From 267bec31f3ef96665e534220334a97c42ae64b18 Mon Sep 17 00:00:00 2001 From: Misipuk Date: Sun, 25 May 2025 10:57:24 +0200 Subject: [PATCH 01/14] adapting iwae to the new code --- .../conv15_sigma_0.01_kl_0.01_lr_0.1.yaml | 63 ++++++++++ core/objective/IWAEObjective.py | 113 ++++++++++++++++++ core/training.py | 32 +++-- scripts/utils/factory/ObjectiveFactory.py | 2 + 4 files changed, 203 insertions(+), 7 deletions(-) create mode 100644 config/iwae_test_configs/conv15_sigma_0.01_kl_0.01_lr_0.1.yaml create mode 100644 core/objective/IWAEObjective.py diff --git a/config/iwae_test_configs/conv15_sigma_0.01_kl_0.01_lr_0.1.yaml b/config/iwae_test_configs/conv15_sigma_0.01_kl_0.01_lr_0.1.yaml new file mode 100644 index 0000000..3bb3103 --- /dev/null +++ b/config/iwae_test_configs/conv15_sigma_0.01_kl_0.01_lr_0.1.yaml @@ -0,0 +1,63 @@ +bound: + delta: 0.025 + delta_test: 0.01 +dist_init: + seed: 110 +factory: + bounds: + - kl + - mcallester + data_loader: + name: cifar10 + params: + dataset_path: ./data/cifar10 + losses: + - nll_loss + - scaled_nll_loss + - 01_loss + metrics: + - accuracy_micro_metric + - accuracy_macro_metric + - f1_micro_metric + - f1_macro_metric + model: + name: conv15 + params: + dataset: cifar10 + in_channels: 3 + posterior_objective: + name: iwae # adapted + params: + delta: 0.025 + kl_penalty: 1.0 + prior_objective: + name: iwae # adapted + params: + delta: 0.025 + kl_penalty: 0.01 +log_wandb: true +mcsamples: 3000 # adapted +pmin: 5.0e-05 +posterior: + training: + epochs: 1 + lr: 0.0001 # adapted + momentum: 0.9 + seed: 1135 +prior: + training: + epochs: 100 + lr: 0.0005 # adapted + momentum: 0.95 + seed: 1135 +sigma: 0.01 +split_config: + batch_size: 250 + dataset_loader_seed: 112 + seed: 111 +split_strategy: + prior_percent: 0.7 + prior_type: learnt + self_certified: true + train_percent: 1.0 + val_percent: 0.0 diff --git a/core/objective/IWAEObjective.py b/core/objective/IWAEObjective.py new file mode 100644 index 0000000..e7ce0ee --- /dev/null +++ b/core/objective/IWAEObjective.py @@ -0,0 +1,113 @@ +import logging, math +from typing import Dict, Optional + +import torch, torch.distributions as dists, wandb +from torch import nn, Tensor + +from core.model import bounded_call +from core.layer.utils import get_torch_layers +from core.objective import AbstractObjective + + +class IWAEObjective(AbstractObjective): + def __init__(self, kl_penalty: float, n: int, temperature: float = 1.0) -> None: + self.kl_penalty = kl_penalty # usually 1 / |D| + self.temperature = temperature + + # -------- helpers to compute log p(w) and log q(w) ------------------- + @staticmethod + def _log_prior(model: nn.Module, eps: float = 1e-6) -> Tensor: + device = next(model.parameters()).device + dtype = next(model.parameters()).dtype + s = torch.zeros(1, device=device, dtype=dtype) + + for _, l in get_torch_layers(model): + s += dists.Normal(l._prior_weight_dist.mu, + l._prior_weight_dist.sigma + eps + ).log_prob(l._sampled_weight).sum() + s += dists.Normal(l._prior_bias_dist.mu, + l._prior_bias_dist.sigma + eps + ).log_prob(l._sampled_bias).sum() + return s + + @staticmethod + def _log_post(model: nn.Module, eps: float = 1e-6) -> Tensor: + device = next(model.parameters()).device + dtype = next(model.parameters()).dtype + s = torch.zeros(1, device=device, dtype=dtype) + + for _, l in get_torch_layers(model): + s += dists.Normal(l._weight_dist.mu, + l._weight_dist.sigma + eps + ).log_prob(l._sampled_weight).sum() + s += dists.Normal(l._bias_dist.mu, + l._bias_dist.sigma + eps + ).log_prob(l._sampled_bias).sum() + return s + + # -------------------------------------------------------------------- + def calculate( + self, + model: nn.Module, + data: Tensor, + target: Tensor, + epoch: int, + batch_idx: int, + dataset_size: int, + pmin: Optional[float] = None, + wandb_params: Optional[Dict] = None, + ) -> Tensor: + + + batch_size = data.size(0) + scale = dataset_size / batch_size # N / |B| + log_ws = [] # list[k] of scalars + + kl_pen = 1 / dataset_size + temp = 1.0 + self.k = 20 + + for l in range(self.k): + # sample w and compute log p(x|w) + logits = bounded_call(model, data, pmin) if pmin is not None else model(data) + + if torch.isnan(logits).any() or torch.isinf(logits).any(): + logging.warning(f"NaN/Inf in logits at epoch {epoch}, batch {batch_idx}") + logits = torch.where(torch.isfinite(logits), logits, torch.zeros_like(logits)) + + log_px = dists.Categorical(logits=logits).log_prob(target) # (batch,) + log_lik = scale * log_px.sum() # scalar + + # global KL part + kl = (self._log_prior(model) - self._log_post(model)) * kl_pen + log_w = log_lik + temp * kl # scalar + log_ws.append(log_w) + + # -------------------- per-sample logging -------------------- + if wandb_params and wandb_params.get("log_wandb", False): + tag = wandb_params["name_wandb"] + wandb.log({ + f"{tag}/epoch": epoch, + f"{tag}/batch": batch_idx, + f"{tag}/sample": l, + f"{tag}/log_likelihood": log_lik.detach(), + f"{tag}/kl": kl.detach(), + f"{tag}/log_weight": log_w.detach(), + }) + + # ----------- PB-IWAE loss (one scalar) --------------------------- + log_ws_tensor = torch.stack(log_ws) # (k,) + loss = -(torch.logsumexp(log_ws_tensor, dim=0) - math.log(self.k)) + + # ----------- final logging -------------------------------------- + if wandb_params and wandb_params.get("log_wandb", False): + wandb.log({f"{wandb_params['name_wandb']}/iwae_loss": loss}) + + if batch_idx == 0: + logging.info( + f"[Epoch {epoch:03d} | Batch {batch_idx:04d}] " + f"IWAE-loss {loss.item():.4f} " + f"| mean log_px {(log_px.mean()).item():.4f} " + f"| KL {kl.item():.2f}" + ) + return loss diff --git a/core/training.py b/core/training.py index e5ed2cb..507f2a6 100644 --- a/core/training.py +++ b/core/training.py @@ -8,7 +8,7 @@ import wandb from core.distribution.utils import DistributionT, compute_kl from core.model import bounded_call -from core.objective import AbstractObjective +from core.objective import AbstractObjective, IWAEObjective def __raise_exception_on_invalid_value(value: torch.Tensor): @@ -75,9 +75,13 @@ def train( None: The model (and its posterior) are updated in-place over the specified epochs. """ criterion = torch.nn.NLLLoss() - optimizer = torch.optim.SGD( - model.parameters(), lr=parameters["lr"], momentum=parameters["momentum"] - ) + #optimizer = torch.optim.SGD( + # model.parameters(), lr=parameters["lr"], momentum=parameters["momentum"] + #) + + optimizer = torch.optim.Adam(model.parameters(), + lr=parameters['lr']) + dataset_size = len(train_loader.dataset) if "seed" in parameters: torch.manual_seed(parameters["seed"]) @@ -89,11 +93,25 @@ def train( output = bounded_call(model, data, parameters["pmin"]) else: output = model(data) - kl = compute_kl(posterior, prior) - loss = criterion(output, target) - objective_value = objective.calculate(loss, kl, parameters["num_samples"]) + if isinstance(objective, IWAEObjective): + objective_value = objective.calculate(model, + data, + target, + epoch=epoch, + batch_idx=_i, + dataset_size=dataset_size, + pmin=parameters.get('pmin', None), + wandb_params=wandb_params) + with torch.no_grad(): + loss = criterion(model(data), target) + kl = compute_kl(posterior, prior) + else: + kl = compute_kl(posterior, prior) + loss = criterion(output, target) + objective_value = objective.calculate(loss, kl, parameters["num_samples"]) __raise_exception_on_invalid_value(objective_value) objective_value.backward() + torch.nn.utils.clip_grad_norm_(model.parameters(), max_norm=5.0) optimizer.step() logging.info( f"Epoch: {epoch}, Objective: {objective_value}, Loss: {loss}, KL/n: {kl / parameters['num_samples']}" diff --git a/scripts/utils/factory/ObjectiveFactory.py b/scripts/utils/factory/ObjectiveFactory.py index 59e6aad..7c187a8 100644 --- a/scripts/utils/factory/ObjectiveFactory.py +++ b/scripts/utils/factory/ObjectiveFactory.py @@ -5,6 +5,7 @@ FQuadObjective, McAllesterObjective, TolstikhinObjective, + IWAEObjective ) from scripts.utils.factory import AbstractFactory @@ -17,3 +18,4 @@ def __init__(self) -> None: self.register_creator("fquad", FQuadObjective) self.register_creator("mcallester", McAllesterObjective) self.register_creator("tolstikhin", TolstikhinObjective) + self.register_creator("iwae", IWAEObjective) From 53ba96434a2383011c30a1e5a00d6388fbdd0dcf Mon Sep 17 00:00:00 2001 From: Misipuk Date: Sun, 25 May 2025 17:49:43 +0200 Subject: [PATCH 02/14] added new configs --- ...onv15_sigma_0.01_kl_0.01_lr_0.1_n_10.yaml} | 15 +++-- ...conv15_sigma_0.01_kl_0.01_lr_0.1_n_20.yaml | 62 +++++++++++++++++++ core/objective/IWAEObjective.py | 10 +-- 3 files changed, 75 insertions(+), 12 deletions(-) rename config/iwae_test_configs/{conv15_sigma_0.01_kl_0.01_lr_0.1.yaml => conv15_sigma_0.01_kl_0.01_lr_0.1_n_10.yaml} (82%) create mode 100644 config/iwae_test_configs/conv15_sigma_0.01_kl_0.01_lr_0.1_n_20.yaml diff --git a/config/iwae_test_configs/conv15_sigma_0.01_kl_0.01_lr_0.1.yaml b/config/iwae_test_configs/conv15_sigma_0.01_kl_0.01_lr_0.1_n_10.yaml similarity index 82% rename from config/iwae_test_configs/conv15_sigma_0.01_kl_0.01_lr_0.1.yaml rename to config/iwae_test_configs/conv15_sigma_0.01_kl_0.01_lr_0.1_n_10.yaml index 3bb3103..0f617c5 100644 --- a/config/iwae_test_configs/conv15_sigma_0.01_kl_0.01_lr_0.1.yaml +++ b/config/iwae_test_configs/conv15_sigma_0.01_kl_0.01_lr_0.1_n_10.yaml @@ -26,28 +26,27 @@ factory: dataset: cifar10 in_channels: 3 posterior_objective: - name: iwae # adapted + name: bbb params: - delta: 0.025 kl_penalty: 1.0 prior_objective: - name: iwae # adapted + name: iwae params: - delta: 0.025 + n: 10 kl_penalty: 0.01 log_wandb: true -mcsamples: 3000 # adapted +mcsamples: 3000 pmin: 5.0e-05 posterior: training: epochs: 1 - lr: 0.0001 # adapted + lr: 0.0001 momentum: 0.9 seed: 1135 prior: training: epochs: 100 - lr: 0.0005 # adapted + lr: 0.0005 momentum: 0.95 seed: 1135 sigma: 0.01 @@ -60,4 +59,4 @@ split_strategy: prior_type: learnt self_certified: true train_percent: 1.0 - val_percent: 0.0 + val_percent: 0.0 \ No newline at end of file diff --git a/config/iwae_test_configs/conv15_sigma_0.01_kl_0.01_lr_0.1_n_20.yaml b/config/iwae_test_configs/conv15_sigma_0.01_kl_0.01_lr_0.1_n_20.yaml new file mode 100644 index 0000000..50eb546 --- /dev/null +++ b/config/iwae_test_configs/conv15_sigma_0.01_kl_0.01_lr_0.1_n_20.yaml @@ -0,0 +1,62 @@ +bound: + delta: 0.025 + delta_test: 0.01 +dist_init: + seed: 110 +factory: + bounds: + - kl + - mcallester + data_loader: + name: cifar10 + params: + dataset_path: ./data/cifar10 + losses: + - nll_loss + - scaled_nll_loss + - 01_loss + metrics: + - accuracy_micro_metric + - accuracy_macro_metric + - f1_micro_metric + - f1_macro_metric + model: + name: conv15 + params: + dataset: cifar10 + in_channels: 3 + posterior_objective: + name: bbb + params: + kl_penalty: 1.0 + prior_objective: + name: iwae + params: + n: 20 + kl_penalty: 0.01 +log_wandb: true +mcsamples: 3000 +pmin: 5.0e-05 +posterior: + training: + epochs: 1 + lr: 0.0001 + momentum: 0.9 + seed: 1135 +prior: + training: + epochs: 100 + lr: 0.0005 + momentum: 0.95 + seed: 1135 +sigma: 0.01 +split_config: + batch_size: 250 + dataset_loader_seed: 112 + seed: 111 +split_strategy: + prior_percent: 0.7 + prior_type: learnt + self_certified: true + train_percent: 1.0 + val_percent: 0.0 \ No newline at end of file diff --git a/core/objective/IWAEObjective.py b/core/objective/IWAEObjective.py index e7ce0ee..5e972bb 100644 --- a/core/objective/IWAEObjective.py +++ b/core/objective/IWAEObjective.py @@ -13,6 +13,9 @@ class IWAEObjective(AbstractObjective): def __init__(self, kl_penalty: float, n: int, temperature: float = 1.0) -> None: self.kl_penalty = kl_penalty # usually 1 / |D| self.temperature = temperature + self.k=n + print(self.temperature) + print(self.k) # -------- helpers to compute log p(w) and log q(w) ------------------- @staticmethod @@ -63,9 +66,8 @@ def calculate( scale = dataset_size / batch_size # N / |B| log_ws = [] # list[k] of scalars - kl_pen = 1 / dataset_size - temp = 1.0 - self.k = 20 + temp = self.temperature + # self.k = 20 for l in range(self.k): # sample w and compute log p(x|w) @@ -79,7 +81,7 @@ def calculate( log_lik = scale * log_px.sum() # scalar # global KL part - kl = (self._log_prior(model) - self._log_post(model)) * kl_pen + kl = self._log_prior(model) - self._log_post(model) log_w = log_lik + temp * kl # scalar log_ws.append(log_w) From 7a94253b0a20e4a39e7450c6c19af5dbe266610b Mon Sep 17 00:00:00 2001 From: Misipuk Date: Sun, 25 May 2025 18:12:42 +0200 Subject: [PATCH 03/14] fixed init --- core/objective/__init__.py | 1 + 1 file changed, 1 insertion(+) diff --git a/core/objective/__init__.py b/core/objective/__init__.py index 6ff21a5..d909d87 100644 --- a/core/objective/__init__.py +++ b/core/objective/__init__.py @@ -17,3 +17,4 @@ from core.objective.FQuadObjective import FQuadObjective from core.objective.McAllesterObjective import McAllesterObjective from core.objective.TolstikhinObjective import TolstikhinObjective +from core.objective.IWAEObjective import IWAEObjective From cd38adc1584d5e022349f10a2e5e41b111d566f7 Mon Sep 17 00:00:00 2001 From: Misipuk Date: Sun, 25 May 2025 18:28:45 +0200 Subject: [PATCH 04/14] added inner vars for prob layer --- core/layer/AbstractProbLayer.py | 6 +++++- 1 file changed, 5 insertions(+), 1 deletion(-) diff --git a/core/layer/AbstractProbLayer.py b/core/layer/AbstractProbLayer.py index fbc9bd0..407c6f2 100644 --- a/core/layer/AbstractProbLayer.py +++ b/core/layer/AbstractProbLayer.py @@ -19,6 +19,8 @@ class AbstractProbLayer(nn.Module, ABC): _bias_dist: AbstractVariable _prior_weight_dist: AbstractVariable _prior_bias_dist: AbstractVariable + _sampled_weight: Tensor + _sampled_bias: Tensor def probabilistic(self, mode: bool = True): """ @@ -64,4 +66,6 @@ def sample_from_distribution(self) -> tuple[Tensor, Tensor]: sampled_bias = self._bias_dist.mu if self._bias_dist else None else: raise ValueError("Only training with probabilistic mode is allowed") - return sampled_weight, sampled_bias + self._sampled_weight = sampled_weight + self._sampled_bias = sampled_bias + return sampled_weight, sampled_bias \ No newline at end of file From 97b6e4d34d4e70f713753a930ec20b201db31f96 Mon Sep 17 00:00:00 2001 From: Misipuk Date: Sun, 25 May 2025 18:59:53 +0200 Subject: [PATCH 05/14] adding beta --- .../conv15_sigma_0.01_kl_0.01_lr_0.1_n_10.yaml | 2 +- .../conv15_sigma_0.01_kl_0.01_lr_0.1_n_20.yaml | 2 +- core/objective/IWAEObjective.py | 4 ++-- 3 files changed, 4 insertions(+), 4 deletions(-) diff --git a/config/iwae_test_configs/conv15_sigma_0.01_kl_0.01_lr_0.1_n_10.yaml b/config/iwae_test_configs/conv15_sigma_0.01_kl_0.01_lr_0.1_n_10.yaml index 0f617c5..4708058 100644 --- a/config/iwae_test_configs/conv15_sigma_0.01_kl_0.01_lr_0.1_n_10.yaml +++ b/config/iwae_test_configs/conv15_sigma_0.01_kl_0.01_lr_0.1_n_10.yaml @@ -49,7 +49,7 @@ prior: lr: 0.0005 momentum: 0.95 seed: 1135 -sigma: 0.01 +sigma: 0.005 split_config: batch_size: 250 dataset_loader_seed: 112 diff --git a/config/iwae_test_configs/conv15_sigma_0.01_kl_0.01_lr_0.1_n_20.yaml b/config/iwae_test_configs/conv15_sigma_0.01_kl_0.01_lr_0.1_n_20.yaml index 50eb546..042b1a7 100644 --- a/config/iwae_test_configs/conv15_sigma_0.01_kl_0.01_lr_0.1_n_20.yaml +++ b/config/iwae_test_configs/conv15_sigma_0.01_kl_0.01_lr_0.1_n_20.yaml @@ -49,7 +49,7 @@ prior: lr: 0.0005 momentum: 0.95 seed: 1135 -sigma: 0.01 +sigma: 0.005 split_config: batch_size: 250 dataset_loader_seed: 112 diff --git a/core/objective/IWAEObjective.py b/core/objective/IWAEObjective.py index 5e972bb..27f5dc9 100644 --- a/core/objective/IWAEObjective.py +++ b/core/objective/IWAEObjective.py @@ -67,7 +67,7 @@ def calculate( log_ws = [] # list[k] of scalars temp = self.temperature - # self.k = 20 + beta = min(1.0, epoch / 20) for l in range(self.k): # sample w and compute log p(x|w) @@ -81,7 +81,7 @@ def calculate( log_lik = scale * log_px.sum() # scalar # global KL part - kl = self._log_prior(model) - self._log_post(model) + kl = beta * (self._log_prior(model) - self._log_post(model)) log_w = log_lik + temp * kl # scalar log_ws.append(log_w) From 534e9d212f5258a5be1f93b267df29dfd9048919 Mon Sep 17 00:00:00 2001 From: Misipuk Date: Sun, 25 May 2025 19:20:13 +0200 Subject: [PATCH 06/14] fix --- core/objective/IWAEObjective.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/core/objective/IWAEObjective.py b/core/objective/IWAEObjective.py index 27f5dc9..5664bad 100644 --- a/core/objective/IWAEObjective.py +++ b/core/objective/IWAEObjective.py @@ -67,7 +67,7 @@ def calculate( log_ws = [] # list[k] of scalars temp = self.temperature - beta = min(1.0, epoch / 20) + beta = min(1.0, (epoch / 40) ** 2) for l in range(self.k): # sample w and compute log p(x|w) From cdb89cbee6a4b02e98184a46b4688ea8512a4984 Mon Sep 17 00:00:00 2001 From: Misipuk Date: Sun, 25 May 2025 20:48:48 +0200 Subject: [PATCH 07/14] hyp fixes --- .../conv15_sigma_0.01_kl_0.01_lr_0.1_n_10.yaml | 2 +- .../conv15_sigma_0.01_kl_0.01_lr_0.1_n_20.yaml | 2 +- core/objective/IWAEObjective.py | 2 +- 3 files changed, 3 insertions(+), 3 deletions(-) diff --git a/config/iwae_test_configs/conv15_sigma_0.01_kl_0.01_lr_0.1_n_10.yaml b/config/iwae_test_configs/conv15_sigma_0.01_kl_0.01_lr_0.1_n_10.yaml index 4708058..89ad595 100644 --- a/config/iwae_test_configs/conv15_sigma_0.01_kl_0.01_lr_0.1_n_10.yaml +++ b/config/iwae_test_configs/conv15_sigma_0.01_kl_0.01_lr_0.1_n_10.yaml @@ -46,7 +46,7 @@ posterior: prior: training: epochs: 100 - lr: 0.0005 + lr: 0.0001 momentum: 0.95 seed: 1135 sigma: 0.005 diff --git a/config/iwae_test_configs/conv15_sigma_0.01_kl_0.01_lr_0.1_n_20.yaml b/config/iwae_test_configs/conv15_sigma_0.01_kl_0.01_lr_0.1_n_20.yaml index 042b1a7..5fc4dc6 100644 --- a/config/iwae_test_configs/conv15_sigma_0.01_kl_0.01_lr_0.1_n_20.yaml +++ b/config/iwae_test_configs/conv15_sigma_0.01_kl_0.01_lr_0.1_n_20.yaml @@ -46,7 +46,7 @@ posterior: prior: training: epochs: 100 - lr: 0.0005 + lr: 0.0001 momentum: 0.95 seed: 1135 sigma: 0.005 diff --git a/core/objective/IWAEObjective.py b/core/objective/IWAEObjective.py index 5664bad..3f478d4 100644 --- a/core/objective/IWAEObjective.py +++ b/core/objective/IWAEObjective.py @@ -67,7 +67,7 @@ def calculate( log_ws = [] # list[k] of scalars temp = self.temperature - beta = min(1.0, (epoch / 40) ** 2) + beta = min(1.0, (epoch / 70) ** 2) for l in range(self.k): # sample w and compute log p(x|w) From 1c884a6ba4fed6d9c0ad51b327c2f81bd93b8a54 Mon Sep 17 00:00:00 2001 From: yauhenii Date: Sun, 25 May 2025 22:03:21 +0200 Subject: [PATCH 08/14] add mnist iwae --- config/iwae_test_configs_mnist/test_conv.yaml | 62 ++++++++++++++++++ config/iwae_test_configs_mnist/test_nn.yaml | 63 +++++++++++++++++++ core/objective/IWAEObjective.py | 25 ++++---- scripts/generic_train.py | 24 +++---- 4 files changed, 149 insertions(+), 25 deletions(-) create mode 100644 config/iwae_test_configs_mnist/test_conv.yaml create mode 100644 config/iwae_test_configs_mnist/test_nn.yaml diff --git a/config/iwae_test_configs_mnist/test_conv.yaml b/config/iwae_test_configs_mnist/test_conv.yaml new file mode 100644 index 0000000..0746c1f --- /dev/null +++ b/config/iwae_test_configs_mnist/test_conv.yaml @@ -0,0 +1,62 @@ +bound: + delta: 0.025 + delta_test: 0.01 +dist_init: + seed: 110 +factory: + bounds: + - kl + - mcallester + data_loader: + name: mnist + params: + dataset_path: ./data/mnist + losses: + - nll_loss + - scaled_nll_loss + - 01_loss + metrics: + - accuracy_micro_metric + - accuracy_macro_metric + - f1_micro_metric + - f1_macro_metric + model: + name: conv + params: + dataset: mnist + in_channels: 1 + posterior_objective: + name: bbb + params: + kl_penalty: 1.0 + prior_objective: + name: iwae + params: + n: 10 + kl_penalty: 0.01 +log_wandb: false +mcsamples: 1000 +pmin: 5.0e-05 +posterior: + training: + epochs: 25 + lr: 0.0001 + momentum: 0.9 + seed: 1135 +prior: + training: + epochs: 10 + lr: 0.0001 + momentum: 0.95 + seed: 1135 +sigma: 0.005 +split_config: + batch_size: 250 + dataset_loader_seed: 112 + seed: 111 +split_strategy: + prior_percent: 0.7 + prior_type: learnt + self_certified: true + train_percent: 1.0 + val_percent: 0.0 \ No newline at end of file diff --git a/config/iwae_test_configs_mnist/test_nn.yaml b/config/iwae_test_configs_mnist/test_nn.yaml new file mode 100644 index 0000000..af2fa98 --- /dev/null +++ b/config/iwae_test_configs_mnist/test_nn.yaml @@ -0,0 +1,63 @@ +bound: + delta: 0.025 + delta_test: 0.01 +dist_init: + seed: 110 +factory: + bounds: + - kl + - mcallester + data_loader: + name: mnist + params: + dataset_path: ./data/mnist + losses: + - nll_loss + - scaled_nll_loss + - 01_loss + metrics: + - accuracy_micro_metric + - accuracy_macro_metric + - f1_micro_metric + - f1_macro_metric + model: + name: nn + params: + input_dim: 784 + hidden_dim: 100 + output_dim: 10 + posterior_objective: + name: bbb + params: + kl_penalty: 1.0 + prior_objective: + name: iwae + params: + n: 10 + kl_penalty: 0.01 +log_wandb: false +mcsamples: 1000 +pmin: 5.0e-05 +posterior: + training: + epochs: 1 + lr: 0.0001 + momentum: 0.9 + seed: 1135 +prior: + training: + epochs: 25 + lr: 0.0001 + momentum: 0.95 + seed: 1135 +sigma: 0.005 +split_config: + batch_size: 250 + dataset_loader_seed: 112 + seed: 111 +split_strategy: + prior_percent: 0.7 + prior_type: learnt + self_certified: true + train_percent: 1.0 + val_percent: 0.0 \ No newline at end of file diff --git a/core/objective/IWAEObjective.py b/core/objective/IWAEObjective.py index 3f478d4..f0d5797 100644 --- a/core/objective/IWAEObjective.py +++ b/core/objective/IWAEObjective.py @@ -13,9 +13,9 @@ class IWAEObjective(AbstractObjective): def __init__(self, kl_penalty: float, n: int, temperature: float = 1.0) -> None: self.kl_penalty = kl_penalty # usually 1 / |D| self.temperature = temperature - self.k=n - print(self.temperature) - print(self.k) + self.k = n + logging.debug(f"IWAE temperature {self.temperature}") + logging.debug(f"IWAE k {self.k}") # -------- helpers to compute log p(w) and log q(w) ------------------- @staticmethod @@ -61,7 +61,6 @@ def calculate( wandb_params: Optional[Dict] = None, ) -> Tensor: - batch_size = data.size(0) scale = dataset_size / batch_size # N / |B| log_ws = [] # list[k] of scalars @@ -86,7 +85,7 @@ def calculate( log_ws.append(log_w) # -------------------- per-sample logging -------------------- - if wandb_params and wandb_params.get("log_wandb", False): + if wandb_params and wandb_params.get("log_wandb", False) and False: tag = wandb_params["name_wandb"] wandb.log({ f"{tag}/epoch": epoch, @@ -96,20 +95,20 @@ def calculate( f"{tag}/kl": kl.detach(), f"{tag}/log_weight": log_w.detach(), }) + # logging.info(f"[Inner Log] Epoch {epoch}, Batch {batch_idx}, Sample {l} | log_lik={log_lik.item():.4f}, kl={kl.item():.4f}, log_w={log_w.item():.4f}") # ----------- PB-IWAE loss (one scalar) --------------------------- log_ws_tensor = torch.stack(log_ws) # (k,) loss = -(torch.logsumexp(log_ws_tensor, dim=0) - math.log(self.k)) # ----------- final logging -------------------------------------- - if wandb_params and wandb_params.get("log_wandb", False): + if wandb_params and wandb_params.get("log_wandb", False) and False: wandb.log({f"{wandb_params['name_wandb']}/iwae_loss": loss}) - if batch_idx == 0: - logging.info( - f"[Epoch {epoch:03d} | Batch {batch_idx:04d}] " - f"IWAE-loss {loss.item():.4f} " - f"| mean log_px {(log_px.mean()).item():.4f} " - f"| KL {kl.item():.2f}" - ) + logging.info( + f"[Epoch {epoch:03d} | Batch {batch_idx:04d}] " + f"IWAE-loss {loss.item():.4f} " + f"| mean log_px {(log_px.mean()).item():.4f} " + f"| KL {kl.item():.2f}" + ) return loss diff --git a/scripts/generic_train.py b/scripts/generic_train.py index fe2082d..712c8fa 100644 --- a/scripts/generic_train.py +++ b/scripts/generic_train.py @@ -136,18 +136,18 @@ def main(config: dict, config_path: str): }, ) - _ = certify_risk( - model=model, - bounds=bounds, - losses=losses, - posterior=prior, - prior=prior_prior, - bound_loader=strategy.bound_loader, - num_samples_loss=config["mcsamples"], - device=device, - pmin=config["pmin"], - wandb_params={"log_wandb": config["log_wandb"], "name_wandb": "Prior Bound"}, - ) + # _ = certify_risk( + # model=model, + # bounds=bounds, + # losses=losses, + # posterior=prior, + # prior=prior_prior, + # bound_loader=strategy.bound_loader, + # num_samples_loss=config["mcsamples"], + # device=device, + # pmin=config["pmin"], + # wandb_params={"log_wandb": config["log_wandb"], "name_wandb": "Prior Bound"}, + # ) posterior_prior = from_copy( dist=prior, distribution=GaussianVariable, requires_grad=False From c50413fa5aa4e4c49d6bcae42395fd01c3a4474e Mon Sep 17 00:00:00 2001 From: yauhenii Date: Sun, 25 May 2025 22:07:13 +0200 Subject: [PATCH 09/14] log wandb --- config/iwae_test_configs_mnist/test_conv.yaml | 2 +- config/iwae_test_configs_mnist/test_nn.yaml | 2 +- core/objective/IWAEObjective.py | 13 +++++++------ 3 files changed, 9 insertions(+), 8 deletions(-) diff --git a/config/iwae_test_configs_mnist/test_conv.yaml b/config/iwae_test_configs_mnist/test_conv.yaml index 0746c1f..24b040a 100644 --- a/config/iwae_test_configs_mnist/test_conv.yaml +++ b/config/iwae_test_configs_mnist/test_conv.yaml @@ -34,7 +34,7 @@ factory: params: n: 10 kl_penalty: 0.01 -log_wandb: false +log_wandb: true mcsamples: 1000 pmin: 5.0e-05 posterior: diff --git a/config/iwae_test_configs_mnist/test_nn.yaml b/config/iwae_test_configs_mnist/test_nn.yaml index af2fa98..0e6795a 100644 --- a/config/iwae_test_configs_mnist/test_nn.yaml +++ b/config/iwae_test_configs_mnist/test_nn.yaml @@ -35,7 +35,7 @@ factory: params: n: 10 kl_penalty: 0.01 -log_wandb: false +log_wandb: true mcsamples: 1000 pmin: 5.0e-05 posterior: diff --git a/core/objective/IWAEObjective.py b/core/objective/IWAEObjective.py index f0d5797..539a781 100644 --- a/core/objective/IWAEObjective.py +++ b/core/objective/IWAEObjective.py @@ -105,10 +105,11 @@ def calculate( if wandb_params and wandb_params.get("log_wandb", False) and False: wandb.log({f"{wandb_params['name_wandb']}/iwae_loss": loss}) - logging.info( - f"[Epoch {epoch:03d} | Batch {batch_idx:04d}] " - f"IWAE-loss {loss.item():.4f} " - f"| mean log_px {(log_px.mean()).item():.4f} " - f"| KL {kl.item():.2f}" - ) + if batch_idx % 50 == 0: + logging.info( + f"[Epoch {epoch:03d} | Batch {batch_idx:04d}] " + f"IWAE-loss {loss.item():.4f} " + f"| mean log_px {(log_px.mean()).item():.4f} " + f"| KL {kl.item():.2f}" + ) return loss From 5874bdbe6c598cf746d07495d28d2575b298e190 Mon Sep 17 00:00:00 2001 From: yauhenii Date: Sun, 25 May 2025 22:36:05 +0200 Subject: [PATCH 10/14] add experiments --- .../test_conv_100.yaml | 62 ++++++++++++++++++ .../test_conv_100_3.yaml | 62 ++++++++++++++++++ .../test_conv_100_bbb.yaml | 61 ++++++++++++++++++ .../test_conv_100_n_1.yaml | 62 ++++++++++++++++++ .../{test_conv.yaml => test_conv_25.yaml} | 4 +- .../iwae_test_configs_mnist/test_conv_70.yaml | 62 ++++++++++++++++++ .../test_conv_best.yaml | 61 ++++++++++++++++++ .../iwae_test_configs_mnist/test_nn_100.yaml | 63 +++++++++++++++++++ .../test_nn_100_3.yaml | 63 +++++++++++++++++++ .../test_nn_100_bbb.yaml | 62 ++++++++++++++++++ .../test_nn_100_like_best.yaml | 63 +++++++++++++++++++ .../test_nn_100_n_1.yaml | 63 +++++++++++++++++++ .../{test_nn.yaml => test_nn_25.yaml} | 0 .../iwae_test_configs_mnist/test_nn_70.yaml | 63 +++++++++++++++++++ .../iwae_test_configs_mnist/test_nn_best.yaml | 62 ++++++++++++++++++ scripts/generic_train.py | 2 +- 16 files changed, 812 insertions(+), 3 deletions(-) create mode 100644 config/iwae_test_configs_mnist/test_conv_100.yaml create mode 100644 config/iwae_test_configs_mnist/test_conv_100_3.yaml create mode 100644 config/iwae_test_configs_mnist/test_conv_100_bbb.yaml create mode 100644 config/iwae_test_configs_mnist/test_conv_100_n_1.yaml rename config/iwae_test_configs_mnist/{test_conv.yaml => test_conv_25.yaml} (98%) create mode 100644 config/iwae_test_configs_mnist/test_conv_70.yaml create mode 100644 config/iwae_test_configs_mnist/test_conv_best.yaml create mode 100644 config/iwae_test_configs_mnist/test_nn_100.yaml create mode 100644 config/iwae_test_configs_mnist/test_nn_100_3.yaml create mode 100644 config/iwae_test_configs_mnist/test_nn_100_bbb.yaml create mode 100644 config/iwae_test_configs_mnist/test_nn_100_like_best.yaml create mode 100644 config/iwae_test_configs_mnist/test_nn_100_n_1.yaml rename config/iwae_test_configs_mnist/{test_nn.yaml => test_nn_25.yaml} (100%) create mode 100644 config/iwae_test_configs_mnist/test_nn_70.yaml create mode 100644 config/iwae_test_configs_mnist/test_nn_best.yaml diff --git a/config/iwae_test_configs_mnist/test_conv_100.yaml b/config/iwae_test_configs_mnist/test_conv_100.yaml new file mode 100644 index 0000000..045602f --- /dev/null +++ b/config/iwae_test_configs_mnist/test_conv_100.yaml @@ -0,0 +1,62 @@ +bound: + delta: 0.025 + delta_test: 0.01 +dist_init: + seed: 110 +factory: + bounds: + - kl + - mcallester + data_loader: + name: mnist + params: + dataset_path: ./data/mnist + losses: + - nll_loss + - scaled_nll_loss + - 01_loss + metrics: + - accuracy_micro_metric + - accuracy_macro_metric + - f1_micro_metric + - f1_macro_metric + model: + name: conv + params: + dataset: mnist + in_channels: 1 + posterior_objective: + name: bbb + params: + kl_penalty: 1.0 + prior_objective: + name: iwae + params: + n: 10 + kl_penalty: 0.01 +log_wandb: true +mcsamples: 1000 +pmin: 5.0e-05 +posterior: + training: + epochs: 1 + lr: 0.0001 + momentum: 0.9 + seed: 1135 +prior: + training: + epochs: 100 + lr: 0.0001 + momentum: 0.95 + seed: 1135 +sigma: 0.005 +split_config: + batch_size: 250 + dataset_loader_seed: 112 + seed: 111 +split_strategy: + prior_percent: 0.7 + prior_type: learnt + self_certified: true + train_percent: 1.0 + val_percent: 0.0 \ No newline at end of file diff --git a/config/iwae_test_configs_mnist/test_conv_100_3.yaml b/config/iwae_test_configs_mnist/test_conv_100_3.yaml new file mode 100644 index 0000000..1334bd5 --- /dev/null +++ b/config/iwae_test_configs_mnist/test_conv_100_3.yaml @@ -0,0 +1,62 @@ +bound: + delta: 0.025 + delta_test: 0.01 +dist_init: + seed: 110 +factory: + bounds: + - kl + - mcallester + data_loader: + name: mnist + params: + dataset_path: ./data/mnist + losses: + - nll_loss + - scaled_nll_loss + - 01_loss + metrics: + - accuracy_micro_metric + - accuracy_macro_metric + - f1_micro_metric + - f1_macro_metric + model: + name: conv + params: + dataset: mnist + in_channels: 1 + posterior_objective: + name: bbb + params: + kl_penalty: 1.0 + prior_objective: + name: iwae + params: + n: 10 + kl_penalty: 0.01 +log_wandb: true +mcsamples: 1000 +pmin: 5.0e-05 +posterior: + training: + epochs: 3 + lr: 0.0001 + momentum: 0.9 + seed: 1135 +prior: + training: + epochs: 100 + lr: 0.0001 + momentum: 0.95 + seed: 1135 +sigma: 0.005 +split_config: + batch_size: 250 + dataset_loader_seed: 112 + seed: 111 +split_strategy: + prior_percent: 0.7 + prior_type: learnt + self_certified: true + train_percent: 1.0 + val_percent: 0.0 \ No newline at end of file diff --git a/config/iwae_test_configs_mnist/test_conv_100_bbb.yaml b/config/iwae_test_configs_mnist/test_conv_100_bbb.yaml new file mode 100644 index 0000000..56ce9c4 --- /dev/null +++ b/config/iwae_test_configs_mnist/test_conv_100_bbb.yaml @@ -0,0 +1,61 @@ +bound: + delta: 0.025 + delta_test: 0.01 +dist_init: + seed: 110 +factory: + bounds: + - kl + - mcallester + data_loader: + name: mnist + params: + dataset_path: ./data/mnist + losses: + - nll_loss + - scaled_nll_loss + - 01_loss + metrics: + - accuracy_micro_metric + - accuracy_macro_metric + - f1_micro_metric + - f1_macro_metric + model: + name: conv + params: + dataset: mnist + in_channels: 1 + posterior_objective: + name: bbb + params: + kl_penalty: 1.0 + prior_objective: + name: bbb + params: + kl_penalty: 0.01 +log_wandb: true +mcsamples: 1000 +pmin: 5.0e-05 +posterior: + training: + epochs: 1 + lr: 0.0001 + momentum: 0.9 + seed: 1135 +prior: + training: + epochs: 100 + lr: 0.0001 + momentum: 0.95 + seed: 1135 +sigma: 0.005 +split_config: + batch_size: 250 + dataset_loader_seed: 112 + seed: 111 +split_strategy: + prior_percent: 0.7 + prior_type: learnt + self_certified: true + train_percent: 1.0 + val_percent: 0.0 \ No newline at end of file diff --git a/config/iwae_test_configs_mnist/test_conv_100_n_1.yaml b/config/iwae_test_configs_mnist/test_conv_100_n_1.yaml new file mode 100644 index 0000000..2c0081a --- /dev/null +++ b/config/iwae_test_configs_mnist/test_conv_100_n_1.yaml @@ -0,0 +1,62 @@ +bound: + delta: 0.025 + delta_test: 0.01 +dist_init: + seed: 110 +factory: + bounds: + - kl + - mcallester + data_loader: + name: mnist + params: + dataset_path: ./data/mnist + losses: + - nll_loss + - scaled_nll_loss + - 01_loss + metrics: + - accuracy_micro_metric + - accuracy_macro_metric + - f1_micro_metric + - f1_macro_metric + model: + name: conv + params: + dataset: mnist + in_channels: 1 + posterior_objective: + name: bbb + params: + kl_penalty: 1.0 + prior_objective: + name: iwae + params: + n: 1 + kl_penalty: 0.01 +log_wandb: true +mcsamples: 1000 +pmin: 5.0e-05 +posterior: + training: + epochs: 1 + lr: 0.0001 + momentum: 0.9 + seed: 1135 +prior: + training: + epochs: 100 + lr: 0.0001 + momentum: 0.95 + seed: 1135 +sigma: 0.005 +split_config: + batch_size: 250 + dataset_loader_seed: 112 + seed: 111 +split_strategy: + prior_percent: 0.7 + prior_type: learnt + self_certified: true + train_percent: 1.0 + val_percent: 0.0 \ No newline at end of file diff --git a/config/iwae_test_configs_mnist/test_conv.yaml b/config/iwae_test_configs_mnist/test_conv_25.yaml similarity index 98% rename from config/iwae_test_configs_mnist/test_conv.yaml rename to config/iwae_test_configs_mnist/test_conv_25.yaml index 24b040a..98880a0 100644 --- a/config/iwae_test_configs_mnist/test_conv.yaml +++ b/config/iwae_test_configs_mnist/test_conv_25.yaml @@ -39,13 +39,13 @@ mcsamples: 1000 pmin: 5.0e-05 posterior: training: - epochs: 25 + epochs: 1 lr: 0.0001 momentum: 0.9 seed: 1135 prior: training: - epochs: 10 + epochs: 25 lr: 0.0001 momentum: 0.95 seed: 1135 diff --git a/config/iwae_test_configs_mnist/test_conv_70.yaml b/config/iwae_test_configs_mnist/test_conv_70.yaml new file mode 100644 index 0000000..d9b5617 --- /dev/null +++ b/config/iwae_test_configs_mnist/test_conv_70.yaml @@ -0,0 +1,62 @@ +bound: + delta: 0.025 + delta_test: 0.01 +dist_init: + seed: 110 +factory: + bounds: + - kl + - mcallester + data_loader: + name: mnist + params: + dataset_path: ./data/mnist + losses: + - nll_loss + - scaled_nll_loss + - 01_loss + metrics: + - accuracy_micro_metric + - accuracy_macro_metric + - f1_micro_metric + - f1_macro_metric + model: + name: conv + params: + dataset: mnist + in_channels: 1 + posterior_objective: + name: bbb + params: + kl_penalty: 1.0 + prior_objective: + name: iwae + params: + n: 10 + kl_penalty: 0.01 +log_wandb: true +mcsamples: 1000 +pmin: 5.0e-05 +posterior: + training: + epochs: 1 + lr: 0.0001 + momentum: 0.9 + seed: 1135 +prior: + training: + epochs: 70 + lr: 0.0001 + momentum: 0.95 + seed: 1135 +sigma: 0.005 +split_config: + batch_size: 250 + dataset_loader_seed: 112 + seed: 111 +split_strategy: + prior_percent: 0.7 + prior_type: learnt + self_certified: true + train_percent: 1.0 + val_percent: 0.0 \ No newline at end of file diff --git a/config/iwae_test_configs_mnist/test_conv_best.yaml b/config/iwae_test_configs_mnist/test_conv_best.yaml new file mode 100644 index 0000000..2105be3 --- /dev/null +++ b/config/iwae_test_configs_mnist/test_conv_best.yaml @@ -0,0 +1,61 @@ +bound: + delta: 0.025 + delta_test: 0.01 +dist_init: + seed: 110 +factory: + bounds: + - kl + - mcallester + data_loader: + name: mnist + params: + dataset_path: ./data/mnist + losses: + - nll_loss + - scaled_nll_loss + - 01_loss + metrics: + - accuracy_micro_metric + - accuracy_macro_metric + - f1_micro_metric + - f1_macro_metric + model: + name: conv + params: + dataset: mnist + in_channels: 1 + posterior_objective: + name: bbb + params: + kl_penalty: 1.0 + prior_objective: + name: bbb + params: + kl_penalty: 0.01 +log_wandb: true +mcsamples: 1000 +pmin: 5.0e-05 +posterior: + training: + epochs: 1 + lr: 0.001 + momentum: 0.9 + seed: 1135 +prior: + training: + epochs: 100 + lr: 0.001 + momentum: 0.95 + seed: 1135 +sigma: 0.01 +split_config: + batch_size: 250 + dataset_loader_seed: 112 + seed: 111 +split_strategy: + prior_percent: 0.7 + prior_type: learnt + self_certified: true + train_percent: 1.0 + val_percent: 0.0 \ No newline at end of file diff --git a/config/iwae_test_configs_mnist/test_nn_100.yaml b/config/iwae_test_configs_mnist/test_nn_100.yaml new file mode 100644 index 0000000..ccecc94 --- /dev/null +++ b/config/iwae_test_configs_mnist/test_nn_100.yaml @@ -0,0 +1,63 @@ +bound: + delta: 0.025 + delta_test: 0.01 +dist_init: + seed: 110 +factory: + bounds: + - kl + - mcallester + data_loader: + name: mnist + params: + dataset_path: ./data/mnist + losses: + - nll_loss + - scaled_nll_loss + - 01_loss + metrics: + - accuracy_micro_metric + - accuracy_macro_metric + - f1_micro_metric + - f1_macro_metric + model: + name: nn + params: + input_dim: 784 + hidden_dim: 100 + output_dim: 10 + posterior_objective: + name: bbb + params: + kl_penalty: 1.0 + prior_objective: + name: iwae + params: + n: 10 + kl_penalty: 0.01 +log_wandb: true +mcsamples: 1000 +pmin: 5.0e-05 +posterior: + training: + epochs: 1 + lr: 0.0001 + momentum: 0.9 + seed: 1135 +prior: + training: + epochs: 100 + lr: 0.0001 + momentum: 0.95 + seed: 1135 +sigma: 0.005 +split_config: + batch_size: 250 + dataset_loader_seed: 112 + seed: 111 +split_strategy: + prior_percent: 0.7 + prior_type: learnt + self_certified: true + train_percent: 1.0 + val_percent: 0.0 \ No newline at end of file diff --git a/config/iwae_test_configs_mnist/test_nn_100_3.yaml b/config/iwae_test_configs_mnist/test_nn_100_3.yaml new file mode 100644 index 0000000..ccecc94 --- /dev/null +++ b/config/iwae_test_configs_mnist/test_nn_100_3.yaml @@ -0,0 +1,63 @@ +bound: + delta: 0.025 + delta_test: 0.01 +dist_init: + seed: 110 +factory: + bounds: + - kl + - mcallester + data_loader: + name: mnist + params: + dataset_path: ./data/mnist + losses: + - nll_loss + - scaled_nll_loss + - 01_loss + metrics: + - accuracy_micro_metric + - accuracy_macro_metric + - f1_micro_metric + - f1_macro_metric + model: + name: nn + params: + input_dim: 784 + hidden_dim: 100 + output_dim: 10 + posterior_objective: + name: bbb + params: + kl_penalty: 1.0 + prior_objective: + name: iwae + params: + n: 10 + kl_penalty: 0.01 +log_wandb: true +mcsamples: 1000 +pmin: 5.0e-05 +posterior: + training: + epochs: 1 + lr: 0.0001 + momentum: 0.9 + seed: 1135 +prior: + training: + epochs: 100 + lr: 0.0001 + momentum: 0.95 + seed: 1135 +sigma: 0.005 +split_config: + batch_size: 250 + dataset_loader_seed: 112 + seed: 111 +split_strategy: + prior_percent: 0.7 + prior_type: learnt + self_certified: true + train_percent: 1.0 + val_percent: 0.0 \ No newline at end of file diff --git a/config/iwae_test_configs_mnist/test_nn_100_bbb.yaml b/config/iwae_test_configs_mnist/test_nn_100_bbb.yaml new file mode 100644 index 0000000..edfbc77 --- /dev/null +++ b/config/iwae_test_configs_mnist/test_nn_100_bbb.yaml @@ -0,0 +1,62 @@ +bound: + delta: 0.025 + delta_test: 0.01 +dist_init: + seed: 110 +factory: + bounds: + - kl + - mcallester + data_loader: + name: mnist + params: + dataset_path: ./data/mnist + losses: + - nll_loss + - scaled_nll_loss + - 01_loss + metrics: + - accuracy_micro_metric + - accuracy_macro_metric + - f1_micro_metric + - f1_macro_metric + model: + name: nn + params: + input_dim: 784 + hidden_dim: 100 + output_dim: 10 + posterior_objective: + name: bbb + params: + kl_penalty: 1.0 + prior_objective: + name: bbb + params: + kl_penalty: 0.01 +log_wandb: true +mcsamples: 1000 +pmin: 5.0e-05 +posterior: + training: + epochs: 1 + lr: 0.0001 + momentum: 0.9 + seed: 1135 +prior: + training: + epochs: 100 + lr: 0.0001 + momentum: 0.95 + seed: 1135 +sigma: 0.005 +split_config: + batch_size: 250 + dataset_loader_seed: 112 + seed: 111 +split_strategy: + prior_percent: 0.7 + prior_type: learnt + self_certified: true + train_percent: 1.0 + val_percent: 0.0 \ No newline at end of file diff --git a/config/iwae_test_configs_mnist/test_nn_100_like_best.yaml b/config/iwae_test_configs_mnist/test_nn_100_like_best.yaml new file mode 100644 index 0000000..ccecc94 --- /dev/null +++ b/config/iwae_test_configs_mnist/test_nn_100_like_best.yaml @@ -0,0 +1,63 @@ +bound: + delta: 0.025 + delta_test: 0.01 +dist_init: + seed: 110 +factory: + bounds: + - kl + - mcallester + data_loader: + name: mnist + params: + dataset_path: ./data/mnist + losses: + - nll_loss + - scaled_nll_loss + - 01_loss + metrics: + - accuracy_micro_metric + - accuracy_macro_metric + - f1_micro_metric + - f1_macro_metric + model: + name: nn + params: + input_dim: 784 + hidden_dim: 100 + output_dim: 10 + posterior_objective: + name: bbb + params: + kl_penalty: 1.0 + prior_objective: + name: iwae + params: + n: 10 + kl_penalty: 0.01 +log_wandb: true +mcsamples: 1000 +pmin: 5.0e-05 +posterior: + training: + epochs: 1 + lr: 0.0001 + momentum: 0.9 + seed: 1135 +prior: + training: + epochs: 100 + lr: 0.0001 + momentum: 0.95 + seed: 1135 +sigma: 0.005 +split_config: + batch_size: 250 + dataset_loader_seed: 112 + seed: 111 +split_strategy: + prior_percent: 0.7 + prior_type: learnt + self_certified: true + train_percent: 1.0 + val_percent: 0.0 \ No newline at end of file diff --git a/config/iwae_test_configs_mnist/test_nn_100_n_1.yaml b/config/iwae_test_configs_mnist/test_nn_100_n_1.yaml new file mode 100644 index 0000000..babdaae --- /dev/null +++ b/config/iwae_test_configs_mnist/test_nn_100_n_1.yaml @@ -0,0 +1,63 @@ +bound: + delta: 0.025 + delta_test: 0.01 +dist_init: + seed: 110 +factory: + bounds: + - kl + - mcallester + data_loader: + name: mnist + params: + dataset_path: ./data/mnist + losses: + - nll_loss + - scaled_nll_loss + - 01_loss + metrics: + - accuracy_micro_metric + - accuracy_macro_metric + - f1_micro_metric + - f1_macro_metric + model: + name: nn + params: + input_dim: 784 + hidden_dim: 100 + output_dim: 10 + posterior_objective: + name: bbb + params: + kl_penalty: 1.0 + prior_objective: + name: iwae + params: + n: 1 + kl_penalty: 0.01 +log_wandb: true +mcsamples: 1000 +pmin: 5.0e-05 +posterior: + training: + epochs: 1 + lr: 0.0001 + momentum: 0.9 + seed: 1135 +prior: + training: + epochs: 100 + lr: 0.0001 + momentum: 0.95 + seed: 1135 +sigma: 0.005 +split_config: + batch_size: 250 + dataset_loader_seed: 112 + seed: 111 +split_strategy: + prior_percent: 0.7 + prior_type: learnt + self_certified: true + train_percent: 1.0 + val_percent: 0.0 \ No newline at end of file diff --git a/config/iwae_test_configs_mnist/test_nn.yaml b/config/iwae_test_configs_mnist/test_nn_25.yaml similarity index 100% rename from config/iwae_test_configs_mnist/test_nn.yaml rename to config/iwae_test_configs_mnist/test_nn_25.yaml diff --git a/config/iwae_test_configs_mnist/test_nn_70.yaml b/config/iwae_test_configs_mnist/test_nn_70.yaml new file mode 100644 index 0000000..0787e95 --- /dev/null +++ b/config/iwae_test_configs_mnist/test_nn_70.yaml @@ -0,0 +1,63 @@ +bound: + delta: 0.025 + delta_test: 0.01 +dist_init: + seed: 110 +factory: + bounds: + - kl + - mcallester + data_loader: + name: mnist + params: + dataset_path: ./data/mnist + losses: + - nll_loss + - scaled_nll_loss + - 01_loss + metrics: + - accuracy_micro_metric + - accuracy_macro_metric + - f1_micro_metric + - f1_macro_metric + model: + name: nn + params: + input_dim: 784 + hidden_dim: 100 + output_dim: 10 + posterior_objective: + name: bbb + params: + kl_penalty: 1.0 + prior_objective: + name: iwae + params: + n: 10 + kl_penalty: 0.01 +log_wandb: true +mcsamples: 1000 +pmin: 5.0e-05 +posterior: + training: + epochs: 1 + lr: 0.0001 + momentum: 0.9 + seed: 1135 +prior: + training: + epochs: 70 + lr: 0.0001 + momentum: 0.95 + seed: 1135 +sigma: 0.005 +split_config: + batch_size: 250 + dataset_loader_seed: 112 + seed: 111 +split_strategy: + prior_percent: 0.7 + prior_type: learnt + self_certified: true + train_percent: 1.0 + val_percent: 0.0 \ No newline at end of file diff --git a/config/iwae_test_configs_mnist/test_nn_best.yaml b/config/iwae_test_configs_mnist/test_nn_best.yaml new file mode 100644 index 0000000..bbf1816 --- /dev/null +++ b/config/iwae_test_configs_mnist/test_nn_best.yaml @@ -0,0 +1,62 @@ +bound: + delta: 0.025 + delta_test: 0.01 +dist_init: + seed: 110 +factory: + bounds: + - kl + - mcallester + data_loader: + name: mnist + params: + dataset_path: ./data/mnist + losses: + - nll_loss + - scaled_nll_loss + - 01_loss + metrics: + - accuracy_micro_metric + - accuracy_macro_metric + - f1_micro_metric + - f1_macro_metric + model: + name: nn + params: + input_dim: 784 + hidden_dim: 100 + output_dim: 10 + posterior_objective: + name: bbb + params: + kl_penalty: 1.0 + prior_objective: + name: bbb + params: + kl_penalty: 0.001 +log_wandb: true +mcsamples: 1000 +pmin: 5.0e-05 +posterior: + training: + epochs: 1 + lr: 0.001 + momentum: 0.9 + seed: 1135 +prior: + training: + epochs: 25 + lr: 0.001 + momentum: 0.95 + seed: 1135 +sigma: 0.01 +split_config: + batch_size: 250 + dataset_loader_seed: 112 + seed: 111 +split_strategy: + prior_percent: 0.7 + prior_type: learnt + self_certified: true + train_percent: 1.0 + val_percent: 0.0 \ No newline at end of file diff --git a/scripts/generic_train.py b/scripts/generic_train.py index 712c8fa..9ee3b8a 100644 --- a/scripts/generic_train.py +++ b/scripts/generic_train.py @@ -24,7 +24,7 @@ def main(config: dict, config_path: str): if config["log_wandb"]: - wandb.init(project="pbb_paper", config=config, name=get_wandb_name(config_path)) + wandb.init(project="pbb_iwae", config=config, name=get_wandb_name(config_path)) device = torch.device("cuda" if torch.cuda.is_available() else "cpu") logging.info(f"Device {device}") # Losses From 41950c5c9ecbf4fd04de633741c7e4b9d61a0a22 Mon Sep 17 00:00:00 2001 From: maxtretiakov Date: Mon, 26 May 2025 08:52:30 +0000 Subject: [PATCH 11/14] iwae using kl penalty --- .../test_conv_100.yaml | 0 .../test_conv_100_3.yaml | 0 .../test_conv_100_bbb.yaml | 0 .../test_conv_100_n_1.yaml | 0 .../test_conv_25.yaml | 0 .../test_conv_70.yaml | 0 .../test_conv_best.yaml | 0 .../test_nn_100.yaml | 0 .../test_nn_100_3.yaml | 0 .../test_nn_100_bbb.yaml | 0 .../test_nn_100_like_best.yaml | 0 .../test_nn_100_n_1.yaml | 0 .../test_nn_25.yaml | 0 .../test_nn_70.yaml | 0 .../test_nn_best.yaml | 0 .../IWAEObjective-checkpoint.py | 115 + core/objective/IWAEObjective.py | 2 +- output.txt | 6540 +++++++++++++++++ 18 files changed, 6656 insertions(+), 1 deletion(-) rename config/{iwae_test_configs_mnist => iwae_test_configs_mnist_penalty}/test_conv_100.yaml (100%) rename config/{iwae_test_configs_mnist => iwae_test_configs_mnist_penalty}/test_conv_100_3.yaml (100%) rename config/{iwae_test_configs_mnist => iwae_test_configs_mnist_penalty}/test_conv_100_bbb.yaml (100%) rename config/{iwae_test_configs_mnist => iwae_test_configs_mnist_penalty}/test_conv_100_n_1.yaml (100%) rename config/{iwae_test_configs_mnist => iwae_test_configs_mnist_penalty}/test_conv_25.yaml (100%) rename config/{iwae_test_configs_mnist => iwae_test_configs_mnist_penalty}/test_conv_70.yaml (100%) rename config/{iwae_test_configs_mnist => iwae_test_configs_mnist_penalty}/test_conv_best.yaml (100%) rename config/{iwae_test_configs_mnist => iwae_test_configs_mnist_penalty}/test_nn_100.yaml (100%) rename config/{iwae_test_configs_mnist => iwae_test_configs_mnist_penalty}/test_nn_100_3.yaml (100%) rename config/{iwae_test_configs_mnist => iwae_test_configs_mnist_penalty}/test_nn_100_bbb.yaml (100%) rename config/{iwae_test_configs_mnist => iwae_test_configs_mnist_penalty}/test_nn_100_like_best.yaml (100%) rename config/{iwae_test_configs_mnist => iwae_test_configs_mnist_penalty}/test_nn_100_n_1.yaml (100%) rename config/{iwae_test_configs_mnist => iwae_test_configs_mnist_penalty}/test_nn_25.yaml (100%) rename config/{iwae_test_configs_mnist => iwae_test_configs_mnist_penalty}/test_nn_70.yaml (100%) rename config/{iwae_test_configs_mnist => iwae_test_configs_mnist_penalty}/test_nn_best.yaml (100%) create mode 100644 core/objective/.ipynb_checkpoints/IWAEObjective-checkpoint.py create mode 100644 output.txt diff --git a/config/iwae_test_configs_mnist/test_conv_100.yaml b/config/iwae_test_configs_mnist_penalty/test_conv_100.yaml similarity index 100% rename from config/iwae_test_configs_mnist/test_conv_100.yaml rename to config/iwae_test_configs_mnist_penalty/test_conv_100.yaml diff --git a/config/iwae_test_configs_mnist/test_conv_100_3.yaml b/config/iwae_test_configs_mnist_penalty/test_conv_100_3.yaml similarity index 100% rename from config/iwae_test_configs_mnist/test_conv_100_3.yaml rename to config/iwae_test_configs_mnist_penalty/test_conv_100_3.yaml diff --git a/config/iwae_test_configs_mnist/test_conv_100_bbb.yaml b/config/iwae_test_configs_mnist_penalty/test_conv_100_bbb.yaml similarity index 100% rename from config/iwae_test_configs_mnist/test_conv_100_bbb.yaml rename to config/iwae_test_configs_mnist_penalty/test_conv_100_bbb.yaml diff --git a/config/iwae_test_configs_mnist/test_conv_100_n_1.yaml b/config/iwae_test_configs_mnist_penalty/test_conv_100_n_1.yaml similarity index 100% rename from config/iwae_test_configs_mnist/test_conv_100_n_1.yaml rename to config/iwae_test_configs_mnist_penalty/test_conv_100_n_1.yaml diff --git a/config/iwae_test_configs_mnist/test_conv_25.yaml b/config/iwae_test_configs_mnist_penalty/test_conv_25.yaml similarity index 100% rename from config/iwae_test_configs_mnist/test_conv_25.yaml rename to config/iwae_test_configs_mnist_penalty/test_conv_25.yaml diff --git a/config/iwae_test_configs_mnist/test_conv_70.yaml b/config/iwae_test_configs_mnist_penalty/test_conv_70.yaml similarity index 100% rename from config/iwae_test_configs_mnist/test_conv_70.yaml rename to config/iwae_test_configs_mnist_penalty/test_conv_70.yaml diff --git a/config/iwae_test_configs_mnist/test_conv_best.yaml b/config/iwae_test_configs_mnist_penalty/test_conv_best.yaml similarity index 100% rename from config/iwae_test_configs_mnist/test_conv_best.yaml rename to config/iwae_test_configs_mnist_penalty/test_conv_best.yaml diff --git a/config/iwae_test_configs_mnist/test_nn_100.yaml b/config/iwae_test_configs_mnist_penalty/test_nn_100.yaml similarity index 100% rename from config/iwae_test_configs_mnist/test_nn_100.yaml rename to config/iwae_test_configs_mnist_penalty/test_nn_100.yaml diff --git a/config/iwae_test_configs_mnist/test_nn_100_3.yaml b/config/iwae_test_configs_mnist_penalty/test_nn_100_3.yaml similarity index 100% rename from config/iwae_test_configs_mnist/test_nn_100_3.yaml rename to config/iwae_test_configs_mnist_penalty/test_nn_100_3.yaml diff --git a/config/iwae_test_configs_mnist/test_nn_100_bbb.yaml b/config/iwae_test_configs_mnist_penalty/test_nn_100_bbb.yaml similarity index 100% rename from config/iwae_test_configs_mnist/test_nn_100_bbb.yaml rename to config/iwae_test_configs_mnist_penalty/test_nn_100_bbb.yaml diff --git a/config/iwae_test_configs_mnist/test_nn_100_like_best.yaml b/config/iwae_test_configs_mnist_penalty/test_nn_100_like_best.yaml similarity index 100% rename from config/iwae_test_configs_mnist/test_nn_100_like_best.yaml rename to config/iwae_test_configs_mnist_penalty/test_nn_100_like_best.yaml diff --git a/config/iwae_test_configs_mnist/test_nn_100_n_1.yaml b/config/iwae_test_configs_mnist_penalty/test_nn_100_n_1.yaml similarity index 100% rename from config/iwae_test_configs_mnist/test_nn_100_n_1.yaml rename to config/iwae_test_configs_mnist_penalty/test_nn_100_n_1.yaml diff --git a/config/iwae_test_configs_mnist/test_nn_25.yaml b/config/iwae_test_configs_mnist_penalty/test_nn_25.yaml similarity index 100% rename from config/iwae_test_configs_mnist/test_nn_25.yaml rename to config/iwae_test_configs_mnist_penalty/test_nn_25.yaml diff --git a/config/iwae_test_configs_mnist/test_nn_70.yaml b/config/iwae_test_configs_mnist_penalty/test_nn_70.yaml similarity index 100% rename from config/iwae_test_configs_mnist/test_nn_70.yaml rename to config/iwae_test_configs_mnist_penalty/test_nn_70.yaml diff --git a/config/iwae_test_configs_mnist/test_nn_best.yaml b/config/iwae_test_configs_mnist_penalty/test_nn_best.yaml similarity index 100% rename from config/iwae_test_configs_mnist/test_nn_best.yaml rename to config/iwae_test_configs_mnist_penalty/test_nn_best.yaml diff --git a/core/objective/.ipynb_checkpoints/IWAEObjective-checkpoint.py b/core/objective/.ipynb_checkpoints/IWAEObjective-checkpoint.py new file mode 100644 index 0000000..7274302 --- /dev/null +++ b/core/objective/.ipynb_checkpoints/IWAEObjective-checkpoint.py @@ -0,0 +1,115 @@ +import logging, math +from typing import Dict, Optional + +import torch, torch.distributions as dists, wandb +from torch import nn, Tensor + +from core.model import bounded_call +from core.layer.utils import get_torch_layers +from core.objective import AbstractObjective + + +class IWAEObjective(AbstractObjective): + def __init__(self, kl_penalty: float, n: int, temperature: float = 1.0) -> None: + self.kl_penalty = kl_penalty # usually 1 / |D| + self.temperature = temperature + self.k = n + logging.debug(f"IWAE temperature {self.temperature}") + logging.debug(f"IWAE k {self.k}") + + # -------- helpers to compute log p(w) and log q(w) ------------------- + @staticmethod + def _log_prior(model: nn.Module, eps: float = 1e-6) -> Tensor: + device = next(model.parameters()).device + dtype = next(model.parameters()).dtype + s = torch.zeros(1, device=device, dtype=dtype) + + for _, l in get_torch_layers(model): + s += dists.Normal(l._prior_weight_dist.mu, + l._prior_weight_dist.sigma + eps + ).log_prob(l._sampled_weight).sum() + s += dists.Normal(l._prior_bias_dist.mu, + l._prior_bias_dist.sigma + eps + ).log_prob(l._sampled_bias).sum() + return s + + @staticmethod + def _log_post(model: nn.Module, eps: float = 1e-6) -> Tensor: + device = next(model.parameters()).device + dtype = next(model.parameters()).dtype + s = torch.zeros(1, device=device, dtype=dtype) + + for _, l in get_torch_layers(model): + s += dists.Normal(l._weight_dist.mu, + l._weight_dist.sigma + eps + ).log_prob(l._sampled_weight).sum() + s += dists.Normal(l._bias_dist.mu, + l._bias_dist.sigma + eps + ).log_prob(l._sampled_bias).sum() + return s + + # -------------------------------------------------------------------- + def calculate( + self, + model: nn.Module, + data: Tensor, + target: Tensor, + epoch: int, + batch_idx: int, + dataset_size: int, + pmin: Optional[float] = None, + wandb_params: Optional[Dict] = None, + ) -> Tensor: + + batch_size = data.size(0) + scale = dataset_size / batch_size # N / |B| + log_ws = [] # list[k] of scalars + + temp = self.temperature + beta = 0.001 + + for l in range(self.k): + # sample w and compute log p(x|w) + logits = bounded_call(model, data, pmin) if pmin is not None else model(data) + + if torch.isnan(logits).any() or torch.isinf(logits).any(): + logging.warning(f"NaN/Inf in logits at epoch {epoch}, batch {batch_idx}") + logits = torch.where(torch.isfinite(logits), logits, torch.zeros_like(logits)) + + log_px = dists.Categorical(logits=logits).log_prob(target) # (batch,) + log_lik = scale * log_px.sum() # scalar + + # global KL part + kl = beta * (self._log_prior(model) - self._log_post(model)) + log_w = log_lik + temp * kl # scalar + log_ws.append(log_w) + + # -------------------- per-sample logging -------------------- + if wandb_params and wandb_params.get("log_wandb", False) and False: + tag = wandb_params["name_wandb"] + wandb.log({ + f"{tag}/epoch": epoch, + f"{tag}/batch": batch_idx, + f"{tag}/sample": l, + f"{tag}/log_likelihood": log_lik.detach(), + f"{tag}/kl": kl.detach(), + f"{tag}/log_weight": log_w.detach(), + }) + # logging.info(f"[Inner Log] Epoch {epoch}, Batch {batch_idx}, Sample {l} | log_lik={log_lik.item():.4f}, kl={kl.item():.4f}, log_w={log_w.item():.4f}") + + # ----------- PB-IWAE loss (one scalar) --------------------------- + log_ws_tensor = torch.stack(log_ws) # (k,) + loss = -(torch.logsumexp(log_ws_tensor, dim=0) - math.log(self.k)) + + # ----------- final logging -------------------------------------- + if wandb_params and wandb_params.get("log_wandb", False) and False: + wandb.log({f"{wandb_params['name_wandb']}/iwae_loss": loss}) + + if batch_idx % 50 == 0: + logging.info( + f"[Epoch {epoch:03d} | Batch {batch_idx:04d}] " + f"IWAE-loss {loss.item():.4f} " + f"| mean log_px {(log_px.mean()).item():.4f} " + f"| KL {kl.item():.2f}" + ) + return loss diff --git a/core/objective/IWAEObjective.py b/core/objective/IWAEObjective.py index 539a781..7274302 100644 --- a/core/objective/IWAEObjective.py +++ b/core/objective/IWAEObjective.py @@ -66,7 +66,7 @@ def calculate( log_ws = [] # list[k] of scalars temp = self.temperature - beta = min(1.0, (epoch / 70) ** 2) + beta = 0.001 for l in range(self.k): # sample w and compute log p(x|w) diff --git a/output.txt b/output.txt new file mode 100644 index 0000000..572cd29 --- /dev/null +++ b/output.txt @@ -0,0 +1,6540 @@ +Running experiment with config: ./config/iwae_test_configs_mnist_penalty/test_conv_100.yaml +2025-05-25 21:28:40,304 - INFO - Logging setup complete. Logs will be saved to logs/iwae_test_configs_mnist_penalty/test_conv_100.log +wandb: Currently logged in as: m-tretiakov (pac-bayes) to https://api.wandb.ai. Use `wandb login --relogin` to force relogin +wandb: Tracking run with wandb version 0.19.11 +wandb: Run data is saved locally in /pacbb/wandb/run-20250525_212840-k0dq01yv +wandb: Run `wandb offline` to turn off syncing. +wandb: Syncing run iwae_test_configs_mnist_penalty/test_conv_100_2505_2128 +wandb: ⭐️ View project at https://wandb.ai/pac-bayes/pbb_iwae +wandb: 🚀 View run at https://wandb.ai/pac-bayes/pbb_iwae/runs/k0dq01yv +2025-05-25 21:28:41,851 - INFO - Device cuda +2025-05-25 21:28:41,851 - INFO - Selected losses: ['nll_loss', 'scaled_nll_loss', '01_loss'] +2025-05-25 21:28:41,851 - INFO - Select metrics: ['accuracy_micro_metric', 'accuracy_macro_metric', 'f1_micro_metric', 'f1_macro_metric'] +2025-05-25 21:28:41,851 - INFO - Selected bounds: ['kl', 'mcallester'] +2025-05-25 21:28:41,851 - INFO - Selected data loader: {'name': 'mnist', 'params': {'dataset_path': './data/mnist'}} +Downloading http://yann.lecun.com/exdb/mnist/train-images-idx3-ubyte.gz +Failed to download (trying next): +HTTP Error 404: Not Found + +Downloading https://ossci-datasets.s3.amazonaws.com/mnist/train-images-idx3-ubyte.gz +Downloading https://ossci-datasets.s3.amazonaws.com/mnist/train-images-idx3-ubyte.gz to ./data/mnist/MNIST/raw/train-images-idx3-ubyte.gz + 0%| | 0/9912422 [00:00), Loss: 0.11140021681785583, KL/n: 71.59821319580078 + 0it [00:00, ?it/s]2025-05-25 21:29:35,288 - INFO - [Epoch 001 | Batch 0000] IWAE-loss 11894.2480 | mean log_px -0.1369 | KL -3499.28 + 1it [00:00, 3.15it/s] 2it [00:00, 3.72it/s] 3it [00:00, 3.93it/s] 4it [00:01, 4.09it/s] 5it [00:01, 4.18it/s] 6it [00:01, 4.32it/s] 7it [00:01, 4.16it/s] 8it [00:01, 4.28it/s] 9it [00:02, 4.41it/s] 10it [00:02, 4.49it/s] 11it [00:02, 4.58it/s] 12it [00:02, 4.44it/s] 13it [00:03, 4.55it/s] 14it [00:03, 4.46it/s] 15it [00:03, 4.39it/s] 16it [00:03, 4.46it/s] 17it [00:03, 4.43it/s] 18it [00:04, 4.51it/s] 19it [00:04, 4.56it/s] 20it [00:04, 4.57it/s] 21it [00:04, 4.47it/s] 22it [00:05, 4.44it/s] 23it [00:05, 4.52it/s] 24it [00:05, 4.46it/s] 25it [00:05, 4.52it/s] 26it [00:05, 4.57it/s] 27it [00:06, 4.30it/s] 28it [00:06, 4.43it/s] 29it [00:06, 4.38it/s] 30it [00:06, 4.44it/s] 31it [00:07, 4.39it/s] 32it [00:07, 4.41it/s] 33it [00:07, 4.38it/s] 34it [00:07, 4.23it/s] 35it [00:08, 4.26it/s] 36it [00:08, 4.24it/s] 37it [00:08, 4.28it/s] 38it [00:08, 4.41it/s] 39it [00:08, 4.50it/s] 40it [00:09, 4.41it/s] 41it [00:09, 4.41it/s] 42it [00:09, 4.48it/s] 43it [00:09, 4.39it/s] 44it [00:10, 4.47it/s] 45it [00:10, 4.38it/s] 46it [00:10, 4.48it/s] 47it [00:10, 4.39it/s] 48it [00:10, 4.37it/s] 49it [00:11, 4.38it/s] 50it [00:11, 4.34it/s]2025-05-25 21:29:46,627 - INFO - [Epoch 001 | Batch 0050] IWAE-loss 11227.0039 | mean log_px -0.1305 | KL -3490.07 + 51it [00:11, 4.20it/s] 52it [00:11, 4.23it/s] 53it [00:12, 4.27it/s] 54it [00:12, 4.40it/s] 55it [00:12, 4.37it/s] 56it [00:12, 4.32it/s] 57it [00:13, 4.33it/s] 58it [00:13, 4.43it/s] 59it [00:13, 4.49it/s] 60it [00:13, 4.41it/s] 61it [00:13, 4.40it/s] 62it [00:14, 4.30it/s] 63it [00:14, 4.32it/s] 64it [00:14, 4.34it/s] 65it [00:14, 4.43it/s] 66it [00:15, 4.37it/s] 67it [00:15, 4.35it/s] 68it [00:15, 4.36it/s] 69it [00:15, 4.37it/s] 70it [00:16, 4.34it/s] 71it [00:16, 4.19it/s] 72it [00:16, 4.23it/s] 73it [00:16, 4.26it/s] 74it [00:16, 4.28it/s] 75it [00:17, 4.31it/s] 76it [00:17, 4.35it/s] 77it [00:17, 4.33it/s] 78it [00:17, 4.36it/s] 79it [00:18, 4.36it/s] 80it [00:18, 4.33it/s] 81it [00:18, 4.29it/s] 82it [00:18, 4.38it/s] 83it [00:19, 4.45it/s] 84it [00:19, 4.25it/s] 85it [00:19, 4.29it/s] 86it [00:19, 4.30it/s] 87it [00:19, 4.32it/s] 88it [00:20, 4.30it/s] 89it [00:20, 4.33it/s] 90it [00:20, 4.31it/s] 91it [00:20, 4.31it/s] 92it [00:21, 4.32it/s] 93it [00:21, 4.31it/s] 94it [00:21, 4.36it/s] 95it [00:21, 4.25it/s] 96it [00:22, 4.26it/s] 97it [00:22, 4.26it/s] 98it [00:22, 4.30it/s] 99it [00:22, 4.18it/s] 100it [00:23, 4.30it/s]2025-05-25 21:29:58,190 - INFO - [Epoch 001 | Batch 0100] IWAE-loss 8575.6543 | mean log_px -0.0730 | KL -3466.15 + 101it [00:23, 4.41it/s] 102it [00:23, 4.47it/s] 103it [00:23, 4.39it/s] 104it [00:23, 4.19it/s] 105it [00:24, 4.29it/s] 106it [00:24, 4.26it/s] 107it [00:24, 4.27it/s] 108it [00:24, 4.29it/s] 109it [00:25, 4.34it/s] 110it [00:25, 4.18it/s] 111it [00:25, 4.23it/s] 112it [00:25, 4.25it/s] 113it [00:26, 4.29it/s] 114it [00:26, 4.28it/s] 115it [00:26, 4.11it/s] 116it [00:26, 4.12it/s] 117it [00:27, 4.15it/s] 118it [00:27, 4.20it/s] 119it [00:27, 4.14it/s] 120it [00:27, 4.22it/s] 121it [00:27, 4.24it/s] 122it [00:28, 4.31it/s] 123it [00:28, 4.31it/s] 124it [00:28, 4.34it/s] 125it [00:28, 4.31it/s] 126it [00:29, 4.17it/s] 127it [00:29, 4.21it/s] 128it [00:29, 4.27it/s] 129it [00:29, 4.36it/s] 130it [00:30, 4.32it/s] 131it [00:30, 4.35it/s] 132it [00:30, 4.33it/s] 133it [00:30, 4.21it/s] 134it [00:30, 4.36it/s] 135it [00:31, 4.47it/s] 136it [00:31, 4.51it/s] 137it [00:31, 4.44it/s] 138it [00:31, 4.36it/s] 139it [00:32, 4.34it/s] 140it [00:32, 4.34it/s] 141it [00:32, 4.34it/s] 142it [00:32, 4.30it/s] 143it [00:33, 4.27it/s] 144it [00:33, 4.19it/s] 145it [00:33, 4.24it/s] 146it [00:33, 4.33it/s] 147it [00:33, 4.35it/s] 148it [00:34, 4.45it/s] 149it [00:34, 4.47it/s] 150it [00:34, 4.47it/s]2025-05-25 21:30:09,826 - INFO - [Epoch 001 | Batch 0150] IWAE-loss 10918.8730 | mean log_px -0.1088 | KL -3451.89 + 151it [00:34, 4.36it/s] 152it [00:35, 4.46it/s] 153it [00:35, 4.37it/s] 154it [00:35, 4.36it/s] 155it [00:35, 4.17it/s] 156it [00:36, 4.22it/s] 157it [00:36, 4.22it/s] 158it [00:36, 4.21it/s] 159it [00:36, 4.28it/s] 160it [00:36, 4.28it/s] 161it [00:37, 4.13it/s] 162it [00:37, 4.17it/s] 163it [00:37, 4.21it/s] 164it [00:37, 4.35it/s] 165it [00:38, 4.36it/s] 166it [00:38, 4.36it/s] 167it [00:38, 4.31it/s] 168it [00:38, 4.34it/s] 169it [00:39, 4.39it/s] 170it [00:39, 4.32it/s] 171it [00:39, 4.32it/s] 172it [00:39, 4.42it/s] 173it [00:39, 4.49it/s] 174it [00:40, 4.46it/s] 175it [00:40, 4.38it/s] 176it [00:40, 4.19it/s] 177it [00:40, 4.21it/s] 178it [00:41, 4.24it/s] 179it [00:41, 4.23it/s] 180it [00:41, 4.25it/s] 181it [00:41, 4.29it/s] 182it [00:42, 4.36it/s] 183it [00:42, 4.40it/s] 184it [00:42, 4.48it/s] 185it [00:42, 4.42it/s] 186it [00:42, 4.42it/s] 187it [00:43, 4.40it/s] 188it [00:43, 4.47it/s] 189it [00:43, 4.55it/s] 190it [00:43, 4.44it/s] 191it [00:44, 4.29it/s] 192it [00:44, 4.33it/s] 193it [00:44, 4.31it/s] 194it [00:44, 4.35it/s] 195it [00:45, 4.31it/s] 196it [00:45, 4.36it/s] 196it [00:45, 4.33it/s] +2025-05-25 21:30:20,343 - INFO - Epoch: 1, Objective: tensor([9172.7520], device='cuda:0', grad_fn=), Loss: 0.07874009013175964, KL/n: 70.15756225585938 + 0it [00:00, ?it/s]2025-05-25 21:30:20,883 - INFO - [Epoch 002 | Batch 0000] IWAE-loss 7225.7852 | mean log_px -0.0616 | KL -3439.12 + 1it [00:00, 3.05it/s] 2it [00:00, 3.87it/s] 3it [00:00, 4.23it/s] 4it [00:00, 4.41it/s] 5it [00:01, 4.52it/s] 6it [00:01, 4.59it/s] 7it [00:01, 4.64it/s] 8it [00:01, 4.66it/s] 9it [00:02, 4.69it/s] 10it [00:02, 4.70it/s] 11it [00:02, 4.72it/s] 12it [00:02, 4.71it/s] 13it [00:02, 4.73it/s] 14it [00:03, 4.73it/s] 15it [00:03, 4.73it/s] 16it [00:03, 4.72it/s] 17it [00:03, 4.56it/s] 18it [00:03, 4.62it/s] 19it [00:04, 4.65it/s] 20it [00:04, 4.67it/s] 21it [00:04, 4.70it/s] 22it [00:04, 4.70it/s] 23it [00:04, 4.72it/s] 24it [00:05, 4.71it/s] 25it [00:05, 4.72it/s] 26it [00:05, 4.72it/s] 27it [00:05, 4.72it/s] 28it [00:06, 4.55it/s] 29it [00:06, 4.62it/s] 30it [00:06, 4.64it/s] 31it [00:06, 4.68it/s] 32it [00:06, 4.69it/s] 33it [00:07, 4.66it/s] 34it [00:07, 4.67it/s] 35it [00:07, 4.57it/s] 36it [00:07, 4.37it/s] 37it [00:08, 4.49it/s] 38it [00:08, 4.55it/s] 39it [00:08, 4.61it/s] 40it [00:08, 4.64it/s] 41it [00:08, 4.63it/s] 42it [00:09, 4.63it/s] 43it [00:09, 4.64it/s] 44it [00:09, 4.63it/s] 45it [00:09, 4.41it/s] 46it [00:10, 4.50it/s] 47it [00:10, 4.54it/s] 48it [00:10, 4.57it/s] 49it [00:10, 4.60it/s] 50it [00:10, 4.55it/s]2025-05-25 21:30:31,674 - INFO - [Epoch 002 | Batch 0050] IWAE-loss 7740.6035 | mean log_px -0.0618 | KL -3413.71 + 51it [00:11, 4.61it/s] 52it [00:11, 4.59it/s] 53it [00:11, 4.62it/s] 54it [00:11, 4.62it/s] 55it [00:11, 4.48it/s] 56it [00:12, 4.53it/s] 57it [00:12, 4.57it/s] 58it [00:12, 4.58it/s] 59it [00:12, 4.62it/s] 60it [00:13, 4.48it/s] 61it [00:13, 4.53it/s] 62it [00:13, 4.56it/s] 63it [00:13, 4.58it/s] 64it [00:13, 4.57it/s] 65it [00:14, 4.59it/s] 66it [00:14, 4.60it/s] 67it [00:14, 4.62it/s] 68it [00:14, 4.48it/s] 69it [00:15, 4.54it/s] 70it [00:15, 4.57it/s] 71it [00:15, 4.59it/s] 72it [00:15, 4.60it/s] 73it [00:15, 4.60it/s] 74it [00:16, 4.62it/s] 75it [00:16, 4.62it/s] 76it [00:16, 4.62it/s] 77it [00:16, 4.64it/s] 78it [00:16, 4.65it/s] 79it [00:17, 4.64it/s] 80it [00:17, 4.64it/s] 81it [00:17, 4.64it/s] 82it [00:17, 4.50it/s] 83it [00:18, 4.54it/s] 84it [00:18, 4.53it/s] 85it [00:18, 4.56it/s] 86it [00:18, 4.57it/s] 87it [00:18, 4.59it/s] 88it [00:19, 4.59it/s] 89it [00:19, 4.60it/s] 90it [00:19, 4.61it/s] 91it [00:19, 4.62it/s] 92it [00:20, 4.60it/s] 93it [00:20, 4.58it/s] 94it [00:20, 4.58it/s] 95it [00:20, 4.60it/s] 96it [00:20, 4.61it/s] 97it [00:21, 4.62it/s] 98it [00:21, 4.62it/s] 99it [00:21, 4.63it/s] 100it [00:21, 4.64it/s]2025-05-25 21:30:42,567 - INFO - [Epoch 002 | Batch 0100] IWAE-loss 10890.5635 | mean log_px -0.1134 | KL -3399.14 + 101it [00:22, 4.50it/s] 102it [00:22, 4.54it/s] 103it [00:22, 4.59it/s] 104it [00:22, 4.59it/s] 105it [00:22, 4.60it/s] 106it [00:23, 4.61it/s] 107it [00:23, 4.63it/s] 108it [00:23, 4.62it/s] 109it [00:23, 4.62it/s] 110it [00:23, 4.50it/s] 111it [00:24, 4.54it/s] 112it [00:24, 4.57it/s] 113it [00:24, 4.59it/s] 114it [00:24, 4.61it/s] 115it [00:25, 4.63it/s] 116it [00:25, 4.64it/s] 117it [00:25, 4.64it/s] 118it [00:25, 4.63it/s] 119it [00:25, 4.50it/s] 120it [00:26, 4.55it/s] 121it [00:26, 4.58it/s] 122it [00:26, 4.59it/s] 123it [00:26, 4.60it/s] 124it [00:27, 4.61it/s] 125it [00:27, 4.63it/s] 126it [00:27, 4.63it/s] 127it [00:27, 4.64it/s] 128it [00:27, 4.51it/s] 129it [00:28, 4.56it/s] 130it [00:28, 4.57it/s] 131it [00:28, 4.59it/s] 132it [00:28, 4.60it/s] 133it [00:28, 4.62it/s] 134it [00:29, 4.62it/s] 135it [00:29, 4.62it/s] 136it [00:29, 4.61it/s] 137it [00:29, 4.62it/s] 138it [00:30, 4.48it/s] 139it [00:30, 4.54it/s] 140it [00:30, 4.57it/s] 141it [00:30, 4.59it/s] 142it [00:30, 4.60it/s] 143it [00:31, 4.58it/s] 144it [00:31, 4.60it/s] 145it [00:31, 4.60it/s] 146it [00:31, 4.60it/s] 147it [00:32, 4.61it/s] 148it [00:32, 4.62it/s] 149it [00:32, 4.63it/s] 150it [00:32, 4.61it/s]2025-05-25 21:30:53,461 - INFO - [Epoch 002 | Batch 0150] IWAE-loss 6388.3467 | mean log_px -0.0455 | KL -3380.82 + 151it [00:32, 4.49it/s] 152it [00:33, 4.52it/s] 153it [00:33, 4.56it/s] 154it [00:33, 4.59it/s] 155it [00:33, 4.60it/s] 156it [00:33, 4.54it/s] 157it [00:34, 4.58it/s] 158it [00:34, 4.57it/s] 159it [00:34, 4.59it/s] 160it [00:34, 4.59it/s] 161it [00:35, 4.61it/s] 162it [00:35, 4.62it/s] 163it [00:35, 4.63it/s] 164it [00:35, 4.64it/s] 165it [00:35, 4.65it/s] 166it [00:36, 4.64it/s] 167it [00:36, 4.64it/s] 168it [00:36, 4.64it/s] 169it [00:36, 4.63it/s] 170it [00:37, 4.63it/s] 171it [00:37, 4.59it/s] 172it [00:37, 4.59it/s] 173it [00:37, 4.60it/s] 174it [00:37, 4.60it/s] 175it [00:38, 4.60it/s] 176it [00:38, 4.61it/s] 177it [00:38, 4.62it/s] 178it [00:38, 4.57it/s] 179it [00:38, 4.57it/s] 180it [00:39, 4.59it/s] 181it [00:39, 4.61it/s] 182it [00:39, 4.61it/s] 183it [00:39, 4.49it/s] 184it [00:40, 4.54it/s] 185it [00:40, 4.57it/s] 186it [00:40, 4.60it/s] 187it [00:40, 4.61it/s] 188it [00:40, 4.61it/s] 189it [00:41, 4.59it/s] 190it [00:41, 4.38it/s] 191it [00:41, 4.45it/s] 192it [00:41, 4.50it/s] 193it [00:42, 4.55it/s] 194it [00:42, 4.58it/s] 195it [00:42, 4.38it/s] 196it [00:42, 4.46it/s] 196it [00:42, 4.58it/s] +2025-05-25 21:31:03,450 - INFO - Epoch: 2, Objective: tensor([7126.1548], device='cuda:0', grad_fn=), Loss: 0.05375305190682411, KL/n: 68.71427154541016 + 0it [00:00, ?it/s]2025-05-25 21:31:03,819 - INFO - [Epoch 003 | Batch 0000] IWAE-loss 6548.8511 | mean log_px -0.0590 | KL -3364.44 + 1it [00:00, 3.34it/s] 2it [00:00, 4.00it/s] 3it [00:00, 4.29it/s] 4it [00:00, 4.25it/s] 5it [00:01, 4.40it/s] 6it [00:01, 4.47it/s] 7it [00:01, 4.52it/s] 8it [00:01, 4.55it/s] 9it [00:02, 4.58it/s] 10it [00:02, 4.59it/s] 11it [00:02, 4.61it/s] 12it [00:02, 4.62it/s] 13it [00:02, 4.64it/s] 14it [00:03, 4.64it/s] 15it [00:03, 4.64it/s] 16it [00:03, 4.63it/s] 17it [00:03, 4.63it/s] 18it [00:03, 4.63it/s] 19it [00:04, 4.64it/s] 20it [00:04, 4.63it/s] 21it [00:04, 4.63it/s] 22it [00:04, 4.63it/s] 23it [00:05, 4.64it/s] 24it [00:05, 4.63it/s] 25it [00:05, 4.64it/s] 26it [00:05, 4.50it/s] 27it [00:05, 4.55it/s] 28it [00:06, 4.58it/s] 29it [00:06, 4.59it/s] 30it [00:06, 4.60it/s] 31it [00:06, 4.63it/s] 32it [00:07, 4.49it/s] 33it [00:07, 4.54it/s] 34it [00:07, 4.56it/s] 35it [00:07, 4.59it/s] 36it [00:07, 4.61it/s] 37it [00:08, 4.62it/s] 38it [00:08, 4.62it/s] 39it [00:08, 4.63it/s] 40it [00:08, 4.61it/s] 41it [00:09, 4.49it/s] 42it [00:09, 4.54it/s] 43it [00:09, 4.58it/s] 44it [00:09, 4.55it/s] 45it [00:09, 4.56it/s] 46it [00:10, 4.54it/s] 47it [00:10, 4.56it/s] 48it [00:10, 4.57it/s] 49it [00:10, 4.57it/s] 50it [00:10, 4.43it/s]2025-05-25 21:31:14,734 - INFO - [Epoch 003 | Batch 0050] IWAE-loss 6395.8638 | mean log_px -0.0435 | KL -3348.27 + 51it [00:11, 4.45it/s] 52it [00:11, 4.49it/s] 53it [00:11, 4.51it/s] 54it [00:11, 4.53it/s] 55it [00:12, 4.53it/s] 56it [00:12, 4.40it/s] 57it [00:12, 4.45it/s] 58it [00:12, 4.45it/s] 59it [00:13, 4.47it/s] 60it [00:13, 4.51it/s] 61it [00:13, 4.55it/s] 62it [00:13, 4.41it/s] 63it [00:13, 4.48it/s] 64it [00:14, 4.51it/s] 65it [00:14, 4.53it/s] 66it [00:14, 4.55it/s] 67it [00:14, 4.56it/s] 68it [00:14, 4.56it/s] 69it [00:15, 4.58it/s] 70it [00:15, 4.55it/s] 71it [00:15, 4.42it/s] 72it [00:15, 4.45it/s] 73it [00:16, 4.47it/s] 74it [00:16, 4.51it/s] 75it [00:16, 4.54it/s] 76it [00:16, 4.57it/s] 77it [00:17, 3.69it/s] 78it [00:17, 3.93it/s] 79it [00:17, 4.12it/s] 80it [00:17, 4.17it/s] 81it [00:18, 4.32it/s] 82it [00:18, 4.40it/s] 83it [00:18, 4.47it/s] 84it [00:18, 4.52it/s] 85it [00:18, 4.56it/s] 86it [00:19, 4.57it/s] 87it [00:19, 4.59it/s] 88it [00:19, 4.59it/s] 89it [00:19, 4.46it/s] 90it [00:19, 4.53it/s] 91it [00:20, 4.58it/s] 92it [00:20, 4.62it/s] 93it [00:20, 4.65it/s] 94it [00:20, 4.65it/s] 95it [00:21, 4.63it/s] 96it [00:21, 4.63it/s] 97it [00:21, 4.64it/s] 98it [00:21, 4.50it/s] 99it [00:21, 4.58it/s] 100it [00:22, 4.61it/s]2025-05-25 21:31:25,885 - INFO - [Epoch 003 | Batch 0100] IWAE-loss 6408.8643 | mean log_px -0.0460 | KL -3327.64 + 101it [00:22, 4.64it/s] 102it [00:22, 4.66it/s] 103it [00:22, 4.68it/s] 104it [00:23, 4.52it/s] 105it [00:23, 4.59it/s] 106it [00:23, 4.62it/s] 107it [00:23, 4.49it/s] 108it [00:23, 4.56it/s] 109it [00:24, 4.60it/s] 110it [00:24, 4.63it/s] 111it [00:24, 4.66it/s] 112it [00:24, 4.68it/s] 113it [00:24, 4.52it/s] 114it [00:25, 4.59it/s] 115it [00:25, 4.62it/s] 116it [00:25, 4.64it/s] 117it [00:25, 4.66it/s] 118it [00:26, 4.66it/s] 119it [00:26, 4.53it/s] 120it [00:26, 4.59it/s] 121it [00:26, 4.62it/s] 122it [00:26, 4.64it/s] 123it [00:27, 4.66it/s] 124it [00:27, 4.68it/s] 125it [00:27, 4.70it/s] 126it [00:27, 4.57it/s] 127it [00:27, 4.63it/s] 128it [00:28, 4.64it/s] 129it [00:28, 4.66it/s] 130it [00:28, 4.67it/s] 131it [00:28, 4.69it/s] 132it [00:29, 4.53it/s] 133it [00:29, 4.60it/s] 134it [00:29, 4.63it/s] 135it [00:29, 4.59it/s] 136it [00:29, 4.51it/s] 137it [00:30, 4.56it/s] 138it [00:30, 4.60it/s] 139it [00:30, 4.64it/s] 140it [00:30, 4.65it/s] 141it [00:31, 4.50it/s] 142it [00:31, 4.56it/s] 143it [00:31, 4.61it/s] 144it [00:31, 4.63it/s] 145it [00:31, 4.66it/s] 146it [00:32, 4.67it/s] 147it [00:32, 4.68it/s] 148it [00:32, 4.68it/s] 149it [00:32, 4.51it/s] 150it [00:32, 4.57it/s]2025-05-25 21:31:36,731 - INFO - [Epoch 003 | Batch 0150] IWAE-loss 6867.9688 | mean log_px -0.0538 | KL -3303.91 + 151it [00:33, 4.60it/s] 152it [00:33, 4.62it/s] 153it [00:33, 4.64it/s] 154it [00:33, 4.66it/s] 155it [00:34, 4.57it/s] 156it [00:34, 4.62it/s] 157it [00:34, 4.65it/s] 158it [00:34, 4.67it/s] 159it [00:34, 4.53it/s] 160it [00:35, 4.59it/s] 161it [00:35, 4.63it/s] 162it [00:35, 4.65it/s] 163it [00:35, 4.67it/s] 164it [00:36, 4.68it/s] 165it [00:36, 4.52it/s] 166it [00:36, 4.59it/s] 167it [00:36, 4.63it/s] 168it [00:36, 4.65it/s] 169it [00:37, 4.67it/s] 170it [00:37, 4.68it/s] 171it [00:37, 4.68it/s] 172it [00:37, 4.54it/s] 173it [00:37, 4.60it/s] 174it [00:38, 4.63it/s] 175it [00:38, 4.65it/s] 176it [00:38, 4.67it/s] 177it [00:38, 4.68it/s] 178it [00:39, 4.49it/s] 179it [00:39, 4.57it/s] 180it [00:39, 4.61it/s] 181it [00:39, 4.64it/s] 182it [00:39, 4.66it/s] 183it [00:40, 4.67it/s] 184it [00:40, 4.67it/s] 185it [00:40, 4.69it/s] 186it [00:40, 4.52it/s] 187it [00:40, 4.58it/s] 188it [00:41, 4.61it/s] 189it [00:41, 4.63it/s] 190it [00:41, 4.65it/s] 191it [00:41, 4.66it/s] 192it [00:42, 4.67it/s] 193it [00:42, 4.52it/s] 194it [00:42, 4.58it/s] 195it [00:42, 4.38it/s] 196it [00:42, 4.41it/s] 196it [00:43, 4.55it/s] +2025-05-25 21:31:46,642 - INFO - Epoch: 3, Objective: tensor([5746.6787], device='cuda:0', grad_fn=), Loss: 0.046654097735881805, KL/n: 67.17630004882812 + 0it [00:00, ?it/s]2025-05-25 21:31:47,004 - INFO - [Epoch 004 | Batch 0000] IWAE-loss 5883.0645 | mean log_px -0.0408 | KL -3290.14 + 1it [00:00, 3.60it/s] 2it [00:00, 3.91it/s] 3it [00:00, 4.24it/s] 4it [00:00, 4.34it/s] 5it [00:01, 4.47it/s] 6it [00:01, 4.55it/s] 7it [00:01, 4.61it/s] 8it [00:01, 4.63it/s] 9it [00:02, 4.66it/s] 10it [00:02, 4.67it/s] 11it [00:02, 4.67it/s] 12it [00:02, 4.67it/s] 13it [00:02, 4.63it/s] 14it [00:03, 4.64it/s] 15it [00:03, 4.66it/s] 16it [00:03, 4.66it/s] 17it [00:03, 4.59it/s] 18it [00:03, 4.63it/s] 19it [00:04, 4.65it/s] 20it [00:04, 4.65it/s] 21it [00:04, 4.65it/s] 22it [00:04, 4.65it/s] 23it [00:05, 4.47it/s] 24it [00:05, 4.54it/s] 25it [00:05, 4.61it/s] 26it [00:05, 4.63it/s] 27it [00:05, 4.64it/s] 28it [00:06, 4.66it/s] 29it [00:06, 4.68it/s] 30it [00:06, 4.68it/s] 31it [00:06, 4.70it/s] 32it [00:06, 4.70it/s] 33it [00:07, 4.71it/s] 34it [00:07, 4.52it/s] 35it [00:07, 4.59it/s] 36it [00:07, 4.62it/s] 37it [00:08, 4.64it/s] 38it [00:08, 4.65it/s] 39it [00:08, 4.66it/s] 40it [00:08, 4.66it/s] 41it [00:08, 4.67it/s] 42it [00:09, 4.48it/s] 43it [00:09, 4.54it/s] 44it [00:09, 4.57it/s] 45it [00:09, 4.59it/s] 46it [00:10, 4.61it/s] 47it [00:10, 4.63it/s] 48it [00:10, 4.63it/s] 49it [00:10, 4.65it/s] 50it [00:10, 4.66it/s]2025-05-25 21:31:57,811 - INFO - [Epoch 004 | Batch 0050] IWAE-loss 4895.3418 | mean log_px -0.0286 | KL -3262.91 + 51it [00:11, 4.49it/s] 52it [00:11, 4.51it/s] 53it [00:11, 4.52it/s] 54it [00:11, 4.50it/s] 55it [00:12, 4.42it/s] 56it [00:12, 4.43it/s] 57it [00:12, 4.37it/s] 58it [00:12, 4.45it/s] 59it [00:12, 4.52it/s] 60it [00:13, 4.55it/s] 61it [00:13, 4.57it/s] 62it [00:13, 4.59it/s] 63it [00:13, 4.52it/s] 64it [00:13, 4.56it/s] 65it [00:14, 4.59it/s] 66it [00:14, 4.60it/s] 67it [00:14, 4.59it/s] 68it [00:14, 4.46it/s] 69it [00:15, 4.52it/s] 70it [00:15, 4.56it/s] 71it [00:15, 4.59it/s] 72it [00:15, 4.59it/s] 73it [00:15, 4.60it/s] 74it [00:16, 4.48it/s] 75it [00:16, 4.53it/s] 76it [00:16, 4.56it/s] 77it [00:16, 4.57it/s] 78it [00:17, 4.57it/s] 79it [00:17, 4.47it/s] 80it [00:17, 4.52it/s] 81it [00:17, 4.55it/s] 82it [00:17, 4.41it/s] 83it [00:18, 4.49it/s] 84it [00:18, 4.53it/s] 85it [00:18, 4.57it/s] 86it [00:18, 4.45it/s] 87it [00:19, 4.51it/s] 88it [00:19, 4.55it/s] 89it [00:19, 4.58it/s] 90it [00:19, 4.61it/s] 91it [00:19, 4.62it/s] 92it [00:20, 4.48it/s] 93it [00:20, 4.55it/s] 94it [00:20, 4.57it/s] 95it [00:20, 4.59it/s] 96it [00:21, 4.61it/s] 97it [00:21, 4.62it/s] 98it [00:21, 4.63it/s] 99it [00:21, 4.64it/s] 100it [00:21, 4.64it/s]2025-05-25 21:32:08,829 - INFO - [Epoch 004 | Batch 0100] IWAE-loss 5435.9736 | mean log_px -0.0313 | KL -3245.03 + 101it [00:22, 4.50it/s] 102it [00:22, 4.55it/s] 103it [00:22, 4.58it/s] 104it [00:22, 4.60it/s] 105it [00:22, 4.62it/s] 106it [00:23, 4.61it/s] 107it [00:23, 4.48it/s] 108it [00:23, 4.50it/s] 109it [00:23, 4.55it/s] 110it [00:24, 4.58it/s] 111it [00:24, 4.60it/s] 112it [00:24, 4.61it/s] 113it [00:24, 4.48it/s] 114it [00:24, 4.53it/s] 115it [00:25, 4.56it/s] 116it [00:25, 4.57it/s] 117it [00:25, 4.58it/s] 118it [00:25, 4.59it/s] 119it [00:26, 4.47it/s] 120it [00:26, 4.52it/s] 121it [00:26, 4.56it/s] 122it [00:26, 4.58it/s] 123it [00:26, 4.46it/s] 124it [00:27, 4.52it/s] 125it [00:27, 4.55it/s] 126it [00:27, 4.57it/s] 127it [00:27, 4.53it/s] 128it [00:28, 4.57it/s] 129it [00:28, 4.60it/s] 130it [00:28, 4.47it/s] 131it [00:28, 4.53it/s] 132it [00:28, 4.56it/s] 133it [00:29, 4.59it/s] 134it [00:29, 4.60it/s] 135it [00:29, 4.61it/s] 136it [00:29, 4.60it/s] 137it [00:30, 4.62it/s] 138it [00:30, 4.63it/s] 139it [00:30, 4.49it/s] 140it [00:30, 4.55it/s] 141it [00:30, 4.56it/s] 142it [00:31, 4.58it/s] 143it [00:31, 4.61it/s] 144it [00:31, 4.47it/s] 145it [00:31, 4.50it/s] 146it [00:31, 4.55it/s] 147it [00:32, 4.58it/s] 148it [00:32, 4.50it/s] 149it [00:32, 4.41it/s] 150it [00:32, 4.49it/s]2025-05-25 21:32:19,836 - INFO - [Epoch 004 | Batch 0150] IWAE-loss 4805.7720 | mean log_px -0.0276 | KL -3228.11 + 151it [00:33, 4.54it/s] 152it [00:33, 4.58it/s] 153it [00:33, 4.46it/s] 154it [00:33, 4.52it/s] 155it [00:33, 4.58it/s] 156it [00:34, 4.60it/s] 157it [00:34, 4.61it/s] 158it [00:34, 4.49it/s] 159it [00:34, 4.55it/s] 160it [00:35, 4.55it/s] 161it [00:35, 4.58it/s] 162it [00:35, 4.59it/s] 163it [00:35, 4.61it/s] 164it [00:35, 4.63it/s] 165it [00:36, 4.64it/s] 166it [00:36, 4.64it/s] 167it [00:36, 4.50it/s] 168it [00:36, 4.55it/s] 169it [00:37, 4.59it/s] 170it [00:37, 4.61it/s] 171it [00:37, 4.62it/s] 172it [00:37, 4.62it/s] 173it [00:37, 4.64it/s] 174it [00:38, 4.65it/s] 175it [00:38, 4.65it/s] 176it [00:38, 4.49it/s] 177it [00:38, 4.56it/s] 178it [00:38, 4.58it/s] 179it [00:39, 4.61it/s] 180it [00:39, 4.61it/s] 181it [00:39, 4.55it/s] 182it [00:39, 4.59it/s] 183it [00:40, 4.49it/s] 184it [00:40, 4.55it/s] 185it [00:40, 4.57it/s] 186it [00:40, 4.59it/s] 187it [00:40, 4.61it/s] 188it [00:41, 4.62it/s] 189it [00:41, 4.63it/s] 190it [00:41, 4.48it/s] 191it [00:41, 4.54it/s] 192it [00:42, 4.58it/s] 193it [00:42, 4.60it/s] 194it [00:42, 4.61it/s] 195it [00:42, 4.36it/s] 196it [00:42, 4.38it/s] 196it [00:43, 4.55it/s] +2025-05-25 21:32:29,827 - INFO - Epoch: 4, Objective: tensor([5635.8784], device='cuda:0', grad_fn=), Loss: 0.03690037503838539, KL/n: 65.52703094482422 + 0it [00:00, ?it/s]2025-05-25 21:32:30,383 - INFO - [Epoch 005 | Batch 0000] IWAE-loss 6954.7480 | mean log_px -0.0605 | KL -3211.71 + 1it [00:00, 2.99it/s] 2it [00:00, 3.81it/s] 3it [00:00, 4.16it/s] 4it [00:00, 4.33it/s] 5it [00:01, 4.45it/s] 6it [00:01, 4.52it/s] 7it [00:01, 4.40it/s] 8it [00:01, 4.49it/s] 9it [00:02, 4.55it/s] 10it [00:02, 4.56it/s] 11it [00:02, 4.59it/s] 12it [00:02, 4.61it/s] 13it [00:02, 4.63it/s] 14it [00:03, 4.61it/s] 15it [00:03, 4.45it/s] 16it [00:03, 4.51it/s] 17it [00:03, 4.56it/s] 18it [00:04, 4.58it/s] 19it [00:04, 4.61it/s] 20it [00:04, 4.60it/s] 21it [00:04, 4.47it/s] 22it [00:04, 4.46it/s] 23it [00:05, 4.52it/s] 24it [00:05, 4.54it/s] 25it [00:05, 4.58it/s] 26it [00:05, 4.59it/s] 27it [00:06, 4.33it/s] 28it [00:06, 4.43it/s] 29it [00:06, 4.50it/s] 30it [00:06, 4.55it/s] 31it [00:06, 4.59it/s] 32it [00:07, 4.45it/s] 33it [00:07, 4.53it/s] 34it [00:07, 4.56it/s] 35it [00:07, 4.60it/s] 36it [00:08, 4.62it/s] 37it [00:08, 4.64it/s] 38it [00:08, 4.64it/s] 39it [00:08, 4.66it/s] 40it [00:08, 4.66it/s] 41it [00:09, 4.66it/s] 42it [00:09, 4.66it/s] 43it [00:09, 4.49it/s] 44it [00:09, 4.55it/s] 45it [00:09, 4.59it/s] 46it [00:10, 4.62it/s] 47it [00:10, 4.64it/s] 48it [00:10, 4.64it/s] 49it [00:10, 4.65it/s] 50it [00:11, 4.65it/s]2025-05-25 21:32:41,324 - INFO - [Epoch 005 | Batch 0050] IWAE-loss 6567.6064 | mean log_px -0.0585 | KL -3187.38 + 51it [00:11, 4.65it/s] 52it [00:11, 4.65it/s] 53it [00:11, 4.65it/s] 54it [00:11, 4.65it/s] 55it [00:12, 4.66it/s] 56it [00:12, 4.65it/s] 57it [00:12, 4.65it/s] 58it [00:12, 4.65it/s] 59it [00:12, 4.66it/s] 60it [00:13, 4.66it/s] 61it [00:13, 4.67it/s] 62it [00:13, 4.67it/s] 63it [00:13, 4.68it/s] 64it [00:14, 4.67it/s] 65it [00:14, 4.67it/s] 66it [00:14, 4.67it/s] 67it [00:14, 4.62it/s] 68it [00:14, 4.49it/s] 69it [00:15, 4.56it/s] 70it [00:15, 4.59it/s] 71it [00:15, 4.61it/s] 72it [00:15, 4.62it/s] 73it [00:15, 4.64it/s] 74it [00:16, 4.64it/s] 75it [00:16, 4.66it/s] 76it [00:16, 4.66it/s] 77it [00:16, 4.67it/s] 78it [00:17, 4.66it/s] 79it [00:17, 4.66it/s] 80it [00:17, 4.66it/s] 81it [00:17, 4.53it/s] 82it [00:17, 4.58it/s] 83it [00:18, 4.61it/s] 84it [00:18, 4.63it/s] 85it [00:18, 4.64it/s] 86it [00:18, 4.65it/s] 87it [00:19, 4.66it/s] 88it [00:19, 4.66it/s] 89it [00:19, 4.66it/s] 90it [00:19, 4.51it/s] 91it [00:19, 4.57it/s] 92it [00:20, 4.60it/s] 93it [00:20, 4.63it/s] 94it [00:20, 4.64it/s] 95it [00:20, 4.65it/s] 96it [00:20, 4.66it/s] 97it [00:21, 4.67it/s] 98it [00:21, 4.67it/s] 99it [00:21, 4.67it/s] 100it [00:21, 4.67it/s]2025-05-25 21:32:52,106 - INFO - [Epoch 005 | Batch 0100] IWAE-loss 5110.2051 | mean log_px -0.0323 | KL -3168.64 + 101it [00:22, 4.66it/s] 102it [00:22, 4.66it/s] 103it [00:22, 4.67it/s] 104it [00:22, 4.67it/s] 105it [00:22, 4.68it/s] 106it [00:23, 4.67it/s] 107it [00:23, 4.67it/s] 108it [00:23, 4.68it/s] 109it [00:23, 4.53it/s] 110it [00:23, 4.58it/s] 111it [00:24, 4.61it/s] 112it [00:24, 4.63it/s] 113it [00:24, 4.64it/s] 114it [00:24, 4.65it/s] 115it [00:25, 4.66it/s] 116it [00:25, 4.66it/s] 117it [00:25, 4.67it/s] 118it [00:25, 4.52it/s] 119it [00:25, 4.58it/s] 120it [00:26, 4.55it/s] 121it [00:26, 4.60it/s] 122it [00:26, 4.60it/s] 123it [00:26, 4.62it/s] 124it [00:27, 4.63it/s] 125it [00:27, 4.64it/s] 126it [00:27, 4.52it/s] 127it [00:27, 4.57it/s] 128it [00:27, 4.60it/s] 129it [00:28, 4.61it/s] 130it [00:28, 4.63it/s] 131it [00:28, 4.64it/s] 132it [00:28, 4.65it/s] 133it [00:28, 4.66it/s] 134it [00:29, 4.66it/s] 135it [00:29, 4.66it/s] 136it [00:29, 4.66it/s] 137it [00:29, 4.66it/s] 138it [00:30, 4.52it/s] 139it [00:30, 4.58it/s] 140it [00:30, 4.60it/s] 141it [00:30, 4.62it/s] 142it [00:30, 4.63it/s] 143it [00:31, 4.64it/s] 144it [00:31, 4.62it/s] 145it [00:31, 4.64it/s] 146it [00:31, 4.49it/s] 147it [00:32, 4.54it/s] 148it [00:32, 4.58it/s] 149it [00:32, 4.60it/s] 150it [00:32, 4.62it/s]2025-05-25 21:33:02,940 - INFO - [Epoch 005 | Batch 0150] IWAE-loss 3932.0217 | mean log_px -0.0119 | KL -3150.20 + 151it [00:32, 4.63it/s] 152it [00:33, 4.64it/s] 153it [00:33, 4.65it/s] 154it [00:33, 4.65it/s] 155it [00:33, 4.51it/s] 156it [00:33, 4.57it/s] 157it [00:34, 4.60it/s] 158it [00:34, 4.60it/s] 159it [00:34, 4.59it/s] 160it [00:34, 4.61it/s] 161it [00:35, 4.63it/s] 162it [00:35, 4.61it/s] 163it [00:35, 4.64it/s] 164it [00:35, 4.51it/s] 165it [00:35, 4.56it/s] 166it [00:36, 4.59it/s] 167it [00:36, 4.61it/s] 168it [00:36, 4.62it/s] 169it [00:36, 4.63it/s] 170it [00:36, 4.62it/s] 171it [00:37, 4.48it/s] 172it [00:37, 4.52it/s] 173it [00:37, 4.42it/s] 174it [00:37, 4.46it/s] 175it [00:38, 4.52it/s] 176it [00:38, 4.56it/s] 177it [00:38, 4.59it/s] 178it [00:38, 4.47it/s] 179it [00:38, 4.55it/s] 180it [00:39, 4.58it/s] 181it [00:39, 4.60it/s] 182it [00:39, 4.62it/s] 183it [00:39, 4.64it/s] 184it [00:40, 4.45it/s] 185it [00:40, 4.50it/s] 186it [00:40, 4.56it/s] 187it [00:40, 4.60it/s] 188it [00:40, 4.62it/s] 189it [00:41, 4.63it/s] 190it [00:41, 4.48it/s] 191it [00:41, 4.54it/s] 192it [00:41, 4.57it/s] 193it [00:42, 4.59it/s] 194it [00:42, 4.61it/s] 195it [00:42, 4.37it/s] 196it [00:42, 4.47it/s] 196it [00:42, 4.58it/s] +2025-05-25 21:33:12,929 - INFO - Epoch: 5, Objective: tensor([4262.7358], device='cuda:0', grad_fn=), Loss: 0.01855652406811714, KL/n: 64.05235290527344 + 0it [00:00, ?it/s]2025-05-25 21:33:13,301 - INFO - [Epoch 006 | Batch 0000] IWAE-loss 4869.3335 | mean log_px -0.0318 | KL -3135.65 + 1it [00:00, 3.32it/s] 2it [00:00, 3.79it/s] 3it [00:00, 4.18it/s] 4it [00:00, 4.36it/s] 5it [00:01, 4.47it/s] 6it [00:01, 4.53it/s] 7it [00:01, 4.58it/s] 8it [00:01, 4.60it/s] 9it [00:02, 4.63it/s] 10it [00:02, 4.62it/s] 11it [00:02, 4.50it/s] 12it [00:02, 4.53it/s] 13it [00:02, 4.59it/s] 14it [00:03, 4.61it/s] 15it [00:03, 4.63it/s] 16it [00:03, 4.47it/s] 17it [00:03, 4.53it/s] 18it [00:04, 4.41it/s] 19it [00:04, 4.50it/s] 20it [00:04, 4.55it/s] 21it [00:04, 4.59it/s] 22it [00:04, 4.60it/s] 23it [00:05, 4.63it/s] 24it [00:05, 4.48it/s] 25it [00:05, 4.55it/s] 26it [00:05, 3.66it/s] 27it [00:06, 3.91it/s] 28it [00:06, 4.11it/s] 29it [00:06, 4.27it/s] 30it [00:06, 4.25it/s] 31it [00:07, 4.37it/s] 32it [00:07, 4.45it/s] 33it [00:07, 4.52it/s] 34it [00:07, 4.56it/s] 35it [00:07, 4.59it/s] 36it [00:08, 4.46it/s] 37it [00:08, 4.52it/s] 38it [00:08, 4.56it/s] 39it [00:08, 4.48it/s] 40it [00:09, 4.54it/s] 41it [00:09, 4.59it/s] 42it [00:09, 4.60it/s] 43it [00:09, 4.63it/s] 44it [00:09, 4.48it/s] 45it [00:10, 4.55it/s] 46it [00:10, 4.58it/s] 47it [00:10, 4.60it/s] 48it [00:10, 4.62it/s] 49it [00:10, 4.64it/s] 50it [00:11, 4.49it/s]2025-05-25 21:33:24,425 - INFO - [Epoch 006 | Batch 0050] IWAE-loss 7057.3750 | mean log_px -0.0627 | KL -3113.32 + 51it [00:11, 4.56it/s] 52it [00:11, 4.59it/s] 53it [00:11, 4.61it/s] 54it [00:12, 4.63it/s] 55it [00:12, 4.64it/s] 56it [00:12, 4.49it/s] 57it [00:12, 4.55it/s] 58it [00:12, 4.59it/s] 59it [00:13, 4.62it/s] 60it [00:13, 4.62it/s] 61it [00:13, 4.64it/s] 62it [00:13, 4.48it/s] 63it [00:14, 4.55it/s] 64it [00:14, 4.58it/s] 65it [00:14, 4.61it/s] 66it [00:14, 4.62it/s] 67it [00:14, 4.64it/s] 68it [00:15, 4.48it/s] 69it [00:15, 4.55it/s] 70it [00:15, 4.58it/s] 71it [00:15, 4.61it/s] 72it [00:15, 4.63it/s] 73it [00:16, 4.63it/s] 74it [00:16, 4.66it/s] 75it [00:16, 4.62it/s] 76it [00:16, 4.48it/s] 77it [00:17, 4.56it/s] 78it [00:17, 4.55it/s] 79it [00:17, 4.59it/s] 80it [00:17, 4.61it/s] 81it [00:17, 4.49it/s] 82it [00:18, 4.54it/s] 83it [00:18, 4.59it/s] 84it [00:18, 4.60it/s] 85it [00:18, 4.62it/s] 86it [00:19, 4.63it/s] 87it [00:19, 4.65it/s] 88it [00:19, 4.66it/s] 89it [00:19, 4.67it/s] 90it [00:19, 4.52it/s] 91it [00:20, 4.57it/s] 92it [00:20, 4.60it/s] 93it [00:20, 4.63it/s] 94it [00:20, 4.50it/s] 95it [00:21, 4.56it/s] 96it [00:21, 4.60it/s] 97it [00:21, 4.63it/s] 98it [00:21, 4.64it/s] 99it [00:21, 4.66it/s] 100it [00:22, 4.51it/s]2025-05-25 21:33:35,320 - INFO - [Epoch 006 | Batch 0100] IWAE-loss 6381.2471 | mean log_px -0.0664 | KL -3103.59 + 101it [00:22, 4.57it/s] 102it [00:22, 4.60it/s] 103it [00:22, 4.63it/s] 104it [00:22, 4.64it/s] 105it [00:23, 4.66it/s] 106it [00:23, 4.66it/s] 107it [00:23, 4.67it/s] 108it [00:23, 4.67it/s] 109it [00:24, 4.53it/s] 110it [00:24, 4.57it/s] 111it [00:24, 4.61it/s] 112it [00:24, 4.63it/s] 113it [00:24, 4.65it/s] 114it [00:25, 4.51it/s] 115it [00:25, 4.57it/s] 116it [00:25, 4.60it/s] 117it [00:25, 4.63it/s] 118it [00:25, 4.64it/s] 119it [00:26, 4.56it/s] 120it [00:26, 4.52it/s] 121it [00:26, 4.52it/s] 122it [00:26, 4.43it/s] 123it [00:27, 4.47it/s] 124it [00:27, 4.48it/s] 125it [00:27, 4.54it/s] 126it [00:27, 4.58it/s] 127it [00:27, 4.61it/s] 128it [00:28, 4.49it/s] 129it [00:28, 4.56it/s] 130it [00:28, 4.54it/s] 131it [00:28, 4.58it/s] 132it [00:29, 4.60it/s] 133it [00:29, 4.63it/s] 134it [00:29, 4.64it/s] 135it [00:29, 4.65it/s] 136it [00:29, 4.66it/s] 137it [00:30, 4.52it/s] 138it [00:30, 4.57it/s] 139it [00:30, 4.61it/s] 140it [00:30, 4.63it/s] 141it [00:31, 4.64it/s] 142it [00:31, 4.65it/s] 143it [00:31, 4.66it/s] 144it [00:31, 4.67it/s] 145it [00:31, 4.68it/s] 146it [00:32, 4.52it/s] 147it [00:32, 4.58it/s] 148it [00:32, 4.61it/s] 149it [00:32, 4.63it/s] 150it [00:32, 4.64it/s]2025-05-25 21:33:46,194 - INFO - [Epoch 006 | Batch 0150] IWAE-loss 4548.9775 | mean log_px -0.0281 | KL -3080.35 + 151it [00:33, 4.50it/s] 152it [00:33, 4.56it/s] 153it [00:33, 4.60it/s] 154it [00:33, 4.61it/s] 155it [00:34, 4.64it/s] 156it [00:34, 4.55it/s] 157it [00:34, 4.60it/s] 158it [00:34, 4.62it/s] 159it [00:34, 4.65it/s] 160it [00:35, 4.65it/s] 161it [00:35, 4.52it/s] 162it [00:35, 4.57it/s] 163it [00:35, 4.59it/s] 164it [00:36, 4.62it/s] 165it [00:36, 4.64it/s] 166it [00:36, 4.50it/s] 167it [00:36, 4.57it/s] 168it [00:36, 4.60it/s] 169it [00:37, 4.62it/s] 170it [00:37, 4.63it/s] 171it [00:37, 4.65it/s] 172it [00:37, 4.65it/s] 173it [00:37, 4.67it/s] 174it [00:38, 4.65it/s] 175it [00:38, 4.68it/s] 176it [00:38, 4.68it/s] 177it [00:38, 4.54it/s] 178it [00:39, 4.59it/s] 179it [00:39, 4.62it/s] 180it [00:39, 4.63it/s] 181it [00:39, 4.65it/s] 182it [00:39, 4.61it/s] 183it [00:40, 4.38it/s] 184it [00:40, 4.45it/s] 185it [00:40, 4.54it/s] 186it [00:40, 4.57it/s] 187it [00:41, 4.57it/s] 188it [00:41, 4.46it/s] 189it [00:41, 4.53it/s] 190it [00:41, 4.55it/s] 191it [00:41, 4.60it/s] 192it [00:42, 4.62it/s] 193it [00:42, 4.63it/s] 194it [00:42, 4.51it/s] 195it [00:42, 4.27it/s] 196it [00:43, 4.31it/s] 196it [00:43, 4.54it/s] +2025-05-25 21:33:56,210 - INFO - Epoch: 6, Objective: tensor([7316.6924], device='cuda:0', grad_fn=), Loss: 0.06832034140825272, KL/n: 62.47688674926758 + 0it [00:00, ?it/s]2025-05-25 21:33:56,621 - INFO - [Epoch 007 | Batch 0000] IWAE-loss 5764.2217 | mean log_px -0.0439 | KL -3059.68 + 1it [00:00, 2.99it/s] 2it [00:00, 3.78it/s] 3it [00:00, 4.01it/s] 4it [00:00, 4.26it/s] 5it [00:01, 4.40it/s] 6it [00:01, 4.49it/s] 7it [00:01, 4.57it/s] 8it [00:01, 4.60it/s] 9it [00:02, 4.63it/s] 10it [00:02, 4.48it/s] 11it [00:02, 4.53it/s] 12it [00:02, 4.58it/s] 13it [00:02, 4.61it/s] 14it [00:03, 4.63it/s] 15it [00:03, 4.64it/s] 16it [00:03, 4.65it/s] 17it [00:03, 4.66it/s] 18it [00:04, 4.67it/s] 19it [00:04, 4.53it/s] 20it [00:04, 4.57it/s] 21it [00:04, 4.61it/s] 22it [00:04, 4.62it/s] 23it [00:05, 4.63it/s] 24it [00:05, 4.64it/s] 25it [00:05, 4.51it/s] 26it [00:05, 4.56it/s] 27it [00:05, 4.59it/s] 28it [00:06, 4.61it/s] 29it [00:06, 4.63it/s] 30it [00:06, 4.64it/s] 31it [00:06, 4.51it/s] 32it [00:07, 4.56it/s] 33it [00:07, 4.59it/s] 34it [00:07, 4.61it/s] 35it [00:07, 4.63it/s] 36it [00:07, 4.64it/s] 37it [00:08, 4.63it/s] 38it [00:08, 4.49it/s] 39it [00:08, 4.56it/s] 40it [00:08, 4.57it/s] 41it [00:09, 4.49it/s] 42it [00:09, 4.44it/s] 43it [00:09, 4.52it/s] 44it [00:09, 4.55it/s] 45it [00:09, 4.44it/s] 46it [00:10, 4.51it/s] 47it [00:10, 4.57it/s] 48it [00:10, 4.60it/s] 49it [00:10, 4.62it/s] 50it [00:11, 4.64it/s]2025-05-25 21:34:07,517 - INFO - [Epoch 007 | Batch 0050] IWAE-loss 4438.1538 | mean log_px -0.0305 | KL -3042.06 + 51it [00:11, 4.50it/s] 52it [00:11, 4.56it/s] 53it [00:11, 4.60it/s] 54it [00:11, 4.62it/s] 55it [00:12, 4.63it/s] 56it [00:12, 4.65it/s] 57it [00:12, 4.50it/s] 58it [00:12, 4.56it/s] 59it [00:12, 4.58it/s] 60it [00:13, 4.54it/s] 61it [00:13, 4.58it/s] 62it [00:13, 4.60it/s] 63it [00:13, 4.62it/s] 64it [00:14, 4.64it/s] 65it [00:14, 4.42it/s] 66it [00:14, 4.50it/s] 67it [00:14, 4.56it/s] 68it [00:14, 4.59it/s] 69it [00:15, 4.63it/s] 70it [00:15, 4.62it/s] 71it [00:15, 4.64it/s] 72it [00:15, 4.49it/s] 73it [00:16, 4.55it/s] 74it [00:16, 4.57it/s] 75it [00:16, 4.61it/s] 76it [00:16, 4.62it/s] 77it [00:16, 4.64it/s] 78it [00:17, 4.53it/s] 79it [00:17, 4.58it/s] 80it [00:17, 4.59it/s] 81it [00:17, 4.62it/s] 82it [00:17, 4.63it/s] 83it [00:18, 4.65it/s] 84it [00:18, 4.50it/s] 85it [00:18, 4.57it/s] 86it [00:18, 4.60it/s] 87it [00:19, 4.62it/s] 88it [00:19, 4.63it/s] 89it [00:19, 4.63it/s] 90it [00:19, 4.63it/s] 91it [00:19, 4.50it/s] 92it [00:20, 4.56it/s] 93it [00:20, 4.59it/s] 94it [00:20, 4.60it/s] 95it [00:20, 4.61it/s] 96it [00:21, 4.62it/s] 97it [00:21, 4.64it/s] 98it [00:21, 4.49it/s] 99it [00:21, 4.55it/s] 100it [00:21, 4.58it/s]2025-05-25 21:34:18,434 - INFO - [Epoch 007 | Batch 0100] IWAE-loss 3706.3210 | mean log_px -0.0132 | KL -3016.29 + 101it [00:22, 4.60it/s] 102it [00:22, 4.62it/s] 103it [00:22, 4.64it/s] 104it [00:22, 4.64it/s] 105it [00:23, 4.50it/s] 106it [00:23, 4.54it/s] 107it [00:23, 4.49it/s] 108it [00:23, 4.55it/s] 109it [00:23, 4.60it/s] 110it [00:24, 4.63it/s] 111it [00:24, 4.51it/s] 112it [00:24, 4.58it/s] 113it [00:24, 4.62it/s] 114it [00:25, 4.50it/s] 115it [00:25, 4.57it/s] 116it [00:25, 4.60it/s] 117it [00:25, 4.63it/s] 118it [00:25, 4.65it/s] 119it [00:26, 4.67it/s] 120it [00:26, 4.65it/s] 121it [00:26, 4.63it/s] 122it [00:26, 4.62it/s] 123it [00:26, 4.62it/s] 124it [00:27, 4.61it/s] 125it [00:27, 4.62it/s] 126it [00:27, 4.62it/s] 127it [00:27, 4.47it/s] 128it [00:28, 4.54it/s] 129it [00:28, 4.60it/s] 130it [00:28, 4.63it/s] 131it [00:28, 4.66it/s] 132it [00:28, 4.62it/s] 133it [00:29, 4.65it/s] 134it [00:29, 4.66it/s] 135it [00:29, 4.68it/s] 136it [00:29, 4.69it/s] 137it [00:29, 4.69it/s] 138it [00:30, 4.69it/s] 139it [00:30, 4.67it/s] 140it [00:30, 4.69it/s] 141it [00:30, 4.70it/s] 142it [00:31, 4.66it/s] 143it [00:31, 4.67it/s] 144it [00:31, 4.52it/s] 145it [00:31, 4.59it/s] 146it [00:31, 4.63it/s] 147it [00:32, 4.67it/s] 148it [00:32, 4.69it/s] 149it [00:32, 4.70it/s] 150it [00:32, 4.70it/s]2025-05-25 21:34:29,248 - INFO - [Epoch 007 | Batch 0150] IWAE-loss 6590.7559 | mean log_px -0.0561 | KL -2995.29 + 151it [00:32, 4.54it/s] 152it [00:33, 4.61it/s] 153it [00:33, 4.65it/s] 154it [00:33, 4.67it/s] 155it [00:33, 4.69it/s] 156it [00:34, 4.54it/s] 157it [00:34, 4.61it/s] 158it [00:34, 4.64it/s] 159it [00:34, 4.67it/s] 160it [00:34, 4.68it/s] 161it [00:35, 4.70it/s] 162it [00:35, 4.71it/s] 163it [00:35, 4.71it/s] 164it [00:35, 4.71it/s] 165it [00:35, 4.72it/s] 166it [00:36, 4.72it/s] 167it [00:36, 4.55it/s] 168it [00:36, 4.62it/s] 169it [00:36, 4.65it/s] 170it [00:37, 4.67it/s] 171it [00:37, 4.69it/s] 172it [00:37, 4.69it/s] 173it [00:37, 4.71it/s] 174it [00:37, 4.71it/s] 175it [00:38, 4.72it/s] 176it [00:38, 4.56it/s] 177it [00:38, 4.62it/s] 178it [00:38, 4.65it/s] 179it [00:38, 4.68it/s] 180it [00:39, 4.69it/s] 181it [00:39, 4.70it/s] 182it [00:39, 4.71it/s] 183it [00:39, 4.72it/s] 184it [00:40, 4.72it/s] 185it [00:40, 4.72it/s] 186it [00:40, 4.55it/s] 187it [00:40, 4.62it/s] 188it [00:40, 4.65it/s] 189it [00:41, 4.67it/s] 190it [00:41, 4.66it/s] 191it [00:41, 4.70it/s] 192it [00:41, 4.70it/s] 193it [00:41, 4.71it/s] 194it [00:42, 4.71it/s] 195it [00:42, 4.40it/s] 196it [00:42, 4.52it/s] 196it [00:42, 4.59it/s] +2025-05-25 21:34:39,052 - INFO - Epoch: 7, Objective: tensor([5831.9897], device='cuda:0', grad_fn=), Loss: 0.03322037681937218, KL/n: 60.5771369934082 + 0it [00:00, ?it/s]2025-05-25 21:34:39,615 - INFO - [Epoch 008 | Batch 0000] IWAE-loss 3881.9414 | mean log_px -0.0130 | KL -2970.20 + 1it [00:00, 3.17it/s] 2it [00:00, 3.86it/s] 3it [00:00, 4.05it/s] 4it [00:01, 4.02it/s] 5it [00:01, 4.24it/s] 6it [00:01, 4.39it/s] 7it [00:01, 4.50it/s] 8it [00:01, 4.54it/s] 9it [00:02, 4.56it/s] 10it [00:02, 4.50it/s] 11it [00:02, 4.57it/s] 12it [00:02, 4.49it/s] 13it [00:02, 4.51it/s] 14it [00:03, 4.54it/s] 15it [00:03, 4.39it/s] 16it [00:03, 4.47it/s] 17it [00:03, 4.48it/s] 18it [00:04, 4.47it/s] 19it [00:04, 4.54it/s] 20it [00:04, 4.59it/s] 21it [00:04, 4.63it/s] 22it [00:04, 4.65it/s] 23it [00:05, 4.67it/s] 24it [00:05, 4.65it/s] 25it [00:05, 4.67it/s] 26it [00:05, 4.69it/s] 27it [00:06, 4.55it/s] 28it [00:06, 4.61it/s] 29it [00:06, 4.65it/s] 30it [00:06, 4.65it/s] 31it [00:06, 4.67it/s] 32it [00:07, 4.68it/s] 33it [00:07, 4.69it/s] 34it [00:07, 4.70it/s] 35it [00:07, 4.71it/s] 36it [00:07, 4.71it/s] 37it [00:08, 4.71it/s] 38it [00:08, 4.71it/s] 39it [00:08, 4.72it/s] 40it [00:08, 4.71it/s] 41it [00:09, 4.72it/s] 42it [00:09, 4.72it/s] 43it [00:09, 4.72it/s] 44it [00:09, 4.71it/s] 45it [00:09, 4.72it/s] 46it [00:10, 4.71it/s] 47it [00:10, 4.72it/s] 48it [00:10, 4.72it/s] 49it [00:10, 4.68it/s] 50it [00:10, 4.68it/s]2025-05-25 21:34:50,434 - INFO - [Epoch 008 | Batch 0050] IWAE-loss 4140.3315 | mean log_px -0.0194 | KL -2946.16 + 51it [00:11, 4.69it/s] 52it [00:11, 4.69it/s] 53it [00:11, 4.71it/s] 54it [00:11, 4.70it/s] 55it [00:11, 4.71it/s] 56it [00:12, 4.71it/s] 57it [00:12, 4.69it/s] 58it [00:12, 4.69it/s] 59it [00:12, 4.70it/s] 60it [00:13, 4.70it/s] 61it [00:13, 4.70it/s] 62it [00:13, 4.71it/s] 63it [00:13, 4.71it/s] 64it [00:13, 4.71it/s] 65it [00:14, 4.72it/s] 66it [00:14, 4.70it/s] 67it [00:14, 4.71it/s] 68it [00:14, 4.71it/s] 69it [00:14, 4.72it/s] 70it [00:15, 4.71it/s] 71it [00:15, 4.72it/s] 72it [00:15, 4.71it/s] 73it [00:15, 4.72it/s] 74it [00:16, 4.72it/s] 75it [00:16, 4.72it/s] 76it [00:16, 4.72it/s] 77it [00:16, 4.74it/s] 78it [00:16, 4.71it/s] 79it [00:17, 4.71it/s] 80it [00:17, 4.70it/s] 81it [00:17, 4.70it/s] 82it [00:17, 4.68it/s] 83it [00:17, 4.68it/s] 84it [00:18, 4.69it/s] 85it [00:18, 4.70it/s] 86it [00:18, 4.70it/s] 87it [00:18, 4.71it/s] 88it [00:18, 4.70it/s] 89it [00:19, 4.71it/s] 90it [00:19, 4.68it/s] 91it [00:19, 4.69it/s] 92it [00:19, 4.70it/s] 93it [00:20, 4.71it/s] 94it [00:20, 4.71it/s] 95it [00:20, 4.71it/s] 96it [00:20, 4.71it/s] 97it [00:20, 4.71it/s] 98it [00:21, 4.73it/s] 99it [00:21, 4.73it/s] 100it [00:21, 4.73it/s]2025-05-25 21:35:01,055 - INFO - [Epoch 008 | Batch 0100] IWAE-loss 3203.0884 | mean log_px -0.0045 | KL -2923.38 + 101it [00:21, 4.56it/s] 102it [00:21, 4.59it/s] 103it [00:22, 4.62it/s] 104it [00:22, 4.60it/s] 105it [00:22, 4.63it/s] 106it [00:22, 4.65it/s] 107it [00:23, 4.60it/s] 108it [00:23, 4.64it/s] 109it [00:23, 4.67it/s] 110it [00:23, 4.68it/s] 111it [00:23, 4.70it/s] 112it [00:24, 4.70it/s] 113it [00:24, 4.71it/s] 114it [00:24, 4.71it/s] 115it [00:24, 4.73it/s] 116it [00:24, 4.72it/s] 117it [00:25, 4.73it/s] 118it [00:25, 4.55it/s] 119it [00:25, 4.62it/s] 120it [00:25, 4.65it/s] 121it [00:26, 4.68it/s] 122it [00:26, 4.69it/s] 123it [00:26, 4.70it/s] 124it [00:26, 4.71it/s] 125it [00:26, 4.72it/s] 126it [00:27, 4.71it/s] 127it [00:27, 4.55it/s] 128it [00:27, 4.61it/s] 129it [00:27, 4.64it/s] 130it [00:27, 4.66it/s] 131it [00:28, 4.68it/s] 132it [00:28, 4.68it/s] 133it [00:28, 4.70it/s] 134it [00:28, 4.70it/s] 135it [00:29, 4.71it/s] 136it [00:29, 4.71it/s] 137it [00:29, 4.72it/s] 138it [00:29, 4.72it/s] 139it [00:29, 4.72it/s] 140it [00:30, 4.55it/s] 141it [00:30, 4.60it/s] 142it [00:30, 4.63it/s] 143it [00:30, 4.66it/s] 144it [00:30, 4.67it/s] 145it [00:31, 4.69it/s] 146it [00:31, 4.70it/s] 147it [00:31, 4.71it/s] 148it [00:31, 4.71it/s] 149it [00:32, 4.56it/s] 150it [00:32, 4.61it/s]2025-05-25 21:35:11,792 - INFO - [Epoch 008 | Batch 0150] IWAE-loss 3672.0759 | mean log_px -0.0163 | KL -2904.56 + 151it [00:32, 4.64it/s] 152it [00:32, 4.67it/s] 153it [00:32, 4.69it/s] 154it [00:33, 4.69it/s] 155it [00:33, 4.50it/s] 156it [00:33, 4.52it/s] 157it [00:33, 4.58it/s] 158it [00:34, 4.61it/s] 159it [00:34, 4.65it/s] 160it [00:34, 4.66it/s] 161it [00:34, 4.67it/s] 162it [00:34, 4.51it/s] 163it [00:35, 4.34it/s] 164it [00:35, 4.46it/s] 165it [00:35, 4.54it/s] 166it [00:35, 4.59it/s] 167it [00:35, 4.63it/s] 168it [00:36, 4.65it/s] 169it [00:36, 4.67it/s] 170it [00:36, 4.68it/s] 171it [00:36, 4.69it/s] 172it [00:37, 4.70it/s] 173it [00:37, 4.71it/s] 174it [00:37, 4.72it/s] 175it [00:37, 4.72it/s] 176it [00:37, 4.72it/s] 177it [00:38, 4.72it/s] 178it [00:38, 4.72it/s] 179it [00:38, 4.72it/s] 180it [00:38, 4.73it/s] 181it [00:38, 4.73it/s] 182it [00:39, 4.73it/s] 183it [00:39, 4.72it/s] 184it [00:39, 4.72it/s] 185it [00:39, 4.72it/s] 186it [00:40, 4.72it/s] 187it [00:40, 4.73it/s] 188it [00:40, 4.73it/s] 189it [00:40, 4.73it/s] 190it [00:40, 4.72it/s] 191it [00:41, 4.72it/s] 192it [00:41, 4.73it/s] 193it [00:41, 4.73it/s] 194it [00:41, 4.72it/s] 195it [00:41, 4.53it/s] 196it [00:42, 4.41it/s] 196it [00:42, 4.64it/s] +2025-05-25 21:35:21,613 - INFO - Epoch: 8, Objective: tensor([4215.5410], device='cuda:0', grad_fn=), Loss: 0.014363881200551987, KL/n: 58.71515655517578 + 0it [00:00, ?it/s]2025-05-25 21:35:22,021 - INFO - [Epoch 009 | Batch 0000] IWAE-loss 3831.5950 | mean log_px -0.0261 | KL -2873.97 + 1it [00:00, 2.96it/s] 2it [00:00, 3.79it/s] 3it [00:00, 4.18it/s] 4it [00:00, 4.37it/s] 5it [00:01, 4.50it/s] 6it [00:01, 4.57it/s] 7it [00:01, 4.62it/s] 8it [00:01, 4.66it/s] 9it [00:02, 4.68it/s] 10it [00:02, 4.69it/s] 11it [00:02, 3.63it/s] 12it [00:02, 3.91it/s] 13it [00:03, 4.13it/s] 14it [00:03, 4.29it/s] 15it [00:03, 4.42it/s] 16it [00:03, 4.31it/s] 17it [00:03, 4.44it/s] 18it [00:04, 4.52it/s] 19it [00:04, 4.59it/s] 20it [00:04, 4.62it/s] 21it [00:04, 4.66it/s] 22it [00:05, 4.68it/s] 23it [00:05, 4.70it/s] 24it [00:05, 4.70it/s] 25it [00:05, 4.71it/s] 26it [00:05, 4.71it/s] 27it [00:06, 4.72it/s] 28it [00:06, 4.71it/s] 29it [00:06, 4.72it/s] 30it [00:06, 4.72it/s] 31it [00:06, 4.72it/s] 32it [00:07, 4.73it/s] 33it [00:07, 4.73it/s] 34it [00:07, 4.72it/s] 35it [00:07, 4.73it/s] 36it [00:07, 4.72it/s] 37it [00:08, 4.73it/s] 38it [00:08, 4.71it/s] 39it [00:08, 4.74it/s] 40it [00:08, 4.74it/s] 41it [00:09, 4.74it/s] 42it [00:09, 4.73it/s] 43it [00:09, 4.74it/s] 44it [00:09, 4.73it/s] 45it [00:09, 4.73it/s] 46it [00:10, 4.73it/s] 47it [00:10, 4.74it/s] 48it [00:10, 4.73it/s] 49it [00:10, 4.74it/s] 50it [00:10, 4.73it/s]2025-05-25 21:35:32,839 - INFO - [Epoch 009 | Batch 0050] IWAE-loss 3554.7034 | mean log_px -0.0139 | KL -2847.36 + 51it [00:11, 4.55it/s] 52it [00:11, 4.61it/s] 53it [00:11, 4.65it/s] 54it [00:11, 4.67it/s] 55it [00:12, 4.68it/s] 56it [00:12, 4.51it/s] 57it [00:12, 4.58it/s] 58it [00:12, 4.62it/s] 59it [00:12, 4.61it/s] 60it [00:13, 4.63it/s] 61it [00:13, 4.67it/s] 62it [00:13, 4.68it/s] 63it [00:13, 4.70it/s] 64it [00:13, 4.70it/s] 65it [00:14, 4.71it/s] 66it [00:14, 4.71it/s] 67it [00:14, 4.72it/s] 68it [00:14, 4.72it/s] 69it [00:15, 4.70it/s] 70it [00:15, 4.72it/s] 71it [00:15, 4.73it/s] 72it [00:15, 4.72it/s] 73it [00:15, 4.73it/s] 74it [00:16, 4.73it/s] 75it [00:16, 4.59it/s] 76it [00:16, 4.64it/s] 77it [00:16, 4.68it/s] 78it [00:16, 4.69it/s] 79it [00:17, 4.70it/s] 80it [00:17, 4.70it/s] 81it [00:17, 4.71it/s] 82it [00:17, 4.71it/s] 83it [00:17, 4.72it/s] 84it [00:18, 4.72it/s] 85it [00:18, 4.73it/s] 86it [00:18, 4.72it/s] 87it [00:18, 4.73it/s] 88it [00:19, 4.72it/s] 89it [00:19, 4.73it/s] 90it [00:19, 4.73it/s] 91it [00:19, 4.73it/s] 92it [00:19, 4.59it/s] 93it [00:20, 4.65it/s] 94it [00:20, 4.67it/s] 95it [00:20, 4.69it/s] 96it [00:20, 4.70it/s] 97it [00:20, 4.70it/s] 98it [00:21, 4.71it/s] 99it [00:21, 4.72it/s] 100it [00:21, 4.71it/s]2025-05-25 21:35:43,517 - INFO - [Epoch 009 | Batch 0100] IWAE-loss 3406.7056 | mean log_px -0.0110 | KL -2821.77 + 101it [00:21, 4.55it/s] 102it [00:22, 4.61it/s] 103it [00:22, 4.65it/s] 104it [00:22, 4.67it/s] 105it [00:22, 4.68it/s] 106it [00:22, 4.69it/s] 107it [00:23, 4.54it/s] 108it [00:23, 4.61it/s] 109it [00:23, 4.65it/s] 110it [00:23, 4.67it/s] 111it [00:24, 4.60it/s] 112it [00:24, 4.60it/s] 113it [00:24, 4.64it/s] 114it [00:24, 4.66it/s] 115it [00:24, 4.68it/s] 116it [00:25, 4.68it/s] 117it [00:25, 4.71it/s] 118it [00:25, 4.53it/s] 119it [00:25, 4.60it/s] 120it [00:25, 4.64it/s] 121it [00:26, 4.67it/s] 122it [00:26, 4.68it/s] 123it [00:26, 4.50it/s] 124it [00:26, 4.57it/s] 125it [00:27, 4.62it/s] 126it [00:27, 4.65it/s] 127it [00:27, 4.67it/s] 128it [00:27, 4.68it/s] 129it [00:27, 4.70it/s] 130it [00:28, 4.71it/s] 131it [00:28, 4.71it/s] 132it [00:28, 4.72it/s] 133it [00:28, 4.72it/s] 134it [00:28, 4.72it/s] 135it [00:29, 4.73it/s] 136it [00:29, 4.73it/s] 137it [00:29, 4.73it/s] 138it [00:29, 4.72it/s] 139it [00:29, 4.70it/s] 140it [00:30, 4.70it/s] 141it [00:30, 4.71it/s] 142it [00:30, 4.71it/s] 143it [00:30, 4.72it/s] 144it [00:31, 4.71it/s] 145it [00:31, 4.72it/s] 146it [00:31, 4.60it/s] 147it [00:31, 4.66it/s] 148it [00:31, 4.67it/s] 149it [00:32, 4.69it/s] 150it [00:32, 4.70it/s]2025-05-25 21:35:54,242 - INFO - [Epoch 009 | Batch 0150] IWAE-loss 5147.5215 | mean log_px -0.0361 | KL -2803.57 + 151it [00:32, 4.54it/s] 152it [00:32, 4.61it/s] 153it [00:32, 4.65it/s] 154it [00:33, 4.66it/s] 155it [00:33, 4.68it/s] 156it [00:33, 4.69it/s] 157it [00:33, 4.71it/s] 158it [00:34, 4.71it/s] 159it [00:34, 4.72it/s] 160it [00:34, 4.72it/s] 161it [00:34, 4.72it/s] 162it [00:34, 4.71it/s] 163it [00:35, 4.60it/s] 164it [00:35, 4.66it/s] 165it [00:35, 4.68it/s] 166it [00:35, 4.69it/s] 167it [00:35, 4.70it/s] 168it [00:36, 4.71it/s] 169it [00:36, 4.72it/s] 170it [00:36, 4.71it/s] 171it [00:36, 4.72it/s] 172it [00:37, 4.72it/s] 173it [00:37, 4.72it/s] 174it [00:37, 4.72it/s] 175it [00:37, 4.71it/s] 176it [00:37, 4.51it/s] 177it [00:38, 4.54it/s] 178it [00:38, 4.58it/s] 179it [00:38, 4.63it/s] 180it [00:38, 4.66it/s] 181it [00:38, 4.68it/s] 182it [00:39, 4.69it/s] 183it [00:39, 4.70it/s] 184it [00:39, 4.70it/s] 185it [00:39, 4.71it/s] 186it [00:40, 4.52it/s] 187it [00:40, 4.60it/s] 188it [00:40, 4.63it/s] 189it [00:40, 4.66it/s] 190it [00:40, 4.68it/s] 191it [00:41, 4.69it/s] 192it [00:41, 4.70it/s] 193it [00:41, 4.51it/s] 194it [00:41, 4.59it/s] 195it [00:42, 4.44it/s] 196it [00:42, 4.42it/s] 196it [00:42, 4.63it/s] +2025-05-25 21:36:04,079 - INFO - Epoch: 9, Objective: tensor([4143.1064], device='cuda:0', grad_fn=), Loss: 0.02341052144765854, KL/n: 56.89252471923828 + 0it [00:00, ?it/s]2025-05-25 21:36:04,460 - INFO - [Epoch 010 | Batch 0000] IWAE-loss 3292.7747 | mean log_px -0.0090 | KL -2785.48 + 1it [00:00, 3.23it/s] 2it [00:00, 3.96it/s] 3it [00:00, 4.05it/s] 4it [00:00, 4.33it/s] 5it [00:01, 4.43it/s] 6it [00:01, 4.52it/s] 7it [00:01, 4.60it/s] 8it [00:01, 4.64it/s] 9it [00:02, 4.68it/s] 10it [00:02, 4.68it/s] 11it [00:02, 4.71it/s] 12it [00:02, 4.59it/s] 13it [00:02, 4.66it/s] 14it [00:03, 4.68it/s] 15it [00:03, 4.70it/s] 16it [00:03, 4.72it/s] 17it [00:03, 4.74it/s] 18it [00:03, 4.73it/s] 19it [00:04, 4.74it/s] 20it [00:04, 4.73it/s] 21it [00:04, 4.74it/s] 22it [00:04, 4.73it/s] 23it [00:04, 4.74it/s] 24it [00:05, 4.74it/s] 25it [00:05, 4.74it/s] 26it [00:05, 4.74it/s] 27it [00:05, 4.74it/s] 28it [00:06, 4.57it/s] 29it [00:06, 4.64it/s] 30it [00:06, 4.67it/s] 31it [00:06, 4.70it/s] 32it [00:06, 4.67it/s] 33it [00:07, 4.70it/s] 34it [00:07, 4.71it/s] 35it [00:07, 4.72it/s] 36it [00:07, 4.71it/s] 37it [00:07, 4.73it/s] 38it [00:08, 4.73it/s] 39it [00:08, 4.73it/s] 40it [00:08, 4.73it/s] 41it [00:08, 4.74it/s] 42it [00:09, 4.73it/s] 43it [00:09, 4.73it/s] 44it [00:09, 4.56it/s] 45it [00:09, 4.64it/s] 46it [00:09, 4.66it/s] 47it [00:10, 4.69it/s] 48it [00:10, 4.70it/s] 49it [00:10, 4.55it/s] 50it [00:10, 4.62it/s]2025-05-25 21:36:15,136 - INFO - [Epoch 010 | Batch 0050] IWAE-loss 3255.0281 | mean log_px -0.0100 | KL -2764.80 + 51it [00:10, 4.65it/s] 52it [00:11, 4.67it/s] 53it [00:11, 4.69it/s] 54it [00:11, 4.70it/s] 55it [00:11, 4.72it/s] 56it [00:12, 4.72it/s] 57it [00:12, 4.73it/s] 58it [00:12, 4.56it/s] 59it [00:12, 4.62it/s] 60it [00:12, 4.57it/s] 61it [00:13, 4.64it/s] 62it [00:13, 4.66it/s] 63it [00:13, 4.69it/s] 64it [00:13, 4.70it/s] 65it [00:13, 4.70it/s] 66it [00:14, 4.71it/s] 67it [00:14, 4.72it/s] 68it [00:14, 4.72it/s] 69it [00:14, 4.73it/s] 70it [00:15, 4.71it/s] 71it [00:15, 4.72it/s] 72it [00:15, 4.73it/s] 73it [00:15, 4.74it/s] 74it [00:15, 4.73it/s] 75it [00:16, 4.74it/s] 76it [00:16, 4.73it/s] 77it [00:16, 4.74it/s] 78it [00:16, 4.74it/s] 79it [00:16, 4.74it/s] 80it [00:17, 4.74it/s] 81it [00:17, 4.74it/s] 82it [00:17, 4.74it/s] 83it [00:17, 4.74it/s] 84it [00:17, 4.74it/s] 85it [00:18, 4.74it/s] 86it [00:18, 4.67it/s] 87it [00:18, 4.69it/s] 88it [00:18, 4.71it/s] 89it [00:19, 4.72it/s] 90it [00:19, 4.72it/s] 91it [00:19, 4.56it/s] 92it [00:19, 4.63it/s] 93it [00:19, 4.66it/s] 94it [00:20, 4.69it/s] 95it [00:20, 4.70it/s] 96it [00:20, 4.47it/s] 97it [00:20, 4.56it/s] 98it [00:21, 4.61it/s] 99it [00:21, 4.65it/s] 100it [00:21, 4.68it/s]2025-05-25 21:36:25,795 - INFO - [Epoch 010 | Batch 0100] IWAE-loss 3816.2234 | mean log_px -0.0176 | KL -2740.36 + 101it [00:21, 4.53it/s] 102it [00:21, 4.61it/s] 103it [00:22, 4.65it/s] 104it [00:22, 4.67it/s] 105it [00:22, 4.68it/s] 106it [00:22, 4.69it/s] 107it [00:22, 4.71it/s] 108it [00:23, 4.71it/s] 109it [00:23, 4.74it/s] 110it [00:23, 4.74it/s] 111it [00:23, 4.74it/s] 112it [00:23, 4.75it/s] 113it [00:24, 4.75it/s] 114it [00:24, 4.75it/s] 115it [00:24, 4.75it/s] 116it [00:24, 4.75it/s] 117it [00:25, 4.75it/s] 118it [00:25, 4.75it/s] 119it [00:25, 4.75it/s] 120it [00:25, 4.74it/s] 121it [00:25, 4.75it/s] 122it [00:26, 4.74it/s] 123it [00:26, 4.75it/s] 124it [00:26, 4.75it/s] 125it [00:26, 4.75it/s] 126it [00:26, 4.75it/s] 127it [00:27, 4.76it/s] 128it [00:27, 4.75it/s] 129it [00:27, 4.75it/s] 130it [00:27, 4.75it/s] 131it [00:27, 4.75it/s] 132it [00:28, 4.75it/s] 133it [00:28, 4.75it/s] 134it [00:28, 4.75it/s] 135it [00:28, 4.75it/s] 136it [00:29, 4.75it/s] 137it [00:29, 4.75it/s] 138it [00:29, 4.58it/s] 139it [00:29, 4.61it/s] 140it [00:29, 4.66it/s] 141it [00:30, 4.69it/s] 142it [00:30, 4.70it/s] 143it [00:30, 4.55it/s] 144it [00:30, 4.62it/s] 145it [00:30, 4.64it/s] 146it [00:31, 4.66it/s] 147it [00:31, 4.69it/s] 148it [00:31, 4.70it/s] 149it [00:31, 4.71it/s] 150it [00:32, 4.71it/s]2025-05-25 21:36:36,410 - INFO - [Epoch 010 | Batch 0150] IWAE-loss 4118.2427 | mean log_px -0.0299 | KL -2717.40 + 151it [00:32, 4.55it/s] 152it [00:32, 4.62it/s] 153it [00:32, 4.66it/s] 154it [00:32, 4.68it/s] 155it [00:33, 4.70it/s] 156it [00:33, 4.72it/s] 157it [00:33, 4.56it/s] 158it [00:33, 4.63it/s] 159it [00:33, 4.67it/s] 160it [00:34, 4.69it/s] 161it [00:34, 4.70it/s] 162it [00:34, 4.72it/s] 163it [00:34, 4.73it/s] 164it [00:35, 4.74it/s] 165it [00:35, 4.74it/s] 166it [00:35, 4.74it/s] 167it [00:35, 4.74it/s] 168it [00:35, 4.75it/s] 169it [00:36, 4.75it/s] 170it [00:36, 4.75it/s] 171it [00:36, 4.76it/s] 172it [00:36, 4.74it/s] 173it [00:36, 4.75it/s] 174it [00:37, 4.75it/s] 175it [00:37, 4.75it/s] 176it [00:37, 4.74it/s] 177it [00:37, 4.74it/s] 178it [00:38, 4.57it/s] 179it [00:38, 4.63it/s] 180it [00:38, 4.66it/s] 181it [00:38, 4.69it/s] 182it [00:38, 4.70it/s] 183it [00:39, 4.72it/s] 184it [00:39, 4.72it/s] 185it [00:39, 4.56it/s] 186it [00:39, 4.63it/s] 187it [00:39, 4.67it/s] 188it [00:40, 4.69it/s] 189it [00:40, 4.71it/s] 190it [00:40, 4.71it/s] 191it [00:40, 4.73it/s] 192it [00:40, 4.73it/s] 193it [00:41, 4.51it/s] 194it [00:41, 4.59it/s] 195it [00:41, 4.55it/s] 196it [00:41, 4.47it/s] 196it [00:41, 4.67it/s] +2025-05-25 21:36:46,179 - INFO - Epoch: 10, Objective: tensor([2976.3257], device='cuda:0', grad_fn=), Loss: 0.00489531084895134, KL/n: 55.191680908203125 + 0it [00:00, ?it/s]2025-05-25 21:36:46,747 - INFO - [Epoch 011 | Batch 0000] IWAE-loss 3065.4336 | mean log_px -0.0064 | KL -2701.94 + 1it [00:00, 3.08it/s] 2it [00:00, 3.73it/s] 3it [00:00, 4.02it/s] 4it [00:01, 4.03it/s] 5it [00:01, 4.15it/s] 6it [00:01, 4.24it/s] 7it [00:01, 4.32it/s] 8it [00:01, 4.38it/s] 9it [00:02, 4.16it/s] 10it [00:02, 4.19it/s] 11it [00:02, 4.33it/s] 12it [00:02, 4.30it/s] 13it [00:03, 4.21it/s] 14it [00:03, 4.23it/s] 15it [00:03, 4.24it/s] 16it [00:03, 4.30it/s] 17it [00:04, 4.40it/s] 18it [00:04, 4.40it/s] 19it [00:04, 4.45it/s] 20it [00:04, 4.37it/s] 21it [00:04, 4.21it/s] 22it [00:05, 4.27it/s] 23it [00:05, 4.26it/s] 24it [00:05, 4.30it/s] 25it [00:05, 4.33it/s] 26it [00:06, 4.32it/s] 27it [00:06, 4.35it/s] 28it [00:06, 4.32it/s] 29it [00:06, 4.35it/s] 30it [00:07, 4.25it/s] 31it [00:07, 4.27it/s] 32it [00:07, 4.27it/s] 33it [00:07, 4.30it/s] 34it [00:07, 4.39it/s] 35it [00:08, 4.33it/s] 36it [00:08, 4.33it/s] 37it [00:08, 4.36it/s] 38it [00:08, 4.43it/s] 39it [00:09, 4.38it/s] 40it [00:09, 4.36it/s] 41it [00:09, 4.37it/s] 42it [00:09, 4.34it/s] 43it [00:10, 4.46it/s] 44it [00:10, 4.28it/s] 45it [00:10, 4.31it/s] 46it [00:10, 4.27it/s] 47it [00:10, 4.27it/s] 48it [00:11, 4.30it/s] 49it [00:11, 4.40it/s] 50it [00:11, 4.33it/s]2025-05-25 21:36:58,320 - INFO - [Epoch 011 | Batch 0050] IWAE-loss 3133.4580 | mean log_px -0.0073 | KL -2682.37 + 51it [00:11, 4.31it/s] 52it [00:12, 4.33it/s] 53it [00:12, 4.34it/s] 54it [00:12, 4.33it/s] 55it [00:12, 4.43it/s] 56it [00:13, 4.50it/s] 57it [00:13, 4.41it/s] 58it [00:13, 4.38it/s] 59it [00:13, 4.39it/s] 60it [00:13, 4.36it/s] 61it [00:14, 4.34it/s] 62it [00:14, 4.35it/s] 63it [00:14, 4.44it/s] 64it [00:14, 4.49it/s] 65it [00:15, 4.51it/s] 66it [00:15, 4.31it/s] 67it [00:15, 4.30it/s] 68it [00:15, 4.34it/s] 69it [00:16, 4.32it/s] 70it [00:16, 4.42it/s] 71it [00:16, 4.28it/s] 72it [00:16, 4.29it/s] 73it [00:16, 4.31it/s] 74it [00:17, 4.32it/s] 75it [00:17, 4.34it/s] 76it [00:17, 4.43it/s] 77it [00:17, 4.52it/s] 78it [00:18, 4.53it/s] 79it [00:18, 4.49it/s] 80it [00:18, 4.28it/s] 81it [00:18, 4.32it/s] 82it [00:18, 4.31it/s] 83it [00:19, 4.39it/s] 84it [00:19, 4.34it/s] 85it [00:19, 4.35it/s] 86it [00:19, 4.45it/s] 87it [00:20, 4.53it/s] 88it [00:20, 4.50it/s] 89it [00:20, 4.39it/s] 90it [00:20, 4.37it/s] 91it [00:21, 4.35it/s] 92it [00:21, 4.45it/s] 93it [00:21, 4.46it/s] 94it [00:21, 4.26it/s] 95it [00:21, 4.32it/s] 96it [00:22, 4.44it/s] 97it [00:22, 4.34it/s] 98it [00:22, 4.29it/s] 99it [00:22, 4.24it/s] 100it [00:23, 4.24it/s]2025-05-25 21:37:09,766 - INFO - [Epoch 011 | Batch 0100] IWAE-loss 4312.6279 | mean log_px -0.0334 | KL -2658.71 + 101it [00:23, 4.25it/s] 102it [00:23, 4.20it/s] 103it [00:23, 4.23it/s] 104it [00:24, 4.29it/s] 105it [00:24, 4.30it/s] 106it [00:24, 4.18it/s] 107it [00:24, 4.22it/s] 108it [00:24, 4.26it/s] 109it [00:25, 4.37it/s] 110it [00:25, 4.33it/s] 111it [00:25, 4.41it/s] 112it [00:25, 4.48it/s] 113it [00:26, 4.51it/s] 114it [00:26, 4.46it/s] 115it [00:26, 4.53it/s] 116it [00:26, 4.49it/s] 117it [00:26, 4.45it/s] 118it [00:27, 4.54it/s] 119it [00:27, 4.55it/s] 120it [00:27, 4.51it/s] 121it [00:27, 4.45it/s] 122it [00:28, 4.42it/s] 123it [00:28, 4.46it/s] 124it [00:28, 4.53it/s] 125it [00:28, 4.59it/s] 126it [00:28, 4.50it/s] 127it [00:29, 4.45it/s] 128it [00:29, 4.40it/s] 129it [00:29, 4.40it/s] 130it [00:29, 4.39it/s] 131it [00:30, 4.46it/s] 132it [00:30, 4.41it/s] 133it [00:30, 4.40it/s] 134it [00:30, 4.38it/s] 135it [00:31, 4.38it/s] 136it [00:31, 4.37it/s] 137it [00:31, 4.47it/s] 138it [00:31, 4.54it/s] 139it [00:31, 4.55it/s] 140it [00:32, 4.58it/s] 141it [00:32, 4.53it/s] 142it [00:32, 4.60it/s] 143it [00:32, 4.61it/s] 144it [00:32, 4.63it/s] 145it [00:33, 4.43it/s] 146it [00:33, 4.35it/s] 147it [00:33, 4.28it/s] 148it [00:33, 4.29it/s] 149it [00:34, 4.40it/s] 150it [00:34, 4.33it/s]2025-05-25 21:37:21,054 - INFO - [Epoch 011 | Batch 0150] IWAE-loss 3104.3960 | mean log_px -0.0096 | KL -2631.08 + 151it [00:34, 4.27it/s] 152it [00:34, 4.29it/s] 153it [00:35, 4.41it/s] 154it [00:35, 4.46it/s] 155it [00:35, 4.49it/s] 156it [00:35, 4.51it/s] 157it [00:35, 4.54it/s] 158it [00:36, 4.46it/s] 159it [00:36, 4.45it/s] 160it [00:36, 4.44it/s] 161it [00:36, 4.50it/s] 162it [00:37, 4.47it/s] 163it [00:37, 4.56it/s] 164it [00:37, 4.47it/s] 165it [00:37, 4.38it/s] 166it [00:38, 4.39it/s] 167it [00:38, 4.39it/s] 168it [00:38, 4.37it/s] 169it [00:38, 4.35it/s] 170it [00:38, 4.36it/s] 171it [00:39, 4.37it/s] 172it [00:39, 4.37it/s] 173it [00:39, 4.46it/s] 174it [00:39, 4.52it/s] 175it [00:40, 4.49it/s] 176it [00:40, 4.34it/s] 177it [00:40, 4.26it/s] 178it [00:40, 4.29it/s] 179it [00:40, 4.34it/s] 180it [00:41, 4.32it/s] 181it [00:41, 4.31it/s] 182it [00:41, 4.20it/s] 183it [00:41, 4.27it/s] 184it [00:42, 4.30it/s] 185it [00:42, 4.38it/s] 186it [00:42, 4.38it/s] 187it [00:42, 4.36it/s] 188it [00:43, 4.32it/s] 189it [00:43, 4.39it/s] 190it [00:43, 4.35it/s] 191it [00:43, 4.21it/s] 192it [00:43, 4.36it/s] 193it [00:44, 4.39it/s] 194it [00:44, 4.43it/s] 195it [00:44, 4.33it/s] 196it [00:44, 4.42it/s] 196it [00:44, 4.36it/s] +2025-05-25 21:37:31,448 - INFO - Epoch: 11, Objective: tensor([4247.3716], device='cuda:0', grad_fn=), Loss: 0.031174693256616592, KL/n: 53.34761047363281 + 0it [00:00, ?it/s]2025-05-25 21:37:31,854 - INFO - [Epoch 012 | Batch 0000] IWAE-loss 3012.1206 | mean log_px -0.0057 | KL -2611.20 + 1it [00:00, 2.82it/s] 2it [00:00, 3.63it/s] 3it [00:00, 4.06it/s] 4it [00:01, 4.27it/s] 5it [00:01, 4.42it/s] 6it [00:01, 4.27it/s] 7it [00:01, 4.41it/s] 8it [00:02, 3.53it/s] 9it [00:02, 3.83it/s] 10it [00:02, 4.04it/s] 11it [00:02, 4.14it/s] 12it [00:02, 4.20it/s] 13it [00:03, 4.29it/s] 14it [00:03, 4.18it/s] 15it [00:03, 4.30it/s] 16it [00:03, 4.37it/s] 17it [00:04, 4.46it/s] 18it [00:04, 4.52it/s] 19it [00:04, 4.47it/s] 20it [00:04, 4.49it/s] 21it [00:04, 4.55it/s] 22it [00:05, 4.43it/s] 23it [00:05, 4.41it/s] 24it [00:05, 4.36it/s] 25it [00:05, 4.36it/s] 26it [00:06, 4.37it/s] 27it [00:06, 4.40it/s] 28it [00:06, 4.47it/s] 29it [00:06, 4.47it/s] 30it [00:07, 4.44it/s] 31it [00:07, 4.41it/s] 32it [00:07, 4.40it/s] 33it [00:07, 4.34it/s] 34it [00:07, 4.19it/s] 35it [00:08, 4.23it/s] 36it [00:08, 4.22it/s] 37it [00:08, 4.35it/s] 38it [00:08, 4.33it/s] 39it [00:09, 4.29it/s] 40it [00:09, 4.13it/s] 41it [00:09, 4.21it/s] 42it [00:09, 4.31it/s] 43it [00:10, 4.37it/s] 44it [00:10, 4.29it/s] 45it [00:10, 4.41it/s] 46it [00:10, 4.42it/s] 47it [00:11, 4.18it/s] 48it [00:11, 4.14it/s] 49it [00:11, 4.31it/s] 50it [00:11, 4.28it/s]2025-05-25 21:37:43,446 - INFO - [Epoch 012 | Batch 0050] IWAE-loss 3992.2141 | mean log_px -0.0251 | KL -2592.65 + 51it [00:11, 4.39it/s] 52it [00:12, 4.47it/s] 53it [00:12, 4.53it/s] 54it [00:12, 4.50it/s] 55it [00:12, 4.56it/s] 56it [00:13, 4.55it/s] 57it [00:13, 4.43it/s] 58it [00:13, 4.37it/s] 59it [00:13, 4.39it/s] 60it [00:13, 4.39it/s] 61it [00:14, 4.49it/s] 62it [00:14, 4.42it/s] 63it [00:14, 4.46it/s] 64it [00:14, 4.51it/s] 65it [00:15, 4.32it/s] 66it [00:15, 4.41it/s] 67it [00:15, 4.48it/s] 68it [00:15, 4.54it/s] 69it [00:15, 4.59it/s] 70it [00:16, 4.62it/s] 71it [00:16, 4.64it/s] 72it [00:16, 4.60it/s] 73it [00:16, 4.63it/s] 74it [00:17, 4.49it/s] 75it [00:17, 4.47it/s] 76it [00:17, 4.49it/s] 77it [00:17, 4.55it/s] 78it [00:17, 4.50it/s] 79it [00:18, 4.58it/s] 80it [00:18, 4.58it/s] 81it [00:18, 4.59it/s] 82it [00:18, 4.47it/s] 83it [00:19, 4.45it/s] 84it [00:19, 4.40it/s] 85it [00:19, 4.40it/s] 86it [00:19, 4.17it/s] 87it [00:19, 4.25it/s] 88it [00:20, 4.24it/s] 89it [00:20, 4.26it/s] 90it [00:20, 4.28it/s] 91it [00:20, 4.31it/s] 92it [00:21, 4.37it/s] 93it [00:21, 4.46it/s] 94it [00:21, 4.38it/s] 95it [00:21, 4.39it/s] 96it [00:22, 4.23it/s] 97it [00:22, 4.36it/s] 98it [00:22, 4.42it/s] 99it [00:22, 4.50it/s] 100it [00:22, 4.40it/s]2025-05-25 21:37:54,682 - INFO - [Epoch 012 | Batch 0100] IWAE-loss 7227.1890 | mean log_px -0.0753 | KL -2570.68 + 101it [00:23, 4.49it/s] 102it [00:23, 4.46it/s] 103it [00:23, 4.51it/s] 104it [00:23, 4.51it/s] 105it [00:24, 4.56it/s] 106it [00:24, 4.29it/s] 107it [00:24, 4.29it/s] 108it [00:24, 4.35it/s] 109it [00:24, 4.45it/s] 110it [00:25, 4.37it/s] 111it [00:25, 4.36it/s] 112it [00:25, 4.23it/s] 113it [00:25, 4.24it/s] 114it [00:26, 4.23it/s] 115it [00:26, 4.35it/s] 116it [00:26, 4.43it/s] 117it [00:26, 4.42it/s] 118it [00:27, 4.39it/s] 119it [00:27, 4.40it/s] 120it [00:27, 4.45it/s] 121it [00:27, 4.40it/s] 122it [00:27, 4.44it/s] 123it [00:28, 4.51it/s] 124it [00:28, 4.48it/s] 125it [00:28, 4.54it/s] 126it [00:28, 4.44it/s] 127it [00:29, 4.27it/s] 128it [00:29, 4.37it/s] 129it [00:29, 4.34it/s] 130it [00:29, 4.38it/s] 131it [00:29, 4.45it/s] 132it [00:30, 4.43it/s] 133it [00:30, 4.33it/s] 134it [00:30, 4.31it/s] 135it [00:30, 4.32it/s] 136it [00:31, 4.33it/s] 137it [00:31, 4.44it/s] 138it [00:31, 4.49it/s] 139it [00:31, 4.48it/s] 140it [00:32, 4.35it/s] 141it [00:32, 4.35it/s] 142it [00:32, 4.34it/s] 143it [00:32, 4.38it/s] 144it [00:32, 4.33it/s] 145it [00:33, 4.37it/s] 146it [00:33, 4.42it/s] 147it [00:33, 4.35it/s] 148it [00:33, 4.22it/s] 149it [00:34, 4.35it/s] 150it [00:34, 4.27it/s]2025-05-25 21:38:06,114 - INFO - [Epoch 012 | Batch 0150] IWAE-loss 3201.9055 | mean log_px -0.0163 | KL -2551.84 + 151it [00:34, 4.32it/s] 152it [00:34, 4.38it/s] 153it [00:35, 4.43it/s] 154it [00:35, 4.50it/s] 155it [00:35, 4.47it/s] 156it [00:35, 4.39it/s] 157it [00:35, 4.47it/s] 158it [00:36, 4.54it/s] 159it [00:36, 4.44it/s] 160it [00:36, 4.41it/s] 161it [00:36, 4.24it/s] 162it [00:37, 4.28it/s] 163it [00:37, 4.32it/s] 164it [00:37, 4.31it/s] 165it [00:37, 4.36it/s] 166it [00:38, 4.34it/s] 167it [00:38, 4.36it/s] 168it [00:38, 4.37it/s] 169it [00:38, 4.33it/s] 170it [00:38, 4.33it/s] 171it [00:39, 4.34it/s] 172it [00:39, 4.44it/s] 173it [00:39, 4.50it/s] 174it [00:39, 4.53it/s] 175it [00:40, 4.46it/s] 176it [00:40, 4.45it/s] 177it [00:40, 4.54it/s] 178it [00:40, 4.43it/s] 179it [00:40, 4.43it/s] 180it [00:41, 4.45it/s] 181it [00:41, 4.52it/s] 182it [00:41, 4.56it/s] 183it [00:41, 4.60it/s] 184it [00:42, 4.60it/s] 185it [00:42, 4.63it/s] 186it [00:42, 4.44it/s] 187it [00:42, 4.40it/s] 188it [00:42, 4.37it/s] 189it [00:43, 4.48it/s] 190it [00:43, 4.52it/s] 191it [00:43, 4.57it/s] 192it [00:43, 4.53it/s] 193it [00:44, 4.48it/s] 194it [00:44, 4.51it/s] 195it [00:44, 4.42it/s] 196it [00:44, 4.40it/s] 196it [00:44, 4.38it/s] +2025-05-25 21:38:16,375 - INFO - Epoch: 12, Objective: tensor([2863.8979], device='cuda:0', grad_fn=), Loss: 0.006043643224984407, KL/n: 51.6978874206543 + 0it [00:00, ?it/s]2025-05-25 21:38:16,736 - INFO - [Epoch 013 | Batch 0000] IWAE-loss 2755.2402 | mean log_px -0.0041 | KL -2532.30 + 1it [00:00, 3.52it/s] 2it [00:00, 4.14it/s] 3it [00:00, 4.39it/s] 4it [00:00, 4.51it/s] 5it [00:01, 4.41it/s] 6it [00:01, 4.51it/s] 7it [00:01, 4.53it/s] 8it [00:01, 4.58it/s] 9it [00:02, 4.62it/s] 10it [00:02, 4.49it/s] 11it [00:02, 4.57it/s] 12it [00:02, 4.61it/s] 13it [00:02, 4.64it/s] 14it [00:03, 4.66it/s] 15it [00:03, 4.68it/s] 16it [00:03, 4.69it/s] 17it [00:03, 4.70it/s] 18it [00:03, 4.70it/s] 19it [00:04, 4.71it/s] 20it [00:04, 4.71it/s] 21it [00:04, 4.71it/s] 22it [00:04, 4.71it/s] 23it [00:05, 4.71it/s] 24it [00:05, 4.70it/s] 25it [00:05, 4.70it/s] 26it [00:05, 4.70it/s] 27it [00:05, 4.71it/s] 28it [00:06, 4.70it/s] 29it [00:06, 4.47it/s] 30it [00:06, 4.52it/s] 31it [00:06, 4.57it/s] 32it [00:06, 4.59it/s] 33it [00:07, 4.61it/s] 34it [00:07, 4.61it/s] 35it [00:07, 4.63it/s] 36it [00:07, 4.50it/s] 37it [00:08, 4.58it/s] 38it [00:08, 4.61it/s] 39it [00:08, 4.65it/s] 40it [00:08, 4.65it/s] 41it [00:08, 4.67it/s] 42it [00:09, 4.68it/s] 43it [00:09, 4.69it/s] 44it [00:09, 4.69it/s] 45it [00:09, 4.68it/s] 46it [00:09, 4.50it/s] 47it [00:10, 4.54it/s] 48it [00:10, 4.56it/s] 49it [00:10, 4.61it/s] 50it [00:10, 4.60it/s]2025-05-25 21:38:27,527 - INFO - [Epoch 013 | Batch 0050] IWAE-loss 2921.4778 | mean log_px -0.0094 | KL -2503.91 + 51it [00:11, 4.62it/s] 52it [00:11, 4.64it/s] 53it [00:11, 4.61it/s] 54it [00:11, 4.63it/s] 55it [00:11, 4.48it/s] 56it [00:12, 4.56it/s] 57it [00:12, 4.58it/s] 58it [00:12, 4.61it/s] 59it [00:12, 4.63it/s] 60it [00:13, 4.48it/s] 61it [00:13, 4.56it/s] 62it [00:13, 4.60it/s] 63it [00:13, 4.64it/s] 64it [00:13, 4.65it/s] 65it [00:14, 4.67it/s] 66it [00:14, 4.67it/s] 67it [00:14, 4.69it/s] 68it [00:14, 4.69it/s] 69it [00:14, 4.70it/s] 70it [00:15, 4.70it/s] 71it [00:15, 4.70it/s] 72it [00:15, 4.70it/s] 73it [00:15, 4.71it/s] 74it [00:16, 4.71it/s] 75it [00:16, 4.71it/s] 76it [00:16, 4.70it/s] 77it [00:16, 4.71it/s] 78it [00:16, 4.60it/s] 79it [00:17, 4.65it/s] 80it [00:17, 4.66it/s] 81it [00:17, 4.68it/s] 82it [00:17, 4.69it/s] 83it [00:17, 4.69it/s] 84it [00:18, 4.54it/s] 85it [00:18, 4.60it/s] 86it [00:18, 4.63it/s] 87it [00:18, 4.66it/s] 88it [00:19, 4.67it/s] 89it [00:19, 4.53it/s] 90it [00:19, 4.59it/s] 91it [00:19, 4.63it/s] 92it [00:19, 4.65it/s] 93it [00:20, 4.67it/s] 94it [00:20, 4.68it/s] 95it [00:20, 4.69it/s] 96it [00:20, 4.69it/s] 97it [00:20, 4.55it/s] 98it [00:21, 4.60it/s] 99it [00:21, 4.63it/s] 100it [00:21, 4.65it/s]2025-05-25 21:38:38,299 - INFO - [Epoch 013 | Batch 0100] IWAE-loss 3051.0591 | mean log_px -0.0105 | KL -2480.72 + 101it [00:21, 4.67it/s] 102it [00:22, 4.68it/s] 103it [00:22, 4.69it/s] 104it [00:22, 4.70it/s] 105it [00:22, 4.70it/s] 106it [00:22, 4.49it/s] 107it [00:23, 4.57it/s] 108it [00:23, 4.61it/s] 109it [00:23, 4.64it/s] 110it [00:23, 4.66it/s] 111it [00:24, 4.67it/s] 112it [00:24, 4.68it/s] 113it [00:24, 4.68it/s] 114it [00:24, 4.69it/s] 115it [00:24, 4.70it/s] 116it [00:25, 4.70it/s] 117it [00:25, 4.69it/s] 118it [00:25, 4.69it/s] 119it [00:25, 4.70it/s] 120it [00:25, 4.69it/s] 121it [00:26, 4.59it/s] 122it [00:26, 4.64it/s] 123it [00:26, 4.66it/s] 124it [00:26, 4.65it/s] 125it [00:26, 4.67it/s] 126it [00:27, 4.68it/s] 127it [00:27, 4.69it/s] 128it [00:27, 4.69it/s] 129it [00:27, 4.69it/s] 130it [00:28, 4.70it/s] 131it [00:28, 4.55it/s] 132it [00:28, 4.61it/s] 133it [00:28, 4.64it/s] 134it [00:28, 4.65it/s] 135it [00:29, 4.66it/s] 136it [00:29, 4.68it/s] 137it [00:29, 4.69it/s] 138it [00:29, 4.70it/s] 139it [00:29, 4.70it/s] 140it [00:30, 4.55it/s] 141it [00:30, 4.61it/s] 142it [00:30, 4.64it/s] 143it [00:30, 4.65it/s] 144it [00:31, 4.67it/s] 145it [00:31, 4.68it/s] 146it [00:31, 4.69it/s] 147it [00:31, 4.69it/s] 148it [00:31, 4.70it/s] 149it [00:32, 4.55it/s] 150it [00:32, 4.61it/s]2025-05-25 21:38:49,042 - INFO - [Epoch 013 | Batch 0150] IWAE-loss 2694.3430 | mean log_px -0.0060 | KL -2454.87 + 151it [00:32, 4.64it/s] 152it [00:32, 4.66it/s] 153it [00:33, 4.66it/s] 154it [00:33, 4.67it/s] 155it [00:33, 4.68it/s] 156it [00:33, 4.69it/s] 157it [00:33, 4.69it/s] 158it [00:34, 4.70it/s] 159it [00:34, 4.50it/s] 160it [00:34, 4.58it/s] 161it [00:34, 4.62it/s] 162it [00:34, 4.63it/s] 163it [00:35, 4.66it/s] 164it [00:35, 4.67it/s] 165it [00:35, 4.69it/s] 166it [00:35, 4.69it/s] 167it [00:36, 4.70it/s] 168it [00:36, 4.69it/s] 169it [00:36, 4.71it/s] 170it [00:36, 4.70it/s] 171it [00:36, 4.70it/s] 172it [00:37, 4.59it/s] 173it [00:37, 4.65it/s] 174it [00:37, 4.66it/s] 175it [00:37, 4.56it/s] 176it [00:37, 4.60it/s] 177it [00:38, 4.62it/s] 178it [00:38, 4.63it/s] 179it [00:38, 4.64it/s] 180it [00:38, 4.49it/s] 181it [00:39, 4.49it/s] 182it [00:39, 4.56it/s] 183it [00:39, 4.58it/s] 184it [00:39, 4.62it/s] 185it [00:39, 4.64it/s] 186it [00:40, 4.65it/s] 187it [00:40, 4.52it/s] 188it [00:40, 4.59it/s] 189it [00:40, 4.62it/s] 190it [00:41, 4.63it/s] 191it [00:41, 4.66it/s] 192it [00:41, 4.66it/s] 193it [00:41, 4.68it/s] 194it [00:41, 4.68it/s] 195it [00:42, 4.42it/s] 196it [00:42, 4.37it/s] 196it [00:42, 4.62it/s] +2025-05-25 21:38:58,931 - INFO - Epoch: 13, Objective: tensor([4922.8945], device='cuda:0', grad_fn=), Loss: 0.041003212332725525, KL/n: 49.89161682128906 + 0it [00:00, ?it/s]2025-05-25 21:38:59,491 - INFO - [Epoch 014 | Batch 0000] IWAE-loss 2859.6846 | mean log_px -0.0121 | KL -2441.73 + 1it [00:00, 3.24it/s] 2it [00:00, 3.87it/s] 3it [00:00, 4.21it/s] 4it [00:00, 4.19it/s] 5it [00:01, 4.36it/s] 6it [00:01, 4.42it/s] 7it [00:01, 4.36it/s] 8it [00:01, 4.34it/s] 9it [00:02, 4.24it/s] 10it [00:02, 4.33it/s] 11it [00:02, 4.26it/s] 12it [00:02, 4.35it/s] 13it [00:03, 4.31it/s] 14it [00:03, 4.31it/s] 15it [00:03, 4.30it/s] 16it [00:03, 4.36it/s] 17it [00:03, 4.32it/s] 18it [00:04, 4.37it/s] 19it [00:04, 4.44it/s] 20it [00:04, 4.50it/s] 21it [00:04, 4.49it/s] 22it [00:05, 4.38it/s] 23it [00:05, 4.39it/s] 24it [00:05, 4.36it/s] 25it [00:05, 4.34it/s] 26it [00:06, 4.39it/s] 27it [00:06, 4.34it/s] 28it [00:06, 4.19it/s] 29it [00:06, 4.28it/s] 30it [00:06, 4.25it/s] 31it [00:07, 4.29it/s] 32it [00:07, 4.33it/s] 33it [00:07, 4.21it/s] 34it [00:07, 4.27it/s] 35it [00:08, 4.35it/s] 36it [00:08, 4.42it/s] 37it [00:08, 4.36it/s] 38it [00:08, 4.24it/s] 39it [00:09, 4.37it/s] 40it [00:09, 4.43it/s] 41it [00:09, 4.50it/s] 42it [00:09, 4.40it/s] 43it [00:09, 4.48it/s] 44it [00:10, 4.53it/s] 45it [00:10, 4.55it/s] 46it [00:10, 4.60it/s] 47it [00:10, 4.62it/s] 48it [00:11, 4.61it/s] 49it [00:11, 4.53it/s] 50it [00:11, 4.45it/s]2025-05-25 21:39:10,866 - INFO - [Epoch 014 | Batch 0050] IWAE-loss 3013.0603 | mean log_px -0.0122 | KL -2423.46 + 51it [00:11, 4.36it/s] 52it [00:11, 4.44it/s] 53it [00:12, 4.44it/s] 54it [00:12, 4.36it/s] 55it [00:12, 4.26it/s] 56it [00:12, 4.26it/s] 57it [00:13, 4.33it/s] 58it [00:13, 4.39it/s] 59it [00:13, 4.46it/s] 60it [00:13, 4.28it/s] 61it [00:13, 4.40it/s] 62it [00:14, 4.43it/s] 63it [00:14, 4.49it/s] 64it [00:14, 4.39it/s] 65it [00:14, 4.34it/s] 66it [00:15, 4.22it/s] 67it [00:15, 4.35it/s] 68it [00:15, 4.33it/s] 69it [00:15, 4.35it/s] 70it [00:16, 4.43it/s] 71it [00:16, 4.35it/s] 72it [00:16, 4.36it/s] 73it [00:16, 4.36it/s] 74it [00:16, 4.30it/s] 75it [00:17, 4.35it/s] 76it [00:17, 4.30it/s] 77it [00:17, 4.28it/s] 78it [00:17, 4.31it/s] 79it [00:18, 4.19it/s] 80it [00:18, 4.23it/s] 81it [00:18, 4.24it/s] 82it [00:18, 4.35it/s] 83it [00:19, 4.44it/s] 84it [00:19, 4.36it/s] 85it [00:19, 4.24it/s] 86it [00:19, 4.26it/s] 87it [00:20, 4.29it/s] 88it [00:20, 4.32it/s] 89it [00:20, 4.37it/s] 90it [00:20, 4.45it/s] 91it [00:20, 4.36it/s] 92it [00:21, 4.35it/s] 93it [00:21, 4.37it/s] 94it [00:21, 4.42it/s] 95it [00:21, 4.45it/s] 96it [00:22, 4.51it/s] 97it [00:22, 4.41it/s] 98it [00:22, 4.36it/s] 99it [00:22, 4.36it/s] 100it [00:22, 4.36it/s]2025-05-25 21:39:22,378 - INFO - [Epoch 014 | Batch 0100] IWAE-loss 3804.5000 | mean log_px -0.0205 | KL -2399.92 + 101it [00:23, 4.37it/s] 102it [00:23, 4.36it/s] 103it [00:23, 4.45it/s] 104it [00:23, 4.45it/s] 105it [00:24, 4.43it/s] 106it [00:24, 4.37it/s] 107it [00:24, 4.36it/s] 108it [00:24, 4.44it/s] 109it [00:24, 4.49it/s] 110it [00:25, 4.53it/s] 111it [00:25, 4.57it/s] 112it [00:25, 4.60it/s] 113it [00:25, 4.48it/s] 114it [00:26, 4.47it/s] 115it [00:26, 4.46it/s] 116it [00:26, 4.46it/s] 117it [00:26, 4.38it/s] 118it [00:27, 4.34it/s] 119it [00:27, 4.41it/s] 120it [00:27, 4.34it/s] 121it [00:27, 4.29it/s] 122it [00:27, 4.31it/s] 123it [00:28, 4.30it/s] 124it [00:28, 4.24it/s] 125it [00:28, 4.29it/s] 126it [00:28, 4.40it/s] 127it [00:29, 4.45it/s] 128it [00:29, 4.42it/s] 129it [00:29, 4.28it/s] 130it [00:29, 4.38it/s] 131it [00:30, 4.37it/s] 132it [00:30, 4.43it/s] 133it [00:30, 4.36it/s] 134it [00:30, 4.45it/s] 135it [00:30, 4.43it/s] 136it [00:31, 4.24it/s] 137it [00:31, 4.38it/s] 138it [00:31, 4.44it/s] 139it [00:31, 4.51it/s] 140it [00:32, 4.53it/s] 141it [00:32, 4.59it/s] 142it [00:32, 4.61it/s] 143it [00:32, 4.63it/s] 144it [00:32, 4.64it/s] 145it [00:33, 4.36it/s] 146it [00:33, 4.33it/s] 147it [00:33, 4.31it/s] 148it [00:33, 4.30it/s] 149it [00:34, 4.31it/s] 150it [00:34, 4.31it/s]2025-05-25 21:39:33,721 - INFO - [Epoch 014 | Batch 0150] IWAE-loss 3109.0154 | mean log_px -0.0184 | KL -2386.44 + 151it [00:34, 4.34it/s] 152it [00:34, 4.36it/s] 153it [00:34, 4.43it/s] 154it [00:35, 4.32it/s] 155it [00:35, 4.35it/s] 156it [00:35, 4.44it/s] 157it [00:35, 4.51it/s] 158it [00:36, 4.43it/s] 159it [00:36, 4.45it/s] 160it [00:36, 4.47it/s] 161it [00:36, 4.55it/s] 162it [00:36, 4.58it/s] 163it [00:37, 4.47it/s] 164it [00:37, 4.50it/s] 165it [00:37, 4.42it/s] 166it [00:37, 4.37it/s] 167it [00:38, 4.33it/s] 168it [00:38, 4.39it/s] 169it [00:38, 4.28it/s] 170it [00:38, 4.38it/s] 171it [00:39, 4.45it/s] 172it [00:39, 4.47it/s] 173it [00:39, 4.46it/s] 174it [00:39, 4.47it/s] 175it [00:39, 4.48it/s] 176it [00:40, 4.53it/s] 177it [00:40, 4.55it/s] 178it [00:40, 4.48it/s] 179it [00:40, 4.42it/s] 180it [00:41, 4.25it/s] 181it [00:41, 4.25it/s] 182it [00:41, 4.29it/s] 183it [00:41, 4.36it/s] 184it [00:42, 4.38it/s] 185it [00:42, 4.46it/s] 186it [00:42, 4.52it/s] 187it [00:42, 4.56it/s] 188it [00:42, 4.31it/s] 189it [00:43, 4.33it/s] 190it [00:43, 4.43it/s] 191it [00:43, 4.43it/s] 192it [00:43, 4.39it/s] 193it [00:44, 4.41it/s] 194it [00:44, 4.33it/s] 195it [00:44, 4.22it/s] 196it [00:44, 4.36it/s] 196it [00:44, 4.37it/s] +2025-05-25 21:39:44,055 - INFO - Epoch: 14, Objective: tensor([2733.1536], device='cuda:0', grad_fn=), Loss: 0.013086755760014057, KL/n: 48.29157638549805 + 0it [00:00, ?it/s]2025-05-25 21:39:44,461 - INFO - [Epoch 015 | Batch 0000] IWAE-loss 3566.3582 | mean log_px -0.0216 | KL -2368.83 + 1it [00:00, 2.78it/s] 2it [00:00, 3.46it/s] 3it [00:00, 3.94it/s] 4it [00:01, 4.11it/s] 5it [00:01, 4.19it/s] 6it [00:01, 4.13it/s] 7it [00:01, 4.09it/s] 8it [00:02, 4.15it/s] 9it [00:02, 4.20it/s] 10it [00:02, 4.26it/s] 11it [00:02, 4.38it/s] 12it [00:02, 4.32it/s] 13it [00:03, 4.22it/s] 14it [00:03, 4.12it/s] 15it [00:03, 4.24it/s] 16it [00:03, 4.31it/s] 17it [00:04, 4.43it/s] 18it [00:04, 4.51it/s] 19it [00:04, 4.46it/s] 20it [00:04, 4.42it/s] 21it [00:04, 4.37it/s] 22it [00:05, 4.38it/s] 23it [00:05, 4.41it/s] 24it [00:05, 4.42it/s] 25it [00:05, 4.51it/s] 26it [00:06, 4.49it/s] 27it [00:06, 4.47it/s] 28it [00:06, 4.48it/s] 29it [00:06, 4.52it/s] 30it [00:06, 4.57it/s] 31it [00:07, 4.52it/s] 32it [00:07, 4.59it/s] 33it [00:07, 4.34it/s] 34it [00:07, 4.37it/s] 35it [00:08, 4.42it/s] 36it [00:08, 4.49it/s] 37it [00:08, 4.45it/s] 38it [00:08, 4.39it/s] 39it [00:09, 4.39it/s] 40it [00:09, 4.39it/s] 41it [00:09, 4.41it/s] 42it [00:09, 4.46it/s] 43it [00:09, 4.46it/s] 44it [00:10, 4.50it/s] 45it [00:10, 4.50it/s] 46it [00:10, 4.55it/s] 47it [00:10, 4.59it/s] 48it [00:10, 4.62it/s] 49it [00:11, 4.59it/s] 50it [00:11, 4.53it/s]2025-05-25 21:39:55,785 - INFO - [Epoch 015 | Batch 0050] IWAE-loss 2586.0901 | mean log_px -0.0101 | KL -2342.14 + 51it [00:11, 4.59it/s] 52it [00:11, 4.63it/s] 53it [00:12, 4.67it/s] 54it [00:12, 4.39it/s] 55it [00:12, 4.50it/s] 56it [00:12, 4.54it/s] 57it [00:13, 4.33it/s] 58it [00:13, 4.34it/s] 59it [00:13, 4.36it/s] 60it [00:13, 4.34it/s] 61it [00:13, 4.32it/s] 62it [00:14, 4.34it/s] 63it [00:14, 4.42it/s] 64it [00:14, 4.37it/s] 65it [00:14, 4.36it/s] 66it [00:15, 4.33it/s] 67it [00:15, 4.41it/s] 68it [00:15, 4.39it/s] 69it [00:15, 4.40it/s] 70it [00:15, 4.36it/s] 71it [00:16, 4.40it/s] 72it [00:16, 4.41it/s] 73it [00:16, 4.50it/s] 74it [00:16, 4.44it/s] 75it [00:17, 4.32it/s] 76it [00:17, 4.30it/s] 77it [00:17, 3.48it/s] 78it [00:18, 3.65it/s] 79it [00:18, 3.89it/s] 80it [00:18, 4.08it/s] 81it [00:18, 4.19it/s] 82it [00:18, 4.22it/s] 83it [00:19, 4.21it/s] 84it [00:19, 4.35it/s] 85it [00:19, 4.46it/s] 86it [00:19, 4.40it/s] 87it [00:20, 4.49it/s] 88it [00:20, 4.54it/s] 89it [00:20, 4.59it/s] 90it [00:20, 4.39it/s] 91it [00:20, 4.51it/s] 92it [00:21, 4.57it/s] 93it [00:21, 4.49it/s] 94it [00:21, 4.43it/s] 95it [00:21, 4.38it/s] 96it [00:22, 4.46it/s] 97it [00:22, 4.46it/s] 98it [00:22, 4.50it/s] 99it [00:22, 4.32it/s] 100it [00:22, 4.42it/s]2025-05-25 21:40:07,299 - INFO - [Epoch 015 | Batch 0100] IWAE-loss 2982.4482 | mean log_px -0.0107 | KL -2318.40 + 101it [00:23, 4.40it/s] 102it [00:23, 4.45it/s] 103it [00:23, 4.54it/s] 104it [00:23, 4.49it/s] 105it [00:24, 4.54it/s] 106it [00:24, 4.49it/s] 107it [00:24, 4.50it/s] 108it [00:24, 4.39it/s] 109it [00:24, 4.51it/s] 110it [00:25, 4.44it/s] 111it [00:25, 4.52it/s] 112it [00:25, 4.56it/s] 113it [00:25, 4.61it/s] 114it [00:26, 4.49it/s] 115it [00:26, 4.34it/s] 116it [00:26, 4.33it/s] 117it [00:26, 4.40it/s] 118it [00:26, 4.48it/s] 119it [00:27, 4.55it/s] 120it [00:27, 4.56it/s] 121it [00:27, 4.61it/s] 122it [00:27, 4.61it/s] 123it [00:28, 4.37it/s] 124it [00:28, 4.42it/s] 125it [00:28, 4.50it/s] 126it [00:28, 4.54it/s] 127it [00:28, 4.60it/s] 128it [00:29, 4.64it/s] 129it [00:29, 4.63it/s] 130it [00:29, 4.64it/s] 131it [00:29, 4.57it/s] 132it [00:30, 4.50it/s] 133it [00:30, 4.34it/s] 134it [00:30, 4.39it/s] 135it [00:30, 4.45it/s] 136it [00:30, 4.44it/s] 137it [00:31, 4.49it/s] 138it [00:31, 4.32it/s] 139it [00:31, 4.35it/s] 140it [00:31, 4.36it/s] 141it [00:32, 4.47it/s] 142it [00:32, 4.52it/s] 143it [00:32, 4.32it/s] 144it [00:32, 4.30it/s] 145it [00:33, 4.42it/s] 146it [00:33, 4.51it/s] 147it [00:33, 4.52it/s] 148it [00:33, 4.57it/s] 149it [00:33, 4.53it/s] 150it [00:34, 4.42it/s]2025-05-25 21:40:18,451 - INFO - [Epoch 015 | Batch 0150] IWAE-loss 3421.2581 | mean log_px -0.0186 | KL -2299.48 + 151it [00:34, 4.51it/s] 152it [00:34, 4.46it/s] 153it [00:34, 4.44it/s] 154it [00:35, 4.38it/s] 155it [00:35, 4.47it/s] 156it [00:35, 4.54it/s] 157it [00:35, 4.57it/s] 158it [00:35, 4.55it/s] 159it [00:36, 4.36it/s] 160it [00:36, 4.34it/s] 161it [00:36, 4.45it/s] 162it [00:36, 4.47it/s] 163it [00:37, 4.55it/s] 164it [00:37, 4.31it/s] 165it [00:37, 4.37it/s] 166it [00:37, 4.33it/s] 167it [00:37, 4.35it/s] 168it [00:38, 4.38it/s] 169it [00:38, 4.40it/s] 170it [00:38, 4.30it/s] 171it [00:38, 4.37it/s] 172it [00:39, 4.41it/s] 173it [00:39, 4.39it/s] 174it [00:39, 4.44it/s] 175it [00:39, 4.41it/s] 176it [00:40, 4.36it/s] 177it [00:40, 4.24it/s] 178it [00:40, 4.27it/s] 179it [00:40, 4.38it/s] 180it [00:40, 4.45it/s] 181it [00:41, 4.42it/s] 182it [00:41, 4.41it/s] 183it [00:41, 4.25it/s] 184it [00:41, 4.26it/s] 185it [00:42, 4.28it/s] 186it [00:42, 4.28it/s] 187it [00:42, 4.29it/s] 188it [00:42, 4.27it/s] 189it [00:43, 4.29it/s] 190it [00:43, 4.25it/s] 191it [00:43, 4.30it/s] 192it [00:43, 4.34it/s] 193it [00:43, 4.41it/s] 194it [00:44, 4.34it/s] 195it [00:44, 4.01it/s] 196it [00:44, 4.19it/s] 196it [00:44, 4.38it/s] +2025-05-25 21:40:28,944 - INFO - Epoch: 15, Objective: tensor([2673.8301], device='cuda:0', grad_fn=), Loss: 0.006941231433302164, KL/n: 46.54920196533203 + 0it [00:00, ?it/s]2025-05-25 21:40:29,340 - INFO - [Epoch 016 | Batch 0000] IWAE-loss 2568.5730 | mean log_px -0.0058 | KL -2277.45 + 1it [00:00, 3.08it/s] 2it [00:00, 3.66it/s] 3it [00:00, 4.10it/s] 4it [00:01, 4.18it/s] 5it [00:01, 4.32it/s] 6it [00:01, 4.44it/s] 7it [00:01, 4.37it/s] 8it [00:01, 4.49it/s] 9it [00:02, 4.43it/s] 10it [00:02, 4.48it/s] 11it [00:02, 4.57it/s] 12it [00:02, 4.46it/s] 13it [00:02, 4.53it/s] 14it [00:03, 4.43it/s] 15it [00:03, 4.39it/s] 16it [00:03, 4.22it/s] 17it [00:03, 4.37it/s] 18it [00:04, 4.33it/s] 19it [00:04, 4.32it/s] 20it [00:04, 4.40it/s] 21it [00:04, 4.43it/s] 22it [00:05, 4.51it/s] 23it [00:05, 4.42it/s] 24it [00:05, 4.50it/s] 25it [00:05, 4.47it/s] 26it [00:05, 4.52it/s] 27it [00:06, 4.57it/s] 28it [00:06, 4.47it/s] 29it [00:06, 4.42it/s] 30it [00:06, 4.36it/s] 31it [00:07, 4.45it/s] 32it [00:07, 4.36it/s] 33it [00:07, 4.48it/s] 34it [00:07, 4.54it/s] 35it [00:07, 4.59it/s] 36it [00:08, 4.61it/s] 37it [00:08, 4.55it/s] 38it [00:08, 4.45it/s] 39it [00:08, 4.53it/s] 40it [00:09, 4.56it/s] 41it [00:09, 4.45it/s] 42it [00:09, 4.54it/s] 43it [00:09, 4.60it/s] 44it [00:09, 4.63it/s] 45it [00:10, 4.66it/s] 46it [00:10, 4.66it/s] 47it [00:10, 4.68it/s] 48it [00:10, 4.68it/s] 49it [00:10, 4.70it/s] 50it [00:11, 4.54it/s]2025-05-25 21:40:40,470 - INFO - [Epoch 016 | Batch 0050] IWAE-loss 2469.5354 | mean log_px -0.0050 | KL -2246.70 + 51it [00:11, 4.29it/s] 52it [00:11, 4.30it/s] 53it [00:11, 4.35it/s] 54it [00:12, 4.31it/s] 55it [00:12, 4.31it/s] 56it [00:12, 4.15it/s] 57it [00:12, 4.32it/s] 58it [00:13, 4.29it/s] 59it [00:13, 4.40it/s] 60it [00:13, 4.34it/s] 61it [00:13, 4.18it/s] 62it [00:14, 4.31it/s] 63it [00:14, 4.43it/s] 64it [00:14, 4.52it/s] 65it [00:14, 4.58it/s] 66it [00:14, 4.62it/s] 67it [00:15, 4.65it/s] 68it [00:15, 4.67it/s] 69it [00:15, 4.69it/s] 70it [00:15, 4.38it/s] 71it [00:15, 4.49it/s] 72it [00:16, 4.35it/s] 73it [00:16, 4.38it/s] 74it [00:16, 4.46it/s] 75it [00:16, 4.54it/s] 76it [00:17, 4.58it/s] 77it [00:17, 4.62it/s] 78it [00:17, 4.49it/s] 79it [00:17, 4.43it/s] 80it [00:18, 4.48it/s] 81it [00:18, 4.54it/s] 82it [00:18, 4.59it/s] 83it [00:18, 4.64it/s] 84it [00:18, 4.66it/s] 85it [00:19, 4.54it/s] 86it [00:19, 4.40it/s] 87it [00:19, 4.38it/s] 88it [00:19, 4.44it/s] 89it [00:20, 4.39it/s] 90it [00:20, 4.46it/s] 91it [00:20, 4.54it/s] 92it [00:20, 4.43it/s] 93it [00:20, 4.54it/s] 94it [00:21, 4.59it/s] 95it [00:21, 4.63it/s] 96it [00:21, 4.49it/s] 97it [00:21, 4.43it/s] 98it [00:22, 4.38it/s] 99it [00:22, 4.47it/s] 100it [00:22, 4.52it/s]2025-05-25 21:40:51,684 - INFO - [Epoch 016 | Batch 0100] IWAE-loss 2823.7253 | mean log_px -0.0109 | KL -2227.54 + 101it [00:22, 4.34it/s] 102it [00:22, 4.43it/s] 103it [00:23, 4.38it/s] 104it [00:23, 4.34it/s] 105it [00:23, 4.36it/s] 106it [00:23, 4.45it/s] 107it [00:24, 4.53it/s] 108it [00:24, 4.57it/s] 109it [00:24, 4.46it/s] 110it [00:24, 4.38it/s] 111it [00:24, 4.42it/s] 112it [00:25, 4.49it/s] 113it [00:25, 4.56it/s] 114it [00:25, 4.60it/s] 115it [00:25, 4.64it/s] 116it [00:26, 4.50it/s] 117it [00:26, 4.49it/s] 118it [00:26, 4.26it/s] 119it [00:26, 4.28it/s] 120it [00:26, 4.37it/s] 121it [00:27, 4.47it/s] 122it [00:27, 4.52it/s] 123it [00:27, 4.55it/s] 124it [00:27, 4.61it/s] 125it [00:28, 4.50it/s] 126it [00:28, 4.41it/s] 127it [00:28, 4.23it/s] 128it [00:28, 4.24it/s] 129it [00:29, 4.25it/s] 130it [00:29, 4.25it/s] 131it [00:29, 4.25it/s] 132it [00:29, 4.35it/s] 133it [00:29, 4.33it/s] 134it [00:30, 4.29it/s] 135it [00:30, 4.21it/s] 136it [00:30, 4.33it/s] 137it [00:30, 4.43it/s] 138it [00:31, 4.49it/s] 139it [00:31, 4.54it/s] 140it [00:31, 4.57it/s] 141it [00:31, 4.56it/s] 142it [00:31, 4.38it/s] 143it [00:32, 4.35it/s] 144it [00:32, 4.30it/s] 145it [00:32, 4.42it/s] 146it [00:32, 4.32it/s] 147it [00:33, 4.34it/s] 148it [00:33, 4.14it/s] 149it [00:33, 4.15it/s] 150it [00:33, 4.15it/s]2025-05-25 21:41:03,119 - INFO - [Epoch 016 | Batch 0150] IWAE-loss 2373.7930 | mean log_px -0.0035 | KL -2207.88 + 151it [00:34, 4.20it/s] 152it [00:34, 4.28it/s] 153it [00:34, 4.38it/s] 154it [00:34, 4.33it/s] 155it [00:35, 4.31it/s] 156it [00:35, 4.31it/s] 157it [00:35, 4.40it/s] 158it [00:35, 4.44it/s] 159it [00:35, 4.50it/s] 160it [00:36, 4.40it/s] 161it [00:36, 4.46it/s] 162it [00:36, 4.24it/s] 163it [00:36, 4.25it/s] 164it [00:37, 4.34it/s] 165it [00:37, 4.42it/s] 166it [00:37, 4.48it/s] 167it [00:37, 4.42it/s] 168it [00:37, 4.45it/s] 169it [00:38, 4.49it/s] 170it [00:38, 4.48it/s] 171it [00:38, 4.53it/s] 172it [00:38, 4.52it/s] 173it [00:39, 4.38it/s] 174it [00:39, 4.45it/s] 175it [00:39, 4.52it/s] 176it [00:39, 4.54it/s] 177it [00:39, 4.56it/s] 178it [00:40, 4.57it/s] 179it [00:40, 4.59it/s] 180it [00:40, 4.31it/s] 181it [00:40, 4.41it/s] 182it [00:41, 4.45it/s] 183it [00:41, 4.42it/s] 184it [00:41, 4.47it/s] 185it [00:41, 4.50it/s] 186it [00:41, 4.53it/s] 187it [00:42, 4.56it/s] 188it [00:42, 4.44it/s] 189it [00:42, 4.50it/s] 190it [00:42, 4.53it/s] 191it [00:43, 4.56it/s] 192it [00:43, 4.44it/s] 193it [00:43, 4.39it/s] 194it [00:43, 4.43it/s] 195it [00:44, 4.26it/s] 196it [00:44, 4.24it/s] 196it [00:44, 4.42it/s] +2025-05-25 21:41:13,397 - INFO - Epoch: 16, Objective: tensor([2848.4922], device='cuda:0', grad_fn=), Loss: 0.02026955410838127, KL/n: 44.883338928222656 + 0it [00:00, ?it/s]2025-05-25 21:41:13,936 - INFO - [Epoch 017 | Batch 0000] IWAE-loss 2439.9866 | mean log_px -0.0047 | KL -2197.12 + 1it [00:00, 3.26it/s] 2it [00:00, 3.96it/s] 3it [00:00, 4.26it/s] 4it [00:00, 4.29it/s] 5it [00:01, 4.32it/s] 6it [00:01, 4.39it/s] 7it [00:01, 4.40it/s] 8it [00:01, 4.45it/s] 9it [00:02, 4.50it/s] 10it [00:02, 4.54it/s] 11it [00:02, 4.57it/s] 12it [00:02, 4.59it/s] 13it [00:02, 4.50it/s] 14it [00:03, 4.44it/s] 15it [00:03, 4.48it/s] 16it [00:03, 4.39it/s] 17it [00:03, 4.47it/s] 18it [00:04, 4.42it/s] 19it [00:04, 4.46it/s] 20it [00:04, 4.50it/s] 21it [00:04, 4.53it/s] 22it [00:04, 4.55it/s] 23it [00:05, 4.58it/s] 24it [00:05, 4.49it/s] 25it [00:05, 4.35it/s] 26it [00:05, 4.37it/s] 27it [00:06, 4.26it/s] 28it [00:06, 4.29it/s] 29it [00:06, 4.36it/s] 30it [00:06, 4.44it/s] 31it [00:07, 4.41it/s] 32it [00:07, 4.41it/s] 33it [00:07, 4.38it/s] 34it [00:07, 4.46it/s] 35it [00:07, 4.42it/s] 36it [00:08, 4.46it/s] 37it [00:08, 4.50it/s] 38it [00:08, 4.53it/s] 39it [00:08, 4.46it/s] 40it [00:09, 4.41it/s] 41it [00:09, 4.44it/s] 42it [00:09, 4.40it/s] 43it [00:09, 4.43it/s] 44it [00:09, 4.27it/s] 45it [00:10, 4.40it/s] 46it [00:10, 4.37it/s] 47it [00:10, 4.35it/s] 48it [00:10, 4.31it/s] 49it [00:11, 4.31it/s] 50it [00:11, 4.42it/s]2025-05-25 21:41:25,221 - INFO - [Epoch 017 | Batch 0050] IWAE-loss 3817.5354 | mean log_px -0.0287 | KL -2182.09 + 51it [00:11, 4.37it/s] 52it [00:11, 4.36it/s] 53it [00:12, 4.34it/s] 54it [00:12, 4.43it/s] 55it [00:12, 4.49it/s] 56it [00:12, 4.42it/s] 57it [00:12, 4.32it/s] 58it [00:13, 4.18it/s] 59it [00:13, 4.11it/s] 60it [00:13, 4.14it/s] 61it [00:13, 4.27it/s] 62it [00:14, 4.38it/s] 63it [00:14, 4.47it/s] 64it [00:14, 4.42it/s] 65it [00:14, 4.47it/s] 66it [00:15, 4.40it/s] 67it [00:15, 4.34it/s] 68it [00:15, 4.45it/s] 69it [00:15, 4.50it/s] 70it [00:15, 4.38it/s] 71it [00:16, 4.36it/s] 72it [00:16, 4.45it/s] 73it [00:16, 4.50it/s] 74it [00:16, 4.48it/s] 75it [00:17, 4.55it/s] 76it [00:17, 4.54it/s] 77it [00:17, 4.42it/s] 78it [00:17, 4.51it/s] 79it [00:17, 4.55it/s] 80it [00:18, 4.58it/s] 81it [00:18, 4.58it/s] 82it [00:18, 4.40it/s] 83it [00:18, 4.34it/s] 84it [00:19, 4.29it/s] 85it [00:19, 4.12it/s] 86it [00:19, 4.24it/s] 87it [00:19, 4.31it/s] 88it [00:20, 4.41it/s] 89it [00:20, 4.48it/s] 90it [00:20, 4.53it/s] 91it [00:20, 4.46it/s] 92it [00:20, 4.41it/s] 93it [00:21, 4.38it/s] 94it [00:21, 4.47it/s] 95it [00:21, 4.51it/s] 96it [00:21, 4.45it/s] 97it [00:22, 4.39it/s] 98it [00:22, 4.39it/s] 99it [00:22, 4.37it/s] 100it [00:22, 4.37it/s]2025-05-25 21:41:36,578 - INFO - [Epoch 017 | Batch 0100] IWAE-loss 2449.2668 | mean log_px -0.0059 | KL -2174.15 + 101it [00:22, 4.42it/s] 102it [00:23, 4.39it/s] 103it [00:23, 4.44it/s] 104it [00:23, 4.53it/s] 105it [00:23, 4.31it/s] 106it [00:24, 4.44it/s] 107it [00:24, 4.49it/s] 108it [00:24, 4.47it/s] 109it [00:24, 4.50it/s] 110it [00:24, 4.44it/s] 111it [00:25, 4.27it/s] 112it [00:25, 4.26it/s] 113it [00:25, 4.25it/s] 114it [00:25, 4.39it/s] 115it [00:26, 4.46it/s] 116it [00:26, 4.53it/s] 117it [00:26, 4.58it/s] 118it [00:26, 4.62it/s] 119it [00:26, 4.65it/s] 120it [00:27, 4.56it/s] 121it [00:27, 4.48it/s] 122it [00:27, 4.39it/s] 123it [00:27, 4.47it/s] 124it [00:28, 4.53it/s] 125it [00:28, 4.59it/s] 126it [00:28, 4.62it/s] 127it [00:28, 4.60it/s] 128it [00:28, 4.62it/s] 129it [00:29, 4.65it/s] 130it [00:29, 4.66it/s] 131it [00:29, 4.56it/s] 132it [00:29, 4.50it/s] 133it [00:30, 4.52it/s] 134it [00:30, 4.56it/s] 135it [00:30, 4.61it/s] 136it [00:30, 4.47it/s] 137it [00:30, 4.56it/s] 138it [00:31, 4.60it/s] 139it [00:31, 4.48it/s] 140it [00:31, 4.45it/s] 141it [00:31, 4.46it/s] 142it [00:32, 4.53it/s] 143it [00:32, 4.58it/s] 144it [00:32, 4.51it/s] 145it [00:32, 4.38it/s] 146it [00:32, 4.48it/s] 147it [00:33, 4.56it/s] 148it [00:33, 4.49it/s] 149it [00:33, 4.44it/s] 150it [00:33, 4.36it/s]2025-05-25 21:41:47,705 - INFO - [Epoch 017 | Batch 0150] IWAE-loss 2379.8494 | mean log_px -0.0040 | KL -2152.76 + 151it [00:34, 4.48it/s] 152it [00:34, 4.54it/s] 153it [00:34, 4.59it/s] 154it [00:34, 4.63it/s] 155it [00:34, 4.66it/s] 156it [00:35, 4.56it/s] 157it [00:35, 4.58it/s] 158it [00:35, 4.51it/s] 159it [00:35, 4.38it/s] 160it [00:36, 4.45it/s] 161it [00:36, 4.52it/s] 162it [00:36, 4.56it/s] 163it [00:36, 4.61it/s] 164it [00:36, 4.64it/s] 165it [00:37, 4.66it/s] 166it [00:37, 4.57it/s] 167it [00:37, 4.59it/s] 168it [00:37, 4.35it/s] 169it [00:38, 4.45it/s] 170it [00:38, 4.51it/s] 171it [00:38, 4.46it/s] 172it [00:38, 4.54it/s] 173it [00:38, 4.56it/s] 174it [00:39, 4.60it/s] 175it [00:39, 4.63it/s] 176it [00:39, 4.55it/s] 177it [00:39, 4.56it/s] 178it [00:39, 4.46it/s] 179it [00:40, 4.43it/s] 180it [00:40, 4.41it/s] 181it [00:40, 4.23it/s] 182it [00:40, 4.38it/s] 183it [00:41, 4.36it/s] 184it [00:41, 4.46it/s] 185it [00:41, 4.43it/s] 186it [00:41, 4.28it/s] 187it [00:42, 4.37it/s] 188it [00:42, 4.37it/s] 189it [00:42, 4.36it/s] 190it [00:42, 4.36it/s] 191it [00:42, 4.43it/s] 192it [00:43, 4.35it/s] 193it [00:43, 4.46it/s] 194it [00:43, 4.52it/s] 195it [00:43, 4.45it/s] 196it [00:44, 4.39it/s] 196it [00:44, 4.44it/s] +2025-05-25 21:41:57,888 - INFO - Epoch: 17, Objective: tensor([2270.9153], device='cuda:0', grad_fn=), Loss: 0.004182320553809404, KL/n: 43.6452751159668 + 0it [00:00, ?it/s]2025-05-25 21:41:58,300 - INFO - [Epoch 018 | Batch 0000] IWAE-loss 2706.3704 | mean log_px -0.0173 | KL -2135.82 + 1it [00:00, 2.96it/s] 2it [00:00, 3.75it/s] 3it [00:00, 4.14it/s] 4it [00:00, 4.33it/s] 5it [00:01, 4.36it/s] 6it [00:01, 4.39it/s] 7it [00:01, 4.25it/s] 8it [00:01, 4.40it/s] 9it [00:02, 4.50it/s] 10it [00:02, 4.56it/s] 11it [00:02, 4.51it/s] 12it [00:02, 4.57it/s] 13it [00:02, 4.54it/s] 14it [00:03, 4.47it/s] 15it [00:03, 4.52it/s] 16it [00:03, 4.51it/s] 17it [00:03, 4.52it/s] 18it [00:04, 4.39it/s] 19it [00:04, 4.47it/s] 20it [00:04, 4.42it/s] 21it [00:04, 4.43it/s] 22it [00:05, 4.42it/s] 23it [00:05, 4.31it/s] 24it [00:05, 4.38it/s] 25it [00:05, 3.53it/s] 26it [00:06, 3.74it/s] 27it [00:06, 3.83it/s] 28it [00:06, 3.97it/s] 29it [00:06, 4.12it/s] 30it [00:07, 4.17it/s] 31it [00:07, 4.26it/s] 32it [00:07, 4.14it/s] 33it [00:07, 4.24it/s] 34it [00:07, 4.28it/s] 35it [00:08, 4.34it/s] 36it [00:08, 4.46it/s] 37it [00:08, 4.47it/s] 38it [00:08, 4.44it/s] 39it [00:09, 4.53it/s] 40it [00:09, 4.46it/s] 41it [00:09, 4.45it/s] 42it [00:09, 4.43it/s] 43it [00:09, 4.50it/s] 44it [00:10, 4.47it/s] 45it [00:10, 4.38it/s] 46it [00:10, 4.37it/s] 47it [00:10, 4.42it/s] 48it [00:11, 4.46it/s] 49it [00:11, 4.52it/s] 50it [00:11, 4.59it/s]2025-05-25 21:42:09,723 - INFO - [Epoch 018 | Batch 0050] IWAE-loss 2571.1865 | mean log_px -0.0093 | KL -2121.10 + 51it [00:11, 4.55it/s] 52it [00:11, 4.55it/s] 53it [00:12, 4.61it/s] 54it [00:12, 4.47it/s] 55it [00:12, 4.55it/s] 56it [00:12, 4.58it/s] 57it [00:13, 4.56it/s] 58it [00:13, 4.53it/s] 59it [00:13, 4.57it/s] 60it [00:13, 4.52it/s] 61it [00:13, 4.41it/s] 62it [00:14, 4.39it/s] 63it [00:14, 4.46it/s] 64it [00:14, 4.42it/s] 65it [00:14, 4.42it/s] 66it [00:15, 4.45it/s] 67it [00:15, 4.50it/s] 68it [00:15, 4.44it/s] 69it [00:15, 4.46it/s] 70it [00:15, 4.50it/s] 71it [00:16, 4.57it/s] 72it [00:16, 4.32it/s] 73it [00:16, 4.37it/s] 74it [00:16, 4.35it/s] 75it [00:17, 4.46it/s] 76it [00:17, 4.46it/s] 77it [00:17, 4.30it/s] 78it [00:17, 4.33it/s] 79it [00:18, 4.44it/s] 80it [00:18, 4.40it/s] 81it [00:18, 4.38it/s] 82it [00:18, 4.42it/s] 83it [00:18, 4.30it/s] 84it [00:19, 4.34it/s] 85it [00:19, 4.45it/s] 86it [00:19, 4.50it/s] 87it [00:19, 4.57it/s] 88it [00:20, 4.61it/s] 89it [00:20, 4.62it/s] 90it [00:20, 4.57it/s] 91it [00:20, 4.55it/s] 92it [00:20, 4.37it/s] 93it [00:21, 4.41it/s] 94it [00:21, 4.41it/s] 95it [00:21, 4.40it/s] 96it [00:21, 4.36it/s] 97it [00:22, 4.43it/s] 98it [00:22, 4.48it/s] 99it [00:22, 4.47it/s] 100it [00:22, 4.47it/s]2025-05-25 21:42:20,954 - INFO - [Epoch 018 | Batch 0100] IWAE-loss 2327.6116 | mean log_px -0.0041 | KL -2106.47 + 101it [00:23, 4.28it/s] 102it [00:23, 4.41it/s] 103it [00:23, 4.50it/s] 104it [00:23, 4.49it/s] 105it [00:23, 4.31it/s] 106it [00:24, 4.34it/s] 107it [00:24, 4.41it/s] 108it [00:24, 4.49it/s] 109it [00:24, 4.43it/s] 110it [00:25, 4.44it/s] 111it [00:25, 4.47it/s] 112it [00:25, 4.47it/s] 113it [00:25, 4.31it/s] 114it [00:25, 4.36it/s] 115it [00:26, 4.37it/s] 116it [00:26, 4.41it/s] 117it [00:26, 4.44it/s] 118it [00:26, 4.48it/s] 119it [00:27, 4.53it/s] 120it [00:27, 4.60it/s] 121it [00:27, 4.55it/s] 122it [00:27, 4.60it/s] 123it [00:27, 4.54it/s] 124it [00:28, 4.56it/s] 125it [00:28, 4.45it/s] 126it [00:28, 4.42it/s] 127it [00:28, 4.31it/s] 128it [00:29, 4.34it/s] 129it [00:29, 4.34it/s] 130it [00:29, 4.44it/s] 131it [00:29, 4.33it/s] 132it [00:29, 4.38it/s] 133it [00:30, 4.40it/s] 134it [00:30, 4.40it/s] 135it [00:30, 4.42it/s] 136it [00:30, 4.40it/s] 137it [00:31, 4.45it/s] 138it [00:31, 4.52it/s] 139it [00:31, 4.58it/s] 140it [00:31, 4.57it/s] 141it [00:31, 4.60it/s] 142it [00:32, 4.63it/s] 143it [00:32, 4.56it/s] 144it [00:32, 4.62it/s] 145it [00:32, 4.62it/s] 146it [00:33, 4.56it/s] 147it [00:33, 4.58it/s] 148it [00:33, 4.44it/s] 149it [00:33, 4.53it/s] 150it [00:33, 4.50it/s]2025-05-25 21:42:32,148 - INFO - [Epoch 018 | Batch 0150] IWAE-loss 3520.7913 | mean log_px -0.0254 | KL -2092.53 + 151it [00:34, 4.53it/s] 152it [00:34, 4.45it/s] 153it [00:34, 4.32it/s] 154it [00:34, 4.33it/s] 155it [00:35, 4.39it/s] 156it [00:35, 4.42it/s] 157it [00:35, 4.51it/s] 158it [00:35, 4.56it/s] 159it [00:35, 4.55it/s] 160it [00:36, 4.52it/s] 161it [00:36, 4.49it/s] 162it [00:36, 4.56it/s] 163it [00:36, 4.32it/s] 164it [00:37, 4.25it/s] 165it [00:37, 4.37it/s] 166it [00:37, 4.47it/s] 167it [00:37, 4.54it/s] 168it [00:38, 4.49it/s] 169it [00:38, 4.46it/s] 170it [00:38, 4.43it/s] 171it [00:38, 4.51it/s] 172it [00:38, 4.38it/s] 173it [00:39, 4.43it/s] 174it [00:39, 4.38it/s] 175it [00:39, 4.39it/s] 176it [00:39, 4.43it/s] 177it [00:40, 4.51it/s] 178it [00:40, 4.44it/s] 179it [00:40, 4.53it/s] 180it [00:40, 4.45it/s] 181it [00:40, 4.48it/s] 182it [00:41, 4.35it/s] 183it [00:41, 4.33it/s] 184it [00:41, 4.40it/s] 185it [00:41, 4.37it/s] 186it [00:42, 4.35it/s] 187it [00:42, 4.35it/s] 188it [00:42, 4.37it/s] 189it [00:42, 4.34it/s] 190it [00:43, 4.43it/s] 191it [00:43, 4.45it/s] 192it [00:43, 4.40it/s] 193it [00:43, 4.49it/s] 194it [00:43, 4.38it/s] 195it [00:44, 4.37it/s] 196it [00:44, 4.35it/s] 196it [00:44, 4.41it/s] +2025-05-25 21:42:42,478 - INFO - Epoch: 18, Objective: tensor([2600.6919], device='cuda:0', grad_fn=), Loss: 0.01254788413643837, KL/n: 42.441864013671875 + 0it [00:00, ?it/s]2025-05-25 21:42:42,882 - INFO - [Epoch 019 | Batch 0000] IWAE-loss 2569.3970 | mean log_px -0.0069 | KL -2083.59 + 1it [00:00, 3.00it/s] 2it [00:00, 3.65it/s] 3it [00:00, 4.03it/s] 4it [00:01, 4.18it/s] 5it [00:01, 4.34it/s] 6it [00:01, 4.43it/s] 7it [00:01, 4.54it/s] 8it [00:01, 4.53it/s] 9it [00:02, 4.49it/s] 10it [00:02, 4.53it/s] 11it [00:02, 4.59it/s] 12it [00:02, 4.60it/s] 13it [00:02, 4.64it/s] 14it [00:03, 4.50it/s] 15it [00:03, 4.59it/s] 16it [00:03, 4.63it/s] 17it [00:03, 4.67it/s] 18it [00:04, 4.69it/s] 19it [00:04, 4.62it/s] 20it [00:04, 4.64it/s] 21it [00:04, 4.67it/s] 22it [00:04, 4.69it/s] 23it [00:05, 4.71it/s] 24it [00:05, 4.70it/s] 25it [00:05, 4.71it/s] 26it [00:05, 4.52it/s] 27it [00:05, 4.60it/s] 28it [00:06, 4.64it/s] 29it [00:06, 4.68it/s] 30it [00:06, 4.69it/s] 31it [00:06, 4.71it/s] 32it [00:07, 4.72it/s] 33it [00:07, 4.73it/s] 34it [00:07, 4.73it/s] 35it [00:07, 4.57it/s] 36it [00:07, 4.64it/s] 37it [00:08, 4.67it/s] 38it [00:08, 4.66it/s] 39it [00:08, 4.69it/s] 40it [00:08, 4.54it/s] 41it [00:08, 4.62it/s] 42it [00:09, 4.65it/s] 43it [00:09, 4.69it/s] 44it [00:09, 4.70it/s] 45it [00:09, 4.72it/s] 46it [00:10, 4.71it/s] 47it [00:10, 4.73it/s] 48it [00:10, 4.73it/s] 49it [00:10, 4.74it/s] 50it [00:10, 4.74it/s]2025-05-25 21:42:53,641 - INFO - [Epoch 019 | Batch 0050] IWAE-loss 2562.2981 | mean log_px -0.0159 | KL -2057.50 + 51it [00:11, 4.74it/s] 52it [00:11, 4.64it/s] 53it [00:11, 4.70it/s] 54it [00:11, 4.71it/s] 55it [00:11, 4.72it/s] 56it [00:12, 4.56it/s] 57it [00:12, 4.63it/s] 58it [00:12, 4.67it/s] 59it [00:12, 4.69it/s] 60it [00:13, 4.71it/s] 61it [00:13, 4.72it/s] 62it [00:13, 4.72it/s] 63it [00:13, 4.73it/s] 64it [00:13, 4.73it/s] 65it [00:14, 4.61it/s] 66it [00:14, 4.66it/s] 67it [00:14, 4.69it/s] 68it [00:14, 4.71it/s] 69it [00:14, 4.72it/s] 70it [00:15, 4.72it/s] 71it [00:15, 4.74it/s] 72it [00:15, 4.73it/s] 73it [00:15, 4.55it/s] 74it [00:16, 4.63it/s] 75it [00:16, 4.66it/s] 76it [00:16, 4.69it/s] 77it [00:16, 4.70it/s] 78it [00:16, 4.72it/s] 79it [00:17, 4.55it/s] 80it [00:17, 4.61it/s] 81it [00:17, 4.66it/s] 82it [00:17, 4.69it/s] 83it [00:17, 4.71it/s] 84it [00:18, 4.71it/s] 85it [00:18, 4.73it/s] 86it [00:18, 4.73it/s] 87it [00:18, 4.74it/s] 88it [00:18, 4.74it/s] 89it [00:19, 4.73it/s] 90it [00:19, 4.73it/s] 91it [00:19, 4.71it/s] 92it [00:19, 4.72it/s] 93it [00:20, 4.72it/s] 94it [00:20, 4.73it/s] 95it [00:20, 4.74it/s] 96it [00:20, 4.74it/s] 97it [00:20, 4.74it/s] 98it [00:21, 4.73it/s] 99it [00:21, 4.75it/s] 100it [00:21, 4.74it/s]2025-05-25 21:43:04,287 - INFO - [Epoch 019 | Batch 0100] IWAE-loss 2413.2510 | mean log_px -0.0084 | KL -2045.86 + 101it [00:21, 4.74it/s] 102it [00:21, 4.61it/s] 103it [00:22, 4.63it/s] 104it [00:22, 4.67it/s] 105it [00:22, 4.69it/s] 106it [00:22, 4.71it/s] 107it [00:23, 4.71it/s] 108it [00:23, 4.72it/s] 109it [00:23, 4.73it/s] 110it [00:23, 4.48it/s] 111it [00:23, 4.54it/s] 112it [00:24, 4.59it/s] 113it [00:24, 4.62it/s] 114it [00:24, 4.64it/s] 115it [00:24, 4.66it/s] 116it [00:24, 4.68it/s] 117it [00:25, 4.70it/s] 118it [00:25, 4.71it/s] 119it [00:25, 4.72it/s] 120it [00:25, 4.72it/s] 121it [00:26, 4.73it/s] 122it [00:26, 4.73it/s] 123it [00:26, 4.74it/s] 124it [00:26, 4.73it/s] 125it [00:26, 4.74it/s] 126it [00:27, 4.74it/s] 127it [00:27, 4.74it/s] 128it [00:27, 4.74it/s] 129it [00:27, 4.74it/s] 130it [00:27, 4.74it/s] 131it [00:28, 4.75it/s] 132it [00:28, 4.74it/s] 133it [00:28, 4.75it/s] 134it [00:28, 4.74it/s] 135it [00:28, 4.74it/s] 136it [00:29, 4.74it/s] 137it [00:29, 4.74it/s] 138it [00:29, 4.73it/s] 139it [00:29, 4.73it/s] 140it [00:30, 4.73it/s] 141it [00:30, 4.74it/s] 142it [00:30, 4.74it/s] 143it [00:30, 4.73it/s] 144it [00:30, 4.73it/s] 145it [00:31, 4.70it/s] 146it [00:31, 4.71it/s] 147it [00:31, 4.73it/s] 148it [00:31, 4.73it/s] 149it [00:31, 4.74it/s] 150it [00:32, 4.73it/s]2025-05-25 21:43:14,913 - INFO - [Epoch 019 | Batch 0150] IWAE-loss 2499.8535 | mean log_px -0.0090 | KL -2029.06 + 151it [00:32, 4.73it/s] 152it [00:32, 4.73it/s] 153it [00:32, 4.74it/s] 154it [00:32, 4.74it/s] 155it [00:33, 4.73it/s] 156it [00:33, 4.73it/s] 157it [00:33, 4.73it/s] 158it [00:33, 4.73it/s] 159it [00:34, 4.74it/s] 160it [00:34, 4.73it/s] 161it [00:34, 4.74it/s] 162it [00:34, 4.74it/s] 163it [00:34, 4.74it/s] 164it [00:35, 4.74it/s] 165it [00:35, 4.75it/s] 166it [00:35, 4.75it/s] 167it [00:35, 4.75it/s] 168it [00:35, 4.74it/s] 169it [00:36, 4.75it/s] 170it [00:36, 4.74it/s] 171it [00:36, 4.75it/s] 172it [00:36, 4.74it/s] 173it [00:37, 4.74it/s] 174it [00:37, 4.74it/s] 175it [00:37, 4.75it/s] 176it [00:37, 4.74it/s] 177it [00:37, 4.74it/s] 178it [00:38, 4.74it/s] 179it [00:38, 4.74it/s] 180it [00:38, 4.74it/s] 181it [00:38, 4.74it/s] 182it [00:38, 4.74it/s] 183it [00:39, 4.74it/s] 184it [00:39, 4.74it/s] 185it [00:39, 4.74it/s] 186it [00:39, 4.74it/s] 187it [00:39, 4.74it/s] 188it [00:40, 4.73it/s] 189it [00:40, 4.74it/s] 190it [00:40, 4.74it/s] 191it [00:40, 4.74it/s] 192it [00:41, 4.74it/s] 193it [00:41, 4.74it/s] 194it [00:41, 4.74it/s] 195it [00:41, 4.55it/s] 196it [00:41, 4.49it/s] 196it [00:41, 4.67it/s] +2025-05-25 21:43:24,581 - INFO - Epoch: 19, Objective: tensor([2346.0564], device='cuda:0', grad_fn=), Loss: 0.010250546969473362, KL/n: 41.190834045410156 + 0it [00:00, ?it/s]2025-05-25 21:43:25,168 - INFO - [Epoch 020 | Batch 0000] IWAE-loss 2297.0408 | mean log_px -0.0067 | KL -2018.12 + 1it [00:00, 2.95it/s] 2it [00:00, 3.60it/s] 3it [00:00, 3.91it/s] 4it [00:01, 4.09it/s] 5it [00:01, 4.19it/s] 6it [00:01, 4.28it/s] 7it [00:01, 4.38it/s] 8it [00:01, 4.37it/s] 9it [00:02, 4.43it/s] 10it [00:02, 4.41it/s] 11it [00:02, 4.38it/s] 12it [00:02, 4.39it/s] 13it [00:03, 4.43it/s] 14it [00:03, 4.43it/s] 15it [00:03, 4.40it/s] 16it [00:03, 4.49it/s] 17it [00:03, 4.54it/s] 18it [00:04, 4.59it/s] 19it [00:04, 4.59it/s] 20it [00:04, 4.53it/s] 21it [00:04, 4.45it/s] 22it [00:05, 4.43it/s] 23it [00:05, 4.49it/s] 24it [00:05, 4.41it/s] 25it [00:05, 4.42it/s] 26it [00:05, 4.48it/s] 27it [00:06, 4.45it/s] 28it [00:06, 4.44it/s] 29it [00:06, 4.46it/s] 30it [00:06, 4.40it/s] 31it [00:07, 4.43it/s] 32it [00:07, 4.37it/s] 33it [00:07, 4.38it/s] 34it [00:07, 4.37it/s] 35it [00:07, 4.43it/s] 36it [00:08, 4.39it/s] 37it [00:08, 4.43it/s] 38it [00:08, 4.43it/s] 39it [00:08, 4.47it/s] 40it [00:09, 4.50it/s] 41it [00:09, 4.55it/s] 42it [00:09, 4.52it/s] 43it [00:09, 4.57it/s] 44it [00:09, 4.51it/s] 45it [00:10, 4.57it/s] 46it [00:10, 4.57it/s] 47it [00:10, 4.58it/s] 48it [00:10, 4.55it/s] 49it [00:11, 4.61it/s] 50it [00:11, 4.55it/s]2025-05-25 21:43:36,349 - INFO - [Epoch 020 | Batch 0050] IWAE-loss 2567.9041 | mean log_px -0.0136 | KL -1997.04 + 51it [00:11, 4.58it/s] 52it [00:11, 4.49it/s] 53it [00:11, 4.45it/s] 54it [00:12, 4.42it/s] 55it [00:12, 4.50it/s] 56it [00:12, 4.56it/s] 57it [00:12, 4.49it/s] 58it [00:13, 4.49it/s] 59it [00:13, 4.44it/s] 60it [00:13, 4.50it/s] 61it [00:13, 4.51it/s] 62it [00:13, 4.54it/s] 63it [00:14, 4.56it/s] 64it [00:14, 4.53it/s] 65it [00:14, 4.45it/s] 66it [00:14, 4.44it/s] 67it [00:15, 4.41it/s] 68it [00:15, 4.39it/s] 69it [00:15, 4.37it/s] 70it [00:15, 4.46it/s] 71it [00:16, 4.45it/s] 72it [00:16, 4.52it/s] 73it [00:16, 4.58it/s] 74it [00:16, 4.61it/s] 75it [00:16, 4.52it/s] 76it [00:17, 4.47it/s] 77it [00:17, 4.45it/s] 78it [00:17, 4.40it/s] 79it [00:17, 4.39it/s] 80it [00:18, 4.36it/s] 81it [00:18, 4.36it/s] 82it [00:18, 4.42it/s] 83it [00:18, 4.44it/s] 84it [00:18, 4.50it/s] 85it [00:19, 4.47it/s] 86it [00:19, 4.41it/s] 87it [00:19, 4.42it/s] 88it [00:19, 4.41it/s] 89it [00:20, 4.41it/s] 90it [00:20, 4.37it/s] 91it [00:20, 4.40it/s] 92it [00:20, 4.47it/s] 93it [00:20, 4.49it/s] 94it [00:21, 4.46it/s] 95it [00:21, 4.47it/s] 96it [00:21, 4.42it/s] 97it [00:21, 4.43it/s] 98it [00:22, 4.47it/s] 99it [00:22, 4.47it/s] 100it [00:22, 4.44it/s]2025-05-25 21:43:47,575 - INFO - [Epoch 020 | Batch 0100] IWAE-loss 3235.3687 | mean log_px -0.0223 | KL -1973.44 + 101it [00:22, 4.49it/s] 102it [00:22, 4.44it/s] 103it [00:23, 4.38it/s] 104it [00:23, 4.40it/s] 105it [00:23, 4.39it/s] 106it [00:23, 4.38it/s] 107it [00:24, 4.41it/s] 108it [00:24, 4.49it/s] 109it [00:24, 4.48it/s] 110it [00:24, 4.54it/s] 111it [00:24, 4.47it/s] 112it [00:25, 4.53it/s] 113it [00:25, 4.46it/s] 114it [00:25, 4.44it/s] 115it [00:25, 4.41it/s] 116it [00:26, 4.49it/s] 117it [00:26, 4.40it/s] 118it [00:26, 4.41it/s] 119it [00:26, 4.41it/s] 120it [00:27, 4.44it/s] 121it [00:27, 4.46it/s] 122it [00:27, 4.53it/s] 123it [00:27, 4.46it/s] 124it [00:27, 4.42it/s] 125it [00:28, 4.33it/s] 126it [00:28, 4.34it/s] 127it [00:28, 4.44it/s] 128it [00:28, 4.39it/s] 129it [00:29, 4.30it/s] 130it [00:29, 4.32it/s] 131it [00:29, 4.33it/s] 132it [00:29, 4.31it/s] 133it [00:29, 4.40it/s] 134it [00:30, 4.46it/s] 135it [00:30, 4.37it/s] 136it [00:30, 4.40it/s] 137it [00:30, 4.43it/s] 138it [00:31, 4.39it/s] 139it [00:31, 4.34it/s] 140it [00:31, 4.33it/s] 141it [00:31, 4.35it/s] 142it [00:32, 4.33it/s] 143it [00:32, 4.36it/s] 144it [00:32, 4.30it/s] 145it [00:32, 4.37it/s] 146it [00:32, 4.34it/s] 147it [00:33, 4.37it/s] 148it [00:33, 4.39it/s] 149it [00:33, 4.41it/s] 150it [00:33, 4.37it/s]2025-05-25 21:43:58,941 - INFO - [Epoch 020 | Batch 0150] IWAE-loss 2351.8418 | mean log_px -0.0055 | KL -1967.71 + 151it [00:34, 4.44it/s] 152it [00:34, 4.41it/s] 153it [00:34, 4.38it/s] 154it [00:34, 4.45it/s] 155it [00:35, 4.45it/s] 156it [00:35, 4.40it/s] 157it [00:35, 4.45it/s] 158it [00:35, 4.41it/s] 159it [00:35, 4.36it/s] 160it [00:36, 4.38it/s] 161it [00:36, 4.41it/s] 162it [00:36, 4.47it/s] 163it [00:36, 4.51it/s] 164it [00:37, 4.40it/s] 165it [00:37, 4.37it/s] 166it [00:37, 4.45it/s] 167it [00:37, 4.35it/s] 168it [00:37, 4.37it/s] 169it [00:38, 4.41it/s] 170it [00:38, 4.47it/s] 171it [00:38, 4.48it/s] 172it [00:38, 4.29it/s] 173it [00:39, 4.27it/s] 174it [00:39, 4.30it/s] 175it [00:39, 4.36it/s] 176it [00:39, 4.35it/s] 177it [00:40, 4.33it/s] 178it [00:40, 4.35it/s] 179it [00:40, 4.29it/s] 180it [00:40, 4.38it/s] 181it [00:40, 4.40it/s] 182it [00:41, 4.30it/s] 183it [00:41, 4.30it/s] 184it [00:41, 4.31it/s] 185it [00:41, 4.42it/s] 186it [00:42, 4.48it/s] 187it [00:42, 4.54it/s] 188it [00:42, 4.50it/s] 189it [00:42, 4.52it/s] 190it [00:42, 4.51it/s] 191it [00:43, 4.58it/s] 192it [00:43, 4.49it/s] 193it [00:43, 4.47it/s] 194it [00:43, 4.45it/s] 195it [00:44, 4.40it/s] 196it [00:44, 4.31it/s] 196it [00:44, 4.41it/s] +2025-05-25 21:44:09,298 - INFO - Epoch: 20, Objective: tensor([2321.2383], device='cuda:0', grad_fn=), Loss: 0.013511824421584606, KL/n: 39.98223876953125 + 0it [00:00, ?it/s]2025-05-25 21:44:09,674 - INFO - [Epoch 021 | Batch 0000] IWAE-loss 2518.2864 | mean log_px -0.0100 | KL -1959.45 + 1it [00:00, 3.31it/s] 2it [00:00, 4.00it/s] 3it [00:00, 4.31it/s] 4it [00:00, 4.42it/s] 5it [00:01, 4.51it/s] 6it [00:01, 4.57it/s] 7it [00:01, 4.62it/s] 8it [00:01, 4.62it/s] 9it [00:02, 4.49it/s] 10it [00:02, 4.57it/s] 11it [00:02, 4.55it/s] 12it [00:02, 3.66it/s] 13it [00:03, 3.93it/s] 14it [00:03, 4.13it/s] 15it [00:03, 4.30it/s] 16it [00:03, 4.42it/s] 17it [00:03, 4.51it/s] 18it [00:04, 4.58it/s] 19it [00:04, 4.63it/s] 20it [00:04, 4.65it/s] 21it [00:04, 4.69it/s] 22it [00:04, 4.69it/s] 23it [00:05, 4.71it/s] 24it [00:05, 4.71it/s] 25it [00:05, 4.72it/s] 26it [00:05, 4.72it/s] 27it [00:06, 4.73it/s] 28it [00:06, 4.72it/s] 29it [00:06, 4.73it/s] 30it [00:06, 4.73it/s] 31it [00:06, 4.73it/s] 32it [00:07, 4.73it/s] 33it [00:07, 4.73it/s] 34it [00:07, 4.72it/s] 35it [00:07, 4.73it/s] 36it [00:07, 4.72it/s] 37it [00:08, 4.60it/s] 38it [00:08, 4.65it/s] 39it [00:08, 4.68it/s] 40it [00:08, 4.69it/s] 41it [00:09, 4.54it/s] 42it [00:09, 4.61it/s] 43it [00:09, 4.64it/s] 44it [00:09, 4.66it/s] 45it [00:09, 4.70it/s] 46it [00:10, 4.70it/s] 47it [00:10, 4.50it/s] 48it [00:10, 4.58it/s] 49it [00:10, 4.62it/s] 50it [00:10, 4.65it/s]2025-05-25 21:44:20,555 - INFO - [Epoch 021 | Batch 0050] IWAE-loss 2608.6096 | mean log_px -0.0148 | KL -1939.67 + 51it [00:11, 4.68it/s] 52it [00:11, 4.68it/s] 53it [00:11, 4.70it/s] 54it [00:11, 4.71it/s] 55it [00:12, 4.72it/s] 56it [00:12, 4.72it/s] 57it [00:12, 4.72it/s] 58it [00:12, 4.72it/s] 59it [00:12, 4.73it/s] 60it [00:13, 4.67it/s] 61it [00:13, 4.69it/s] 62it [00:13, 4.69it/s] 63it [00:13, 4.71it/s] 64it [00:13, 4.71it/s] 65it [00:14, 4.72it/s] 66it [00:14, 4.71it/s] 67it [00:14, 4.72it/s] 68it [00:14, 4.72it/s] 69it [00:14, 4.73it/s] 70it [00:15, 4.72it/s] 71it [00:15, 4.72it/s] 72it [00:15, 4.71it/s] 73it [00:15, 4.72it/s] 74it [00:16, 4.73it/s] 75it [00:16, 4.73it/s] 76it [00:16, 4.72it/s] 77it [00:16, 4.72it/s] 78it [00:16, 4.73it/s] 79it [00:17, 4.74it/s] 80it [00:17, 4.73it/s] 81it [00:17, 4.73it/s] 82it [00:17, 4.72it/s] 83it [00:17, 4.73it/s] 84it [00:18, 4.72it/s] 85it [00:18, 4.72it/s] 86it [00:18, 4.72it/s] 87it [00:18, 4.73it/s] 88it [00:19, 4.73it/s] 89it [00:19, 4.74it/s] 90it [00:19, 4.72it/s] 91it [00:19, 4.73it/s] 92it [00:19, 4.72it/s] 93it [00:20, 4.73it/s] 94it [00:20, 4.73it/s] 95it [00:20, 4.73it/s] 96it [00:20, 4.73it/s] 97it [00:20, 4.72it/s] 98it [00:21, 4.73it/s] 99it [00:21, 4.74it/s] 100it [00:21, 4.73it/s]2025-05-25 21:44:31,142 - INFO - [Epoch 021 | Batch 0100] IWAE-loss 2265.2100 | mean log_px -0.0051 | KL -1927.49 + 101it [00:21, 4.72it/s] 102it [00:21, 4.72it/s] 103it [00:22, 4.74it/s] 104it [00:22, 4.73it/s] 105it [00:22, 4.73it/s] 106it [00:22, 4.72it/s] 107it [00:23, 4.72it/s] 108it [00:23, 4.72it/s] 109it [00:23, 4.73it/s] 110it [00:23, 4.72it/s] 111it [00:23, 4.73it/s] 112it [00:24, 4.74it/s] 113it [00:24, 4.74it/s] 114it [00:24, 4.53it/s] 115it [00:24, 4.60it/s] 116it [00:24, 4.63it/s] 117it [00:25, 4.67it/s] 118it [00:25, 4.69it/s] 119it [00:25, 4.70it/s] 120it [00:25, 4.70it/s] 121it [00:26, 4.70it/s] 122it [00:26, 4.54it/s] 123it [00:26, 4.60it/s] 124it [00:26, 4.64it/s] 125it [00:26, 4.67it/s] 126it [00:27, 4.68it/s] 127it [00:27, 4.71it/s] 128it [00:27, 4.71it/s] 129it [00:27, 4.72it/s] 130it [00:27, 4.72it/s] 131it [00:28, 4.72it/s] 132it [00:28, 4.73it/s] 133it [00:28, 4.74it/s] 134it [00:28, 4.73it/s] 135it [00:29, 4.73it/s] 136it [00:29, 4.73it/s] 137it [00:29, 4.73it/s] 138it [00:29, 4.73it/s] 139it [00:29, 4.73it/s] 140it [00:30, 4.73it/s] 141it [00:30, 4.74it/s] 142it [00:30, 4.62it/s] 143it [00:30, 4.68it/s] 144it [00:30, 4.62it/s] 145it [00:31, 4.55it/s] 146it [00:31, 4.58it/s] 147it [00:31, 4.61it/s] 148it [00:31, 4.63it/s] 149it [00:32, 4.65it/s] 150it [00:32, 4.43it/s]2025-05-25 21:44:41,857 - INFO - [Epoch 021 | Batch 0150] IWAE-loss 2249.6196 | mean log_px -0.0076 | KL -1918.02 + 151it [00:32, 4.41it/s] 152it [00:32, 4.51it/s] 153it [00:32, 4.57it/s] 154it [00:33, 4.61it/s] 155it [00:33, 4.64it/s] 156it [00:33, 4.66it/s] 157it [00:33, 4.68it/s] 158it [00:33, 4.69it/s] 159it [00:34, 4.70it/s] 160it [00:34, 4.70it/s] 161it [00:34, 4.71it/s] 162it [00:34, 4.71it/s] 163it [00:35, 4.70it/s] 164it [00:35, 4.70it/s] 165it [00:35, 4.71it/s] 166it [00:35, 4.70it/s] 167it [00:35, 4.70it/s] 168it [00:36, 4.70it/s] 169it [00:36, 4.54it/s] 170it [00:36, 4.61it/s] 171it [00:36, 4.64it/s] 172it [00:36, 4.66it/s] 173it [00:37, 4.69it/s] 174it [00:37, 4.70it/s] 175it [00:37, 4.71it/s] 176it [00:37, 4.70it/s] 177it [00:38, 4.71it/s] 178it [00:38, 4.54it/s] 179it [00:38, 4.61it/s] 180it [00:38, 4.64it/s] 181it [00:38, 4.68it/s] 182it [00:39, 4.69it/s] 183it [00:39, 4.70it/s] 184it [00:39, 4.70it/s] 185it [00:39, 4.71it/s] 186it [00:39, 4.71it/s] 187it [00:40, 4.71it/s] 188it [00:40, 4.72it/s] 189it [00:40, 4.59it/s] 190it [00:40, 4.64it/s] 191it [00:41, 4.68it/s] 192it [00:41, 4.69it/s] 193it [00:41, 4.68it/s] 194it [00:41, 4.68it/s] 195it [00:41, 4.61it/s] 196it [00:42, 4.49it/s] 196it [00:42, 4.64it/s] +2025-05-25 21:44:51,644 - INFO - Epoch: 21, Objective: tensor([2395.0178], device='cuda:0', grad_fn=), Loss: 0.009308933280408382, KL/n: 39.00183868408203 + 0it [00:00, ?it/s]2025-05-25 21:44:52,024 - INFO - [Epoch 022 | Batch 0000] IWAE-loss 2293.9033 | mean log_px -0.0119 | KL -1907.14 + 1it [00:00, 3.30it/s] 2it [00:00, 3.89it/s] 3it [00:00, 4.19it/s] 4it [00:00, 4.35it/s] 5it [00:01, 4.45it/s] 6it [00:01, 4.52it/s] 7it [00:01, 4.55it/s] 8it [00:01, 4.57it/s] 9it [00:02, 4.59it/s] 10it [00:02, 4.58it/s] 11it [00:02, 4.59it/s] 12it [00:02, 4.57it/s] 13it [00:02, 4.59it/s] 14it [00:03, 4.60it/s] 15it [00:03, 4.60it/s] 16it [00:03, 4.60it/s] 17it [00:03, 4.60it/s] 18it [00:03, 4.61it/s] 19it [00:04, 4.62it/s] 20it [00:04, 4.62it/s] 21it [00:04, 4.60it/s] 22it [00:04, 4.57it/s] 23it [00:05, 4.43it/s] 24it [00:05, 4.38it/s] 25it [00:05, 4.32it/s] 26it [00:05, 4.40it/s] 27it [00:06, 4.47it/s] 28it [00:06, 4.51it/s] 29it [00:06, 4.55it/s] 30it [00:06, 4.56it/s] 31it [00:06, 4.58it/s] 32it [00:07, 4.58it/s] 33it [00:07, 4.59it/s] 34it [00:07, 4.59it/s] 35it [00:07, 4.60it/s] 36it [00:07, 4.60it/s] 37it [00:08, 4.62it/s] 38it [00:08, 4.60it/s] 39it [00:08, 4.48it/s] 40it [00:08, 4.48it/s] 41it [00:09, 4.51it/s] 42it [00:09, 4.53it/s] 43it [00:09, 4.57it/s] 44it [00:09, 4.58it/s] 45it [00:09, 4.56it/s] 46it [00:10, 4.39it/s] 47it [00:10, 4.45it/s] 48it [00:10, 4.49it/s] 49it [00:10, 4.49it/s] 50it [00:11, 4.48it/s]2025-05-25 21:45:03,027 - INFO - [Epoch 022 | Batch 0050] IWAE-loss 2142.6248 | mean log_px -0.0071 | KL -1895.51 + 51it [00:11, 4.49it/s] 52it [00:11, 4.47it/s] 53it [00:11, 4.51it/s] 54it [00:11, 4.38it/s] 55it [00:12, 4.44it/s] 56it [00:12, 4.48it/s] 57it [00:12, 4.50it/s] 58it [00:12, 4.53it/s] 59it [00:13, 4.55it/s] 60it [00:13, 4.56it/s] 61it [00:13, 4.57it/s] 62it [00:13, 4.42it/s] 63it [00:13, 4.48it/s] 64it [00:14, 4.51it/s] 65it [00:14, 4.53it/s] 66it [00:14, 4.52it/s] 67it [00:14, 4.55it/s] 68it [00:15, 4.57it/s] 69it [00:15, 4.43it/s] 70it [00:15, 4.49it/s] 71it [00:15, 4.51it/s] 72it [00:15, 4.52it/s] 73it [00:16, 4.52it/s] 74it [00:16, 4.51it/s] 75it [00:16, 4.52it/s] 76it [00:16, 4.54it/s] 77it [00:17, 4.55it/s] 78it [00:17, 4.53it/s] 79it [00:17, 4.56it/s] 80it [00:17, 4.41it/s] 81it [00:17, 4.47it/s] 82it [00:18, 4.49it/s] 83it [00:18, 4.53it/s] 84it [00:18, 4.54it/s] 85it [00:18, 4.53it/s] 86it [00:19, 4.54it/s] 87it [00:19, 4.56it/s] 88it [00:19, 4.56it/s] 89it [00:19, 4.58it/s] 90it [00:19, 4.56it/s] 91it [00:20, 4.38it/s] 92it [00:20, 4.47it/s] 93it [00:20, 4.54it/s] 94it [00:20, 4.58it/s] 95it [00:21, 4.63it/s] 96it [00:21, 4.51it/s] 97it [00:21, 4.59it/s] 98it [00:21, 4.63it/s] 99it [00:21, 4.65it/s] 100it [00:22, 4.67it/s]2025-05-25 21:45:14,056 - INFO - [Epoch 022 | Batch 0100] IWAE-loss 2433.9939 | mean log_px -0.0126 | KL -1877.79 + 101it [00:22, 4.52it/s] 102it [00:22, 4.59it/s] 103it [00:22, 4.63it/s] 104it [00:22, 4.65it/s] 105it [00:23, 4.68it/s] 106it [00:23, 4.69it/s] 107it [00:23, 4.70it/s] 108it [00:23, 4.70it/s] 109it [00:24, 4.71it/s] 110it [00:24, 4.71it/s] 111it [00:24, 4.72it/s] 112it [00:24, 4.71it/s] 113it [00:24, 4.73it/s] 114it [00:25, 4.72it/s] 115it [00:25, 4.73it/s] 116it [00:25, 4.74it/s] 117it [00:25, 4.73it/s] 118it [00:25, 4.72it/s] 119it [00:26, 4.73it/s] 120it [00:26, 4.73it/s] 121it [00:26, 4.73it/s] 122it [00:26, 4.73it/s] 123it [00:27, 4.73it/s] 124it [00:27, 4.72it/s] 125it [00:27, 4.69it/s] 126it [00:27, 4.71it/s] 127it [00:27, 4.72it/s] 128it [00:28, 4.71it/s] 129it [00:28, 4.72it/s] 130it [00:28, 4.72it/s] 131it [00:28, 4.72it/s] 132it [00:28, 4.72it/s] 133it [00:29, 4.56it/s] 134it [00:29, 4.62it/s] 135it [00:29, 4.65it/s] 136it [00:29, 4.68it/s] 137it [00:30, 4.70it/s] 138it [00:30, 4.70it/s] 139it [00:30, 4.71it/s] 140it [00:30, 4.71it/s] 141it [00:30, 4.72it/s] 142it [00:31, 4.72it/s] 143it [00:31, 4.72it/s] 144it [00:31, 4.71it/s] 145it [00:31, 4.73it/s] 146it [00:31, 4.72it/s] 147it [00:32, 4.73it/s] 148it [00:32, 4.52it/s] 149it [00:32, 4.59it/s] 150it [00:32, 4.63it/s]2025-05-25 21:45:24,719 - INFO - [Epoch 022 | Batch 0150] IWAE-loss 2279.8452 | mean log_px -0.0095 | KL -1866.57 + 151it [00:32, 4.65it/s] 152it [00:33, 4.65it/s] 153it [00:33, 4.67it/s] 154it [00:33, 4.68it/s] 155it [00:33, 4.67it/s] 156it [00:34, 4.67it/s] 157it [00:34, 4.69it/s] 158it [00:34, 4.70it/s] 159it [00:34, 4.71it/s] 160it [00:34, 4.71it/s] 161it [00:35, 4.72it/s] 162it [00:35, 4.55it/s] 163it [00:35, 4.61it/s] 164it [00:35, 4.64it/s] 165it [00:35, 4.66it/s] 166it [00:36, 4.68it/s] 167it [00:36, 4.69it/s] 168it [00:36, 4.70it/s] 169it [00:36, 4.54it/s] 170it [00:37, 4.61it/s] 171it [00:37, 4.64it/s] 172it [00:37, 4.66it/s] 173it [00:37, 4.68it/s] 174it [00:37, 4.53it/s] 175it [00:38, 4.60it/s] 176it [00:38, 4.63it/s] 177it [00:38, 4.66it/s] 178it [00:38, 4.68it/s] 179it [00:39, 4.67it/s] 180it [00:39, 4.68it/s] 181it [00:39, 4.69it/s] 182it [00:39, 4.55it/s] 183it [00:39, 4.61it/s] 184it [00:40, 4.64it/s] 185it [00:40, 4.67it/s] 186it [00:40, 4.67it/s] 187it [00:40, 4.69it/s] 188it [00:40, 4.69it/s] 189it [00:41, 4.70it/s] 190it [00:41, 4.70it/s] 191it [00:41, 4.71it/s] 192it [00:41, 4.71it/s] 193it [00:42, 4.71it/s] 194it [00:42, 4.71it/s] 195it [00:42, 4.44it/s] 196it [00:42, 4.55it/s] 196it [00:42, 4.59it/s] +2025-05-25 21:45:34,521 - INFO - Epoch: 22, Objective: tensor([2321.2053], device='cuda:0', grad_fn=), Loss: 0.0126264663413167, KL/n: 37.90328598022461 + 0it [00:00, ?it/s]2025-05-25 21:45:35,083 - INFO - [Epoch 023 | Batch 0000] IWAE-loss 2031.7919 | mean log_px -0.0048 | KL -1857.27 + 1it [00:00, 3.30it/s] 2it [00:00, 3.99it/s] 3it [00:00, 4.29it/s] 4it [00:00, 4.43it/s] 5it [00:01, 4.54it/s] 6it [00:01, 4.59it/s] 7it [00:01, 4.64it/s] 8it [00:01, 4.66it/s] 9it [00:02, 4.68it/s] 10it [00:02, 4.69it/s] 11it [00:02, 4.70it/s] 12it [00:02, 4.53it/s] 13it [00:02, 4.61it/s] 14it [00:03, 4.64it/s] 15it [00:03, 4.66it/s] 16it [00:03, 4.63it/s] 17it [00:03, 4.67it/s] 18it [00:03, 4.68it/s] 19it [00:04, 4.69it/s] 20it [00:04, 4.69it/s] 21it [00:04, 4.72it/s] 22it [00:04, 4.70it/s] 23it [00:05, 4.70it/s] 24it [00:05, 4.52it/s] 25it [00:05, 4.60it/s] 26it [00:05, 4.64it/s] 27it [00:05, 4.68it/s] 28it [00:06, 4.68it/s] 29it [00:06, 4.69it/s] 30it [00:06, 4.70it/s] 31it [00:06, 4.71it/s] 32it [00:06, 4.68it/s] 33it [00:07, 4.69it/s] 34it [00:07, 4.66it/s] 35it [00:07, 4.67it/s] 36it [00:07, 4.66it/s] 37it [00:08, 4.69it/s] 38it [00:08, 4.69it/s] 39it [00:08, 4.46it/s] 40it [00:08, 4.52it/s] 41it [00:08, 4.58it/s] 42it [00:09, 4.60it/s] 43it [00:09, 4.62it/s] 44it [00:09, 4.64it/s] 45it [00:09, 4.66it/s] 46it [00:09, 4.52it/s] 47it [00:10, 4.59it/s] 48it [00:10, 4.63it/s] 49it [00:10, 4.65it/s] 50it [00:10, 4.66it/s]2025-05-25 21:45:45,828 - INFO - [Epoch 023 | Batch 0050] IWAE-loss 2093.6794 | mean log_px -0.0058 | KL -1840.02 + 51it [00:11, 4.52it/s] 52it [00:11, 4.58it/s] 53it [00:11, 4.62it/s] 54it [00:11, 4.63it/s] 55it [00:11, 4.66it/s] 56it [00:12, 4.68it/s] 57it [00:12, 4.70it/s] 58it [00:12, 4.70it/s] 59it [00:12, 4.71it/s] 60it [00:12, 4.71it/s] 61it [00:13, 4.73it/s] 62it [00:13, 4.72it/s] 63it [00:13, 4.72it/s] 64it [00:13, 4.71it/s] 65it [00:14, 4.72it/s] 66it [00:14, 4.72it/s] 67it [00:14, 4.72it/s] 68it [00:14, 4.69it/s] 69it [00:14, 4.46it/s] 70it [00:15, 4.53it/s] 71it [00:15, 4.58it/s] 72it [00:15, 4.61it/s] 73it [00:15, 4.64it/s] 74it [00:15, 4.64it/s] 75it [00:16, 4.68it/s] 76it [00:16, 4.68it/s] 77it [00:16, 4.70it/s] 78it [00:16, 4.72it/s] 79it [00:17, 4.72it/s] 80it [00:17, 4.72it/s] 81it [00:17, 4.74it/s] 82it [00:17, 4.73it/s] 83it [00:17, 4.73it/s] 84it [00:18, 4.55it/s] 85it [00:18, 4.63it/s] 86it [00:18, 4.61it/s] 87it [00:18, 4.67it/s] 88it [00:18, 4.69it/s] 89it [00:19, 4.70it/s] 90it [00:19, 4.69it/s] 91it [00:19, 4.70it/s] 92it [00:19, 4.70it/s] 93it [00:20, 4.72it/s] 94it [00:20, 4.71it/s] 95it [00:20, 4.72it/s] 96it [00:20, 4.71it/s] 97it [00:20, 4.55it/s] 98it [00:21, 4.61it/s] 99it [00:21, 4.64it/s] 100it [00:21, 4.65it/s]2025-05-25 21:45:56,543 - INFO - [Epoch 023 | Batch 0100] IWAE-loss 2605.1060 | mean log_px -0.0202 | KL -1829.09 + 101it [00:21, 4.68it/s] 102it [00:21, 4.68it/s] 103it [00:22, 4.69it/s] 104it [00:22, 4.70it/s] 105it [00:22, 4.70it/s] 106it [00:22, 4.54it/s] 107it [00:23, 4.61it/s] 108it [00:23, 4.64it/s] 109it [00:23, 4.66it/s] 110it [00:23, 4.68it/s] 111it [00:23, 4.70it/s] 112it [00:24, 4.71it/s] 113it [00:24, 4.71it/s] 114it [00:24, 4.71it/s] 115it [00:24, 4.72it/s] 116it [00:24, 4.67it/s] 117it [00:25, 4.69it/s] 118it [00:25, 4.70it/s] 119it [00:25, 4.71it/s] 120it [00:25, 4.70it/s] 121it [00:26, 4.71it/s] 122it [00:26, 4.68it/s] 123it [00:26, 4.72it/s] 124it [00:26, 4.71it/s] 125it [00:26, 4.71it/s] 126it [00:27, 4.71it/s] 127it [00:27, 4.70it/s] 128it [00:27, 4.53it/s] 129it [00:27, 4.61it/s] 130it [00:27, 4.64it/s] 131it [00:28, 4.66it/s] 132it [00:28, 4.67it/s] 133it [00:28, 4.69it/s] 134it [00:28, 4.69it/s] 135it [00:29, 4.70it/s] 136it [00:29, 4.54it/s] 137it [00:29, 4.60it/s] 138it [00:29, 4.63it/s] 139it [00:29, 4.66it/s] 140it [00:30, 4.64it/s] 141it [00:30, 4.66it/s] 142it [00:30, 4.67it/s] 143it [00:30, 4.69it/s] 144it [00:30, 4.52it/s] 145it [00:31, 4.60it/s] 146it [00:31, 4.63it/s] 147it [00:31, 4.66it/s] 148it [00:31, 4.67it/s] 149it [00:32, 4.68it/s] 150it [00:32, 4.69it/s]2025-05-25 21:46:07,258 - INFO - [Epoch 023 | Batch 0150] IWAE-loss 2053.4185 | mean log_px -0.0083 | KL -1817.16 + 151it [00:32, 4.70it/s] 152it [00:32, 4.70it/s] 153it [00:32, 4.70it/s] 154it [00:33, 4.70it/s] 155it [00:33, 4.71it/s] 156it [00:33, 4.71it/s] 157it [00:33, 4.71it/s] 158it [00:33, 4.71it/s] 159it [00:34, 4.71it/s] 160it [00:34, 4.71it/s] 161it [00:34, 4.72it/s] 162it [00:34, 4.72it/s] 163it [00:35, 4.72it/s] 164it [00:35, 4.71it/s] 165it [00:35, 4.71it/s] 166it [00:35, 4.72it/s] 167it [00:35, 4.71it/s] 168it [00:36, 4.72it/s] 169it [00:36, 4.72it/s] 170it [00:36, 4.71it/s] 171it [00:36, 4.73it/s] 172it [00:36, 4.72it/s] 173it [00:37, 4.54it/s] 174it [00:37, 4.60it/s] 175it [00:37, 4.61it/s] 176it [00:37, 4.65it/s] 177it [00:38, 4.67it/s] 178it [00:38, 4.68it/s] 179it [00:38, 4.69it/s] 180it [00:38, 4.70it/s] 181it [00:38, 4.70it/s] 182it [00:39, 4.71it/s] 183it [00:39, 4.71it/s] 184it [00:39, 4.54it/s] 185it [00:39, 4.55it/s] 186it [00:39, 4.55it/s] 187it [00:40, 4.59it/s] 188it [00:40, 4.63it/s] 189it [00:40, 4.63it/s] 190it [00:40, 4.67it/s] 191it [00:41, 4.68it/s] 192it [00:41, 4.52it/s] 193it [00:41, 4.57it/s] 194it [00:41, 4.60it/s] 195it [00:41, 4.55it/s] 196it [00:42, 4.61it/s] 196it [00:42, 4.64it/s] +2025-05-25 21:46:17,041 - INFO - Epoch: 23, Objective: tensor([2333.9048], device='cuda:0', grad_fn=), Loss: 0.009835069067776203, KL/n: 36.8824462890625 + 0it [00:00, ?it/s]2025-05-25 21:46:17,416 - INFO - [Epoch 024 | Batch 0000] IWAE-loss 2042.8802 | mean log_px -0.0088 | KL -1806.51 + 1it [00:00, 3.33it/s] 2it [00:00, 4.01it/s] 3it [00:00, 4.11it/s] 4it [00:00, 4.35it/s] 5it [00:01, 4.48it/s] 6it [00:01, 4.53it/s] 7it [00:01, 4.61it/s] 8it [00:02, 3.52it/s] 9it [00:02, 3.84it/s] 10it [00:02, 4.07it/s] 11it [00:02, 4.25it/s] 12it [00:02, 4.38it/s] 13it [00:03, 4.48it/s] 14it [00:03, 4.54it/s] 15it [00:03, 4.60it/s] 16it [00:03, 4.63it/s] 17it [00:03, 4.66it/s] 18it [00:04, 4.68it/s] 19it [00:04, 4.52it/s] 20it [00:04, 4.60it/s] 21it [00:04, 4.63it/s] 22it [00:05, 4.62it/s] 23it [00:05, 4.66it/s] 24it [00:05, 4.67it/s] 25it [00:05, 4.70it/s] 26it [00:05, 4.71it/s] 27it [00:06, 4.73it/s] 28it [00:06, 4.73it/s] 29it [00:06, 4.57it/s] 30it [00:06, 4.63it/s] 31it [00:06, 4.67it/s] 32it [00:07, 4.69it/s] 33it [00:07, 4.71it/s] 34it [00:07, 4.56it/s] 35it [00:07, 4.63it/s] 36it [00:08, 4.65it/s] 37it [00:08, 4.68it/s] 38it [00:08, 4.70it/s] 39it [00:08, 4.55it/s] 40it [00:08, 4.62it/s] 41it [00:09, 4.67it/s] 42it [00:09, 4.69it/s] 43it [00:09, 4.69it/s] 44it [00:09, 4.69it/s] 45it [00:09, 4.56it/s] 46it [00:10, 4.61it/s] 47it [00:10, 4.66it/s] 48it [00:10, 4.63it/s] 49it [00:10, 4.67it/s] 50it [00:11, 4.67it/s]2025-05-25 21:46:28,356 - INFO - [Epoch 024 | Batch 0050] IWAE-loss 1896.7238 | mean log_px -0.0014 | KL -1796.85 + 51it [00:11, 4.52it/s] 52it [00:11, 4.60it/s] 53it [00:11, 4.64it/s] 54it [00:11, 4.67it/s] 55it [00:12, 4.53it/s] 56it [00:12, 4.61it/s] 57it [00:12, 4.65it/s] 58it [00:12, 4.67it/s] 59it [00:12, 4.70it/s] 60it [00:13, 4.54it/s] 61it [00:13, 4.62it/s] 62it [00:13, 4.65it/s] 63it [00:13, 4.67it/s] 64it [00:14, 4.69it/s] 65it [00:14, 4.54it/s] 66it [00:14, 4.62it/s] 67it [00:14, 4.65it/s] 68it [00:14, 4.68it/s] 69it [00:15, 4.70it/s] 70it [00:15, 4.71it/s] 71it [00:15, 4.72it/s] 72it [00:15, 4.72it/s] 73it [00:15, 4.73it/s] 74it [00:16, 4.74it/s] 75it [00:16, 4.74it/s] 76it [00:16, 4.57it/s] 77it [00:16, 4.65it/s] 78it [00:17, 4.67it/s] 79it [00:17, 4.69it/s] 80it [00:17, 4.71it/s] 81it [00:17, 4.72it/s] 82it [00:17, 4.73it/s] 83it [00:18, 4.57it/s] 84it [00:18, 4.63it/s] 85it [00:18, 4.66it/s] 86it [00:18, 4.68it/s] 87it [00:18, 4.70it/s] 88it [00:19, 4.54it/s] 89it [00:19, 4.62it/s] 90it [00:19, 4.65it/s] 91it [00:19, 4.68it/s] 92it [00:20, 4.69it/s] 93it [00:20, 4.71it/s] 94it [00:20, 4.73it/s] 95it [00:20, 4.73it/s] 96it [00:20, 4.73it/s] 97it [00:21, 4.74it/s] 98it [00:21, 4.74it/s] 99it [00:21, 4.75it/s] 100it [00:21, 4.74it/s]2025-05-25 21:46:39,070 - INFO - [Epoch 024 | Batch 0100] IWAE-loss 2474.6335 | mean log_px -0.0208 | KL -1782.80 + 101it [00:21, 4.70it/s] 102it [00:22, 4.54it/s] 103it [00:22, 4.62it/s] 104it [00:22, 4.65it/s] 105it [00:22, 4.68it/s] 106it [00:23, 4.69it/s] 107it [00:23, 4.53it/s] 108it [00:23, 4.61it/s] 109it [00:23, 4.65it/s] 110it [00:23, 4.68it/s] 111it [00:24, 4.70it/s] 112it [00:24, 4.71it/s] 113it [00:24, 4.71it/s] 114it [00:24, 4.56it/s] 115it [00:24, 4.63it/s] 116it [00:25, 4.65it/s] 117it [00:25, 4.68it/s] 118it [00:25, 4.69it/s] 119it [00:25, 4.71it/s] 120it [00:26, 4.71it/s] 121it [00:26, 4.56it/s] 122it [00:26, 4.63it/s] 123it [00:26, 4.66it/s] 124it [00:26, 4.66it/s] 125it [00:27, 4.52it/s] 126it [00:27, 4.60it/s] 127it [00:27, 4.65it/s] 128it [00:27, 4.68it/s] 129it [00:27, 4.70it/s] 130it [00:28, 4.68it/s] 131it [00:28, 4.70it/s] 132it [00:28, 4.54it/s] 133it [00:28, 4.48it/s] 134it [00:29, 4.53it/s] 135it [00:29, 4.58it/s] 136it [00:29, 4.62it/s] 137it [00:29, 4.64it/s] 138it [00:29, 4.53it/s] 139it [00:30, 4.61it/s] 140it [00:30, 4.58it/s] 141it [00:30, 4.50it/s] 142it [00:30, 4.57it/s] 143it [00:31, 4.62it/s] 144it [00:31, 4.66it/s] 145it [00:31, 4.69it/s] 146it [00:31, 4.55it/s] 147it [00:31, 4.63it/s] 148it [00:32, 4.66it/s] 149it [00:32, 4.66it/s] 150it [00:32, 4.65it/s]2025-05-25 21:46:49,879 - INFO - [Epoch 024 | Batch 0150] IWAE-loss 2033.4376 | mean log_px -0.0059 | KL -1774.52 + 151it [00:32, 4.68it/s] 152it [00:32, 4.70it/s] 153it [00:33, 4.69it/s] 154it [00:33, 4.70it/s] 155it [00:33, 4.72it/s] 156it [00:33, 4.72it/s] 157it [00:34, 4.56it/s] 158it [00:34, 4.63it/s] 159it [00:34, 4.66it/s] 160it [00:34, 4.68it/s] 161it [00:34, 4.70it/s] 162it [00:35, 4.54it/s] 163it [00:35, 4.62it/s] 164it [00:35, 4.64it/s] 165it [00:35, 4.67it/s] 166it [00:35, 4.69it/s] 167it [00:36, 4.71it/s] 168it [00:36, 4.71it/s] 169it [00:36, 4.72it/s] 170it [00:36, 4.72it/s] 171it [00:37, 4.73it/s] 172it [00:37, 4.56it/s] 173it [00:37, 4.63it/s] 174it [00:37, 4.66it/s] 175it [00:37, 4.68it/s] 176it [00:38, 4.69it/s] 177it [00:38, 4.71it/s] 178it [00:38, 4.72it/s] 179it [00:38, 4.73it/s] 180it [00:38, 4.56it/s] 181it [00:39, 4.63it/s] 182it [00:39, 4.66it/s] 183it [00:39, 4.68it/s] 184it [00:39, 4.70it/s] 185it [00:40, 4.54it/s] 186it [00:40, 4.60it/s] 187it [00:40, 4.65it/s] 188it [00:40, 4.68it/s] 189it [00:40, 4.70it/s] 190it [00:41, 4.54it/s] 191it [00:41, 4.62it/s] 192it [00:41, 4.65it/s] 193it [00:41, 4.68it/s] 194it [00:41, 4.70it/s] 195it [00:42, 4.62it/s] 196it [00:42, 4.66it/s] 196it [00:42, 4.61it/s] +2025-05-25 21:46:59,665 - INFO - Epoch: 24, Objective: tensor([2720.5593], device='cuda:0', grad_fn=), Loss: 0.01608070731163025, KL/n: 36.15454864501953 + 0it [00:00, ?it/s]2025-05-25 21:47:00,042 - INFO - [Epoch 025 | Batch 0000] IWAE-loss 2173.3323 | mean log_px -0.0057 | KL -1770.69 + 1it [00:00, 3.04it/s] 2it [00:00, 3.64it/s] 3it [00:00, 3.92it/s] 4it [00:01, 4.03it/s] 5it [00:01, 4.13it/s] 6it [00:01, 4.08it/s] 7it [00:01, 4.26it/s] 8it [00:01, 4.24it/s] 9it [00:02, 4.22it/s] 10it [00:02, 4.26it/s] 11it [00:02, 4.24it/s] 12it [00:02, 4.36it/s] 13it [00:03, 4.47it/s] 14it [00:03, 4.53it/s] 15it [00:03, 4.57it/s] 16it [00:03, 4.59it/s] 17it [00:03, 4.60it/s] 18it [00:04, 4.47it/s] 19it [00:04, 4.49it/s] 20it [00:04, 4.28it/s] 21it [00:04, 4.32it/s] 22it [00:05, 4.41it/s] 23it [00:05, 4.50it/s] 24it [00:05, 4.52it/s] 25it [00:05, 4.57it/s] 26it [00:06, 4.45it/s] 27it [00:06, 4.29it/s] 28it [00:06, 4.28it/s] 29it [00:06, 4.27it/s] 30it [00:06, 4.21it/s] 31it [00:07, 4.24it/s] 32it [00:07, 4.21it/s] 33it [00:07, 4.32it/s] 34it [00:07, 4.27it/s] 35it [00:08, 4.27it/s] 36it [00:08, 4.35it/s] 37it [00:08, 4.18it/s] 38it [00:08, 4.17it/s] 39it [00:09, 4.23it/s] 40it [00:09, 4.32it/s] 41it [00:09, 4.41it/s] 42it [00:09, 4.31it/s] 43it [00:09, 4.32it/s] 44it [00:10, 4.37it/s] 45it [00:10, 4.45it/s] 46it [00:10, 4.36it/s] 47it [00:10, 4.45it/s] 48it [00:11, 4.50it/s] 49it [00:11, 4.40it/s] 50it [00:11, 4.46it/s]2025-05-25 21:47:11,538 - INFO - [Epoch 025 | Batch 0050] IWAE-loss 1950.6661 | mean log_px -0.0028 | KL -1755.02 + 51it [00:11, 4.39it/s] 52it [00:12, 4.43it/s] 53it [00:12, 4.23it/s] 54it [00:12, 4.33it/s] 55it [00:12, 4.38it/s] 56it [00:12, 4.34it/s] 57it [00:13, 4.33it/s] 58it [00:13, 4.40it/s] 59it [00:13, 4.43it/s] 60it [00:13, 4.48it/s] 61it [00:14, 4.53it/s] 62it [00:14, 4.55it/s] 63it [00:14, 4.54it/s] 64it [00:14, 4.45it/s] 65it [00:14, 4.52it/s] 66it [00:15, 4.49it/s] 67it [00:15, 4.54it/s] 68it [00:15, 4.41it/s] 69it [00:15, 4.37it/s] 70it [00:16, 4.32it/s] 71it [00:16, 4.17it/s] 72it [00:16, 4.16it/s] 73it [00:16, 4.20it/s] 74it [00:17, 4.30it/s] 75it [00:17, 4.40it/s] 76it [00:17, 4.42it/s] 77it [00:17, 4.31it/s] 78it [00:17, 4.26it/s] 79it [00:18, 4.35it/s] 80it [00:18, 4.38it/s] 81it [00:18, 4.43it/s] 82it [00:18, 4.43it/s] 83it [00:19, 4.39it/s] 84it [00:19, 4.25it/s] 85it [00:19, 4.36it/s] 86it [00:19, 4.32it/s] 87it [00:20, 4.27it/s] 88it [00:20, 4.26it/s] 89it [00:20, 4.37it/s] 90it [00:20, 4.32it/s] 91it [00:20, 4.29it/s] 92it [00:21, 4.22it/s] 93it [00:21, 4.23it/s] 94it [00:21, 4.31it/s] 95it [00:21, 4.29it/s] 96it [00:22, 4.35it/s] 97it [00:22, 4.30it/s] 98it [00:22, 4.26it/s] 99it [00:22, 4.31it/s] 100it [00:23, 4.25it/s]2025-05-25 21:47:23,055 - INFO - [Epoch 025 | Batch 0100] IWAE-loss 1830.5348 | mean log_px -0.0022 | KL -1743.90 + 101it [00:23, 4.23it/s] 102it [00:23, 4.15it/s] 103it [00:23, 4.17it/s] 104it [00:24, 4.16it/s] 105it [00:24, 4.21it/s] 106it [00:24, 4.30it/s] 107it [00:24, 4.28it/s] 108it [00:25, 4.09it/s] 109it [00:25, 4.13it/s] 110it [00:25, 4.17it/s] 111it [00:25, 4.19it/s] 112it [00:25, 4.27it/s] 113it [00:26, 4.38it/s] 114it [00:26, 4.32it/s] 115it [00:26, 4.44it/s] 116it [00:26, 4.52it/s] 117it [00:27, 4.42it/s] 118it [00:27, 4.27it/s] 119it [00:27, 4.27it/s] 120it [00:27, 4.31it/s] 121it [00:28, 4.30it/s] 122it [00:28, 4.31it/s] 123it [00:28, 4.34it/s] 124it [00:28, 4.28it/s] 125it [00:28, 4.28it/s] 126it [00:29, 4.31it/s] 127it [00:29, 4.31it/s] 128it [00:29, 4.39it/s] 129it [00:29, 4.45it/s] 130it [00:30, 4.25it/s] 131it [00:30, 4.26it/s] 132it [00:30, 4.30it/s] 133it [00:30, 4.29it/s] 134it [00:31, 4.31it/s] 135it [00:31, 4.36it/s] 136it [00:31, 4.31it/s] 137it [00:31, 4.33it/s] 138it [00:31, 4.40it/s] 139it [00:32, 4.48it/s] 140it [00:32, 4.38it/s] 141it [00:32, 4.41it/s] 142it [00:32, 4.29it/s] 143it [00:33, 4.37it/s] 144it [00:33, 4.45it/s] 145it [00:33, 4.41it/s] 146it [00:33, 4.35it/s] 147it [00:33, 4.37it/s] 148it [00:34, 4.22it/s] 149it [00:34, 4.37it/s] 150it [00:34, 4.34it/s]2025-05-25 21:47:34,634 - INFO - [Epoch 025 | Batch 0150] IWAE-loss 2106.1345 | mean log_px -0.0053 | KL -1734.84 + 151it [00:34, 4.44it/s] 152it [00:35, 4.51it/s] 153it [00:35, 4.56it/s] 154it [00:35, 4.32it/s] 155it [00:35, 4.31it/s] 156it [00:36, 4.34it/s] 157it [00:36, 4.33it/s] 158it [00:36, 4.39it/s] 159it [00:36, 4.48it/s] 160it [00:36, 4.38it/s] 161it [00:37, 4.50it/s] 162it [00:37, 4.41it/s] 163it [00:37, 4.46it/s] 164it [00:37, 4.41it/s] 165it [00:38, 4.49it/s] 166it [00:38, 4.40it/s] 167it [00:38, 4.38it/s] 168it [00:38, 4.46it/s] 169it [00:38, 4.53it/s] 170it [00:39, 4.45it/s] 171it [00:39, 4.40it/s] 172it [00:39, 4.24it/s] 173it [00:39, 4.37it/s] 174it [00:40, 4.45it/s] 175it [00:40, 4.38it/s] 176it [00:40, 4.39it/s] 177it [00:40, 4.48it/s] 178it [00:41, 4.39it/s] 179it [00:41, 4.38it/s] 180it [00:41, 4.39it/s] 181it [00:41, 4.37it/s] 182it [00:41, 4.44it/s] 183it [00:42, 4.40it/s] 184it [00:42, 4.48it/s] 185it [00:42, 4.55it/s] 186it [00:42, 4.59it/s] 187it [00:43, 4.63it/s] 188it [00:43, 4.49it/s] 189it [00:43, 4.43it/s] 190it [00:43, 4.51it/s] 191it [00:43, 4.48it/s] 192it [00:44, 4.42it/s] 193it [00:44, 4.49it/s] 194it [00:44, 4.28it/s] 195it [00:44, 4.28it/s] 196it [00:45, 4.40it/s] 196it [00:45, 4.34it/s] +2025-05-25 21:47:44,925 - INFO - Epoch: 25, Objective: tensor([2120.1199], device='cuda:0', grad_fn=), Loss: 0.009839070029556751, KL/n: 35.31795120239258 + 0it [00:00, ?it/s]2025-05-25 21:47:45,503 - INFO - [Epoch 026 | Batch 0000] IWAE-loss 2901.0183 | mean log_px -0.0300 | KL -1724.86 + 1it [00:00, 3.04it/s] 2it [00:00, 3.69it/s] 3it [00:00, 4.08it/s] 4it [00:01, 4.12it/s] 5it [00:01, 4.30it/s] 6it [00:01, 4.41it/s] 7it [00:01, 4.50it/s] 8it [00:01, 4.45it/s] 9it [00:02, 4.49it/s] 10it [00:02, 4.38it/s] 11it [00:02, 4.44it/s] 12it [00:02, 4.43it/s] 13it [00:03, 4.49it/s] 14it [00:03, 4.54it/s] 15it [00:03, 4.50it/s] 16it [00:03, 4.29it/s] 17it [00:03, 4.31it/s] 18it [00:04, 4.31it/s] 19it [00:04, 4.34it/s] 20it [00:04, 4.41it/s] 21it [00:04, 4.42it/s] 22it [00:05, 4.23it/s] 23it [00:05, 4.21it/s] 24it [00:05, 4.28it/s] 25it [00:05, 4.38it/s] 26it [00:05, 4.43it/s] 27it [00:06, 4.38it/s] 28it [00:06, 4.35it/s] 29it [00:06, 4.26it/s] 30it [00:06, 4.36it/s] 31it [00:07, 4.43it/s] 32it [00:07, 4.47it/s] 33it [00:07, 4.48it/s] 34it [00:07, 4.49it/s] 35it [00:08, 4.49it/s] 36it [00:08, 4.42it/s] 37it [00:08, 4.45it/s] 38it [00:08, 4.40it/s] 39it [00:08, 4.49it/s] 40it [00:09, 4.54it/s] 41it [00:09, 4.49it/s] 42it [00:09, 4.47it/s] 43it [00:09, 4.43it/s] 44it [00:10, 4.25it/s] 45it [00:10, 4.33it/s] 46it [00:10, 4.42it/s] 47it [00:10, 4.47it/s] 48it [00:10, 4.52it/s] 49it [00:11, 4.55it/s] 50it [00:11, 4.58it/s]2025-05-25 21:47:56,781 - INFO - [Epoch 026 | Batch 0050] IWAE-loss 2016.3051 | mean log_px -0.0103 | KL -1714.56 + 51it [00:11, 4.43it/s] 52it [00:11, 4.49it/s] 53it [00:12, 4.49it/s] 54it [00:12, 4.52it/s] 55it [00:12, 4.49it/s] 56it [00:12, 4.53it/s] 57it [00:12, 4.54it/s] 58it [00:13, 4.57it/s] 59it [00:13, 4.47it/s] 60it [00:13, 4.51it/s] 61it [00:13, 4.37it/s] 62it [00:14, 4.37it/s] 63it [00:14, 4.41it/s] 64it [00:14, 4.38it/s] 65it [00:14, 4.41it/s] 66it [00:14, 4.48it/s] 67it [00:15, 4.31it/s] 68it [00:15, 4.32it/s] 69it [00:15, 4.37it/s] 70it [00:15, 4.44it/s] 71it [00:16, 4.51it/s] 72it [00:16, 4.52it/s] 73it [00:16, 4.50it/s] 74it [00:16, 4.53it/s] 75it [00:16, 4.58it/s] 76it [00:17, 4.49it/s] 77it [00:17, 4.49it/s] 78it [00:17, 4.45it/s] 79it [00:17, 4.46it/s] 80it [00:18, 4.41it/s] 81it [00:18, 4.37it/s] 82it [00:18, 4.31it/s] 83it [00:18, 4.31it/s] 84it [00:19, 4.40it/s] 85it [00:19, 4.45it/s] 86it [00:19, 4.48it/s] 87it [00:19, 4.52it/s] 88it [00:19, 4.49it/s] 89it [00:20, 4.49it/s] 90it [00:20, 4.26it/s] 91it [00:20, 4.26it/s] 92it [00:20, 4.36it/s] 93it [00:21, 4.33it/s] 94it [00:21, 4.42it/s] 95it [00:21, 4.47it/s] 96it [00:21, 4.37it/s] 97it [00:21, 4.45it/s] 98it [00:22, 4.41it/s] 99it [00:22, 4.35it/s] 100it [00:22, 4.43it/s]2025-05-25 21:48:08,074 - INFO - [Epoch 026 | Batch 0100] IWAE-loss 2671.4316 | mean log_px -0.0232 | KL -1705.30 + 101it [00:22, 4.34it/s] 102it [00:23, 4.43it/s] 103it [00:23, 4.49it/s] 104it [00:23, 4.44it/s] 105it [00:23, 4.44it/s] 106it [00:24, 4.50it/s] 107it [00:24, 4.43it/s] 108it [00:24, 4.35it/s] 109it [00:24, 4.32it/s] 110it [00:24, 4.40it/s] 111it [00:25, 4.32it/s] 112it [00:25, 4.32it/s] 113it [00:25, 4.37it/s] 114it [00:25, 4.25it/s] 115it [00:26, 4.33it/s] 116it [00:26, 4.31it/s] 117it [00:26, 4.31it/s] 118it [00:26, 4.30it/s] 119it [00:27, 4.32it/s] 120it [00:27, 4.32it/s] 121it [00:27, 4.20it/s] 122it [00:27, 4.35it/s] 123it [00:27, 4.44it/s] 124it [00:28, 4.50it/s] 125it [00:28, 4.43it/s] 126it [00:28, 4.42it/s] 127it [00:28, 4.46it/s] 128it [00:29, 4.52it/s] 129it [00:29, 4.57it/s] 130it [00:29, 4.50it/s] 131it [00:29, 4.52it/s] 132it [00:29, 4.48it/s] 133it [00:30, 4.43it/s] 134it [00:30, 4.39it/s] 135it [00:30, 4.38it/s] 136it [00:30, 4.38it/s] 137it [00:31, 4.36it/s] 138it [00:31, 4.46it/s] 139it [00:31, 4.37it/s] 140it [00:31, 4.41it/s] 141it [00:32, 4.38it/s] 142it [00:32, 4.47it/s] 143it [00:32, 4.43it/s] 144it [00:32, 4.50it/s] 145it [00:32, 4.55it/s] 146it [00:33, 4.45it/s] 147it [00:33, 4.42it/s] 148it [00:33, 4.41it/s] 149it [00:33, 4.46it/s] 150it [00:34, 4.52it/s]2025-05-25 21:48:19,407 - INFO - [Epoch 026 | Batch 0150] IWAE-loss 3300.8362 | mean log_px -0.0360 | KL -1700.18 + 151it [00:34, 4.41it/s] 152it [00:34, 4.51it/s] 153it [00:34, 4.37it/s] 154it [00:34, 4.32it/s] 155it [00:35, 4.32it/s] 156it [00:35, 4.34it/s] 157it [00:35, 4.26it/s] 158it [00:35, 4.40it/s] 159it [00:36, 4.45it/s] 160it [00:36, 4.43it/s] 161it [00:36, 4.37it/s] 162it [00:36, 4.40it/s] 163it [00:37, 4.38it/s] 164it [00:37, 4.32it/s] 165it [00:37, 4.42it/s] 166it [00:37, 4.42it/s] 167it [00:37, 4.36it/s] 168it [00:38, 4.43it/s] 169it [00:38, 4.48it/s] 170it [00:38, 4.54it/s] 171it [00:38, 4.59it/s] 172it [00:38, 4.62it/s] 173it [00:39, 4.47it/s] 174it [00:39, 4.55it/s] 175it [00:39, 4.54it/s] 176it [00:39, 4.59it/s] 177it [00:40, 4.62it/s] 178it [00:40, 4.64it/s] 179it [00:40, 4.51it/s] 180it [00:40, 4.48it/s] 181it [00:40, 4.50it/s] 182it [00:41, 4.46it/s] 183it [00:41, 4.41it/s] 184it [00:41, 4.49it/s] 185it [00:41, 4.43it/s] 186it [00:42, 4.27it/s] 187it [00:42, 4.37it/s] 188it [00:42, 4.46it/s] 189it [00:42, 4.54it/s] 190it [00:43, 4.48it/s] 191it [00:43, 4.42it/s] 192it [00:43, 4.41it/s] 193it [00:43, 4.38it/s] 194it [00:43, 4.23it/s] 195it [00:44, 4.26it/s] 196it [00:44, 4.31it/s] 196it [00:44, 4.40it/s] +2025-05-25 21:48:29,732 - INFO - Epoch: 26, Objective: tensor([2170.3135], device='cuda:0', grad_fn=), Loss: 0.008433881215751171, KL/n: 34.64965057373047 + 0it [00:00, ?it/s]2025-05-25 21:48:30,134 - INFO - [Epoch 027 | Batch 0000] IWAE-loss 1838.5685 | mean log_px -0.0048 | KL -1699.11 + 1it [00:00, 3.00it/s] 2it [00:00, 3.78it/s] 3it [00:00, 4.16it/s] 4it [00:00, 4.29it/s] 5it [00:01, 4.29it/s] 6it [00:01, 4.43it/s] 7it [00:01, 4.53it/s] 8it [00:01, 4.57it/s] 9it [00:02, 4.62it/s] 10it [00:02, 4.64it/s] 11it [00:02, 4.52it/s] 12it [00:02, 4.58it/s] 13it [00:02, 4.62it/s] 14it [00:03, 4.64it/s] 15it [00:03, 4.39it/s] 16it [00:03, 4.49it/s] 17it [00:03, 4.53it/s] 18it [00:04, 4.40it/s] 19it [00:04, 4.40it/s] 20it [00:04, 4.44it/s] 21it [00:04, 4.51it/s] 22it [00:04, 4.57it/s] 23it [00:05, 4.61it/s] 24it [00:05, 4.63it/s] 25it [00:05, 4.65it/s] 26it [00:05, 4.50it/s] 27it [00:06, 4.56it/s] 28it [00:06, 4.61it/s] 29it [00:06, 4.57it/s] 30it [00:06, 4.61it/s] 31it [00:06, 4.64it/s] 32it [00:07, 4.65it/s] 33it [00:07, 4.66it/s] 34it [00:07, 4.66it/s] 35it [00:07, 4.46it/s] 36it [00:07, 4.54it/s] 37it [00:08, 4.60it/s] 38it [00:08, 4.63it/s] 39it [00:08, 4.66it/s] 40it [00:08, 4.68it/s] 41it [00:09, 4.70it/s] 42it [00:09, 4.54it/s] 43it [00:09, 4.60it/s] 44it [00:09, 4.62it/s] 45it [00:09, 4.65it/s] 46it [00:10, 4.67it/s] 47it [00:10, 4.69it/s] 48it [00:10, 4.69it/s] 49it [00:10, 4.70it/s] 50it [00:10, 4.70it/s]2025-05-25 21:48:41,009 - INFO - [Epoch 027 | Batch 0050] IWAE-loss 2172.3386 | mean log_px -0.0069 | KL -1685.88 + 51it [00:11, 4.54it/s] 52it [00:11, 4.59it/s] 53it [00:11, 4.63it/s] 54it [00:11, 4.63it/s] 55it [00:12, 4.65it/s] 56it [00:12, 4.51it/s] 57it [00:12, 4.57it/s] 58it [00:12, 4.60it/s] 59it [00:12, 4.64it/s] 60it [00:13, 4.66it/s] 61it [00:13, 4.52it/s] 62it [00:13, 4.58it/s] 63it [00:13, 4.62it/s] 64it [00:14, 4.65it/s] 65it [00:14, 4.67it/s] 66it [00:14, 4.52it/s] 67it [00:14, 4.56it/s] 68it [00:14, 4.60it/s] 69it [00:15, 4.63it/s] 70it [00:15, 4.66it/s] 71it [00:15, 4.68it/s] 72it [00:15, 4.69it/s] 73it [00:15, 4.57it/s] 74it [00:16, 4.62it/s] 75it [00:16, 4.65it/s] 76it [00:16, 4.66it/s] 77it [00:17, 3.71it/s] 78it [00:17, 3.96it/s] 79it [00:17, 4.16it/s] 80it [00:17, 4.32it/s] 81it [00:17, 4.42it/s] 82it [00:18, 4.51it/s] 83it [00:18, 4.57it/s] 84it [00:18, 4.45it/s] 85it [00:18, 4.54it/s] 86it [00:18, 4.59it/s] 87it [00:19, 4.63it/s] 88it [00:19, 4.66it/s] 89it [00:19, 4.68it/s] 90it [00:19, 4.69it/s] 91it [00:20, 4.71it/s] 92it [00:20, 4.71it/s] 93it [00:20, 4.54it/s] 94it [00:20, 4.61it/s] 95it [00:20, 4.65it/s] 96it [00:21, 4.68it/s] 97it [00:21, 4.70it/s] 98it [00:21, 4.70it/s] 99it [00:21, 4.48it/s] 100it [00:21, 4.53it/s]2025-05-25 21:48:52,010 - INFO - [Epoch 027 | Batch 0100] IWAE-loss 2017.5281 | mean log_px -0.0098 | KL -1670.65 + 101it [00:22, 4.55it/s] 102it [00:22, 4.58it/s] 103it [00:22, 4.61it/s] 104it [00:22, 4.62it/s] 105it [00:23, 4.64it/s] 106it [00:23, 4.65it/s] 107it [00:23, 4.67it/s] 108it [00:23, 4.69it/s] 109it [00:23, 4.70it/s] 110it [00:24, 4.71it/s] 111it [00:24, 4.72it/s] 112it [00:24, 4.72it/s] 113it [00:24, 4.69it/s] 114it [00:24, 4.70it/s] 115it [00:25, 4.71it/s] 116it [00:25, 4.71it/s] 117it [00:25, 4.71it/s] 118it [00:25, 4.72it/s] 119it [00:26, 4.57it/s] 120it [00:26, 4.62it/s] 121it [00:26, 4.66it/s] 122it [00:26, 4.66it/s] 123it [00:26, 4.67it/s] 124it [00:27, 4.68it/s] 125it [00:27, 4.70it/s] 126it [00:27, 4.70it/s] 127it [00:27, 4.54it/s] 128it [00:27, 4.60it/s] 129it [00:28, 4.64it/s] 130it [00:28, 4.66it/s] 131it [00:28, 4.68it/s] 132it [00:28, 4.70it/s] 133it [00:29, 4.71it/s] 134it [00:29, 4.71it/s] 135it [00:29, 4.71it/s] 136it [00:29, 4.54it/s] 137it [00:29, 4.61it/s] 138it [00:30, 4.64it/s] 139it [00:30, 4.66it/s] 140it [00:30, 4.68it/s] 141it [00:30, 4.69it/s] 142it [00:31, 4.53it/s] 143it [00:31, 4.60it/s] 144it [00:31, 4.64it/s] 145it [00:31, 4.67it/s] 146it [00:31, 4.67it/s] 147it [00:32, 4.69it/s] 148it [00:32, 4.70it/s] 149it [00:32, 4.70it/s] 150it [00:32, 4.71it/s]2025-05-25 21:49:02,718 - INFO - [Epoch 027 | Batch 0150] IWAE-loss 2334.5696 | mean log_px -0.0127 | KL -1661.62 + 151it [00:32, 4.54it/s] 152it [00:33, 4.61it/s] 153it [00:33, 4.65it/s] 154it [00:33, 4.65it/s] 155it [00:33, 4.68it/s] 156it [00:33, 4.68it/s] 157it [00:34, 4.70it/s] 158it [00:34, 4.70it/s] 159it [00:34, 4.70it/s] 160it [00:34, 4.70it/s] 161it [00:35, 4.54it/s] 162it [00:35, 4.61it/s] 163it [00:35, 4.64it/s] 164it [00:35, 4.67it/s] 165it [00:35, 4.69it/s] 166it [00:36, 4.69it/s] 167it [00:36, 4.71it/s] 168it [00:36, 4.71it/s] 169it [00:36, 4.72it/s] 170it [00:36, 4.72it/s] 171it [00:37, 4.72it/s] 172it [00:37, 4.71it/s] 173it [00:37, 4.72it/s] 174it [00:37, 4.72it/s] 175it [00:38, 4.72it/s] 176it [00:38, 4.72it/s] 177it [00:38, 4.73it/s] 178it [00:38, 4.72it/s] 179it [00:38, 4.73it/s] 180it [00:39, 4.73it/s] 181it [00:39, 4.53it/s] 182it [00:39, 4.60it/s] 183it [00:39, 4.64it/s] 184it [00:39, 4.65it/s] 185it [00:40, 4.68it/s] 186it [00:40, 4.52it/s] 187it [00:40, 4.60it/s] 188it [00:40, 4.60it/s] 189it [00:41, 4.64it/s] 190it [00:41, 4.65it/s] 191it [00:41, 4.67it/s] 192it [00:41, 4.69it/s] 193it [00:41, 4.52it/s] 194it [00:42, 4.59it/s] 195it [00:42, 4.43it/s] 196it [00:42, 4.49it/s] 196it [00:42, 4.59it/s] +2025-05-25 21:49:12,547 - INFO - Epoch: 27, Objective: tensor([2400.2996], device='cuda:0', grad_fn=), Loss: 0.009168989956378937, KL/n: 33.872135162353516 + 0it [00:00, ?it/s]2025-05-25 21:49:12,978 - INFO - [Epoch 028 | Batch 0000] IWAE-loss 1821.6100 | mean log_px -0.0041 | KL -1660.52 + 1it [00:00, 2.80it/s] 2it [00:00, 3.69it/s] 3it [00:00, 4.07it/s] 4it [00:00, 4.30it/s] 5it [00:01, 4.46it/s] 6it [00:01, 4.55it/s] 7it [00:01, 4.61it/s] 8it [00:01, 4.64it/s] 9it [00:02, 4.68it/s] 10it [00:02, 4.69it/s] 11it [00:02, 4.72it/s] 12it [00:02, 4.73it/s] 13it [00:02, 4.74it/s] 14it [00:03, 4.56it/s] 15it [00:03, 4.64it/s] 16it [00:03, 4.66it/s] 17it [00:03, 4.69it/s] 18it [00:03, 4.70it/s] 19it [00:04, 4.72it/s] 20it [00:04, 4.72it/s] 21it [00:04, 4.73it/s] 22it [00:04, 4.74it/s] 23it [00:05, 4.75it/s] 24it [00:05, 4.74it/s] 25it [00:05, 4.73it/s] 26it [00:05, 4.52it/s] 27it [00:05, 4.59it/s] 28it [00:06, 4.63it/s] 29it [00:06, 4.67it/s] 30it [00:06, 4.68it/s] 31it [00:06, 4.71it/s] 32it [00:06, 4.65it/s] 33it [00:07, 4.67it/s] 34it [00:07, 4.68it/s] 35it [00:07, 4.71it/s] 36it [00:07, 4.72it/s] 37it [00:08, 4.73it/s] 38it [00:08, 4.56it/s] 39it [00:08, 4.62it/s] 40it [00:08, 4.65it/s] 41it [00:08, 4.68it/s] 42it [00:09, 4.69it/s] 43it [00:09, 4.69it/s] 44it [00:09, 4.67it/s] 45it [00:09, 4.53it/s] 46it [00:09, 4.59it/s] 47it [00:10, 4.61it/s] 48it [00:10, 4.51it/s] 49it [00:10, 4.55it/s] 50it [00:10, 4.57it/s]2025-05-25 21:49:23,699 - INFO - [Epoch 028 | Batch 0050] IWAE-loss 1886.0216 | mean log_px -0.0034 | KL -1643.58 + 51it [00:11, 4.44it/s] 52it [00:11, 4.50it/s] 53it [00:11, 4.53it/s] 54it [00:11, 4.57it/s] 55it [00:11, 4.62it/s] 56it [00:12, 4.63it/s] 57it [00:12, 4.49it/s] 58it [00:12, 4.56it/s] 59it [00:12, 4.60it/s] 60it [00:13, 4.62it/s] 61it [00:13, 4.64it/s] 62it [00:13, 4.65it/s] 63it [00:13, 4.50it/s] 64it [00:13, 4.57it/s] 65it [00:14, 4.61it/s] 66it [00:14, 4.62it/s] 67it [00:14, 4.64it/s] 68it [00:14, 4.65it/s] 69it [00:15, 4.50it/s] 70it [00:15, 4.57it/s] 71it [00:15, 4.61it/s] 72it [00:15, 4.63it/s] 73it [00:15, 4.65it/s] 74it [00:16, 4.66it/s] 75it [00:16, 4.51it/s] 76it [00:16, 4.57it/s] 77it [00:16, 4.61it/s] 78it [00:16, 4.63it/s] 79it [00:17, 4.64it/s] 80it [00:17, 4.63it/s] 81it [00:17, 4.49it/s] 82it [00:17, 4.56it/s] 83it [00:18, 4.60it/s] 84it [00:18, 4.62it/s] 85it [00:18, 4.64it/s] 86it [00:18, 4.65it/s] 87it [00:18, 4.51it/s] 88it [00:19, 4.57it/s] 89it [00:19, 4.60it/s] 90it [00:19, 4.62it/s] 91it [00:19, 4.65it/s] 92it [00:20, 4.65it/s] 93it [00:20, 4.51it/s] 94it [00:20, 4.57it/s] 95it [00:20, 4.61it/s] 96it [00:20, 4.62it/s] 97it [00:21, 4.65it/s] 98it [00:21, 4.65it/s] 99it [00:21, 4.50it/s] 100it [00:21, 4.57it/s]2025-05-25 21:49:34,593 - INFO - [Epoch 028 | Batch 0100] IWAE-loss 1992.9895 | mean log_px -0.0080 | KL -1643.61 + 101it [00:21, 4.60it/s] 102it [00:22, 4.62it/s] 103it [00:22, 4.64it/s] 104it [00:22, 4.65it/s] 105it [00:22, 4.50it/s] 106it [00:23, 4.56it/s] 107it [00:23, 4.60it/s] 108it [00:23, 4.62it/s] 109it [00:23, 4.64it/s] 110it [00:23, 4.65it/s] 111it [00:24, 4.51it/s] 112it [00:24, 4.57it/s] 113it [00:24, 4.60it/s] 114it [00:24, 4.63it/s] 115it [00:25, 4.65it/s] 116it [00:25, 4.65it/s] 117it [00:25, 4.50it/s] 118it [00:25, 4.56it/s] 119it [00:25, 4.60it/s] 120it [00:26, 4.62it/s] 121it [00:26, 4.65it/s] 122it [00:26, 4.65it/s] 123it [00:26, 4.51it/s] 124it [00:26, 4.57it/s] 125it [00:27, 4.61it/s] 126it [00:27, 4.63it/s] 127it [00:27, 4.64it/s] 128it [00:27, 4.65it/s] 129it [00:28, 4.52it/s] 130it [00:28, 4.54it/s] 131it [00:28, 4.48it/s] 132it [00:28, 4.56it/s] 133it [00:28, 4.60it/s] 134it [00:29, 4.61it/s] 135it [00:29, 4.49it/s] 136it [00:29, 4.55it/s] 137it [00:29, 4.55it/s] 138it [00:30, 4.58it/s] 139it [00:30, 4.62it/s] 140it [00:30, 4.64it/s] 141it [00:30, 4.50it/s] 142it [00:30, 4.57it/s] 143it [00:31, 4.61it/s] 144it [00:31, 4.64it/s] 145it [00:31, 4.66it/s] 146it [00:31, 4.66it/s] 147it [00:31, 4.55it/s] 148it [00:32, 4.61it/s] 149it [00:32, 4.64it/s] 150it [00:32, 4.65it/s]2025-05-25 21:49:45,469 - INFO - [Epoch 028 | Batch 0150] IWAE-loss 1948.8407 | mean log_px -0.0090 | KL -1636.46 + 151it [00:32, 4.67it/s] 152it [00:33, 4.67it/s] 153it [00:33, 4.68it/s] 154it [00:33, 4.69it/s] 155it [00:33, 4.69it/s] 156it [00:33, 4.69it/s] 157it [00:34, 4.70it/s] 158it [00:34, 4.70it/s] 159it [00:34, 4.70it/s] 160it [00:34, 4.70it/s] 161it [00:34, 4.53it/s] 162it [00:35, 4.59it/s] 163it [00:35, 4.63it/s] 164it [00:35, 4.65it/s] 165it [00:35, 4.67it/s] 166it [00:36, 4.67it/s] 167it [00:36, 4.52it/s] 168it [00:36, 4.58it/s] 169it [00:36, 4.62it/s] 170it [00:36, 4.64it/s] 171it [00:37, 4.66it/s] 172it [00:37, 4.67it/s] 173it [00:37, 4.68it/s] 174it [00:37, 4.68it/s] 175it [00:37, 4.69it/s] 176it [00:38, 4.69it/s] 177it [00:38, 4.70it/s] 178it [00:38, 4.70it/s] 179it [00:38, 4.70it/s] 180it [00:39, 4.69it/s] 181it [00:39, 4.70it/s] 182it [00:39, 4.70it/s] 183it [00:39, 4.70it/s] 184it [00:39, 4.70it/s] 185it [00:40, 4.70it/s] 186it [00:40, 4.70it/s] 187it [00:40, 4.70it/s] 188it [00:40, 4.70it/s] 189it [00:40, 4.70it/s] 190it [00:41, 4.67it/s] 191it [00:41, 4.69it/s] 192it [00:41, 4.66it/s] 193it [00:41, 4.44it/s] 194it [00:42, 4.48it/s] 195it [00:42, 4.30it/s] 196it [00:42, 4.26it/s] 196it [00:42, 4.60it/s] +2025-05-25 21:49:55,340 - INFO - Epoch: 28, Objective: tensor([2206.5891], device='cuda:0', grad_fn=), Loss: 0.015577034093439579, KL/n: 33.273502349853516 + 0it [00:00, ?it/s]2025-05-25 21:49:55,926 - INFO - [Epoch 029 | Batch 0000] IWAE-loss 1807.6621 | mean log_px -0.0057 | KL -1630.16 + 1it [00:00, 2.96it/s] 2it [00:00, 3.60it/s] 3it [00:00, 3.90it/s] 4it [00:01, 4.00it/s] 5it [00:01, 4.02it/s] 6it [00:01, 4.08it/s] 7it [00:01, 4.16it/s] 8it [00:01, 4.21it/s] 9it [00:02, 4.26it/s] 10it [00:02, 4.29it/s] 11it [00:02, 4.31it/s] 12it [00:02, 4.19it/s] 13it [00:03, 4.32it/s] 14it [00:03, 4.29it/s] 15it [00:03, 4.33it/s] 16it [00:03, 4.33it/s] 17it [00:04, 4.37it/s] 18it [00:04, 4.19it/s] 19it [00:04, 4.30it/s] 20it [00:04, 4.27it/s] 21it [00:05, 4.32it/s] 22it [00:05, 4.27it/s] 23it [00:05, 4.18it/s] 24it [00:05, 4.21it/s] 25it [00:05, 4.20it/s] 26it [00:06, 4.05it/s] 27it [00:06, 4.08it/s] 28it [00:06, 4.14it/s] 29it [00:06, 4.25it/s] 30it [00:07, 4.23it/s] 31it [00:07, 4.22it/s] 32it [00:07, 4.19it/s] 33it [00:07, 4.22it/s] 34it [00:08, 4.06it/s] 35it [00:08, 4.12it/s] 36it [00:08, 4.16it/s] 37it [00:08, 4.16it/s] 38it [00:09, 4.18it/s] 39it [00:09, 4.11it/s] 40it [00:09, 4.11it/s] 41it [00:09, 4.07it/s] 42it [00:10, 4.08it/s] 43it [00:10, 4.13it/s] 44it [00:10, 4.15it/s] 45it [00:10, 4.18it/s] 46it [00:11, 4.18it/s] 47it [00:11, 4.10it/s] 48it [00:11, 4.13it/s] 49it [00:11, 4.15it/s] 50it [00:12, 4.16it/s]2025-05-25 21:50:07,845 - INFO - [Epoch 029 | Batch 0050] IWAE-loss 1674.5372 | mean log_px -0.0011 | KL -1614.30 + 51it [00:12, 4.13it/s] 52it [00:12, 4.19it/s] 53it [00:12, 4.22it/s] 54it [00:12, 4.31it/s] 55it [00:13, 4.33it/s] 56it [00:13, 4.30it/s] 57it [00:13, 4.26it/s] 58it [00:13, 4.22it/s] 59it [00:14, 4.22it/s] 60it [00:14, 4.21it/s] 61it [00:14, 4.14it/s] 62it [00:14, 4.20it/s] 63it [00:15, 4.25it/s] 64it [00:15, 4.22it/s] 65it [00:15, 4.19it/s] 66it [00:15, 4.19it/s] 67it [00:16, 4.17it/s] 68it [00:16, 4.18it/s] 69it [00:16, 4.17it/s] 70it [00:16, 4.17it/s] 71it [00:17, 4.14it/s] 72it [00:17, 4.27it/s] 73it [00:17, 4.29it/s] 74it [00:17, 4.28it/s] 75it [00:17, 4.30it/s] 76it [00:18, 4.28it/s] 77it [00:18, 4.26it/s] 78it [00:18, 4.39it/s] 79it [00:18, 4.23it/s] 80it [00:19, 4.24it/s] 81it [00:19, 4.21it/s] 82it [00:19, 4.23it/s] 83it [00:19, 4.27it/s] 84it [00:20, 4.26it/s] 85it [00:20, 4.17it/s] 86it [00:20, 4.23it/s] 87it [00:20, 4.24it/s] 88it [00:20, 4.24it/s] 89it [00:21, 4.25it/s] 90it [00:21, 4.36it/s] 91it [00:21, 4.44it/s] 92it [00:21, 4.34it/s] 93it [00:22, 4.43it/s] 94it [00:22, 4.43it/s] 95it [00:22, 4.42it/s] 96it [00:22, 4.36it/s] 97it [00:23, 4.32it/s] 98it [00:23, 4.39it/s] 99it [00:23, 4.37it/s] 100it [00:23, 4.34it/s]2025-05-25 21:50:19,532 - INFO - [Epoch 029 | Batch 0100] IWAE-loss 1752.5222 | mean log_px -0.0047 | KL -1603.06 + 101it [00:23, 4.37it/s] 102it [00:24, 4.20it/s] 103it [00:24, 4.20it/s] 104it [00:24, 4.23it/s] 105it [00:24, 4.19it/s] 106it [00:25, 4.21it/s] 107it [00:25, 4.26it/s] 108it [00:25, 4.34it/s] 109it [00:25, 4.28it/s] 110it [00:26, 4.38it/s] 111it [00:26, 4.44it/s] 112it [00:26, 4.47it/s] 113it [00:26, 4.44it/s] 114it [00:26, 4.47it/s] 115it [00:27, 4.52it/s] 116it [00:27, 4.40it/s] 117it [00:27, 4.38it/s] 118it [00:27, 4.31it/s] 119it [00:28, 4.36it/s] 120it [00:28, 4.40it/s] 121it [00:28, 4.31it/s] 122it [00:28, 4.27it/s] 123it [00:29, 4.30it/s] 124it [00:29, 4.17it/s] 125it [00:29, 4.21it/s] 126it [00:29, 4.33it/s] 127it [00:29, 4.29it/s] 128it [00:30, 4.25it/s] 129it [00:30, 4.26it/s] 130it [00:30, 4.37it/s] 131it [00:30, 4.37it/s] 132it [00:31, 4.32it/s] 133it [00:31, 4.17it/s] 134it [00:31, 4.21it/s] 135it [00:31, 4.24it/s] 136it [00:32, 4.27it/s] 137it [00:32, 4.39it/s] 138it [00:32, 4.17it/s] 139it [00:32, 4.31it/s] 140it [00:33, 4.28it/s] 141it [00:33, 4.25it/s] 142it [00:33, 4.32it/s] 143it [00:33, 4.34it/s] 144it [00:33, 4.31it/s] 145it [00:34, 4.40it/s] 146it [00:34, 4.35it/s] 147it [00:34, 4.30it/s] 148it [00:34, 4.30it/s] 149it [00:35, 4.38it/s] 150it [00:35, 4.33it/s]2025-05-25 21:50:31,131 - INFO - [Epoch 029 | Batch 0150] IWAE-loss 1698.8661 | mean log_px -0.0024 | KL -1595.82 + 151it [00:35, 4.37it/s] 152it [00:35, 4.33it/s] 153it [00:35, 4.42it/s] 154it [00:36, 4.50it/s] 155it [00:36, 4.41it/s] 156it [00:36, 4.41it/s] 157it [00:36, 4.45it/s] 158it [00:37, 4.42it/s] 159it [00:37, 4.49it/s] 160it [00:37, 4.44it/s] 161it [00:37, 4.38it/s] 162it [00:38, 4.38it/s] 163it [00:38, 4.32it/s] 164it [00:38, 4.32it/s] 165it [00:38, 4.28it/s] 166it [00:38, 4.31it/s] 167it [00:39, 4.27it/s] 168it [00:39, 4.27it/s] 169it [00:39, 4.24it/s] 170it [00:39, 4.26it/s] 171it [00:40, 4.24it/s] 172it [00:40, 4.27it/s] 173it [00:40, 4.38it/s] 174it [00:40, 4.36it/s] 175it [00:41, 4.41it/s] 176it [00:41, 4.40it/s] 177it [00:41, 4.36it/s] 178it [00:41, 4.34it/s] 179it [00:41, 4.32it/s] 180it [00:42, 4.31it/s] 181it [00:42, 4.34it/s] 182it [00:42, 4.44it/s] 183it [00:42, 4.36it/s] 184it [00:43, 4.36it/s] 185it [00:43, 4.30it/s] 186it [00:43, 4.32it/s] 187it [00:43, 4.27it/s] 188it [00:44, 4.36it/s] 189it [00:44, 4.39it/s] 190it [00:44, 4.34it/s] 191it [00:44, 4.18it/s] 192it [00:44, 4.22it/s] 193it [00:45, 4.28it/s] 194it [00:45, 4.38it/s] 195it [00:45, 4.24it/s] 196it [00:45, 4.23it/s] 196it [00:46, 4.26it/s] +2025-05-25 21:50:41,656 - INFO - Epoch: 29, Objective: tensor([2066.5352], device='cuda:0', grad_fn=), Loss: 0.007869544439017773, KL/n: 32.472476959228516 + 0it [00:00, ?it/s]2025-05-25 21:50:42,050 - INFO - [Epoch 030 | Batch 0000] IWAE-loss 1742.8804 | mean log_px -0.0048 | KL -1591.28 + 1it [00:00, 2.85it/s] 2it [00:00, 3.64it/s] 3it [00:00, 4.00it/s] 4it [00:01, 4.22it/s] 5it [00:01, 4.39it/s] 6it [00:01, 4.30it/s] 7it [00:01, 4.33it/s] 8it [00:01, 4.32it/s] 9it [00:02, 4.31it/s] 10it [00:02, 4.27it/s] 11it [00:02, 4.12it/s] 12it [00:02, 4.17it/s] 13it [00:03, 4.25it/s] 14it [00:03, 4.25it/s] 15it [00:03, 4.34it/s] 16it [00:03, 4.17it/s] 17it [00:04, 4.19it/s] 18it [00:04, 4.24it/s] 19it [00:04, 4.33it/s] 20it [00:04, 4.21it/s] 21it [00:04, 4.35it/s] 22it [00:05, 4.42it/s] 23it [00:05, 4.50it/s] 24it [00:05, 4.56it/s] 25it [00:05, 4.33it/s] 26it [00:06, 3.50it/s] 27it [00:06, 3.73it/s] 28it [00:06, 3.91it/s] 29it [00:06, 4.12it/s] 30it [00:07, 4.26it/s] 31it [00:07, 4.25it/s] 32it [00:07, 4.23it/s] 33it [00:07, 4.23it/s] 34it [00:08, 4.24it/s] 35it [00:08, 4.39it/s] 36it [00:08, 4.48it/s] 37it [00:08, 4.51it/s] 38it [00:08, 4.56it/s] 39it [00:09, 4.48it/s] 40it [00:09, 4.56it/s] 41it [00:09, 4.61it/s] 42it [00:09, 4.62it/s] 43it [00:10, 4.51it/s] 44it [00:10, 4.38it/s] 45it [00:10, 4.38it/s] 46it [00:10, 4.32it/s] 47it [00:11, 4.33it/s] 48it [00:11, 4.29it/s] 49it [00:11, 4.41it/s] 50it [00:11, 4.49it/s]2025-05-25 21:50:53,641 - INFO - [Epoch 030 | Batch 0050] IWAE-loss 1974.8240 | mean log_px -0.0085 | KL -1577.82 + 51it [00:11, 4.46it/s] 52it [00:12, 4.45it/s] 53it [00:12, 4.39it/s] 54it [00:12, 4.36it/s] 55it [00:12, 4.34it/s] 56it [00:13, 4.35it/s] 57it [00:13, 4.32it/s] 58it [00:13, 4.40it/s] 59it [00:13, 4.50it/s] 60it [00:13, 4.54it/s] 61it [00:14, 4.59it/s] 62it [00:14, 4.48it/s] 63it [00:14, 4.33it/s] 64it [00:14, 4.36it/s] 65it [00:15, 4.32it/s] 66it [00:15, 4.27it/s] 67it [00:15, 4.24it/s] 68it [00:15, 4.26it/s] 69it [00:16, 4.38it/s] 70it [00:16, 4.37it/s] 71it [00:16, 4.35it/s] 72it [00:16, 4.23it/s] 73it [00:16, 4.24it/s] 74it [00:17, 4.25it/s] 75it [00:17, 4.39it/s] 76it [00:17, 4.32it/s] 77it [00:17, 4.16it/s] 78it [00:18, 4.16it/s] 79it [00:18, 4.21it/s] 80it [00:18, 4.20it/s] 81it [00:18, 4.25it/s] 82it [00:19, 4.34it/s] 83it [00:19, 4.30it/s] 84it [00:19, 4.30it/s] 85it [00:19, 4.28it/s] 86it [00:20, 4.29it/s] 87it [00:20, 4.38it/s] 88it [00:20, 4.38it/s] 89it [00:20, 4.23it/s] 90it [00:20, 4.29it/s] 91it [00:21, 4.29it/s] 92it [00:21, 4.36it/s] 93it [00:21, 4.43it/s] 94it [00:21, 4.43it/s] 95it [00:22, 4.32it/s] 96it [00:22, 4.42it/s] 97it [00:22, 4.48it/s] 98it [00:22, 4.45it/s] 99it [00:22, 4.43it/s] 100it [00:23, 4.26it/s]2025-05-25 21:51:05,194 - INFO - [Epoch 030 | Batch 0100] IWAE-loss 1863.1838 | mean log_px -0.0062 | KL -1573.59 + 101it [00:23, 4.26it/s] 102it [00:23, 4.25it/s] 103it [00:23, 4.23it/s] 104it [00:24, 4.23it/s] 105it [00:24, 4.10it/s] 106it [00:24, 4.25it/s] 107it [00:24, 4.33it/s] 108it [00:25, 4.10it/s] 109it [00:25, 4.17it/s] 110it [00:25, 4.17it/s] 111it [00:25, 4.13it/s] 112it [00:26, 4.27it/s] 113it [00:26, 4.26it/s] 114it [00:26, 4.36it/s] 115it [00:26, 4.47it/s] 116it [00:26, 4.54it/s] 117it [00:27, 4.35it/s] 118it [00:27, 4.34it/s] 119it [00:27, 4.46it/s] 120it [00:27, 4.37it/s] 121it [00:28, 4.38it/s] 122it [00:28, 4.36it/s] 123it [00:28, 4.23it/s] 124it [00:28, 4.18it/s] 125it [00:29, 4.31it/s] 126it [00:29, 4.31it/s] 127it [00:29, 4.43it/s] 128it [00:29, 4.51it/s] 129it [00:29, 4.57it/s] 130it [00:30, 4.50it/s] 131it [00:30, 4.49it/s] 132it [00:30, 4.56it/s] 133it [00:30, 4.59it/s] 134it [00:31, 4.60it/s] 135it [00:31, 4.52it/s] 136it [00:31, 4.34it/s] 137it [00:31, 4.47it/s] 138it [00:31, 4.50it/s] 139it [00:32, 4.45it/s] 140it [00:32, 4.49it/s] 141it [00:32, 4.40it/s] 142it [00:32, 4.49it/s] 143it [00:33, 4.57it/s] 144it [00:33, 4.60it/s] 145it [00:33, 4.63it/s] 146it [00:33, 4.46it/s] 147it [00:33, 4.43it/s] 148it [00:34, 4.47it/s] 149it [00:34, 4.39it/s] 150it [00:34, 4.18it/s]2025-05-25 21:51:16,627 - INFO - [Epoch 030 | Batch 0150] IWAE-loss 2044.0123 | mean log_px -0.0121 | KL -1569.41 + 151it [00:34, 4.21it/s] 152it [00:35, 4.19it/s] 153it [00:35, 4.29it/s] 154it [00:35, 4.29it/s] 155it [00:35, 4.35it/s] 156it [00:36, 4.39it/s] 157it [00:36, 4.34it/s] 158it [00:36, 4.41it/s] 159it [00:36, 4.37it/s] 160it [00:36, 4.28it/s] 161it [00:37, 4.14it/s] 162it [00:37, 4.19it/s] 163it [00:37, 4.19it/s] 164it [00:37, 4.23it/s] 165it [00:38, 4.25it/s] 166it [00:38, 4.39it/s] 167it [00:38, 4.32it/s] 168it [00:38, 4.43it/s] 169it [00:39, 4.43it/s] 170it [00:39, 4.50it/s] 171it [00:39, 4.44it/s] 172it [00:39, 4.41it/s] 173it [00:39, 4.48it/s] 174it [00:40, 4.43it/s] 175it [00:40, 4.53it/s] 176it [00:40, 4.40it/s] 177it [00:40, 4.47it/s] 178it [00:41, 4.38it/s] 179it [00:41, 4.37it/s] 180it [00:41, 4.44it/s] 181it [00:41, 4.43it/s] 182it [00:42, 4.23it/s] 183it [00:42, 4.31it/s] 184it [00:42, 4.32it/s] 185it [00:42, 4.39it/s] 186it [00:42, 4.44it/s] 187it [00:43, 4.37it/s] 188it [00:43, 4.18it/s] 189it [00:43, 4.21it/s] 190it [00:43, 4.31it/s] 191it [00:44, 4.42it/s] 192it [00:44, 4.50it/s] 193it [00:44, 4.51it/s] 194it [00:44, 4.54it/s] 195it [00:44, 4.44it/s] 196it [00:45, 4.38it/s] 196it [00:45, 4.33it/s] +2025-05-25 21:51:27,060 - INFO - Epoch: 30, Objective: tensor([1660.5792], device='cuda:0', grad_fn=), Loss: 0.002282704459503293, KL/n: 31.856414794921875 + 0it [00:00, ?it/s]2025-05-25 21:51:27,468 - INFO - [Epoch 031 | Batch 0000] IWAE-loss 1722.8004 | mean log_px -0.0030 | KL -1562.43 + 1it [00:00, 2.77it/s] 2it [00:00, 3.65it/s] 3it [00:00, 4.10it/s] 4it [00:00, 4.31it/s] 5it [00:01, 4.28it/s] 6it [00:01, 4.34it/s] 7it [00:01, 4.45it/s] 8it [00:01, 4.34it/s] 9it [00:02, 4.36it/s] 10it [00:02, 4.32it/s] 11it [00:02, 4.17it/s] 12it [00:02, 4.18it/s] 13it [00:03, 4.19it/s] 14it [00:03, 4.20it/s] 15it [00:03, 4.23it/s] 16it [00:03, 4.32it/s] 17it [00:04, 4.38it/s] 18it [00:04, 4.31it/s] 19it [00:04, 4.37it/s] 20it [00:04, 4.19it/s] 21it [00:04, 4.27it/s] 22it [00:05, 4.39it/s] 23it [00:05, 4.47it/s] 24it [00:05, 4.41it/s] 25it [00:05, 4.37it/s] 26it [00:06, 4.23it/s] 27it [00:06, 4.25it/s] 28it [00:06, 4.24it/s] 29it [00:06, 4.30it/s] 30it [00:07, 4.28it/s] 31it [00:07, 4.40it/s] 32it [00:07, 4.34it/s] 33it [00:07, 4.47it/s] 34it [00:07, 4.54it/s] 35it [00:08, 4.48it/s] 36it [00:08, 4.43it/s] 37it [00:08, 4.44it/s] 38it [00:08, 4.50it/s] 39it [00:09, 4.32it/s] 40it [00:09, 4.33it/s] 41it [00:09, 4.37it/s] 42it [00:09, 4.49it/s] 43it [00:09, 4.46it/s] 44it [00:10, 4.30it/s] 45it [00:10, 4.30it/s] 46it [00:10, 4.40it/s] 47it [00:10, 4.48it/s] 48it [00:11, 4.41it/s] 49it [00:11, 4.39it/s] 50it [00:11, 4.45it/s]2025-05-25 21:51:38,923 - INFO - [Epoch 031 | Batch 0050] IWAE-loss 1696.5232 | mean log_px -0.0034 | KL -1540.58 + 51it [00:11, 4.43it/s] 52it [00:12, 4.38it/s] 53it [00:12, 4.37it/s] 54it [00:12, 4.47it/s] 55it [00:12, 4.27it/s] 56it [00:12, 4.29it/s] 57it [00:13, 4.38it/s] 58it [00:13, 4.39it/s] 59it [00:13, 4.47it/s] 60it [00:13, 4.44it/s] 61it [00:14, 4.37it/s] 62it [00:14, 4.20it/s] 63it [00:14, 4.23it/s] 64it [00:14, 4.25it/s] 65it [00:15, 4.31it/s] 66it [00:15, 4.41it/s] 67it [00:15, 4.36it/s] 68it [00:15, 4.46it/s] 69it [00:15, 4.40it/s] 70it [00:16, 4.23it/s] 71it [00:16, 4.23it/s] 72it [00:16, 4.39it/s] 73it [00:16, 4.36it/s] 74it [00:17, 4.36it/s] 75it [00:17, 4.47it/s] 76it [00:17, 4.40it/s] 77it [00:17, 4.36it/s] 78it [00:17, 4.37it/s] 79it [00:18, 4.33it/s] 80it [00:18, 4.46it/s] 81it [00:18, 4.38it/s] 82it [00:18, 4.34it/s] 83it [00:19, 4.33it/s] 84it [00:19, 4.43it/s] 85it [00:19, 4.49it/s] 86it [00:19, 4.41it/s] 87it [00:20, 4.39it/s] 88it [00:20, 4.38it/s] 89it [00:20, 4.23it/s] 90it [00:20, 4.21it/s] 91it [00:20, 4.23it/s] 92it [00:21, 4.27it/s] 93it [00:21, 4.40it/s] 94it [00:21, 4.34it/s] 95it [00:21, 4.43it/s] 96it [00:22, 4.27it/s] 97it [00:22, 4.29it/s] 98it [00:22, 4.27it/s] 99it [00:22, 4.27it/s] 100it [00:23, 4.28it/s]2025-05-25 21:51:50,435 - INFO - [Epoch 031 | Batch 0100] IWAE-loss 1671.5338 | mean log_px -0.0022 | KL -1533.55 + 101it [00:23, 4.23it/s] 102it [00:23, 4.21it/s] 103it [00:23, 4.27it/s] 104it [00:24, 4.23it/s] 105it [00:24, 4.30it/s] 106it [00:24, 4.31it/s] 107it [00:24, 4.43it/s] 108it [00:24, 4.45it/s] 109it [00:25, 4.52it/s] 110it [00:25, 4.48it/s] 111it [00:25, 4.54it/s] 112it [00:25, 4.58it/s] 113it [00:26, 4.35it/s] 114it [00:26, 4.39it/s] 115it [00:26, 4.48it/s] 116it [00:26, 4.43it/s] 117it [00:26, 4.54it/s] 118it [00:27, 4.48it/s] 119it [00:27, 4.41it/s] 120it [00:27, 4.39it/s] 121it [00:27, 4.50it/s] 122it [00:28, 4.44it/s] 123it [00:28, 4.25it/s] 124it [00:28, 4.28it/s] 125it [00:28, 4.28it/s] 126it [00:29, 4.27it/s] 127it [00:29, 4.30it/s] 128it [00:29, 4.30it/s] 129it [00:29, 4.29it/s] 130it [00:29, 4.19it/s] 131it [00:30, 4.19it/s] 132it [00:30, 4.23it/s] 133it [00:30, 4.22it/s] 134it [00:30, 4.36it/s] 135it [00:31, 4.36it/s] 136it [00:31, 4.39it/s] 137it [00:31, 4.40it/s] 138it [00:31, 4.27it/s] 139it [00:32, 4.28it/s] 140it [00:32, 4.40it/s] 141it [00:32, 4.50it/s] 142it [00:32, 4.47it/s] 143it [00:32, 4.16it/s] 144it [00:33, 4.21it/s] 145it [00:33, 4.20it/s] 146it [00:33, 4.20it/s] 147it [00:33, 4.26it/s] 148it [00:34, 4.26it/s] 149it [00:34, 4.26it/s] 150it [00:34, 4.33it/s]2025-05-25 21:52:01,972 - INFO - [Epoch 031 | Batch 0150] IWAE-loss 1709.1289 | mean log_px -0.0036 | KL -1533.10 + 151it [00:34, 4.28it/s] 152it [00:35, 4.30it/s] 153it [00:35, 4.31it/s] 154it [00:35, 4.17it/s] 155it [00:35, 4.26it/s] 156it [00:36, 4.32it/s] 157it [00:36, 4.43it/s] 158it [00:36, 4.43it/s] 159it [00:36, 4.52it/s] 160it [00:36, 4.43it/s] 161it [00:37, 4.28it/s] 162it [00:37, 4.28it/s] 163it [00:37, 4.35it/s] 164it [00:37, 4.32it/s] 165it [00:38, 4.43it/s] 166it [00:38, 4.20it/s] 167it [00:38, 4.29it/s] 168it [00:38, 4.31it/s] 169it [00:38, 4.31it/s] 170it [00:39, 4.32it/s] 171it [00:39, 4.33it/s] 172it [00:39, 4.34it/s] 173it [00:39, 4.34it/s] 174it [00:40, 4.29it/s] 175it [00:40, 4.31it/s] 176it [00:40, 4.41it/s] 177it [00:40, 4.49it/s] 178it [00:41, 4.56it/s] 179it [00:41, 4.55it/s] 180it [00:41, 4.38it/s] 181it [00:41, 4.36it/s] 182it [00:41, 4.37it/s] 183it [00:42, 4.35it/s] 184it [00:42, 4.35it/s] 185it [00:42, 4.32it/s] 186it [00:42, 4.24it/s] 187it [00:43, 4.25it/s] 188it [00:43, 4.27it/s] 189it [00:43, 4.24it/s] 190it [00:43, 4.10it/s] 191it [00:44, 4.16it/s] 192it [00:44, 4.26it/s] 193it [00:44, 4.28it/s] 194it [00:44, 4.33it/s] 195it [00:44, 4.34it/s] 196it [00:45, 4.32it/s] 196it [00:45, 4.33it/s] +2025-05-25 21:52:12,498 - INFO - Epoch: 31, Objective: tensor([1998.8662], device='cuda:0', grad_fn=), Loss: 0.011031880974769592, KL/n: 31.218055725097656 + 0it [00:00, ?it/s]2025-05-25 21:52:13,095 - INFO - [Epoch 032 | Batch 0000] IWAE-loss 1605.7083 | mean log_px -0.0011 | KL -1530.47 + 1it [00:00, 2.73it/s] 2it [00:00, 3.45it/s] 3it [00:00, 3.85it/s] 4it [00:01, 4.00it/s] 5it [00:01, 4.20it/s] 6it [00:01, 4.26it/s] 7it [00:01, 4.08it/s] 8it [00:02, 4.10it/s] 9it [00:02, 4.20it/s] 10it [00:02, 4.27it/s] 11it [00:02, 4.30it/s] 12it [00:02, 4.31it/s] 13it [00:03, 4.43it/s] 14it [00:03, 4.31it/s] 15it [00:03, 4.29it/s] 16it [00:03, 4.27it/s] 17it [00:04, 4.29it/s] 18it [00:04, 4.38it/s] 19it [00:04, 4.48it/s] 20it [00:04, 4.54it/s] 21it [00:04, 4.60it/s] 22it [00:05, 4.46it/s] 23it [00:05, 4.44it/s] 24it [00:05, 4.42it/s] 25it [00:05, 4.40it/s] 26it [00:06, 4.34it/s] 27it [00:06, 4.44it/s] 28it [00:06, 4.51it/s] 29it [00:06, 4.50it/s] 30it [00:06, 4.53it/s] 31it [00:07, 4.59it/s] 32it [00:07, 4.50it/s] 33it [00:07, 4.46it/s] 34it [00:07, 4.23it/s] 35it [00:08, 4.27it/s] 36it [00:08, 4.25it/s] 37it [00:08, 4.39it/s] 38it [00:08, 4.32it/s] 39it [00:09, 4.37it/s] 40it [00:09, 4.13it/s] 41it [00:09, 4.22it/s] 42it [00:09, 4.23it/s] 43it [00:09, 4.34it/s] 44it [00:10, 4.30it/s] 45it [00:10, 4.42it/s] 46it [00:10, 4.34it/s] 47it [00:10, 4.44it/s] 48it [00:11, 4.36it/s] 49it [00:11, 4.35it/s] 50it [00:11, 4.38it/s]2025-05-25 21:52:24,568 - INFO - [Epoch 032 | Batch 0050] IWAE-loss 1871.9933 | mean log_px -0.0139 | KL -1516.54 + 51it [00:11, 4.31it/s] 52it [00:12, 4.34it/s] 53it [00:12, 4.44it/s] 54it [00:12, 4.46it/s] 55it [00:12, 4.45it/s] 56it [00:12, 4.38it/s] 57it [00:13, 4.37it/s] 58it [00:13, 4.36it/s] 59it [00:13, 4.37it/s] 60it [00:13, 4.24it/s] 61it [00:14, 4.28it/s] 62it [00:14, 4.28it/s] 63it [00:14, 4.29it/s] 64it [00:14, 4.31it/s] 65it [00:15, 4.43it/s] 66it [00:15, 4.48it/s] 67it [00:15, 4.41it/s] 68it [00:15, 4.47it/s] 69it [00:15, 4.39it/s] 70it [00:16, 4.41it/s] 71it [00:16, 4.50it/s] 72it [00:16, 4.49it/s] 73it [00:16, 4.54it/s] 74it [00:17, 4.42it/s] 75it [00:17, 4.41it/s] 76it [00:17, 4.35it/s] 77it [00:17, 4.35it/s] 78it [00:17, 4.41it/s] 79it [00:18, 4.50it/s] 80it [00:18, 4.21it/s] 81it [00:18, 4.32it/s] 82it [00:18, 4.26it/s] 83it [00:19, 4.26it/s] 84it [00:19, 4.25it/s] 85it [00:19, 4.30it/s] 86it [00:19, 4.38it/s] 87it [00:20, 4.48it/s] 88it [00:20, 4.44it/s] 89it [00:20, 4.26it/s] 90it [00:20, 4.19it/s] 91it [00:21, 4.24it/s] 92it [00:21, 4.35it/s] 93it [00:21, 4.45it/s] 94it [00:21, 4.28it/s] 95it [00:21, 4.37it/s] 96it [00:22, 4.39it/s] 97it [00:22, 4.35it/s] 98it [00:22, 4.29it/s] 99it [00:22, 4.15it/s] 100it [00:23, 4.18it/s]2025-05-25 21:52:36,082 - INFO - [Epoch 032 | Batch 0100] IWAE-loss 2199.9558 | mean log_px -0.0137 | KL -1505.77 + 101it [00:23, 4.23it/s] 102it [00:23, 4.27it/s] 103it [00:23, 4.33it/s] 104it [00:24, 4.32it/s] 105it [00:24, 4.31it/s] 106it [00:24, 4.30it/s] 107it [00:24, 4.30it/s] 108it [00:24, 4.41it/s] 109it [00:25, 4.35it/s] 110it [00:25, 4.29it/s] 111it [00:25, 4.19it/s] 112it [00:25, 4.21it/s] 113it [00:26, 4.34it/s] 114it [00:26, 4.31it/s] 115it [00:26, 4.31it/s] 116it [00:26, 4.22it/s] 117it [00:27, 4.24it/s] 118it [00:27, 4.26it/s] 119it [00:27, 4.28it/s] 120it [00:27, 4.29it/s] 121it [00:27, 4.28it/s] 122it [00:28, 4.29it/s] 123it [00:28, 4.41it/s] 124it [00:28, 4.49it/s] 125it [00:28, 4.55it/s] 126it [00:29, 4.56it/s] 127it [00:29, 4.48it/s] 128it [00:29, 4.41it/s] 129it [00:29, 4.46it/s] 130it [00:29, 4.45it/s] 131it [00:30, 4.47it/s] 132it [00:30, 4.29it/s] 133it [00:30, 4.35it/s] 134it [00:30, 4.32it/s] 135it [00:31, 4.40it/s] 136it [00:31, 4.41it/s] 137it [00:31, 4.50it/s] 138it [00:31, 4.37it/s] 139it [00:32, 4.21it/s] 140it [00:32, 4.19it/s] 141it [00:32, 4.22it/s] 142it [00:32, 4.33it/s] 143it [00:32, 4.35it/s] 144it [00:33, 4.39it/s] 145it [00:33, 4.36it/s] 146it [00:33, 4.21it/s] 147it [00:33, 4.25it/s] 148it [00:34, 4.23it/s] 149it [00:34, 4.36it/s] 150it [00:34, 4.33it/s]2025-05-25 21:52:47,615 - INFO - [Epoch 032 | Batch 0150] IWAE-loss 1934.8878 | mean log_px -0.0096 | KL -1507.10 + 151it [00:34, 4.29it/s] 152it [00:35, 4.37it/s] 153it [00:35, 4.31it/s] 154it [00:35, 4.25it/s] 155it [00:35, 4.25it/s] 156it [00:36, 4.21it/s] 157it [00:36, 4.31it/s] 158it [00:36, 4.40it/s] 159it [00:36, 4.33it/s] 160it [00:36, 4.21it/s] 161it [00:37, 4.25it/s] 162it [00:37, 4.32it/s] 163it [00:37, 4.34it/s] 164it [00:37, 4.39it/s] 165it [00:38, 4.46it/s] 166it [00:38, 4.48it/s] 167it [00:38, 4.37it/s] 168it [00:38, 4.43it/s] 169it [00:39, 4.36it/s] 170it [00:39, 4.42it/s] 171it [00:39, 4.35it/s] 172it [00:39, 4.20it/s] 173it [00:39, 4.22it/s] 174it [00:40, 4.30it/s] 175it [00:40, 4.40it/s] 176it [00:40, 4.41it/s] 177it [00:40, 4.50it/s] 178it [00:41, 4.47it/s] 179it [00:41, 4.42it/s] 180it [00:41, 4.38it/s] 181it [00:41, 4.47it/s] 182it [00:41, 4.35it/s] 183it [00:42, 4.30it/s] 184it [00:42, 4.27it/s] 185it [00:42, 4.24it/s] 186it [00:42, 4.23it/s] 187it [00:43, 4.27it/s] 188it [00:43, 4.20it/s] 189it [00:43, 4.21it/s] 190it [00:43, 4.29it/s] 191it [00:44, 4.38it/s] 192it [00:44, 4.38it/s] 193it [00:44, 4.33it/s] 194it [00:44, 4.17it/s] 195it [00:45, 4.16it/s] 196it [00:45, 4.29it/s] 196it [00:45, 4.32it/s] +2025-05-25 21:52:58,159 - INFO - Epoch: 32, Objective: tensor([1967.3446], device='cuda:0', grad_fn=), Loss: 0.012947743758559227, KL/n: 30.607524871826172 + 0it [00:00, ?it/s]2025-05-25 21:52:58,553 - INFO - [Epoch 033 | Batch 0000] IWAE-loss 1662.4415 | mean log_px -0.0023 | KL -1498.38 + 1it [00:00, 3.10it/s] 2it [00:00, 3.75it/s] 3it [00:00, 3.93it/s] 4it [00:01, 3.99it/s] 5it [00:01, 4.10it/s] 6it [00:01, 3.98it/s] 7it [00:01, 4.06it/s] 8it [00:02, 4.09it/s] 9it [00:02, 4.18it/s] 10it [00:02, 4.13it/s] 11it [00:02, 4.18it/s] 12it [00:03, 3.38it/s] 13it [00:03, 3.60it/s] 14it [00:03, 3.73it/s] 15it [00:03, 3.96it/s] 16it [00:04, 4.02it/s] 17it [00:04, 3.86it/s] 18it [00:04, 3.94it/s] 19it [00:04, 4.06it/s] 20it [00:05, 4.19it/s] 21it [00:05, 4.24it/s] 22it [00:05, 4.31it/s] 23it [00:05, 4.38it/s] 24it [00:05, 4.41it/s] 25it [00:06, 4.43it/s] 26it [00:06, 4.33it/s] 27it [00:06, 4.30it/s] 28it [00:06, 4.38it/s] 29it [00:07, 4.32it/s] 30it [00:07, 4.26it/s] 31it [00:07, 4.27it/s] 32it [00:07, 4.25it/s] 33it [00:08, 4.23it/s] 34it [00:08, 4.22it/s] 35it [00:08, 4.32it/s] 36it [00:08, 4.32it/s] 37it [00:08, 4.29it/s] 38it [00:09, 4.22it/s] 39it [00:09, 4.24it/s] 40it [00:09, 4.19it/s] 41it [00:09, 4.32it/s] 42it [00:10, 4.30it/s] 43it [00:10, 4.39it/s] 44it [00:10, 4.35it/s] 45it [00:10, 4.41it/s] 46it [00:11, 4.34it/s] 47it [00:11, 4.31it/s] 48it [00:11, 4.36it/s] 49it [00:11, 4.31it/s] 50it [00:12, 4.31it/s]2025-05-25 21:53:10,469 - INFO - [Epoch 033 | Batch 0050] IWAE-loss 1766.8324 | mean log_px -0.0126 | KL -1488.90 + 51it [00:12, 4.27it/s] 52it [00:12, 4.22it/s] 53it [00:12, 4.26it/s] 54it [00:12, 4.32it/s] 55it [00:13, 4.31it/s] 56it [00:13, 4.34it/s] 57it [00:13, 4.43it/s] 58it [00:13, 4.44it/s] 59it [00:14, 4.32it/s] 60it [00:14, 4.21it/s] 61it [00:14, 4.22it/s] 62it [00:14, 4.20it/s] 63it [00:15, 4.23it/s] 64it [00:15, 4.28it/s] 65it [00:15, 4.38it/s] 66it [00:15, 4.41it/s] 67it [00:15, 4.47it/s] 68it [00:16, 4.37it/s] 69it [00:16, 4.19it/s] 70it [00:16, 4.31it/s] 71it [00:16, 4.34it/s] 72it [00:17, 4.42it/s] 73it [00:17, 4.34it/s] 74it [00:17, 4.28it/s] 75it [00:17, 4.26it/s] 76it [00:18, 4.35it/s] 77it [00:18, 4.27it/s] 78it [00:18, 4.36it/s] 79it [00:18, 4.32it/s] 80it [00:18, 4.37it/s] 81it [00:19, 4.37it/s] 82it [00:19, 4.28it/s] 83it [00:19, 4.29it/s] 84it [00:19, 4.33it/s] 85it [00:20, 4.29it/s] 86it [00:20, 4.27it/s] 87it [00:20, 4.19it/s] 88it [00:20, 4.18it/s] 89it [00:21, 4.22it/s] 90it [00:21, 4.30it/s] 91it [00:21, 4.31it/s] 92it [00:21, 4.29it/s] 93it [00:21, 4.26it/s] 94it [00:22, 4.25it/s] 95it [00:22, 4.36it/s] 96it [00:22, 4.28it/s] 97it [00:22, 4.28it/s] 98it [00:23, 4.39it/s] 99it [00:23, 4.39it/s] 100it [00:23, 4.31it/s]2025-05-25 21:53:22,076 - INFO - [Epoch 033 | Batch 0100] IWAE-loss 1801.3687 | mean log_px -0.0054 | KL -1479.41 + 101it [00:23, 4.30it/s] 102it [00:24, 4.33it/s] 103it [00:24, 4.27it/s] 104it [00:24, 4.26it/s] 105it [00:24, 4.26it/s] 106it [00:25, 4.23it/s] 107it [00:25, 4.27it/s] 108it [00:25, 4.20it/s] 109it [00:25, 4.27it/s] 110it [00:25, 4.08it/s] 111it [00:26, 4.26it/s] 112it [00:26, 4.32it/s] 113it [00:26, 4.41it/s] 114it [00:26, 4.33it/s] 115it [00:27, 4.33it/s] 116it [00:27, 4.32it/s] 117it [00:27, 4.32it/s] 118it [00:27, 4.35it/s] 119it [00:28, 4.44it/s] 120it [00:28, 4.35it/s] 121it [00:28, 4.33it/s] 122it [00:28, 4.37it/s] 123it [00:28, 4.45it/s] 124it [00:29, 4.48it/s] 125it [00:29, 4.43it/s] 126it [00:29, 4.40it/s] 127it [00:29, 4.40it/s] 128it [00:30, 4.38it/s] 129it [00:30, 4.47it/s] 130it [00:30, 4.37it/s] 131it [00:30, 4.36it/s] 132it [00:30, 4.31it/s] 133it [00:31, 4.29it/s] 134it [00:31, 4.35it/s] 135it [00:31, 4.43it/s] 136it [00:31, 4.30it/s] 137it [00:32, 4.34it/s] 138it [00:32, 4.28it/s] 139it [00:32, 4.27it/s] 140it [00:32, 4.29it/s] 141it [00:33, 4.37it/s] 142it [00:33, 4.44it/s] 143it [00:33, 4.51it/s] 144it [00:33, 4.52it/s] 145it [00:33, 4.40it/s] 146it [00:34, 4.46it/s] 147it [00:34, 4.44it/s] 148it [00:34, 4.49it/s] 149it [00:34, 4.38it/s] 150it [00:35, 4.33it/s]2025-05-25 21:53:33,567 - INFO - [Epoch 033 | Batch 0150] IWAE-loss 1976.7753 | mean log_px -0.0103 | KL -1475.10 + 151it [00:35, 4.32it/s] 152it [00:35, 4.10it/s] 153it [00:35, 4.14it/s] 154it [00:36, 4.20it/s] 155it [00:36, 4.23it/s] 156it [00:36, 4.23it/s] 157it [00:36, 4.26it/s] 158it [00:36, 4.36it/s] 159it [00:37, 4.32it/s] 160it [00:37, 4.17it/s] 161it [00:37, 4.31it/s] 162it [00:37, 4.31it/s] 163it [00:38, 4.31it/s] 164it [00:38, 4.32it/s] 165it [00:38, 4.35it/s] 166it [00:38, 4.34it/s] 167it [00:39, 4.37it/s] 168it [00:39, 4.33it/s] 169it [00:39, 4.34it/s] 170it [00:39, 4.22it/s] 171it [00:40, 4.27it/s] 172it [00:40, 4.29it/s] 173it [00:40, 4.28it/s] 174it [00:40, 4.27it/s] 175it [00:40, 4.29it/s] 176it [00:41, 4.29it/s] 177it [00:41, 4.25it/s] 178it [00:41, 4.24it/s] 179it [00:41, 4.33it/s] 180it [00:42, 4.41it/s] 181it [00:42, 4.47it/s] 182it [00:42, 4.52it/s] 183it [00:42, 4.48it/s] 184it [00:42, 4.52it/s] 185it [00:43, 4.50it/s] 186it [00:43, 4.36it/s] 187it [00:43, 4.32it/s] 188it [00:43, 4.28it/s] 189it [00:44, 4.25it/s] 190it [00:44, 4.24it/s] 191it [00:44, 4.36it/s] 192it [00:44, 4.45it/s] 193it [00:45, 4.35it/s] 194it [00:45, 4.46it/s] 195it [00:45, 4.26it/s] 196it [00:45, 4.28it/s] 196it [00:45, 4.27it/s] +2025-05-25 21:53:44,142 - INFO - Epoch: 33, Objective: tensor([2188.4385], device='cuda:0', grad_fn=), Loss: 0.011592795141041279, KL/n: 29.990604400634766 + 0it [00:00, ?it/s]2025-05-25 21:53:44,545 - INFO - [Epoch 034 | Batch 0000] IWAE-loss 1666.0902 | mean log_px -0.0050 | KL -1469.55 + 1it [00:00, 2.98it/s] 2it [00:00, 3.81it/s] 3it [00:00, 4.03it/s] 4it [00:00, 4.28it/s] 5it [00:01, 4.43it/s] 6it [00:01, 4.51it/s] 7it [00:01, 4.59it/s] 8it [00:01, 4.62it/s] 9it [00:02, 4.66it/s] 10it [00:02, 4.65it/s] 11it [00:02, 4.68it/s] 12it [00:02, 4.69it/s] 13it [00:02, 4.70it/s] 14it [00:03, 4.71it/s] 15it [00:03, 4.71it/s] 16it [00:03, 4.54it/s] 17it [00:03, 4.62it/s] 18it [00:03, 4.64it/s] 19it [00:04, 4.67it/s] 20it [00:04, 4.66it/s] 21it [00:04, 4.69it/s] 22it [00:04, 4.70it/s] 23it [00:05, 4.71it/s] 24it [00:05, 4.70it/s] 25it [00:05, 4.72it/s] 26it [00:05, 4.71it/s] 27it [00:05, 4.72it/s] 28it [00:06, 4.71it/s] 29it [00:06, 4.73it/s] 30it [00:06, 4.72it/s] 31it [00:06, 4.72it/s] 32it [00:06, 4.71it/s] 33it [00:07, 4.71it/s] 34it [00:07, 4.70it/s] 35it [00:07, 4.71it/s] 36it [00:07, 4.70it/s] 37it [00:08, 4.70it/s] 38it [00:08, 4.71it/s] 39it [00:08, 4.71it/s] 40it [00:08, 4.66it/s] 41it [00:08, 4.67it/s] 42it [00:09, 4.51it/s] 43it [00:09, 4.59it/s] 44it [00:09, 4.62it/s] 45it [00:09, 4.65it/s] 46it [00:09, 4.67it/s] 47it [00:10, 4.69it/s] 48it [00:10, 4.64it/s] 49it [00:10, 4.68it/s] 50it [00:10, 4.69it/s]2025-05-25 21:53:55,240 - INFO - [Epoch 034 | Batch 0050] IWAE-loss 1685.5781 | mean log_px -0.0031 | KL -1466.24 + 51it [00:11, 4.70it/s] 52it [00:11, 4.70it/s] 53it [00:11, 4.71it/s] 54it [00:11, 4.71it/s] 55it [00:11, 4.71it/s] 56it [00:12, 4.71it/s] 57it [00:12, 4.72it/s] 58it [00:12, 4.72it/s] 59it [00:12, 4.70it/s] 60it [00:12, 4.71it/s] 61it [00:13, 4.71it/s] 62it [00:13, 4.69it/s] 63it [00:13, 4.69it/s] 64it [00:13, 4.69it/s] 65it [00:13, 4.71it/s] 66it [00:14, 4.71it/s] 67it [00:14, 4.71it/s] 68it [00:14, 4.71it/s] 69it [00:14, 4.71it/s] 70it [00:15, 4.71it/s] 71it [00:15, 4.71it/s] 72it [00:15, 4.71it/s] 73it [00:15, 4.71it/s] 74it [00:15, 4.71it/s] 75it [00:16, 4.71it/s] 76it [00:16, 4.71it/s] 77it [00:16, 4.71it/s] 78it [00:16, 4.70it/s] 79it [00:16, 4.70it/s] 80it [00:17, 4.71it/s] 81it [00:17, 4.71it/s] 82it [00:17, 4.71it/s] 83it [00:17, 4.68it/s] 84it [00:18, 4.69it/s] 85it [00:18, 4.70it/s] 86it [00:18, 4.69it/s] 87it [00:18, 4.70it/s] 88it [00:18, 4.70it/s] 89it [00:19, 4.55it/s] 90it [00:19, 4.60it/s] 91it [00:19, 4.65it/s] 92it [00:19, 4.67it/s] 93it [00:19, 4.63it/s] 94it [00:20, 4.64it/s] 95it [00:20, 4.50it/s] 96it [00:20, 4.56it/s] 97it [00:20, 4.53it/s] 98it [00:21, 4.46it/s] 99it [00:21, 4.51it/s] 100it [00:21, 4.54it/s]2025-05-25 21:54:05,961 - INFO - [Epoch 034 | Batch 0100] IWAE-loss 4595.9902 | mean log_px -0.0572 | KL -1454.45 + 101it [00:21, 4.56it/s] 102it [00:21, 4.55it/s] 103it [00:22, 4.61it/s] 104it [00:22, 4.63it/s] 105it [00:22, 4.53it/s] 106it [00:22, 4.60it/s] 107it [00:23, 4.64it/s] 108it [00:23, 4.66it/s] 109it [00:23, 4.67it/s] 110it [00:23, 4.51it/s] 111it [00:23, 4.58it/s] 112it [00:24, 4.62it/s] 113it [00:24, 4.65it/s] 114it [00:24, 4.67it/s] 115it [00:24, 4.69it/s] 116it [00:24, 4.70it/s] 117it [00:25, 4.70it/s] 118it [00:25, 4.70it/s] 119it [00:25, 4.71it/s] 120it [00:25, 4.71it/s] 121it [00:26, 4.71it/s] 122it [00:26, 4.71it/s] 123it [00:26, 4.71it/s] 124it [00:26, 4.71it/s] 125it [00:26, 4.72it/s] 126it [00:27, 4.72it/s] 127it [00:27, 4.56it/s] 128it [00:27, 4.62it/s] 129it [00:27, 4.64it/s] 130it [00:27, 4.66it/s] 131it [00:28, 4.66it/s] 132it [00:28, 4.55it/s] 133it [00:28, 4.59it/s] 134it [00:28, 4.51it/s] 135it [00:29, 4.59it/s] 136it [00:29, 4.62it/s] 137it [00:29, 4.63it/s] 138it [00:29, 4.65it/s] 139it [00:29, 4.68it/s] 140it [00:30, 4.69it/s] 141it [00:30, 4.70it/s] 142it [00:30, 4.69it/s] 143it [00:30, 4.70it/s] 144it [00:30, 4.71it/s] 145it [00:31, 4.72it/s] 146it [00:31, 4.66it/s] 147it [00:31, 4.69it/s] 148it [00:31, 4.69it/s] 149it [00:32, 4.71it/s] 150it [00:32, 4.70it/s]2025-05-25 21:54:16,695 - INFO - [Epoch 034 | Batch 0150] IWAE-loss 1796.6715 | mean log_px -0.0049 | KL -1448.83 + 151it [00:32, 4.70it/s] 152it [00:32, 4.71it/s] 153it [00:32, 4.71it/s] 154it [00:33, 4.55it/s] 155it [00:33, 4.61it/s] 156it [00:33, 4.64it/s] 157it [00:33, 4.67it/s] 158it [00:33, 4.68it/s] 159it [00:34, 4.70it/s] 160it [00:34, 4.53it/s] 161it [00:34, 4.59it/s] 162it [00:34, 4.63it/s] 163it [00:35, 4.65it/s] 164it [00:35, 4.67it/s] 165it [00:35, 4.65it/s] 166it [00:35, 4.67it/s] 167it [00:35, 4.68it/s] 168it [00:36, 4.68it/s] 169it [00:36, 4.70it/s] 170it [00:36, 4.70it/s] 171it [00:36, 4.71it/s] 172it [00:36, 4.71it/s] 173it [00:37, 4.72it/s] 174it [00:37, 4.71it/s] 175it [00:37, 4.71it/s] 176it [00:37, 4.70it/s] 177it [00:38, 4.71it/s] 178it [00:38, 4.71it/s] 179it [00:38, 4.72it/s] 180it [00:38, 4.71it/s] 181it [00:38, 4.72it/s] 182it [00:39, 4.55it/s] 183it [00:39, 4.61it/s] 184it [00:39, 4.64it/s] 185it [00:39, 4.67it/s] 186it [00:39, 4.68it/s] 187it [00:40, 4.60it/s] 188it [00:40, 4.63it/s] 189it [00:40, 4.65it/s] 190it [00:40, 4.67it/s] 191it [00:41, 4.68it/s] 192it [00:41, 4.66it/s] 193it [00:41, 4.54it/s] 194it [00:41, 4.60it/s] 195it [00:41, 4.42it/s] 196it [00:42, 4.51it/s] 196it [00:42, 4.64it/s] +2025-05-25 21:54:26,514 - INFO - Epoch: 34, Objective: tensor([1598.8741], device='cuda:0', grad_fn=), Loss: 0.003922741860151291, KL/n: 29.56195640563965 + 0it [00:00, ?it/s]2025-05-25 21:54:27,071 - INFO - [Epoch 035 | Batch 0000] IWAE-loss 1601.3729 | mean log_px -0.0040 | KL -1447.12 + 1it [00:00, 3.31it/s] 2it [00:00, 3.83it/s] 3it [00:00, 3.91it/s] 4it [00:01, 4.07it/s] 5it [00:01, 4.20it/s] 6it [00:01, 4.21it/s] 7it [00:01, 4.27it/s] 8it [00:01, 4.24it/s] 9it [00:02, 4.34it/s] 10it [00:02, 4.34it/s] 11it [00:02, 4.32it/s] 12it [00:02, 4.29it/s] 13it [00:03, 4.42it/s] 14it [00:03, 4.36it/s] 15it [00:03, 4.40it/s] 16it [00:03, 4.28it/s] 17it [00:03, 4.36it/s] 18it [00:04, 4.34it/s] 19it [00:04, 4.32it/s] 20it [00:04, 4.21it/s] 21it [00:04, 4.29it/s] 22it [00:05, 4.42it/s] 23it [00:05, 4.43it/s] 24it [00:05, 4.48it/s] 25it [00:05, 4.46it/s] 26it [00:06, 4.53it/s] 27it [00:06, 4.44it/s] 28it [00:06, 4.31it/s] 29it [00:06, 4.31it/s] 30it [00:06, 4.32it/s] 31it [00:07, 4.31it/s] 32it [00:07, 4.40it/s] 33it [00:07, 4.50it/s] 34it [00:07, 4.30it/s] 35it [00:08, 4.44it/s] 36it [00:08, 4.37it/s] 37it [00:08, 4.45it/s] 38it [00:08, 4.38it/s] 39it [00:09, 4.48it/s] 40it [00:09, 4.47it/s] 41it [00:09, 4.44it/s] 42it [00:09, 4.26it/s] 43it [00:09, 4.18it/s] 44it [00:10, 4.19it/s] 45it [00:10, 4.25it/s] 46it [00:10, 4.36it/s] 47it [00:10, 4.30it/s] 48it [00:11, 4.44it/s] 49it [00:11, 4.48it/s] 50it [00:11, 4.41it/s]2025-05-25 21:54:38,547 - INFO - [Epoch 035 | Batch 0050] IWAE-loss 1802.3173 | mean log_px -0.0079 | KL -1440.26 + 51it [00:11, 4.36it/s] 52it [00:12, 4.35it/s] 53it [00:12, 4.46it/s] 54it [00:12, 4.51it/s] 55it [00:12, 4.45it/s] 56it [00:12, 4.45it/s] 57it [00:13, 4.38it/s] 58it [00:13, 4.34it/s] 59it [00:13, 4.32it/s] 60it [00:13, 4.30it/s] 61it [00:14, 4.38it/s] 62it [00:14, 4.33it/s] 63it [00:14, 4.45it/s] 64it [00:14, 4.22it/s] 65it [00:14, 4.28it/s] 66it [00:15, 4.35it/s] 67it [00:15, 4.46it/s] 68it [00:15, 4.48it/s] 69it [00:15, 4.55it/s] 70it [00:16, 4.44it/s] 71it [00:16, 4.44it/s] 72it [00:16, 4.48it/s] 73it [00:16, 4.43it/s] 74it [00:17, 4.36it/s] 75it [00:17, 4.22it/s] 76it [00:17, 4.24it/s] 77it [00:17, 4.32it/s] 78it [00:17, 4.27it/s] 79it [00:18, 4.32it/s] 80it [00:18, 4.33it/s] 81it [00:18, 4.17it/s] 82it [00:18, 4.29it/s] 83it [00:19, 4.41it/s] 84it [00:19, 4.36it/s] 85it [00:19, 4.32it/s] 86it [00:19, 4.32it/s] 87it [00:20, 4.30it/s] 88it [00:20, 4.41it/s] 89it [00:20, 4.47it/s] 90it [00:20, 4.38it/s] 91it [00:20, 4.37it/s] 92it [00:21, 4.35it/s] 93it [00:21, 4.37it/s] 94it [00:21, 4.42it/s] 95it [00:21, 4.38it/s] 96it [00:22, 4.19it/s] 97it [00:22, 4.34it/s] 98it [00:22, 4.37it/s] 99it [00:22, 4.36it/s] 100it [00:23, 4.28it/s]2025-05-25 21:54:50,022 - INFO - [Epoch 035 | Batch 0100] IWAE-loss 1988.3760 | mean log_px -0.0165 | KL -1428.70 + 101it [00:23, 4.18it/s] 102it [00:23, 4.23it/s] 103it [00:23, 4.27it/s] 104it [00:23, 4.25it/s] 105it [00:24, 4.29it/s] 106it [00:24, 4.38it/s] 107it [00:24, 4.49it/s] 108it [00:24, 4.53it/s] 109it [00:25, 4.46it/s] 110it [00:25, 4.31it/s] 111it [00:25, 4.31it/s] 112it [00:25, 4.33it/s] 113it [00:26, 4.31it/s] 114it [00:26, 4.33it/s] 115it [00:26, 4.25it/s] 116it [00:26, 4.25it/s] 117it [00:26, 4.26it/s] 118it [00:27, 4.37it/s] 119it [00:27, 4.48it/s] 120it [00:27, 4.55it/s] 121it [00:27, 4.34it/s] 122it [00:28, 4.35it/s] 123it [00:28, 4.32it/s] 124it [00:28, 4.33it/s] 125it [00:28, 4.45it/s] 126it [00:28, 4.46it/s] 127it [00:29, 4.32it/s] 128it [00:29, 4.31it/s] 129it [00:29, 4.29it/s] 130it [00:29, 4.41it/s] 131it [00:30, 4.40it/s] 132it [00:30, 4.45it/s] 133it [00:30, 4.31it/s] 134it [00:30, 4.41it/s] 135it [00:31, 4.51it/s] 136it [00:31, 4.41it/s] 137it [00:31, 4.50it/s] 138it [00:31, 4.41it/s] 139it [00:31, 4.48it/s] 140it [00:32, 4.52it/s] 141it [00:32, 4.58it/s] 142it [00:32, 4.58it/s] 143it [00:32, 4.50it/s] 144it [00:33, 4.48it/s] 145it [00:33, 4.39it/s] 146it [00:33, 4.48it/s] 147it [00:33, 4.41it/s] 148it [00:33, 4.49it/s] 149it [00:34, 4.48it/s] 150it [00:34, 4.30it/s]2025-05-25 21:55:01,412 - INFO - [Epoch 035 | Batch 0150] IWAE-loss 1613.8336 | mean log_px -0.0041 | KL -1433.86 + 151it [00:34, 4.36it/s] 152it [00:34, 4.44it/s] 153it [00:35, 4.49it/s] 154it [00:35, 4.39it/s] 155it [00:35, 4.48it/s] 156it [00:35, 4.31it/s] 157it [00:36, 4.19it/s] 158it [00:36, 4.19it/s] 159it [00:36, 4.24it/s] 160it [00:36, 4.37it/s] 161it [00:36, 4.46it/s] 162it [00:37, 4.47it/s] 163it [00:37, 4.51it/s] 164it [00:37, 4.55it/s] 165it [00:37, 4.45it/s] 166it [00:38, 4.38it/s] 167it [00:38, 4.44it/s] 168it [00:38, 4.50it/s] 169it [00:38, 4.51it/s] 170it [00:38, 4.56it/s] 171it [00:39, 4.47it/s] 172it [00:39, 4.49it/s] 173it [00:39, 4.43it/s] 174it [00:39, 4.35it/s] 175it [00:40, 4.36it/s] 176it [00:40, 4.38it/s] 177it [00:40, 4.46it/s] 178it [00:40, 4.51it/s] 179it [00:40, 4.42it/s] 180it [00:41, 4.24it/s] 181it [00:41, 4.28it/s] 182it [00:41, 4.25it/s] 183it [00:41, 4.25it/s] 184it [00:42, 4.26it/s] 185it [00:42, 4.22it/s] 186it [00:42, 4.24it/s] 187it [00:42, 4.31it/s] 188it [00:43, 4.27it/s] 189it [00:43, 4.27it/s] 190it [00:43, 4.29it/s] 191it [00:43, 4.41it/s] 192it [00:44, 4.37it/s] 193it [00:44, 4.44it/s] 194it [00:44, 4.24it/s] 195it [00:44, 4.25it/s] 196it [00:44, 4.28it/s] 196it [00:45, 4.35it/s] +2025-05-25 21:55:11,853 - INFO - Epoch: 35, Objective: tensor([2143.9568], device='cuda:0', grad_fn=), Loss: 0.021683480590581894, KL/n: 29.22657012939453 + 0it [00:00, ?it/s]2025-05-25 21:55:12,247 - INFO - [Epoch 036 | Batch 0000] IWAE-loss 1631.0413 | mean log_px -0.0034 | KL -1429.53 + 1it [00:00, 3.06it/s] 2it [00:00, 3.69it/s] 3it [00:00, 3.93it/s] 4it [00:01, 4.11it/s] 5it [00:01, 4.21it/s] 6it [00:01, 4.36it/s] 7it [00:01, 4.38it/s] 8it [00:01, 4.48it/s] 9it [00:02, 3.57it/s] 10it [00:02, 3.83it/s] 11it [00:02, 3.99it/s] 12it [00:02, 4.17it/s] 13it [00:03, 4.27it/s] 14it [00:03, 4.27it/s] 15it [00:03, 4.27it/s] 16it [00:03, 4.26it/s] 17it [00:04, 4.36it/s] 18it [00:04, 4.35it/s] 19it [00:04, 4.39it/s] 20it [00:04, 4.26it/s] 21it [00:05, 4.36it/s] 22it [00:05, 4.37it/s] 23it [00:05, 4.24it/s] 24it [00:05, 4.27it/s] 25it [00:05, 4.38it/s] 26it [00:06, 4.47it/s] 27it [00:06, 4.46it/s] 28it [00:06, 4.39it/s] 29it [00:06, 4.38it/s] 30it [00:07, 4.47it/s] 31it [00:07, 4.55it/s] 32it [00:07, 4.58it/s] 33it [00:07, 4.63it/s] 34it [00:07, 4.50it/s] 35it [00:08, 4.32it/s] 36it [00:08, 4.29it/s] 37it [00:08, 4.32it/s] 38it [00:08, 4.41it/s] 39it [00:09, 4.48it/s] 40it [00:09, 4.40it/s] 41it [00:09, 4.33it/s] 42it [00:09, 4.36it/s] 43it [00:10, 4.47it/s] 44it [00:10, 4.39it/s] 45it [00:10, 4.47it/s] 46it [00:10, 4.53it/s] 47it [00:10, 4.50it/s] 48it [00:11, 4.54it/s] 49it [00:11, 4.46it/s] 50it [00:11, 4.39it/s]2025-05-25 21:55:23,723 - INFO - [Epoch 036 | Batch 0050] IWAE-loss 1841.2819 | mean log_px -0.0059 | KL -1423.28 + 51it [00:11, 4.33it/s] 52it [00:12, 4.35it/s] 53it [00:12, 4.45it/s] 54it [00:12, 4.38it/s] 55it [00:12, 4.20it/s] 56it [00:12, 4.22it/s] 57it [00:13, 4.25it/s] 58it [00:13, 4.29it/s] 59it [00:13, 4.28it/s] 60it [00:13, 4.26it/s] 61it [00:14, 4.18it/s] 62it [00:14, 4.31it/s] 63it [00:14, 4.42it/s] 64it [00:14, 4.35it/s] 65it [00:15, 4.36it/s] 66it [00:15, 4.32it/s] 67it [00:15, 4.32it/s] 68it [00:15, 4.32it/s] 69it [00:16, 4.23it/s] 70it [00:16, 4.07it/s] 71it [00:16, 4.22it/s] 72it [00:16, 4.35it/s] 73it [00:16, 4.34it/s] 74it [00:17, 4.29it/s] 75it [00:17, 4.40it/s] 76it [00:17, 4.34it/s] 77it [00:17, 4.29it/s] 78it [00:18, 4.31it/s] 79it [00:18, 4.31it/s] 80it [00:18, 4.43it/s] 81it [00:18, 4.46it/s] 82it [00:18, 4.53it/s] 83it [00:19, 4.55it/s] 84it [00:19, 4.41it/s] 85it [00:19, 4.29it/s] 86it [00:19, 4.36it/s] 87it [00:20, 4.46it/s] 88it [00:20, 4.37it/s] 89it [00:20, 4.37it/s] 90it [00:20, 4.32it/s] 91it [00:21, 4.43it/s] 92it [00:21, 4.35it/s] 93it [00:21, 4.40it/s] 94it [00:21, 4.49it/s] 95it [00:21, 4.40it/s] 96it [00:22, 4.28it/s] 97it [00:22, 4.38it/s] 98it [00:22, 4.43it/s] 99it [00:22, 4.48it/s] 100it [00:23, 4.55it/s]2025-05-25 21:55:35,207 - INFO - [Epoch 036 | Batch 0100] IWAE-loss 1601.9835 | mean log_px -0.0026 | KL -1416.70 + 101it [00:23, 4.43it/s] 102it [00:23, 4.49it/s] 103it [00:23, 4.56it/s] 104it [00:23, 4.43it/s] 105it [00:24, 4.49it/s] 106it [00:24, 4.50it/s] 107it [00:24, 4.49it/s] 108it [00:24, 4.54it/s] 109it [00:25, 4.44it/s] 110it [00:25, 4.50it/s] 111it [00:25, 4.43it/s] 112it [00:25, 4.44it/s] 113it [00:25, 4.52it/s] 114it [00:26, 4.55it/s] 115it [00:26, 4.45it/s] 116it [00:26, 4.51it/s] 117it [00:26, 4.57it/s] 118it [00:27, 4.61it/s] 119it [00:27, 4.59it/s] 120it [00:27, 4.39it/s] 121it [00:27, 4.49it/s] 122it [00:27, 4.54it/s] 123it [00:28, 4.58it/s] 124it [00:28, 4.55it/s] 125it [00:28, 4.58it/s] 126it [00:28, 4.48it/s] 127it [00:29, 4.56it/s] 128it [00:29, 4.43it/s] 129it [00:29, 4.41it/s] 130it [00:29, 4.34it/s] 131it [00:30, 4.23it/s] 132it [00:30, 4.24it/s] 133it [00:30, 4.27it/s] 134it [00:30, 4.38it/s] 135it [00:30, 4.34it/s] 136it [00:31, 4.43it/s] 137it [00:31, 4.50it/s] 138it [00:31, 4.54it/s] 139it [00:31, 4.59it/s] 140it [00:31, 4.62it/s] 141it [00:32, 4.64it/s] 142it [00:32, 4.52it/s] 143it [00:32, 4.43it/s] 144it [00:32, 4.30it/s] 145it [00:33, 4.35it/s] 146it [00:33, 4.34it/s] 147it [00:33, 4.31it/s] 148it [00:33, 4.32it/s] 149it [00:34, 4.42it/s] 150it [00:34, 4.36it/s]2025-05-25 21:55:46,465 - INFO - [Epoch 036 | Batch 0150] IWAE-loss 1938.5652 | mean log_px -0.0120 | KL -1410.55 + 151it [00:34, 4.19it/s] 152it [00:34, 4.20it/s] 153it [00:35, 4.26it/s] 154it [00:35, 4.35it/s] 155it [00:35, 4.45it/s] 156it [00:35, 4.37it/s] 157it [00:35, 4.24it/s] 158it [00:36, 4.21it/s] 159it [00:36, 4.23it/s] 160it [00:36, 4.24it/s] 161it [00:36, 4.28it/s] 162it [00:37, 4.42it/s] 163it [00:37, 4.35it/s] 164it [00:37, 4.33it/s] 165it [00:37, 4.39it/s] 166it [00:38, 4.45it/s] 167it [00:38, 4.40it/s] 168it [00:38, 4.41it/s] 169it [00:38, 4.47it/s] 170it [00:38, 4.46it/s] 171it [00:39, 4.53it/s] 172it [00:39, 4.53it/s] 173it [00:39, 4.39it/s] 174it [00:39, 4.18it/s] 175it [00:40, 4.23it/s] 176it [00:40, 4.20it/s] 177it [00:40, 4.26it/s] 178it [00:40, 4.26it/s] 179it [00:41, 4.28it/s] 180it [00:41, 4.14it/s] 181it [00:41, 4.24it/s] 182it [00:41, 4.33it/s] 183it [00:41, 4.36it/s] 184it [00:42, 4.34it/s] 185it [00:42, 4.37it/s] 186it [00:42, 4.34it/s] 187it [00:42, 4.34it/s] 188it [00:43, 4.43it/s] 189it [00:43, 4.51it/s] 190it [00:43, 4.42it/s] 191it [00:43, 4.37it/s] 192it [00:43, 4.36it/s] 193it [00:44, 4.32it/s] 194it [00:44, 4.34it/s] 195it [00:44, 4.14it/s] 196it [00:44, 4.19it/s] 196it [00:45, 4.35it/s] +2025-05-25 21:55:57,012 - INFO - Epoch: 36, Objective: tensor([1572.9171], device='cuda:0', grad_fn=), Loss: 0.004463386721909046, KL/n: 28.696121215820312 + 0it [00:00, ?it/s]2025-05-25 21:55:57,392 - INFO - [Epoch 037 | Batch 0000] IWAE-loss 1712.1151 | mean log_px -0.0071 | KL -1405.82 + 1it [00:00, 3.02it/s] 2it [00:00, 3.61it/s] 3it [00:00, 3.99it/s] 4it [00:01, 4.23it/s] 5it [00:01, 4.35it/s] 6it [00:01, 4.45it/s] 7it [00:01, 4.53it/s] 8it [00:01, 4.30it/s] 9it [00:02, 4.32it/s] 10it [00:02, 4.43it/s] 11it [00:02, 4.34it/s] 12it [00:02, 4.34it/s] 13it [00:03, 4.41it/s] 14it [00:03, 4.36it/s] 15it [00:03, 4.30it/s] 16it [00:03, 4.33it/s] 17it [00:03, 4.36it/s] 18it [00:04, 4.34it/s] 19it [00:04, 4.35it/s] 20it [00:04, 4.35it/s] 21it [00:04, 4.20it/s] 22it [00:05, 4.21it/s] 23it [00:05, 4.28it/s] 24it [00:05, 4.25it/s] 25it [00:05, 4.36it/s] 26it [00:06, 4.40it/s] 27it [00:06, 4.34it/s] 28it [00:06, 4.34it/s] 29it [00:06, 4.30it/s] 30it [00:07, 4.25it/s] 31it [00:07, 4.27it/s] 32it [00:07, 4.24it/s] 33it [00:07, 4.26it/s] 34it [00:07, 4.34it/s] 35it [00:08, 4.29it/s] 36it [00:08, 4.38it/s] 37it [00:08, 4.45it/s] 38it [00:08, 4.36it/s] 39it [00:09, 4.44it/s] 40it [00:09, 4.47it/s] 41it [00:09, 4.51it/s] 42it [00:09, 4.53it/s] 43it [00:09, 4.42it/s] 44it [00:10, 4.38it/s] 45it [00:10, 4.47it/s] 46it [00:10, 4.39it/s] 47it [00:10, 4.34it/s] 48it [00:11, 4.38it/s] 49it [00:11, 4.33it/s] 50it [00:11, 4.39it/s]2025-05-25 21:56:08,852 - INFO - [Epoch 037 | Batch 0050] IWAE-loss 1829.0848 | mean log_px -0.0077 | KL -1399.44 + 51it [00:11, 4.45it/s] 52it [00:11, 4.44it/s] 53it [00:12, 4.52it/s] 54it [00:12, 4.56it/s] 55it [00:12, 4.42it/s] 56it [00:12, 4.35it/s] 57it [00:13, 4.31it/s] 58it [00:13, 4.29it/s] 59it [00:13, 4.18it/s] 60it [00:13, 4.32it/s] 61it [00:14, 4.29it/s] 62it [00:14, 4.39it/s] 63it [00:14, 4.23it/s] 64it [00:14, 4.14it/s] 65it [00:15, 4.23it/s] 66it [00:15, 4.33it/s] 67it [00:15, 4.33it/s] 68it [00:15, 4.42it/s] 69it [00:15, 4.42it/s] 70it [00:16, 4.24it/s] 71it [00:16, 4.23it/s] 72it [00:16, 4.29it/s] 73it [00:16, 4.25it/s] 74it [00:17, 4.27it/s] 75it [00:17, 4.19it/s] 76it [00:17, 4.27it/s] 77it [00:17, 4.27it/s] 78it [00:18, 4.27it/s] 79it [00:18, 4.33it/s] 80it [00:18, 4.37it/s] 81it [00:18, 4.45it/s] 82it [00:18, 4.34it/s] 83it [00:19, 4.31it/s] 84it [00:19, 4.31it/s] 85it [00:19, 4.33it/s] 86it [00:19, 4.17it/s] 87it [00:20, 4.31it/s] 88it [00:20, 4.38it/s] 89it [00:20, 4.45it/s] 90it [00:20, 4.50it/s] 91it [00:21, 4.52it/s] 92it [00:21, 4.54it/s] 93it [00:21, 4.46it/s] 94it [00:21, 4.41it/s] 95it [00:21, 4.41it/s] 96it [00:22, 4.35it/s] 97it [00:22, 4.38it/s] 98it [00:22, 4.42it/s] 99it [00:22, 4.24it/s] 100it [00:23, 4.21it/s]2025-05-25 21:56:20,409 - INFO - [Epoch 037 | Batch 0100] IWAE-loss 1828.0680 | mean log_px -0.0090 | KL -1395.64 + 101it [00:23, 4.25it/s] 102it [00:23, 4.30it/s] 103it [00:23, 4.35it/s] 104it [00:24, 4.35it/s] 105it [00:24, 4.34it/s] 106it [00:24, 4.44it/s] 107it [00:24, 4.40it/s] 108it [00:24, 4.44it/s] 109it [00:25, 4.28it/s] 110it [00:25, 4.30it/s] 111it [00:25, 4.35it/s] 112it [00:25, 4.44it/s] 113it [00:26, 4.46it/s] 114it [00:26, 4.50it/s] 115it [00:26, 4.55it/s] 116it [00:26, 4.45it/s] 117it [00:26, 4.41it/s] 118it [00:27, 4.38it/s] 119it [00:27, 4.41it/s] 120it [00:27, 4.45it/s] 121it [00:27, 4.53it/s] 122it [00:28, 4.42it/s] 123it [00:28, 4.41it/s] 124it [00:28, 4.34it/s] 125it [00:28, 4.38it/s] 126it [00:28, 4.35it/s] 127it [00:29, 4.39it/s] 128it [00:29, 4.37it/s] 129it [00:29, 4.43it/s] 130it [00:29, 4.29it/s] 131it [00:30, 4.28it/s] 132it [00:30, 4.30it/s] 133it [00:30, 4.40it/s] 134it [00:30, 4.49it/s] 135it [00:31, 4.40it/s] 136it [00:31, 4.44it/s] 137it [00:31, 4.53it/s] 138it [00:31, 4.55it/s] 139it [00:31, 4.45it/s] 140it [00:32, 4.51it/s] 141it [00:32, 4.57it/s] 142it [00:32, 4.61it/s] 143it [00:32, 4.48it/s] 144it [00:33, 4.42it/s] 145it [00:33, 4.42it/s] 146it [00:33, 4.36it/s] 147it [00:33, 4.23it/s] 148it [00:33, 4.23it/s] 149it [00:34, 4.28it/s] 150it [00:34, 4.32it/s]2025-05-25 21:56:31,765 - INFO - [Epoch 037 | Batch 0150] IWAE-loss 2035.0342 | mean log_px -0.0140 | KL -1391.93 + 151it [00:34, 4.30it/s] 152it [00:34, 4.40it/s] 153it [00:35, 4.37it/s] 154it [00:35, 4.17it/s] 155it [00:35, 4.24it/s] 156it [00:35, 4.23it/s] 157it [00:36, 4.28it/s] 158it [00:36, 4.36it/s] 159it [00:36, 4.33it/s] 160it [00:36, 4.33it/s] 161it [00:36, 4.33it/s] 162it [00:37, 4.42it/s] 163it [00:37, 4.51it/s] 164it [00:37, 4.56it/s] 165it [00:37, 4.53it/s] 166it [00:38, 4.57it/s] 167it [00:38, 4.62it/s] 168it [00:38, 4.63it/s] 169it [00:38, 4.65it/s] 170it [00:38, 4.51it/s] 171it [00:39, 4.46it/s] 172it [00:39, 4.54it/s] 173it [00:39, 4.50it/s] 174it [00:39, 4.43it/s] 175it [00:40, 4.44it/s] 176it [00:40, 4.51it/s] 177it [00:40, 4.54it/s] 178it [00:40, 4.59it/s] 179it [00:40, 4.46it/s] 180it [00:41, 4.31it/s] 181it [00:41, 4.44it/s] 182it [00:41, 4.41it/s] 183it [00:41, 4.51it/s] 184it [00:42, 4.54it/s] 185it [00:42, 4.60it/s] 186it [00:42, 4.47it/s] 187it [00:42, 4.32it/s] 188it [00:42, 4.43it/s] 189it [00:43, 4.39it/s] 190it [00:43, 4.51it/s] 191it [00:43, 4.42it/s] 192it [00:43, 4.30it/s] 193it [00:44, 4.32it/s] 194it [00:44, 4.33it/s] 195it [00:44, 4.34it/s] 196it [00:44, 4.40it/s] 196it [00:44, 4.37it/s] +2025-05-25 21:56:42,037 - INFO - Epoch: 37, Objective: tensor([1723.5656], device='cuda:0', grad_fn=), Loss: 0.004755986854434013, KL/n: 28.372997283935547 + 0it [00:00, ?it/s]2025-05-25 21:56:42,621 - INFO - [Epoch 038 | Batch 0000] IWAE-loss 1650.8577 | mean log_px -0.0084 | KL -1389.24 + 1it [00:00, 3.11it/s] 2it [00:00, 3.52it/s] 3it [00:00, 4.00it/s] 4it [00:01, 4.22it/s] 5it [00:01, 4.24it/s] 6it [00:01, 4.23it/s] 7it [00:01, 4.24it/s] 8it [00:01, 4.14it/s] 9it [00:02, 4.19it/s] 10it [00:02, 4.21it/s] 11it [00:02, 4.21it/s] 12it [00:02, 4.26it/s] 13it [00:03, 4.23it/s] 14it [00:03, 4.36it/s] 15it [00:03, 4.34it/s] 16it [00:03, 4.37it/s] 17it [00:04, 4.36it/s] 18it [00:04, 4.33it/s] 19it [00:04, 4.24it/s] 20it [00:04, 4.38it/s] 21it [00:04, 4.41it/s] 22it [00:05, 4.38it/s] 23it [00:05, 4.40it/s] 24it [00:05, 4.35it/s] 25it [00:05, 4.22it/s] 26it [00:06, 4.37it/s] 27it [00:06, 4.37it/s] 28it [00:06, 4.38it/s] 29it [00:06, 4.40it/s] 30it [00:07, 4.25it/s] 31it [00:07, 4.29it/s] 32it [00:07, 4.28it/s] 33it [00:07, 4.28it/s] 34it [00:07, 4.28it/s] 35it [00:08, 4.36it/s] 36it [00:08, 4.30it/s] 37it [00:08, 4.28it/s] 38it [00:08, 4.28it/s] 39it [00:09, 4.39it/s] 40it [00:09, 4.46it/s] 41it [00:09, 4.39it/s] 42it [00:09, 4.38it/s] 43it [00:10, 4.47it/s] 44it [00:10, 4.44it/s] 45it [00:10, 4.41it/s] 46it [00:10, 4.48it/s] 47it [00:10, 4.40it/s] 48it [00:11, 4.28it/s] 49it [00:11, 4.35it/s] 50it [00:11, 4.45it/s]2025-05-25 21:56:54,134 - INFO - [Epoch 038 | Batch 0050] IWAE-loss 1416.7461 | mean log_px -0.0029 | KL -1381.36 + 51it [00:11, 4.48it/s] 52it [00:12, 4.40it/s] 53it [00:12, 4.45it/s] 54it [00:12, 4.52it/s] 55it [00:12, 4.40it/s] 56it [00:12, 4.33it/s] 57it [00:13, 4.35it/s] 58it [00:13, 4.40it/s] 59it [00:13, 4.47it/s] 60it [00:13, 4.53it/s] 61it [00:14, 4.42it/s] 62it [00:14, 4.28it/s] 63it [00:14, 4.27it/s] 64it [00:14, 4.36it/s] 65it [00:15, 4.45it/s] 66it [00:15, 4.49it/s] 67it [00:15, 4.41it/s] 68it [00:15, 4.37it/s] 69it [00:15, 4.37it/s] 70it [00:16, 4.36it/s] 71it [00:16, 4.36it/s] 72it [00:16, 4.45it/s] 73it [00:16, 4.37it/s] 74it [00:17, 4.33it/s] 75it [00:17, 4.37it/s] 76it [00:17, 4.44it/s] 77it [00:17, 4.35it/s] 78it [00:17, 4.35it/s] 79it [00:18, 4.36it/s] 80it [00:18, 4.31it/s] 81it [00:18, 4.31it/s] 82it [00:18, 4.30it/s] 83it [00:19, 4.35it/s] 84it [00:19, 4.42it/s] 85it [00:19, 4.37it/s] 86it [00:19, 4.32it/s] 87it [00:20, 4.34it/s] 88it [00:20, 4.39it/s] 89it [00:20, 4.35it/s] 90it [00:20, 4.20it/s] 91it [00:21, 4.25it/s] 92it [00:21, 4.23it/s] 93it [00:21, 4.34it/s] 94it [00:21, 4.42it/s] 95it [00:21, 4.35it/s] 96it [00:22, 4.24it/s] 97it [00:22, 4.34it/s] 98it [00:22, 4.31it/s] 99it [00:22, 4.28it/s] 100it [00:23, 4.29it/s]2025-05-25 21:57:05,608 - INFO - [Epoch 038 | Batch 0100] IWAE-loss 1494.8090 | mean log_px -0.0030 | KL -1374.98 + 101it [00:23, 4.23it/s] 102it [00:23, 4.36it/s] 103it [00:23, 4.33it/s] 104it [00:23, 4.40it/s] 105it [00:24, 4.36it/s] 106it [00:24, 4.38it/s] 107it [00:24, 4.46it/s] 108it [00:24, 4.45it/s] 109it [00:25, 4.41it/s] 110it [00:25, 4.45it/s] 111it [00:25, 4.52it/s] 112it [00:25, 4.41it/s] 113it [00:26, 4.40it/s] 114it [00:26, 4.34it/s] 115it [00:26, 4.22it/s] 116it [00:26, 4.35it/s] 117it [00:26, 4.44it/s] 118it [00:27, 4.48it/s] 119it [00:27, 4.40it/s] 120it [00:27, 4.47it/s] 121it [00:27, 4.48it/s] 122it [00:28, 4.41it/s] 123it [00:28, 4.46it/s] 124it [00:28, 4.51it/s] 125it [00:28, 4.56it/s] 126it [00:28, 4.56it/s] 127it [00:29, 4.47it/s] 128it [00:29, 4.43it/s] 129it [00:29, 4.26it/s] 130it [00:29, 4.35it/s] 131it [00:30, 4.44it/s] 132it [00:30, 4.36it/s] 133it [00:30, 4.36it/s] 134it [00:30, 4.21it/s] 135it [00:31, 4.22it/s] 136it [00:31, 4.16it/s] 137it [00:31, 4.24it/s] 138it [00:31, 4.23it/s] 139it [00:31, 4.31it/s] 140it [00:32, 4.36it/s] 141it [00:32, 4.41it/s] 142it [00:32, 4.47it/s] 143it [00:32, 4.48it/s] 144it [00:33, 4.41it/s] 145it [00:33, 4.41it/s] 146it [00:33, 4.43it/s] 147it [00:33, 4.36it/s] 148it [00:34, 4.34it/s] 149it [00:34, 4.30it/s] 150it [00:34, 4.29it/s]2025-05-25 21:57:17,037 - INFO - [Epoch 038 | Batch 0150] IWAE-loss 2008.2279 | mean log_px -0.0121 | KL -1368.49 + 151it [00:34, 4.26it/s] 152it [00:34, 4.30it/s] 153it [00:35, 4.31it/s] 154it [00:35, 4.29it/s] 155it [00:35, 4.28it/s] 156it [00:35, 4.28it/s] 157it [00:36, 4.27it/s] 158it [00:36, 4.29it/s] 159it [00:36, 4.32it/s] 160it [00:36, 4.37it/s] 161it [00:37, 4.34it/s] 162it [00:37, 4.35it/s] 163it [00:37, 4.41it/s] 164it [00:37, 4.36it/s] 165it [00:37, 4.34it/s] 166it [00:38, 4.35it/s] 167it [00:38, 4.28it/s] 168it [00:38, 4.30it/s] 169it [00:38, 4.28it/s] 170it [00:39, 4.30it/s] 171it [00:39, 4.28it/s] 172it [00:39, 4.27it/s] 173it [00:39, 4.38it/s] 174it [00:40, 4.42it/s] 175it [00:40, 4.33it/s] 176it [00:40, 4.37it/s] 177it [00:40, 4.33it/s] 178it [00:40, 4.39it/s] 179it [00:41, 4.47it/s] 180it [00:41, 4.50it/s] 181it [00:41, 4.36it/s] 182it [00:41, 4.34it/s] 183it [00:42, 4.44it/s] 184it [00:42, 4.44it/s] 185it [00:42, 4.42it/s] 186it [00:42, 4.39it/s] 187it [00:43, 4.35it/s] 188it [00:43, 4.36it/s] 189it [00:43, 4.46it/s] 190it [00:43, 4.41it/s] 191it [00:43, 4.30it/s] 192it [00:44, 4.29it/s] 193it [00:44, 4.32it/s] 194it [00:44, 4.35it/s] 195it [00:44, 4.32it/s] 196it [00:45, 4.36it/s] 196it [00:45, 4.34it/s] +2025-05-25 21:57:27,508 - INFO - Epoch: 38, Objective: tensor([1541.9781], device='cuda:0', grad_fn=), Loss: 0.006994233466684818, KL/n: 27.92793846130371 + 0it [00:00, ?it/s]2025-05-25 21:57:27,907 - INFO - [Epoch 039 | Batch 0000] IWAE-loss 2019.2355 | mean log_px -0.0157 | KL -1369.24 + 1it [00:00, 2.82it/s] 2it [00:00, 3.63it/s] 3it [00:00, 4.04it/s] 4it [00:01, 4.09it/s] 5it [00:01, 4.15it/s] 6it [00:01, 4.15it/s] 7it [00:01, 4.31it/s] 8it [00:02, 3.40it/s] 9it [00:02, 3.58it/s] 10it [00:02, 3.75it/s] 11it [00:02, 3.93it/s] 12it [00:03, 4.10it/s] 13it [00:03, 4.27it/s] 14it [00:03, 4.36it/s] 15it [00:03, 4.45it/s] 16it [00:03, 4.38it/s] 17it [00:04, 4.41it/s] 18it [00:04, 4.22it/s] 19it [00:04, 4.24it/s] 20it [00:04, 4.23it/s] 21it [00:05, 4.27it/s] 22it [00:05, 4.38it/s] 23it [00:05, 4.38it/s] 24it [00:05, 4.35it/s] 25it [00:06, 4.40it/s] 26it [00:06, 4.36it/s] 27it [00:06, 4.43it/s] 28it [00:06, 4.50it/s] 29it [00:06, 4.55it/s] 30it [00:07, 4.43it/s] 31it [00:07, 4.49it/s] 32it [00:07, 4.53it/s] 33it [00:07, 4.58it/s] 34it [00:08, 4.61it/s] 35it [00:08, 4.64it/s] 36it [00:08, 4.41it/s] 37it [00:08, 4.39it/s] 38it [00:08, 4.45it/s] 39it [00:09, 4.51it/s] 40it [00:09, 4.56it/s] 41it [00:09, 4.60it/s] 42it [00:09, 4.47it/s] 43it [00:10, 4.49it/s] 44it [00:10, 4.56it/s] 45it [00:10, 4.54it/s] 46it [00:10, 4.57it/s] 47it [00:10, 4.41it/s] 48it [00:11, 4.50it/s] 49it [00:11, 4.41it/s] 50it [00:11, 4.41it/s]2025-05-25 21:57:39,417 - INFO - [Epoch 039 | Batch 0050] IWAE-loss 1660.3208 | mean log_px -0.0043 | KL -1355.90 + 51it [00:11, 4.36it/s] 52it [00:12, 4.38it/s] 53it [00:12, 4.48it/s] 54it [00:12, 4.50it/s] 55it [00:12, 4.43it/s] 56it [00:12, 4.49it/s] 57it [00:13, 4.38it/s] 58it [00:13, 4.44it/s] 59it [00:13, 4.38it/s] 60it [00:13, 4.35it/s] 61it [00:14, 4.31it/s] 62it [00:14, 4.18it/s] 63it [00:14, 4.31it/s] 64it [00:14, 4.42it/s] 65it [00:15, 4.49it/s] 66it [00:15, 4.55it/s] 67it [00:15, 4.53it/s] 68it [00:15, 4.43it/s] 69it [00:15, 4.30it/s] 70it [00:16, 4.31it/s] 71it [00:16, 4.42it/s] 72it [00:16, 4.41it/s] 73it [00:16, 4.51it/s] 74it [00:17, 4.41it/s] 75it [00:17, 4.47it/s] 76it [00:17, 4.33it/s] 77it [00:17, 4.41it/s] 78it [00:17, 4.49it/s] 79it [00:18, 4.52it/s] 80it [00:18, 4.56it/s] 81it [00:18, 4.58it/s] 82it [00:18, 4.49it/s] 83it [00:19, 4.57it/s] 84it [00:19, 4.60it/s] 85it [00:19, 4.63it/s] 86it [00:19, 4.59it/s] 87it [00:19, 4.62it/s] 88it [00:20, 4.64it/s] 89it [00:20, 4.66it/s] 90it [00:20, 4.67it/s] 91it [00:20, 4.51it/s] 92it [00:21, 4.36it/s] 93it [00:21, 4.38it/s] 94it [00:21, 4.31it/s] 95it [00:21, 4.29it/s] 96it [00:21, 4.27it/s] 97it [00:22, 4.27it/s] 98it [00:22, 4.28it/s] 99it [00:22, 4.41it/s] 100it [00:22, 4.31it/s]2025-05-25 21:57:50,678 - INFO - [Epoch 039 | Batch 0100] IWAE-loss 2246.3765 | mean log_px -0.0212 | KL -1355.14 + 101it [00:23, 4.43it/s] 102it [00:23, 4.49it/s] 103it [00:23, 4.51it/s] 104it [00:23, 4.56it/s] 105it [00:23, 4.61it/s] 106it [00:24, 4.63it/s] 107it [00:24, 4.44it/s] 108it [00:24, 4.38it/s] 109it [00:24, 4.34it/s] 110it [00:25, 4.32it/s] 111it [00:25, 4.44it/s] 112it [00:25, 4.46it/s] 113it [00:25, 4.51it/s] 114it [00:26, 4.43it/s] 115it [00:26, 4.42it/s] 116it [00:26, 4.34it/s] 117it [00:26, 4.34it/s] 118it [00:26, 4.37it/s] 119it [00:27, 4.45it/s] 120it [00:27, 4.52it/s] 121it [00:27, 4.34it/s] 122it [00:27, 4.32it/s] 123it [00:28, 4.38it/s] 124it [00:28, 4.35it/s] 125it [00:28, 4.37it/s] 126it [00:28, 4.32it/s] 127it [00:28, 4.35it/s] 128it [00:29, 4.37it/s] 129it [00:29, 4.41it/s] 130it [00:29, 4.34it/s] 131it [00:29, 4.32it/s] 132it [00:30, 4.34it/s] 133it [00:30, 4.34it/s] 134it [00:30, 4.34it/s] 135it [00:30, 4.24it/s] 136it [00:31, 4.35it/s] 137it [00:31, 4.45it/s] 138it [00:31, 4.52it/s] 139it [00:31, 4.57it/s] 140it [00:31, 4.46it/s] 141it [00:32, 4.35it/s] 142it [00:32, 4.31it/s] 143it [00:32, 4.34it/s] 144it [00:32, 4.31it/s] 145it [00:33, 4.42it/s] 146it [00:33, 4.48it/s] 147it [00:33, 4.42it/s] 148it [00:33, 4.35it/s] 149it [00:34, 4.24it/s] 150it [00:34, 4.37it/s]2025-05-25 21:58:02,062 - INFO - [Epoch 039 | Batch 0150] IWAE-loss 1432.8291 | mean log_px -0.0022 | KL -1358.02 + 151it [00:34, 4.31it/s] 152it [00:34, 4.41it/s] 153it [00:34, 4.41it/s] 154it [00:35, 4.29it/s] 155it [00:35, 4.40it/s] 156it [00:35, 4.34it/s] 157it [00:35, 4.31it/s] 158it [00:36, 4.36it/s] 159it [00:36, 4.45it/s] 160it [00:36, 4.41it/s] 161it [00:36, 4.23it/s] 162it [00:37, 4.27it/s] 163it [00:37, 4.37it/s] 164it [00:37, 4.43it/s] 165it [00:37, 4.41it/s] 166it [00:37, 4.37it/s] 167it [00:38, 4.37it/s] 168it [00:38, 4.34it/s] 169it [00:38, 4.32it/s] 170it [00:38, 4.39it/s] 171it [00:39, 4.48it/s] 172it [00:39, 4.55it/s] 173it [00:39, 4.34it/s] 174it [00:39, 4.39it/s] 175it [00:39, 4.37it/s] 176it [00:40, 4.31it/s] 177it [00:40, 4.34it/s] 178it [00:40, 4.39it/s] 179it [00:40, 4.42it/s] 180it [00:41, 4.45it/s] 181it [00:41, 4.45it/s] 182it [00:41, 4.42it/s] 183it [00:41, 4.29it/s] 184it [00:42, 4.36it/s] 185it [00:42, 4.43it/s] 186it [00:42, 4.50it/s] 187it [00:42, 4.53it/s] 188it [00:42, 4.47it/s] 189it [00:43, 4.47it/s] 190it [00:43, 4.52it/s] 191it [00:43, 4.58it/s] 192it [00:43, 4.61it/s] 193it [00:43, 4.64it/s] 194it [00:44, 4.49it/s] 195it [00:44, 4.21it/s] 196it [00:44, 4.37it/s] 196it [00:44, 4.38it/s] +2025-05-25 21:58:12,405 - INFO - Epoch: 39, Objective: tensor([1496.1766], device='cuda:0', grad_fn=), Loss: 0.00248352880589664, KL/n: 27.671977996826172 + 0it [00:00, ?it/s]2025-05-25 21:58:12,802 - INFO - [Epoch 040 | Batch 0000] IWAE-loss 1431.6737 | mean log_px -0.0017 | KL -1354.64 + 1it [00:00, 3.04it/s] 2it [00:00, 3.77it/s] 3it [00:00, 4.14it/s] 4it [00:00, 4.25it/s] 5it [00:01, 4.40it/s] 6it [00:01, 4.42it/s] 7it [00:01, 4.51it/s] 8it [00:01, 4.43it/s] 9it [00:02, 4.42it/s] 10it [00:02, 4.39it/s] 11it [00:02, 4.39it/s] 12it [00:02, 4.18it/s] 13it [00:03, 4.33it/s] 14it [00:03, 4.29it/s] 15it [00:03, 4.28it/s] 16it [00:03, 4.17it/s] 17it [00:03, 4.20it/s] 18it [00:04, 4.32it/s] 19it [00:04, 4.41it/s] 20it [00:04, 4.41it/s] 21it [00:04, 4.36it/s] 22it [00:05, 4.46it/s] 23it [00:05, 4.44it/s] 24it [00:05, 4.39it/s] 25it [00:05, 4.38it/s] 26it [00:06, 4.47it/s] 27it [00:06, 4.43it/s] 28it [00:06, 4.40it/s] 29it [00:06, 4.50it/s] 30it [00:06, 4.45it/s] 31it [00:07, 4.46it/s] 32it [00:07, 4.30it/s] 33it [00:07, 4.34it/s] 34it [00:07, 4.30it/s] 35it [00:08, 4.32it/s] 36it [00:08, 4.33it/s] 37it [00:08, 4.40it/s] 38it [00:08, 4.22it/s] 39it [00:09, 4.32it/s] 40it [00:09, 4.40it/s] 41it [00:09, 4.46it/s] 42it [00:09, 4.34it/s] 43it [00:09, 4.44it/s] 44it [00:10, 4.47it/s] 45it [00:10, 4.36it/s] 46it [00:10, 4.33it/s] 47it [00:10, 4.37it/s] 48it [00:11, 4.42it/s] 49it [00:11, 4.38it/s] 50it [00:11, 4.03it/s]2025-05-25 21:58:24,258 - INFO - [Epoch 040 | Batch 0050] IWAE-loss 1473.0669 | mean log_px -0.0033 | KL -1345.21 + 51it [00:11, 4.17it/s] 52it [00:12, 4.16it/s] 53it [00:12, 4.11it/s] 54it [00:12, 4.09it/s] 55it [00:12, 4.12it/s] 56it [00:12, 4.27it/s] 57it [00:13, 4.37it/s] 58it [00:13, 4.38it/s] 59it [00:13, 4.25it/s] 60it [00:13, 4.25it/s] 61it [00:14, 4.38it/s] 62it [00:14, 4.35it/s] 63it [00:14, 4.28it/s] 64it [00:14, 4.27it/s] 65it [00:15, 4.27it/s] 66it [00:15, 4.26it/s] 67it [00:15, 4.22it/s] 68it [00:15, 4.24it/s] 69it [00:16, 4.27it/s] 70it [00:16, 4.29it/s] 71it [00:16, 4.39it/s] 72it [00:16, 4.34it/s] 73it [00:16, 4.31it/s] 74it [00:17, 4.16it/s] 75it [00:17, 4.21it/s] 76it [00:17, 4.24it/s] 77it [00:17, 4.26it/s] 78it [00:18, 4.25it/s] 79it [00:18, 4.28it/s] 80it [00:18, 4.22it/s] 81it [00:18, 4.26it/s] 82it [00:19, 4.28it/s] 83it [00:19, 4.29it/s] 84it [00:19, 4.21it/s] 85it [00:19, 4.26it/s] 86it [00:19, 4.25it/s] 87it [00:20, 4.27it/s] 88it [00:20, 4.23it/s] 89it [00:20, 4.22it/s] 90it [00:20, 4.25it/s] 91it [00:21, 4.35it/s] 92it [00:21, 4.34it/s] 93it [00:21, 4.34it/s] 94it [00:21, 4.22it/s] 95it [00:22, 4.23it/s] 96it [00:22, 4.29it/s] 97it [00:22, 4.33it/s] 98it [00:22, 4.40it/s] 99it [00:22, 4.46it/s] 100it [00:23, 4.40it/s]2025-05-25 21:58:35,927 - INFO - [Epoch 040 | Batch 0100] IWAE-loss 1605.0006 | mean log_px -0.0037 | KL -1343.43 + 101it [00:23, 4.42it/s] 102it [00:23, 4.41it/s] 103it [00:23, 4.49it/s] 104it [00:24, 4.31it/s] 105it [00:24, 4.32it/s] 106it [00:24, 4.29it/s] 107it [00:24, 4.34it/s] 108it [00:25, 4.31it/s] 109it [00:25, 4.24it/s] 110it [00:25, 4.38it/s] 111it [00:25, 4.47it/s] 112it [00:25, 4.53it/s] 113it [00:26, 4.44it/s] 114it [00:26, 4.39it/s] 115it [00:26, 4.51it/s] 116it [00:26, 4.56it/s] 117it [00:27, 4.60it/s] 118it [00:27, 4.50it/s] 119it [00:27, 4.43it/s] 120it [00:27, 4.35it/s] 121it [00:27, 4.34it/s] 122it [00:28, 4.34it/s] 123it [00:28, 4.31it/s] 124it [00:28, 4.30it/s] 125it [00:28, 4.20it/s] 126it [00:29, 4.21it/s] 127it [00:29, 4.25it/s] 128it [00:29, 4.11it/s] 129it [00:29, 4.20it/s] 130it [00:30, 4.32it/s] 131it [00:30, 4.30it/s] 132it [00:30, 4.30it/s] 133it [00:30, 4.33it/s] 134it [00:31, 4.26it/s] 135it [00:31, 4.27it/s] 136it [00:31, 4.38it/s] 137it [00:31, 4.39it/s] 138it [00:31, 4.40it/s] 139it [00:32, 4.40it/s] 140it [00:32, 4.38it/s] 141it [00:32, 4.47it/s] 142it [00:32, 4.25it/s] 143it [00:33, 4.29it/s] 144it [00:33, 4.28it/s] 145it [00:33, 4.37it/s] 146it [00:33, 4.45it/s] 147it [00:34, 4.37it/s] 148it [00:34, 4.36it/s] 149it [00:34, 4.38it/s] 150it [00:34, 4.45it/s]2025-05-25 21:58:47,410 - INFO - [Epoch 040 | Batch 0150] IWAE-loss 1694.4125 | mean log_px -0.0137 | KL -1343.96 + 151it [00:34, 4.25it/s] 152it [00:35, 4.18it/s] 153it [00:35, 4.18it/s] 154it [00:35, 4.30it/s] 155it [00:35, 4.32it/s] 156it [00:36, 4.39it/s] 157it [00:36, 4.47it/s] 158it [00:36, 4.39it/s] 159it [00:36, 4.20it/s] 160it [00:37, 4.22it/s] 161it [00:37, 4.31it/s] 162it [00:37, 4.28it/s] 163it [00:37, 4.40it/s] 164it [00:37, 4.46it/s] 165it [00:38, 4.44it/s] 166it [00:38, 4.36it/s] 167it [00:38, 4.36it/s] 168it [00:38, 4.41it/s] 169it [00:39, 4.48it/s] 170it [00:39, 4.44it/s] 171it [00:39, 4.37it/s] 172it [00:39, 4.44it/s] 173it [00:39, 4.40it/s] 174it [00:40, 4.45it/s] 175it [00:40, 4.40it/s] 176it [00:40, 4.47it/s] 177it [00:40, 4.41it/s] 178it [00:41, 4.43it/s] 179it [00:41, 4.50it/s] 180it [00:41, 4.53it/s] 181it [00:41, 4.43it/s] 182it [00:42, 4.33it/s] 183it [00:42, 4.33it/s] 184it [00:42, 4.29it/s] 185it [00:42, 4.33it/s] 186it [00:42, 4.31it/s] 187it [00:43, 4.28it/s] 188it [00:43, 4.25it/s] 189it [00:43, 4.27it/s] 190it [00:43, 4.29it/s] 191it [00:44, 4.28it/s] 192it [00:44, 4.28it/s] 193it [00:44, 4.39it/s] 194it [00:44, 4.28it/s] 195it [00:45, 4.14it/s] 196it [00:45, 4.30it/s] 196it [00:45, 4.32it/s] +2025-05-25 21:58:57,885 - INFO - Epoch: 40, Objective: tensor([1448.3232], device='cuda:0', grad_fn=), Loss: 0.0037635706830769777, KL/n: 27.25246238708496 + 0it [00:00, ?it/s]2025-05-25 21:58:58,468 - INFO - [Epoch 041 | Batch 0000] IWAE-loss 1551.8910 | mean log_px -0.0058 | KL -1334.23 + 1it [00:00, 2.97it/s] 2it [00:00, 3.79it/s] 3it [00:00, 4.11it/s] 4it [00:00, 4.24it/s] 5it [00:01, 4.27it/s] 6it [00:01, 4.36it/s] 7it [00:01, 4.31it/s] 8it [00:01, 4.32it/s] 9it [00:02, 4.34it/s] 10it [00:02, 4.17it/s] 11it [00:02, 4.16it/s] 12it [00:02, 4.21it/s] 13it [00:03, 4.21it/s] 14it [00:03, 4.32it/s] 15it [00:03, 4.33it/s] 16it [00:03, 4.31it/s] 17it [00:04, 4.39it/s] 18it [00:04, 4.18it/s] 19it [00:04, 4.20it/s] 20it [00:04, 4.18it/s] 21it [00:04, 4.21it/s] 22it [00:05, 4.31it/s] 23it [00:05, 4.28it/s] 24it [00:05, 4.25it/s] 25it [00:05, 4.27it/s] 26it [00:06, 4.14it/s] 27it [00:06, 4.26it/s] 28it [00:06, 4.29it/s] 29it [00:06, 4.40it/s] 30it [00:07, 4.31it/s] 31it [00:07, 4.31it/s] 32it [00:07, 4.14it/s] 33it [00:07, 4.18it/s] 34it [00:08, 4.28it/s] 35it [00:08, 4.34it/s] 36it [00:08, 4.31it/s] 37it [00:08, 4.41it/s] 38it [00:08, 4.47it/s] 39it [00:09, 4.39it/s] 40it [00:09, 4.33it/s] 41it [00:09, 4.18it/s] 42it [00:09, 4.20it/s] 43it [00:10, 4.24it/s] 44it [00:10, 4.27it/s] 45it [00:10, 4.27it/s] 46it [00:10, 4.27it/s] 47it [00:11, 4.34it/s] 48it [00:11, 4.28it/s] 49it [00:11, 4.27it/s] 50it [00:11, 4.31it/s]2025-05-25 21:59:10,111 - INFO - [Epoch 041 | Batch 0050] IWAE-loss 1382.9540 | mean log_px -0.0018 | KL -1326.47 + 51it [00:11, 4.29it/s] 52it [00:12, 4.27it/s] 53it [00:12, 4.26it/s] 54it [00:12, 4.36it/s] 55it [00:12, 4.39it/s] 56it [00:13, 4.31it/s] 57it [00:13, 4.32it/s] 58it [00:13, 4.39it/s] 59it [00:13, 4.40it/s] 60it [00:14, 4.46it/s] 61it [00:14, 4.50it/s] 62it [00:14, 4.45it/s] 63it [00:14, 4.49it/s] 64it [00:14, 4.47it/s] 65it [00:15, 4.34it/s] 66it [00:15, 4.40it/s] 67it [00:15, 4.34it/s] 68it [00:15, 4.34it/s] 69it [00:16, 4.44it/s] 70it [00:16, 4.37it/s] 71it [00:16, 4.43it/s] 72it [00:16, 4.34it/s] 73it [00:16, 4.33it/s] 74it [00:17, 4.17it/s] 75it [00:17, 4.18it/s] 76it [00:17, 4.29it/s] 77it [00:17, 4.39it/s] 78it [00:18, 4.30it/s] 79it [00:18, 4.32it/s] 80it [00:18, 4.32it/s] 81it [00:18, 4.42it/s] 82it [00:19, 4.38it/s] 83it [00:19, 4.45it/s] 84it [00:19, 4.49it/s] 85it [00:19, 4.53it/s] 86it [00:19, 4.39it/s] 87it [00:20, 4.38it/s] 88it [00:20, 4.30it/s] 89it [00:20, 4.39it/s] 90it [00:20, 4.14it/s] 91it [00:21, 4.23it/s] 92it [00:21, 4.20it/s] 93it [00:21, 4.22it/s] 94it [00:21, 4.18it/s] 95it [00:22, 4.19it/s] 96it [00:22, 4.27it/s] 97it [00:22, 4.25it/s] 98it [00:22, 4.29it/s] 99it [00:23, 4.29it/s] 100it [00:23, 4.21it/s]2025-05-25 21:59:21,660 - INFO - [Epoch 041 | Batch 0100] IWAE-loss 1411.5579 | mean log_px -0.0019 | KL -1321.44 + 101it [00:23, 4.21it/s] 102it [00:23, 4.31it/s] 103it [00:23, 4.36it/s] 104it [00:24, 4.18it/s] 105it [00:24, 4.20it/s] 106it [00:24, 4.32it/s] 107it [00:24, 4.34it/s] 108it [00:25, 4.41it/s] 109it [00:25, 4.47it/s] 110it [00:25, 4.36it/s] 111it [00:25, 4.45it/s] 112it [00:26, 4.46it/s] 113it [00:26, 4.29it/s] 114it [00:26, 4.33it/s] 115it [00:26, 4.41it/s] 116it [00:26, 4.27it/s] 117it [00:27, 4.26it/s] 118it [00:27, 4.23it/s] 119it [00:27, 4.30it/s] 120it [00:27, 4.35it/s] 121it [00:28, 4.36it/s] 122it [00:28, 4.30it/s] 123it [00:28, 4.37it/s] 124it [00:28, 4.34it/s] 125it [00:29, 4.45it/s] 126it [00:29, 4.52it/s] 127it [00:29, 4.53it/s] 128it [00:29, 4.36it/s] 129it [00:29, 4.39it/s] 130it [00:30, 4.33it/s] 131it [00:30, 4.35it/s] 132it [00:30, 4.45it/s] 133it [00:30, 4.39it/s] 134it [00:31, 4.38it/s] 135it [00:31, 4.44it/s] 136it [00:31, 4.24it/s] 137it [00:31, 4.30it/s] 138it [00:31, 4.42it/s] 139it [00:32, 4.49it/s] 140it [00:32, 4.37it/s] 141it [00:32, 4.26it/s] 142it [00:32, 4.38it/s] 143it [00:33, 4.48it/s] 144it [00:33, 4.48it/s] 145it [00:33, 4.56it/s] 146it [00:33, 4.59it/s] 147it [00:34, 4.50it/s] 148it [00:34, 4.40it/s] 149it [00:34, 4.28it/s] 150it [00:34, 4.41it/s]2025-05-25 21:59:33,073 - INFO - [Epoch 041 | Batch 0150] IWAE-loss 1899.3881 | mean log_px -0.0105 | KL -1315.73 + 151it [00:34, 4.35it/s] 152it [00:35, 4.34it/s] 153it [00:35, 4.31it/s] 154it [00:35, 4.22it/s] 155it [00:35, 4.32it/s] 156it [00:36, 4.30it/s] 157it [00:36, 4.28it/s] 158it [00:36, 4.30it/s] 159it [00:36, 4.35it/s] 160it [00:37, 4.31it/s] 161it [00:37, 4.43it/s] 162it [00:37, 4.36it/s] 163it [00:37, 4.47it/s] 164it [00:37, 4.39it/s] 165it [00:38, 4.30it/s] 166it [00:38, 4.35it/s] 167it [00:38, 4.45it/s] 168it [00:38, 4.50it/s] 169it [00:39, 4.56it/s] 170it [00:39, 4.61it/s] 171it [00:39, 4.44it/s] 172it [00:39, 4.40it/s] 173it [00:39, 4.43it/s] 174it [00:40, 4.38it/s] 175it [00:40, 4.45it/s] 176it [00:40, 4.37it/s] 177it [00:40, 4.48it/s] 178it [00:41, 4.41it/s] 179it [00:41, 4.42it/s] 180it [00:41, 4.51it/s] 181it [00:41, 4.51it/s] 182it [00:41, 4.58it/s] 183it [00:42, 4.42it/s] 184it [00:42, 4.53it/s] 185it [00:42, 4.51it/s] 186it [00:42, 4.47it/s] 187it [00:43, 4.39it/s] 188it [00:43, 4.24it/s] 189it [00:43, 4.26it/s] 190it [00:43, 4.24it/s] 191it [00:44, 4.26it/s] 192it [00:44, 4.24it/s] 193it [00:44, 4.26it/s] 194it [00:44, 4.36it/s] 195it [00:44, 4.37it/s] 196it [00:45, 4.48it/s] 196it [00:45, 4.33it/s] +2025-05-25 21:59:43,450 - INFO - Epoch: 41, Objective: tensor([1496.4008], device='cuda:0', grad_fn=), Loss: 0.004434915725141764, KL/n: 26.789295196533203 + 0it [00:00, ?it/s]2025-05-25 21:59:43,851 - INFO - [Epoch 042 | Batch 0000] IWAE-loss 1575.5166 | mean log_px -0.0100 | KL -1312.57 + 1it [00:00, 2.81it/s] 2it [00:00, 3.58it/s] 3it [00:00, 3.88it/s] 4it [00:01, 4.00it/s] 5it [00:01, 4.19it/s] 6it [00:01, 4.19it/s] 7it [00:01, 4.15it/s] 8it [00:01, 4.25it/s] 9it [00:02, 4.39it/s] 10it [00:02, 4.48it/s] 11it [00:02, 4.56it/s] 12it [00:02, 4.57it/s] 13it [00:03, 4.59it/s] 14it [00:03, 4.59it/s] 15it [00:03, 4.48it/s] 16it [00:03, 4.51it/s] 17it [00:03, 4.59it/s] 18it [00:04, 4.50it/s] 19it [00:04, 4.37it/s] 20it [00:04, 4.42it/s] 21it [00:04, 4.40it/s] 22it [00:05, 4.36it/s] 23it [00:05, 4.43it/s] 24it [00:05, 4.36it/s] 25it [00:05, 4.35it/s] 26it [00:05, 4.39it/s] 27it [00:06, 4.37it/s] 28it [00:06, 4.34it/s] 29it [00:06, 4.41it/s] 30it [00:06, 4.12it/s] 31it [00:07, 4.29it/s] 32it [00:07, 4.31it/s] 33it [00:07, 4.43it/s] 34it [00:07, 4.50it/s] 35it [00:08, 4.56it/s] 36it [00:08, 4.61it/s] 37it [00:08, 4.48it/s] 38it [00:08, 4.31it/s] 39it [00:08, 4.45it/s] 40it [00:09, 4.39it/s] 41it [00:09, 4.34it/s] 42it [00:09, 4.34it/s] 43it [00:09, 4.33it/s] 44it [00:10, 4.20it/s] 45it [00:10, 4.28it/s] 46it [00:10, 4.38it/s] 47it [00:10, 4.43it/s] 48it [00:11, 4.52it/s] 49it [00:11, 4.55it/s] 50it [00:11, 4.37it/s]2025-05-25 21:59:55,230 - INFO - [Epoch 042 | Batch 0050] IWAE-loss 1876.5878 | mean log_px -0.0155 | KL -1306.35 + 51it [00:11, 4.35it/s] 52it [00:11, 4.34it/s] 53it [00:12, 4.42it/s] 54it [00:12, 4.37it/s] 55it [00:12, 4.32it/s] 56it [00:12, 4.19it/s] 57it [00:13, 4.23it/s] 58it [00:13, 4.25it/s] 59it [00:13, 4.39it/s] 60it [00:13, 4.25it/s] 61it [00:14, 4.40it/s] 62it [00:14, 4.44it/s] 63it [00:14, 4.55it/s] 64it [00:14, 4.56it/s] 65it [00:14, 4.42it/s] 66it [00:15, 3.56it/s] 67it [00:15, 3.83it/s] 68it [00:15, 4.05it/s] 69it [00:15, 4.24it/s] 70it [00:16, 4.25it/s] 71it [00:16, 4.35it/s] 72it [00:16, 4.46it/s] 73it [00:16, 4.38it/s] 74it [00:17, 4.32it/s] 75it [00:17, 4.36it/s] 76it [00:17, 4.41it/s] 77it [00:17, 4.34it/s] 78it [00:18, 4.31it/s] 79it [00:18, 4.37it/s] 80it [00:18, 4.33it/s] 81it [00:18, 4.42it/s] 82it [00:18, 4.35it/s] 83it [00:19, 4.26it/s] 84it [00:19, 4.37it/s] 85it [00:19, 4.48it/s] 86it [00:19, 4.52it/s] 87it [00:20, 4.48it/s] 88it [00:20, 4.40it/s] 89it [00:20, 4.50it/s] 90it [00:20, 4.56it/s] 91it [00:20, 4.48it/s] 92it [00:21, 4.31it/s] 93it [00:21, 4.43it/s] 94it [00:21, 4.45it/s] 95it [00:21, 4.54it/s] 96it [00:22, 4.52it/s] 97it [00:22, 4.36it/s] 98it [00:22, 4.32it/s] 99it [00:22, 4.35it/s] 100it [00:22, 4.37it/s]2025-05-25 22:00:06,724 - INFO - [Epoch 042 | Batch 0100] IWAE-loss 1476.0132 | mean log_px -0.0030 | KL -1307.70 + 101it [00:23, 4.46it/s] 102it [00:23, 4.54it/s] 103it [00:23, 4.53it/s] 104it [00:23, 4.56it/s] 105it [00:24, 4.61it/s] 106it [00:24, 4.64it/s] 107it [00:24, 4.65it/s] 108it [00:24, 4.42it/s] 109it [00:24, 4.40it/s] 110it [00:25, 4.41it/s] 111it [00:25, 4.44it/s] 112it [00:25, 4.49it/s] 113it [00:25, 4.37it/s] 114it [00:26, 4.31it/s] 115it [00:26, 4.31it/s] 116it [00:26, 4.30it/s] 117it [00:26, 4.16it/s] 118it [00:27, 4.32it/s] 119it [00:27, 4.27it/s] 120it [00:27, 4.29it/s] 121it [00:27, 4.29it/s] 122it [00:27, 4.24it/s] 123it [00:28, 4.25it/s] 124it [00:28, 4.26it/s] 125it [00:28, 4.26it/s] 126it [00:28, 4.35it/s] 127it [00:29, 4.45it/s] 128it [00:29, 4.54it/s] 129it [00:29, 4.52it/s] 130it [00:29, 4.55it/s] 131it [00:30, 4.53it/s] 132it [00:30, 4.52it/s] 133it [00:30, 4.34it/s] 134it [00:30, 4.45it/s] 135it [00:30, 4.53it/s] 136it [00:31, 4.42it/s] 137it [00:31, 4.39it/s] 138it [00:31, 4.25it/s] 139it [00:31, 4.27it/s] 140it [00:32, 4.26it/s] 141it [00:32, 4.34it/s] 142it [00:32, 4.32it/s] 143it [00:32, 4.16it/s] 144it [00:33, 4.23it/s] 145it [00:33, 4.23it/s] 146it [00:33, 4.21it/s] 147it [00:33, 4.15it/s] 148it [00:33, 4.18it/s] 149it [00:34, 4.34it/s] 150it [00:34, 4.28it/s]2025-05-25 22:00:18,195 - INFO - [Epoch 042 | Batch 0150] IWAE-loss 1960.0638 | mean log_px -0.0210 | KL -1302.23 + 151it [00:34, 4.32it/s] 152it [00:34, 4.28it/s] 153it [00:35, 4.20it/s] 154it [00:35, 4.23it/s] 155it [00:35, 4.27it/s] 156it [00:35, 4.28it/s] 157it [00:36, 4.39it/s] 158it [00:36, 4.49it/s] 159it [00:36, 4.43it/s] 160it [00:36, 4.25it/s] 161it [00:36, 4.39it/s] 162it [00:37, 4.29it/s] 163it [00:37, 4.32it/s] 164it [00:37, 4.42it/s] 165it [00:37, 4.48it/s] 166it [00:38, 4.24it/s] 167it [00:38, 4.29it/s] 168it [00:38, 4.13it/s] 169it [00:38, 4.31it/s] 170it [00:39, 4.28it/s] 171it [00:39, 4.40it/s] 172it [00:39, 4.49it/s] 173it [00:39, 4.40it/s] 174it [00:39, 4.44it/s] 175it [00:40, 4.43it/s] 176it [00:40, 4.37it/s] 177it [00:40, 4.43it/s] 178it [00:40, 4.23it/s] 179it [00:41, 4.25it/s] 180it [00:41, 4.28it/s] 181it [00:41, 4.27it/s] 182it [00:41, 4.30it/s] 183it [00:42, 4.31it/s] 184it [00:42, 4.43it/s] 185it [00:42, 4.32it/s] 186it [00:42, 4.43it/s] 187it [00:42, 4.40it/s] 188it [00:43, 4.35it/s] 189it [00:43, 4.32it/s] 190it [00:43, 4.32it/s] 191it [00:43, 4.43it/s] 192it [00:44, 4.50it/s] 193it [00:44, 4.44it/s] 194it [00:44, 4.38it/s] 195it [00:44, 4.33it/s] 196it [00:45, 4.44it/s] 196it [00:45, 4.35it/s] +2025-05-25 22:00:28,669 - INFO - Epoch: 42, Objective: tensor([1482.2252], device='cuda:0', grad_fn=), Loss: 0.007103536278009415, KL/n: 26.547670364379883 + 0it [00:00, ?it/s]2025-05-25 22:00:29,058 - INFO - [Epoch 043 | Batch 0000] IWAE-loss 1369.3737 | mean log_px -0.0017 | KL -1301.93 + 1it [00:00, 3.18it/s] 2it [00:00, 3.89it/s] 3it [00:00, 4.13it/s] 4it [00:00, 4.16it/s] 5it [00:01, 4.35it/s] 6it [00:01, 4.34it/s] 7it [00:01, 4.19it/s] 8it [00:01, 4.26it/s] 9it [00:02, 4.30it/s] 10it [00:02, 4.33it/s] 11it [00:02, 4.45it/s] 12it [00:02, 4.22it/s] 13it [00:03, 4.37it/s] 14it [00:03, 4.29it/s] 15it [00:03, 4.30it/s] 16it [00:03, 4.29it/s] 17it [00:04, 4.26it/s] 18it [00:04, 4.37it/s] 19it [00:04, 4.47it/s] 20it [00:04, 4.39it/s] 21it [00:04, 4.47it/s] 22it [00:05, 4.54it/s] 23it [00:05, 4.35it/s] 24it [00:05, 4.34it/s] 25it [00:05, 4.38it/s] 26it [00:06, 4.43it/s] 27it [00:06, 4.50it/s] 28it [00:06, 4.54it/s] 29it [00:06, 4.42it/s] 30it [00:06, 4.43it/s] 31it [00:07, 4.34it/s] 32it [00:07, 4.39it/s] 33it [00:07, 4.47it/s] 34it [00:07, 4.38it/s] 35it [00:08, 4.31it/s] 36it [00:08, 4.36it/s] 37it [00:08, 4.43it/s] 38it [00:08, 4.46it/s] 39it [00:08, 4.36it/s] 40it [00:09, 4.21it/s] 41it [00:09, 4.26it/s] 42it [00:09, 4.33it/s] 43it [00:09, 4.30it/s] 44it [00:10, 4.30it/s] 45it [00:10, 4.30it/s] 46it [00:10, 4.30it/s] 47it [00:10, 4.39it/s] 48it [00:11, 4.38it/s] 49it [00:11, 4.32it/s] 50it [00:11, 4.25it/s]2025-05-25 22:00:40,525 - INFO - [Epoch 043 | Batch 0050] IWAE-loss 1440.7559 | mean log_px -0.0027 | KL -1296.14 + 51it [00:11, 4.25it/s] 52it [00:12, 4.23it/s] 53it [00:12, 4.20it/s] 54it [00:12, 4.20it/s] 55it [00:12, 4.18it/s] 56it [00:12, 4.15it/s] 57it [00:13, 4.28it/s] 58it [00:13, 4.10it/s] 59it [00:13, 4.22it/s] 60it [00:13, 4.29it/s] 61it [00:14, 4.31it/s] 62it [00:14, 4.31it/s] 63it [00:14, 4.37it/s] 64it [00:14, 4.40it/s] 65it [00:15, 4.42it/s] 66it [00:15, 4.39it/s] 67it [00:15, 4.33it/s] 68it [00:15, 4.29it/s] 69it [00:15, 4.24it/s] 70it [00:16, 4.25it/s] 71it [00:16, 4.23it/s] 72it [00:16, 4.16it/s] 73it [00:16, 4.28it/s] 74it [00:17, 4.36it/s] 75it [00:17, 4.28it/s] 76it [00:17, 4.27it/s] 77it [00:17, 4.19it/s] 78it [00:18, 4.05it/s] 79it [00:18, 4.08it/s] 80it [00:18, 4.24it/s] 81it [00:18, 4.37it/s] 82it [00:19, 4.46it/s] 83it [00:19, 4.54it/s] 84it [00:19, 4.56it/s] 85it [00:19, 4.48it/s] 86it [00:19, 4.52it/s] 87it [00:20, 4.50it/s] 88it [00:20, 4.56it/s] 89it [00:20, 4.57it/s] 90it [00:20, 4.59it/s] 91it [00:20, 4.59it/s] 92it [00:21, 4.45it/s] 93it [00:21, 4.40it/s] 94it [00:21, 4.44it/s] 95it [00:21, 4.44it/s] 96it [00:22, 4.50it/s] 97it [00:22, 4.56it/s] 98it [00:22, 4.56it/s] 99it [00:22, 4.50it/s] 100it [00:23, 4.50it/s]2025-05-25 22:00:51,977 - INFO - [Epoch 043 | Batch 0100] IWAE-loss 1553.6163 | mean log_px -0.0052 | KL -1291.85 + 101it [00:23, 4.55it/s] 102it [00:23, 4.43it/s] 103it [00:23, 4.46it/s] 104it [00:23, 4.52it/s] 105it [00:24, 4.48it/s] 106it [00:24, 4.44it/s] 107it [00:24, 4.16it/s] 108it [00:24, 4.20it/s] 109it [00:25, 4.20it/s] 110it [00:25, 4.10it/s] 111it [00:25, 4.12it/s] 112it [00:25, 4.17it/s] 113it [00:26, 4.15it/s] 114it [00:26, 4.15it/s] 115it [00:26, 4.18it/s] 116it [00:26, 4.15it/s] 117it [00:27, 4.19it/s] 118it [00:27, 4.27it/s] 119it [00:27, 4.38it/s] 120it [00:27, 4.32it/s] 121it [00:27, 4.28it/s] 122it [00:28, 4.24it/s] 123it [00:28, 4.29it/s] 124it [00:28, 4.27it/s] 125it [00:28, 4.31it/s] 126it [00:29, 4.30it/s] 127it [00:29, 4.16it/s] 128it [00:29, 4.17it/s] 129it [00:29, 4.24it/s] 130it [00:30, 4.21it/s] 131it [00:30, 4.36it/s] 132it [00:30, 4.33it/s] 133it [00:30, 4.45it/s] 134it [00:31, 4.18it/s] 135it [00:31, 4.21it/s] 136it [00:31, 4.21it/s] 137it [00:31, 4.25it/s] 138it [00:31, 4.34it/s] 139it [00:32, 4.26it/s] 140it [00:32, 4.26it/s] 141it [00:32, 4.23it/s] 142it [00:32, 4.26it/s] 143it [00:33, 4.26it/s] 144it [00:33, 4.12it/s] 145it [00:33, 4.17it/s] 146it [00:33, 4.22it/s] 147it [00:34, 4.21it/s] 148it [00:34, 4.25it/s] 149it [00:34, 4.31it/s] 150it [00:34, 4.25it/s]2025-05-25 22:01:03,757 - INFO - [Epoch 043 | Batch 0150] IWAE-loss 2060.3196 | mean log_px -0.0110 | KL -1286.15 + 151it [00:35, 4.24it/s] 152it [00:35, 4.24it/s] 153it [00:35, 4.27it/s] 154it [00:35, 4.31it/s] 155it [00:35, 4.20it/s] 156it [00:36, 4.32it/s] 157it [00:36, 4.30it/s] 158it [00:36, 4.39it/s] 159it [00:36, 4.36it/s] 160it [00:37, 4.16it/s] 161it [00:37, 4.19it/s] 162it [00:37, 4.19it/s] 163it [00:37, 4.21it/s] 164it [00:38, 4.22it/s] 165it [00:38, 4.08it/s] 166it [00:38, 4.14it/s] 167it [00:38, 4.30it/s] 168it [00:38, 4.38it/s] 169it [00:39, 4.46it/s] 170it [00:39, 4.36it/s] 171it [00:39, 4.33it/s] 172it [00:39, 4.33it/s] 173it [00:40, 4.43it/s] 174it [00:40, 4.42it/s] 175it [00:40, 4.25it/s] 176it [00:40, 4.31it/s] 177it [00:41, 4.42it/s] 178it [00:41, 4.34it/s] 179it [00:41, 4.34it/s] 180it [00:41, 4.15it/s] 181it [00:42, 4.19it/s] 182it [00:42, 4.31it/s] 183it [00:42, 4.38it/s] 184it [00:42, 4.46it/s] 185it [00:42, 4.24it/s] 186it [00:43, 4.33it/s] 187it [00:43, 4.37it/s] 188it [00:43, 4.37it/s] 189it [00:43, 4.32it/s] 190it [00:44, 4.44it/s] 191it [00:44, 4.46it/s] 192it [00:44, 4.39it/s] 193it [00:44, 4.37it/s] 194it [00:44, 4.25it/s] 195it [00:45, 4.28it/s] 196it [00:45, 4.41it/s] 196it [00:45, 4.31it/s] +2025-05-25 22:01:14,315 - INFO - Epoch: 43, Objective: tensor([1422.8802], device='cuda:0', grad_fn=), Loss: 0.004217221401631832, KL/n: 26.26324462890625 + 0it [00:00, ?it/s]2025-05-25 22:01:14,890 - INFO - [Epoch 044 | Batch 0000] IWAE-loss 1640.3896 | mean log_px -0.0097 | KL -1284.26 + 1it [00:00, 3.17it/s] 2it [00:00, 3.88it/s] 3it [00:00, 3.88it/s] 4it [00:01, 4.10it/s] 5it [00:01, 4.31it/s] 6it [00:01, 4.30it/s] 7it [00:01, 4.43it/s] 8it [00:01, 4.36it/s] 9it [00:02, 4.26it/s] 10it [00:02, 4.29it/s] 11it [00:02, 4.35it/s] 12it [00:02, 4.30it/s] 13it [00:03, 4.34it/s] 14it [00:03, 4.45it/s] 15it [00:03, 4.51it/s] 16it [00:03, 4.43it/s] 17it [00:03, 4.38it/s] 18it [00:04, 4.26it/s] 19it [00:04, 4.37it/s] 20it [00:04, 4.32it/s] 21it [00:04, 4.30it/s] 22it [00:05, 4.33it/s] 23it [00:05, 4.40it/s] 24it [00:05, 4.24it/s] 25it [00:05, 4.39it/s] 26it [00:06, 4.35it/s] 27it [00:06, 4.39it/s] 28it [00:06, 4.48it/s] 29it [00:06, 4.47it/s] 30it [00:06, 4.54it/s] 31it [00:07, 4.60it/s] 32it [00:07, 4.46it/s] 33it [00:07, 4.31it/s] 34it [00:07, 4.30it/s] 35it [00:08, 4.42it/s] 36it [00:08, 4.39it/s] 37it [00:08, 4.41it/s] 38it [00:08, 4.38it/s] 39it [00:09, 4.27it/s] 40it [00:09, 4.27it/s] 41it [00:09, 4.29it/s] 42it [00:09, 4.28it/s] 43it [00:09, 4.36it/s] 44it [00:10, 4.18it/s] 45it [00:10, 4.13it/s] 46it [00:10, 4.12it/s] 47it [00:10, 4.18it/s] 48it [00:11, 4.16it/s] 49it [00:11, 4.20it/s] 50it [00:11, 4.06it/s]2025-05-25 22:01:26,459 - INFO - [Epoch 044 | Batch 0050] IWAE-loss 1426.9062 | mean log_px -0.0024 | KL -1280.41 + 51it [00:11, 4.12it/s] 52it [00:12, 4.18it/s] 53it [00:12, 4.29it/s] 54it [00:12, 4.33it/s] 55it [00:12, 4.44it/s] 56it [00:12, 4.49it/s] 57it [00:13, 4.56it/s] 58it [00:13, 4.56it/s] 59it [00:13, 4.60it/s] 60it [00:13, 4.51it/s] 61it [00:14, 4.56it/s] 62it [00:14, 4.51it/s] 63it [00:14, 4.46it/s] 64it [00:14, 4.49it/s] 65it [00:14, 4.56it/s] 66it [00:15, 4.46it/s] 67it [00:15, 4.47it/s] 68it [00:15, 4.26it/s] 69it [00:15, 4.34it/s] 70it [00:16, 4.43it/s] 71it [00:16, 4.36it/s] 72it [00:16, 4.35it/s] 73it [00:16, 4.45it/s] 74it [00:17, 4.40it/s] 75it [00:17, 4.51it/s] 76it [00:17, 4.52it/s] 77it [00:17, 4.56it/s] 78it [00:17, 4.59it/s] 79it [00:18, 4.62it/s] 80it [00:18, 4.52it/s] 81it [00:18, 4.57it/s] 82it [00:18, 4.45it/s] 83it [00:19, 4.52it/s] 84it [00:19, 4.57it/s] 85it [00:19, 4.58it/s] 86it [00:19, 4.62it/s] 87it [00:19, 4.65it/s] 88it [00:20, 4.63it/s] 89it [00:20, 4.63it/s] 90it [00:20, 4.63it/s] 91it [00:20, 4.66it/s] 92it [00:20, 4.64it/s] 93it [00:21, 4.50it/s] 94it [00:21, 4.55it/s] 95it [00:21, 4.53it/s] 96it [00:21, 4.42it/s] 97it [00:22, 4.51it/s] 98it [00:22, 4.55it/s] 99it [00:22, 4.45it/s] 100it [00:22, 4.39it/s]2025-05-25 22:01:37,555 - INFO - [Epoch 044 | Batch 0100] IWAE-loss 1384.5699 | mean log_px -0.0015 | KL -1274.65 + 101it [00:23, 4.21it/s] 102it [00:23, 4.26it/s] 103it [00:23, 4.25it/s] 104it [00:23, 4.28it/s] 105it [00:23, 4.33it/s] 106it [00:24, 4.42it/s] 107it [00:24, 4.43it/s] 108it [00:24, 4.49it/s] 109it [00:24, 4.55it/s] 110it [00:25, 4.59it/s] 111it [00:25, 4.49it/s] 112it [00:25, 4.47it/s] 113it [00:25, 4.37it/s] 114it [00:25, 4.32it/s] 115it [00:26, 4.34it/s] 116it [00:26, 4.38it/s] 117it [00:26, 4.44it/s] 118it [00:26, 4.41it/s] 119it [00:27, 4.48it/s] 120it [00:27, 4.27it/s] 121it [00:27, 4.26it/s] 122it [00:27, 4.26it/s] 123it [00:28, 4.33it/s] 124it [00:28, 4.42it/s] 125it [00:28, 4.44it/s] 126it [00:28, 4.47it/s] 127it [00:28, 4.39it/s] 128it [00:29, 4.40it/s] 129it [00:29, 4.22it/s] 130it [00:29, 4.33it/s] 131it [00:29, 4.32it/s] 132it [00:30, 4.26it/s] 133it [00:30, 4.26it/s] 134it [00:30, 4.23it/s] 135it [00:30, 4.15it/s] 136it [00:31, 4.18it/s] 137it [00:31, 4.19it/s] 138it [00:31, 4.24it/s] 139it [00:31, 4.22it/s] 140it [00:32, 4.14it/s] 141it [00:32, 4.32it/s] 142it [00:32, 4.40it/s] 143it [00:32, 4.49it/s] 144it [00:32, 4.39it/s] 145it [00:33, 4.44it/s] 146it [00:33, 4.43it/s] 147it [00:33, 4.51it/s] 148it [00:33, 4.51it/s] 149it [00:33, 4.57it/s] 150it [00:34, 4.48it/s]2025-05-25 22:01:49,016 - INFO - [Epoch 044 | Batch 0150] IWAE-loss 1477.1619 | mean log_px -0.0045 | KL -1270.62 + 151it [00:34, 4.29it/s] 152it [00:34, 4.39it/s] 153it [00:34, 4.48it/s] 154it [00:35, 4.43it/s] 155it [00:35, 4.42it/s] 156it [00:35, 4.44it/s] 157it [00:35, 4.40it/s] 158it [00:36, 4.42it/s] 159it [00:36, 4.49it/s] 160it [00:36, 4.54it/s] 161it [00:36, 4.46it/s] 162it [00:36, 4.46it/s] 163it [00:37, 4.41it/s] 164it [00:37, 4.48it/s] 165it [00:37, 4.45it/s] 166it [00:37, 4.44it/s] 167it [00:38, 4.49it/s] 168it [00:38, 4.41it/s] 169it [00:38, 4.44it/s] 170it [00:38, 4.38it/s] 171it [00:38, 4.34it/s] 172it [00:39, 4.41it/s] 173it [00:39, 4.50it/s] 174it [00:39, 4.40it/s] 175it [00:39, 4.41it/s] 176it [00:40, 4.43it/s] 177it [00:40, 4.41it/s] 178it [00:40, 4.40it/s] 179it [00:40, 4.49it/s] 180it [00:40, 4.42it/s] 181it [00:41, 4.36it/s] 182it [00:41, 4.46it/s] 183it [00:41, 4.41it/s] 184it [00:41, 4.19it/s] 185it [00:42, 4.21it/s] 186it [00:42, 4.23it/s] 187it [00:42, 4.21it/s] 188it [00:42, 4.27it/s] 189it [00:43, 4.37it/s] 190it [00:43, 4.33it/s] 191it [00:43, 4.32it/s] 192it [00:43, 4.43it/s] 193it [00:43, 4.43it/s] 194it [00:44, 4.51it/s] 195it [00:44, 4.48it/s] 196it [00:44, 4.26it/s] 196it [00:44, 4.38it/s] +2025-05-25 22:01:59,403 - INFO - Epoch: 44, Objective: tensor([1421.5844], device='cuda:0', grad_fn=), Loss: 0.0031296706292778254, KL/n: 25.87446403503418 + 0it [00:00, ?it/s]2025-05-25 22:01:59,801 - INFO - [Epoch 045 | Batch 0000] IWAE-loss 1360.7262 | mean log_px -0.0022 | KL -1263.72 + 1it [00:00, 3.05it/s] 2it [00:00, 3.62it/s] 3it [00:00, 3.89it/s] 4it [00:01, 4.13it/s] 5it [00:01, 4.33it/s] 6it [00:01, 4.40it/s] 7it [00:01, 4.52it/s] 8it [00:01, 4.32it/s] 9it [00:02, 4.46it/s] 10it [00:02, 4.44it/s] 11it [00:02, 4.53it/s] 12it [00:02, 4.45it/s] 13it [00:03, 4.40it/s] 14it [00:03, 4.33it/s] 15it [00:03, 4.39it/s] 16it [00:03, 4.25it/s] 17it [00:03, 4.25it/s] 18it [00:04, 4.28it/s] 19it [00:04, 4.32it/s] 20it [00:04, 4.41it/s] 21it [00:04, 4.40it/s] 22it [00:05, 4.50it/s] 23it [00:05, 4.57it/s] 24it [00:05, 4.43it/s] 25it [00:05, 4.52it/s] 26it [00:05, 4.52it/s] 27it [00:06, 4.56it/s] 28it [00:06, 4.43it/s] 29it [00:06, 4.45it/s] 30it [00:06, 4.50it/s] 31it [00:07, 4.42it/s] 32it [00:07, 4.47it/s] 33it [00:07, 4.54it/s] 34it [00:07, 4.49it/s] 35it [00:07, 4.43it/s] 36it [00:08, 4.41it/s] 37it [00:08, 4.47it/s] 38it [00:08, 4.41it/s] 39it [00:09, 3.60it/s] 40it [00:09, 3.87it/s] 41it [00:09, 3.95it/s] 42it [00:09, 4.16it/s] 43it [00:09, 4.18it/s] 44it [00:10, 4.22it/s] 45it [00:10, 4.21it/s] 46it [00:10, 4.11it/s] 47it [00:10, 4.19it/s] 48it [00:11, 4.19it/s] 49it [00:11, 4.32it/s] 50it [00:11, 4.37it/s]2025-05-25 22:02:11,307 - INFO - [Epoch 045 | Batch 0050] IWAE-loss 1378.6949 | mean log_px -0.0038 | KL -1256.42 + 51it [00:11, 4.22it/s] 52it [00:12, 4.24it/s] 53it [00:12, 4.29it/s] 54it [00:12, 4.26it/s] 55it [00:12, 4.35it/s] 56it [00:13, 4.34it/s] 57it [00:13, 4.34it/s] 58it [00:13, 4.44it/s] 59it [00:13, 4.46it/s] 60it [00:13, 4.49it/s] 61it [00:14, 4.37it/s] 62it [00:14, 4.35it/s] 63it [00:14, 4.30it/s] 64it [00:14, 4.33it/s] 65it [00:15, 4.39it/s] 66it [00:15, 4.47it/s] 67it [00:15, 4.42it/s] 68it [00:15, 4.48it/s] 69it [00:15, 4.46it/s] 70it [00:16, 4.46it/s] 71it [00:16, 4.43it/s] 72it [00:16, 4.37it/s] 73it [00:16, 4.37it/s] 74it [00:17, 4.34it/s] 75it [00:17, 4.42it/s] 76it [00:17, 4.35it/s] 77it [00:17, 4.36it/s] 78it [00:18, 4.33it/s] 79it [00:18, 4.34it/s] 80it [00:18, 4.37it/s] 81it [00:18, 4.43it/s] 82it [00:18, 4.36it/s] 83it [00:19, 4.36it/s] 84it [00:19, 4.44it/s] 85it [00:19, 4.40it/s] 86it [00:19, 4.49it/s] 87it [00:20, 4.50it/s] 88it [00:20, 4.48it/s] 89it [00:20, 4.43it/s] 90it [00:20, 4.39it/s] 91it [00:20, 4.46it/s] 92it [00:21, 4.53it/s] 93it [00:21, 4.59it/s] 94it [00:21, 4.52it/s] 95it [00:21, 4.42it/s] 96it [00:22, 4.51it/s] 97it [00:22, 4.43it/s] 98it [00:22, 4.37it/s] 99it [00:22, 4.37it/s] 100it [00:22, 4.31it/s]2025-05-25 22:02:22,686 - INFO - [Epoch 045 | Batch 0100] IWAE-loss 1430.3690 | mean log_px -0.0046 | KL -1253.53 + 101it [00:23, 4.32it/s] 102it [00:23, 4.35it/s] 103it [00:23, 4.46it/s] 104it [00:23, 4.39it/s] 105it [00:24, 4.33it/s] 106it [00:24, 4.34it/s] 107it [00:24, 4.30it/s] 108it [00:24, 4.17it/s] 109it [00:25, 4.23it/s] 110it [00:25, 4.35it/s] 111it [00:25, 4.30it/s] 112it [00:25, 4.41it/s] 113it [00:25, 4.36it/s] 114it [00:26, 4.43it/s] 115it [00:26, 4.46it/s] 116it [00:26, 4.37it/s] 117it [00:26, 4.48it/s] 118it [00:27, 4.53it/s] 119it [00:27, 4.39it/s] 120it [00:27, 4.35it/s] 121it [00:27, 4.36it/s] 122it [00:28, 4.34it/s] 123it [00:28, 4.39it/s] 124it [00:28, 4.27it/s] 125it [00:28, 4.26it/s] 126it [00:28, 4.24it/s] 127it [00:29, 4.27it/s] 128it [00:29, 4.38it/s] 129it [00:29, 4.27it/s] 130it [00:29, 4.27it/s] 131it [00:30, 4.36it/s] 132it [00:30, 4.33it/s] 133it [00:30, 4.32it/s] 134it [00:30, 4.34it/s] 135it [00:31, 4.22it/s] 136it [00:31, 4.34it/s] 137it [00:31, 4.31it/s] 138it [00:31, 4.32it/s] 139it [00:31, 4.39it/s] 140it [00:32, 4.47it/s] 141it [00:32, 4.45it/s] 142it [00:32, 4.39it/s] 143it [00:32, 4.37it/s] 144it [00:33, 4.46it/s] 145it [00:33, 4.53it/s] 146it [00:33, 4.42it/s] 147it [00:33, 4.24it/s] 148it [00:34, 4.37it/s] 149it [00:34, 4.31it/s] 150it [00:34, 4.41it/s]2025-05-25 22:02:34,156 - INFO - [Epoch 045 | Batch 0150] IWAE-loss 1851.1366 | mean log_px -0.0243 | KL -1258.04 + 151it [00:34, 4.41it/s] 152it [00:34, 4.48it/s] 153it [00:35, 4.53it/s] 154it [00:35, 4.43it/s] 155it [00:35, 4.46it/s] 156it [00:35, 4.35it/s] 157it [00:36, 4.31it/s] 158it [00:36, 4.32it/s] 159it [00:36, 4.31it/s] 160it [00:36, 4.35it/s] 161it [00:36, 4.23it/s] 162it [00:37, 4.31it/s] 163it [00:37, 4.31it/s] 164it [00:37, 4.31it/s] 165it [00:37, 4.25it/s] 166it [00:38, 4.30it/s] 167it [00:38, 4.40it/s] 168it [00:38, 4.19it/s] 169it [00:38, 4.25it/s] 170it [00:39, 4.23it/s] 171it [00:39, 4.27it/s] 172it [00:39, 4.26it/s] 173it [00:39, 4.11it/s] 174it [00:40, 4.23it/s] 175it [00:40, 4.21it/s] 176it [00:40, 4.21it/s] 177it [00:40, 4.21it/s] 178it [00:41, 4.16it/s] 179it [00:41, 4.26it/s] 180it [00:41, 4.26it/s] 181it [00:41, 4.23it/s] 182it [00:41, 4.28it/s] 183it [00:42, 4.34it/s] 184it [00:42, 4.23it/s] 185it [00:42, 4.28it/s] 186it [00:42, 4.29it/s] 187it [00:43, 4.25it/s] 188it [00:43, 4.18it/s] 189it [00:43, 4.19it/s] 190it [00:43, 4.11it/s] 191it [00:44, 4.28it/s] 192it [00:44, 4.39it/s] 193it [00:44, 4.49it/s] 194it [00:44, 4.52it/s] 195it [00:44, 4.36it/s] 196it [00:45, 4.19it/s] 196it [00:45, 4.33it/s] +2025-05-25 22:02:44,809 - INFO - Epoch: 45, Objective: tensor([1544.8090], device='cuda:0', grad_fn=), Loss: 0.005014732480049133, KL/n: 25.61770248413086 + 0it [00:00, ?it/s]2025-05-25 22:02:45,190 - INFO - [Epoch 046 | Batch 0000] IWAE-loss 1496.1056 | mean log_px -0.0046 | KL -1254.61 + 1it [00:00, 3.19it/s] 2it [00:00, 3.75it/s] 3it [00:00, 4.10it/s] 4it [00:00, 4.16it/s] 5it [00:01, 4.17it/s] 6it [00:01, 4.11it/s] 7it [00:01, 4.18it/s] 8it [00:01, 4.35it/s] 9it [00:02, 4.33it/s] 10it [00:02, 4.43it/s] 11it [00:02, 4.40it/s] 12it [00:02, 4.49it/s] 13it [00:03, 4.51it/s] 14it [00:03, 4.54it/s] 15it [00:03, 4.53it/s] 16it [00:03, 4.57it/s] 17it [00:03, 4.27it/s] 18it [00:04, 4.27it/s] 19it [00:04, 4.25it/s] 20it [00:04, 4.29it/s] 21it [00:04, 4.31it/s] 22it [00:05, 4.27it/s] 23it [00:05, 4.38it/s] 24it [00:05, 4.40it/s] 25it [00:05, 4.47it/s] 26it [00:05, 4.53it/s] 27it [00:06, 4.57it/s] 28it [00:06, 4.45it/s] 29it [00:06, 4.36it/s] 30it [00:06, 4.32it/s] 31it [00:07, 4.33it/s] 32it [00:07, 4.42it/s] 33it [00:07, 4.50it/s] 34it [00:07, 4.57it/s] 35it [00:08, 4.43it/s] 36it [00:08, 4.23it/s] 37it [00:08, 4.22it/s] 38it [00:08, 4.27it/s] 39it [00:08, 4.28it/s] 40it [00:09, 4.28it/s] 41it [00:09, 4.31it/s] 42it [00:09, 4.26it/s] 43it [00:09, 4.29it/s] 44it [00:10, 4.33it/s] 45it [00:10, 4.34it/s] 46it [00:10, 4.43it/s] 47it [00:10, 4.51it/s] 48it [00:11, 4.44it/s] 49it [00:11, 4.33it/s] 50it [00:11, 4.31it/s]2025-05-25 22:02:56,625 - INFO - [Epoch 046 | Batch 0050] IWAE-loss 1504.4362 | mean log_px -0.0047 | KL -1249.88 + 51it [00:11, 4.39it/s] 52it [00:11, 4.35it/s] 53it [00:12, 4.25it/s] 54it [00:12, 4.26it/s] 55it [00:12, 4.37it/s] 56it [00:12, 4.45it/s] 57it [00:13, 4.50it/s] 58it [00:13, 4.31it/s] 59it [00:13, 4.32it/s] 60it [00:13, 4.34it/s] 61it [00:14, 4.30it/s] 62it [00:14, 4.36it/s] 63it [00:14, 4.35it/s] 64it [00:14, 4.45it/s] 65it [00:14, 4.40it/s] 66it [00:15, 4.39it/s] 67it [00:15, 4.22it/s] 68it [00:15, 4.28it/s] 69it [00:15, 4.36it/s] 70it [00:16, 4.37it/s] 71it [00:16, 4.40it/s] 72it [00:16, 4.47it/s] 73it [00:16, 4.41it/s] 74it [00:17, 4.46it/s] 75it [00:17, 4.19it/s] 76it [00:17, 4.11it/s] 77it [00:17, 4.22it/s] 78it [00:17, 4.22it/s] 79it [00:18, 4.26it/s] 80it [00:18, 4.30it/s] 81it [00:18, 4.42it/s] 82it [00:18, 4.32it/s] 83it [00:19, 4.21it/s] 84it [00:19, 4.32it/s] 85it [00:19, 4.43it/s] 86it [00:19, 4.33it/s] 87it [00:20, 4.41it/s] 88it [00:20, 4.49it/s] 89it [00:20, 4.52it/s] 90it [00:20, 4.34it/s] 91it [00:20, 4.45it/s] 92it [00:21, 4.53it/s] 93it [00:21, 4.59it/s] 94it [00:21, 4.50it/s] 95it [00:21, 4.57it/s] 96it [00:22, 4.49it/s] 97it [00:22, 4.41it/s] 98it [00:22, 4.37it/s] 99it [00:22, 4.33it/s] 100it [00:22, 4.29it/s]2025-05-25 22:03:08,090 - INFO - [Epoch 046 | Batch 0100] IWAE-loss 2131.2534 | mean log_px -0.0194 | KL -1246.14 + 101it [00:23, 4.20it/s] 102it [00:23, 4.33it/s] 103it [00:23, 4.44it/s] 104it [00:23, 4.48it/s] 105it [00:24, 4.44it/s] 106it [00:24, 4.49it/s] 107it [00:24, 4.56it/s] 108it [00:24, 4.46it/s] 109it [00:24, 4.49it/s] 110it [00:25, 4.56it/s] 111it [00:25, 4.48it/s] 112it [00:25, 4.31it/s] 113it [00:25, 4.39it/s] 114it [00:26, 4.32it/s] 115it [00:26, 4.28it/s] 116it [00:26, 4.38it/s] 117it [00:26, 4.32it/s] 118it [00:27, 4.20it/s] 119it [00:27, 4.20it/s] 120it [00:27, 4.19it/s] 121it [00:27, 4.20it/s] 122it [00:28, 4.24it/s] 123it [00:28, 4.25it/s] 124it [00:28, 4.25it/s] 125it [00:28, 4.27it/s] 126it [00:28, 4.25it/s] 127it [00:29, 4.35it/s] 128it [00:29, 4.42it/s] 129it [00:29, 4.50it/s] 130it [00:29, 4.44it/s] 131it [00:30, 4.37it/s] 132it [00:30, 4.40it/s] 133it [00:30, 4.43it/s] 134it [00:30, 4.47it/s] 135it [00:30, 4.42it/s] 136it [00:31, 4.46it/s] 137it [00:31, 4.53it/s] 138it [00:31, 4.43it/s] 139it [00:31, 4.51it/s] 140it [00:32, 4.56it/s] 141it [00:32, 4.46it/s] 142it [00:32, 4.37it/s] 143it [00:32, 4.21it/s] 144it [00:33, 4.24it/s] 145it [00:33, 4.29it/s] 146it [00:33, 4.38it/s] 147it [00:33, 4.45it/s] 148it [00:33, 4.50it/s] 149it [00:34, 4.53it/s] 150it [00:34, 4.38it/s]2025-05-25 22:03:19,491 - INFO - [Epoch 046 | Batch 0150] IWAE-loss 1519.1067 | mean log_px -0.0050 | KL -1243.51 + 151it [00:34, 4.45it/s] 152it [00:34, 4.49it/s] 153it [00:35, 4.53it/s] 154it [00:35, 4.55it/s] 155it [00:35, 4.40it/s] 156it [00:35, 4.34it/s] 157it [00:35, 4.33it/s] 158it [00:36, 4.29it/s] 159it [00:36, 4.24it/s] 160it [00:36, 4.37it/s] 161it [00:36, 4.35it/s] 162it [00:37, 4.23it/s] 163it [00:37, 4.23it/s] 164it [00:37, 4.37it/s] 165it [00:37, 4.46it/s] 166it [00:38, 4.53it/s] 167it [00:38, 4.58it/s] 168it [00:38, 4.31it/s] 169it [00:38, 4.26it/s] 170it [00:38, 4.35it/s] 171it [00:39, 4.45it/s] 172it [00:39, 4.45it/s] 173it [00:39, 4.54it/s] 174it [00:39, 4.59it/s] 175it [00:40, 4.54it/s] 176it [00:40, 4.56it/s] 177it [00:40, 4.46it/s] 178it [00:40, 4.37it/s] 179it [00:40, 4.21it/s] 180it [00:41, 4.23it/s] 181it [00:41, 4.27it/s] 182it [00:41, 4.25it/s] 183it [00:41, 4.26it/s] 184it [00:42, 4.26it/s] 185it [00:42, 4.16it/s] 186it [00:42, 4.22it/s] 187it [00:42, 4.20it/s] 188it [00:43, 4.28it/s] 189it [00:43, 4.27it/s] 190it [00:43, 4.35it/s] 191it [00:43, 4.31it/s] 192it [00:44, 4.16it/s] 193it [00:44, 4.20it/s] 194it [00:44, 4.20it/s] 195it [00:44, 4.12it/s] 196it [00:45, 4.16it/s] 196it [00:45, 4.35it/s] +2025-05-25 22:03:30,032 - INFO - Epoch: 46, Objective: tensor([1405.0212], device='cuda:0', grad_fn=), Loss: 0.008077585138380527, KL/n: 25.350950241088867 + 0it [00:00, ?it/s]2025-05-25 22:03:30,608 - INFO - [Epoch 047 | Batch 0000] IWAE-loss 1908.2433 | mean log_px -0.0132 | KL -1241.40 + 1it [00:00, 3.05it/s] 2it [00:00, 3.76it/s] 3it [00:00, 4.14it/s] 4it [00:00, 4.34it/s] 5it [00:01, 4.33it/s] 6it [00:01, 4.42it/s] 7it [00:01, 4.20it/s] 8it [00:01, 4.23it/s] 9it [00:02, 4.25it/s] 10it [00:02, 4.24it/s] 11it [00:02, 4.28it/s] 12it [00:02, 4.41it/s] 13it [00:03, 4.37it/s] 14it [00:03, 4.48it/s] 15it [00:03, 4.52it/s] 16it [00:03, 4.47it/s] 17it [00:03, 4.44it/s] 18it [00:04, 4.52it/s] 19it [00:04, 4.56it/s] 20it [00:04, 4.48it/s] 21it [00:04, 4.41it/s] 22it [00:05, 4.31it/s] 23it [00:05, 4.42it/s] 24it [00:05, 4.50it/s] 25it [00:05, 4.47it/s] 26it [00:05, 4.41it/s] 27it [00:06, 4.36it/s] 28it [00:06, 4.46it/s] 29it [00:06, 4.54it/s] 30it [00:06, 4.55it/s] 31it [00:07, 4.46it/s] 32it [00:07, 4.39it/s] 33it [00:07, 4.36it/s] 34it [00:07, 4.45it/s] 35it [00:07, 4.53it/s] 36it [00:08, 4.45it/s] 37it [00:08, 4.52it/s] 38it [00:08, 4.56it/s] 39it [00:08, 4.46it/s] 40it [00:09, 4.53it/s] 41it [00:09, 4.43it/s] 42it [00:09, 4.51it/s] 43it [00:09, 4.52it/s] 44it [00:09, 4.56it/s] 45it [00:10, 4.47it/s] 46it [00:10, 4.40it/s] 47it [00:10, 4.45it/s] 48it [00:10, 4.52it/s] 49it [00:11, 4.54it/s] 50it [00:11, 4.46it/s]2025-05-25 22:03:41,826 - INFO - [Epoch 047 | Batch 0050] IWAE-loss 1597.2115 | mean log_px -0.0160 | KL -1236.86 + 51it [00:11, 4.37it/s] 52it [00:11, 4.34it/s] 53it [00:12, 4.35it/s] 54it [00:12, 4.34it/s] 55it [00:12, 4.32it/s] 56it [00:12, 4.43it/s] 57it [00:12, 4.41it/s] 58it [00:13, 4.28it/s] 59it [00:13, 4.27it/s] 60it [00:13, 4.30it/s] 61it [00:13, 4.28it/s] 62it [00:14, 4.27it/s] 63it [00:14, 4.27it/s] 64it [00:14, 4.38it/s] 65it [00:14, 4.48it/s] 66it [00:15, 4.52it/s] 67it [00:15, 4.42it/s] 68it [00:15, 4.22it/s] 69it [00:15, 4.35it/s] 70it [00:15, 4.45it/s] 71it [00:16, 4.42it/s] 72it [00:16, 4.49it/s] 73it [00:16, 4.50it/s] 74it [00:16, 4.57it/s] 75it [00:17, 4.54it/s] 76it [00:17, 4.50it/s] 77it [00:17, 4.29it/s] 78it [00:17, 4.31it/s] 79it [00:17, 4.32it/s] 80it [00:18, 4.42it/s] 81it [00:18, 4.36it/s] 82it [00:18, 4.32it/s] 83it [00:18, 4.28it/s] 84it [00:19, 4.26it/s] 85it [00:19, 4.29it/s] 86it [00:19, 4.30it/s] 87it [00:19, 4.41it/s] 88it [00:20, 4.49it/s] 89it [00:20, 4.40it/s] 90it [00:20, 4.25it/s] 91it [00:20, 4.27it/s] 92it [00:20, 4.39it/s] 93it [00:21, 4.35it/s] 94it [00:21, 4.35it/s] 95it [00:21, 4.32it/s] 96it [00:21, 4.29it/s] 97it [00:22, 4.32it/s] 98it [00:22, 4.39it/s] 99it [00:22, 4.40it/s] 100it [00:22, 4.36it/s]2025-05-25 22:03:53,328 - INFO - [Epoch 047 | Batch 0100] IWAE-loss 2198.4983 | mean log_px -0.0194 | KL -1234.72 + 101it [00:23, 4.15it/s] 102it [00:23, 4.18it/s] 103it [00:23, 4.19it/s] 104it [00:23, 4.26it/s] 105it [00:23, 4.40it/s] 106it [00:24, 4.48it/s] 107it [00:24, 4.51it/s] 108it [00:24, 4.48it/s] 109it [00:24, 4.42it/s] 110it [00:25, 4.40it/s] 111it [00:25, 4.50it/s] 112it [00:25, 4.28it/s] 113it [00:25, 4.31it/s] 114it [00:26, 4.33it/s] 115it [00:26, 4.45it/s] 116it [00:26, 4.40it/s] 117it [00:26, 4.26it/s] 118it [00:26, 4.41it/s] 119it [00:27, 4.34it/s] 120it [00:27, 4.37it/s] 121it [00:27, 4.34it/s] 122it [00:27, 4.32it/s] 123it [00:28, 4.30it/s] 124it [00:28, 4.41it/s] 125it [00:28, 4.35it/s] 126it [00:28, 4.36it/s] 127it [00:29, 4.33it/s] 128it [00:29, 4.44it/s] 129it [00:29, 4.50it/s] 130it [00:29, 4.56it/s] 131it [00:29, 4.44it/s] 132it [00:30, 4.31it/s] 133it [00:30, 4.32it/s] 134it [00:30, 4.29it/s] 135it [00:30, 4.31it/s] 136it [00:31, 4.42it/s] 137it [00:31, 4.45it/s] 138it [00:31, 4.41it/s] 139it [00:31, 4.43it/s] 140it [00:31, 4.30it/s] 141it [00:32, 4.30it/s] 142it [00:32, 4.39it/s] 143it [00:32, 4.45it/s] 144it [00:32, 4.49it/s] 145it [00:33, 4.49it/s] 146it [00:33, 4.42it/s] 147it [00:33, 4.37it/s] 148it [00:33, 4.46it/s] 149it [00:33, 4.39it/s] 150it [00:34, 4.27it/s]2025-05-25 22:04:04,767 - INFO - [Epoch 047 | Batch 0150] IWAE-loss 1541.9181 | mean log_px -0.0085 | KL -1228.83 + 151it [00:34, 4.27it/s] 152it [00:34, 4.28it/s] 153it [00:34, 4.26it/s] 154it [00:35, 4.31it/s] 155it [00:35, 4.37it/s] 156it [00:35, 4.45it/s] 157it [00:35, 4.42it/s] 158it [00:36, 4.51it/s] 159it [00:36, 4.49it/s] 160it [00:36, 4.40it/s] 161it [00:36, 4.42it/s] 162it [00:36, 4.39it/s] 163it [00:37, 4.34it/s] 164it [00:37, 4.44it/s] 165it [00:37, 4.31it/s] 166it [00:37, 4.30it/s] 167it [00:38, 4.31it/s] 168it [00:38, 4.27it/s] 169it [00:38, 4.34it/s] 170it [00:38, 4.43it/s] 171it [00:39, 4.46it/s] 172it [00:39, 4.40it/s] 173it [00:39, 4.40it/s] 174it [00:39, 4.48it/s] 175it [00:39, 4.39it/s] 176it [00:40, 4.49it/s] 177it [00:40, 4.57it/s] 178it [00:40, 4.46it/s] 179it [00:40, 4.49it/s] 180it [00:41, 4.55it/s] 181it [00:41, 4.50it/s] 182it [00:41, 4.55it/s] 183it [00:41, 4.47it/s] 184it [00:41, 4.47it/s] 185it [00:42, 4.39it/s] 186it [00:42, 4.47it/s] 187it [00:42, 4.53it/s] 188it [00:42, 4.58it/s] 189it [00:43, 4.52it/s] 190it [00:43, 4.59it/s] 191it [00:43, 4.60it/s] 192it [00:43, 4.63it/s] 193it [00:43, 4.60it/s] 194it [00:44, 4.52it/s] 195it [00:44, 4.33it/s] 196it [00:44, 4.44it/s] 196it [00:44, 4.39it/s] +2025-05-25 22:04:15,010 - INFO - Epoch: 47, Objective: tensor([1696.6771], device='cuda:0', grad_fn=), Loss: 0.011943808756768703, KL/n: 25.065183639526367 + 0it [00:00, ?it/s]2025-05-25 22:04:15,420 - INFO - [Epoch 048 | Batch 0000] IWAE-loss 2080.8501 | mean log_px -0.0122 | KL -1227.69 + 1it [00:00, 2.74it/s] 2it [00:00, 3.46it/s] 3it [00:00, 3.81it/s] 4it [00:01, 4.11it/s] 5it [00:01, 4.31it/s] 6it [00:01, 4.37it/s] 7it [00:01, 4.36it/s] 8it [00:01, 4.46it/s] 9it [00:02, 4.52it/s] 10it [00:02, 4.57it/s] 11it [00:02, 4.56it/s] 12it [00:02, 4.61it/s] 13it [00:03, 4.47it/s] 14it [00:03, 4.44it/s] 15it [00:03, 4.46it/s] 16it [00:03, 4.52it/s] 17it [00:03, 4.54it/s] 18it [00:04, 4.57it/s] 19it [00:04, 4.62it/s] 20it [00:04, 4.47it/s] 21it [00:04, 4.30it/s] 22it [00:05, 4.31it/s] 23it [00:05, 4.30it/s] 24it [00:05, 4.26it/s] 25it [00:05, 3.45it/s] 26it [00:06, 3.58it/s] 27it [00:06, 3.77it/s] 28it [00:06, 3.94it/s] 29it [00:06, 4.14it/s] 30it [00:07, 4.17it/s] 31it [00:07, 4.27it/s] 32it [00:07, 4.38it/s] 33it [00:07, 4.48it/s] 34it [00:07, 4.40it/s] 35it [00:08, 4.38it/s] 36it [00:08, 4.47it/s] 37it [00:08, 4.41it/s] 38it [00:08, 4.36it/s] 39it [00:09, 4.44it/s] 40it [00:09, 4.40it/s] 41it [00:09, 4.48it/s] 42it [00:09, 4.54it/s] 43it [00:10, 4.42it/s] 44it [00:10, 4.39it/s] 45it [00:10, 4.44it/s] 46it [00:10, 4.51it/s] 47it [00:10, 4.42it/s] 48it [00:11, 4.36it/s] 49it [00:11, 4.21it/s] 50it [00:11, 4.33it/s]2025-05-25 22:04:26,934 - INFO - [Epoch 048 | Batch 0050] IWAE-loss 1285.0804 | mean log_px -0.0012 | KL -1222.04 + 51it [00:11, 4.40it/s] 52it [00:12, 4.45it/s] 53it [00:12, 4.37it/s] 54it [00:12, 4.43it/s] 55it [00:12, 4.45it/s] 56it [00:12, 4.50it/s] 57it [00:13, 4.39it/s] 58it [00:13, 4.35it/s] 59it [00:13, 4.35it/s] 60it [00:13, 4.37it/s] 61it [00:14, 4.30it/s] 62it [00:14, 4.39it/s] 63it [00:14, 4.37it/s] 64it [00:14, 4.44it/s] 65it [00:15, 4.37it/s] 66it [00:15, 4.43it/s] 67it [00:15, 4.34it/s] 68it [00:15, 4.29it/s] 69it [00:15, 4.37it/s] 70it [00:16, 4.43it/s] 71it [00:16, 4.36it/s] 72it [00:16, 4.42it/s] 73it [00:16, 4.35it/s] 74it [00:17, 4.29it/s] 75it [00:17, 4.24it/s] 76it [00:17, 4.28it/s] 77it [00:17, 4.30it/s] 78it [00:18, 4.30it/s] 79it [00:18, 4.30it/s] 80it [00:18, 4.21it/s] 81it [00:18, 4.31it/s] 82it [00:18, 4.38it/s] 83it [00:19, 4.43it/s] 84it [00:19, 4.49it/s] 85it [00:19, 4.44it/s] 86it [00:19, 4.37it/s] 87it [00:20, 4.43it/s] 88it [00:20, 4.39it/s] 89it [00:20, 4.46it/s] 90it [00:20, 4.52it/s] 91it [00:20, 4.54it/s] 92it [00:21, 4.53it/s] 93it [00:21, 4.42it/s] 94it [00:21, 4.35it/s] 95it [00:21, 4.31it/s] 96it [00:22, 4.25it/s] 97it [00:22, 4.36it/s] 98it [00:22, 4.43it/s] 99it [00:22, 4.36it/s] 100it [00:23, 4.30it/s]2025-05-25 22:04:38,377 - INFO - [Epoch 048 | Batch 0100] IWAE-loss 1300.4762 | mean log_px -0.0050 | KL -1212.15 + 101it [00:23, 4.28it/s] 102it [00:23, 4.35it/s] 103it [00:23, 4.31it/s] 104it [00:23, 4.28it/s] 105it [00:24, 4.29it/s] 106it [00:24, 4.28it/s] 107it [00:24, 4.34it/s] 108it [00:24, 4.42it/s] 109it [00:25, 4.43it/s] 110it [00:25, 4.30it/s] 111it [00:25, 4.32it/s] 112it [00:25, 4.24it/s] 113it [00:26, 4.25it/s] 114it [00:26, 4.28it/s] 115it [00:26, 4.37it/s] 116it [00:26, 4.43it/s] 117it [00:26, 4.36it/s] 118it [00:27, 4.39it/s] 119it [00:27, 4.32it/s] 120it [00:27, 4.29it/s] 121it [00:27, 4.26it/s] 122it [00:28, 4.27it/s] 123it [00:28, 4.27it/s] 124it [00:28, 4.37it/s] 125it [00:28, 4.31it/s] 126it [00:29, 4.31it/s] 127it [00:29, 4.41it/s] 128it [00:29, 4.45it/s] 129it [00:29, 4.50it/s] 130it [00:29, 4.54it/s] 131it [00:30, 4.48it/s] 132it [00:30, 4.39it/s] 133it [00:30, 4.47it/s] 134it [00:30, 4.44it/s] 135it [00:31, 4.40it/s] 136it [00:31, 4.31it/s] 137it [00:31, 4.31it/s] 138it [00:31, 4.26it/s] 139it [00:32, 4.36it/s] 140it [00:32, 4.42it/s] 141it [00:32, 4.40it/s] 142it [00:32, 4.46it/s] 143it [00:32, 4.43it/s] 144it [00:33, 4.49it/s] 145it [00:33, 4.46it/s] 146it [00:33, 4.39it/s] 147it [00:33, 4.29it/s] 148it [00:34, 4.26it/s] 149it [00:34, 4.25it/s] 150it [00:34, 4.22it/s]2025-05-25 22:04:49,874 - INFO - [Epoch 048 | Batch 0150] IWAE-loss 1771.9763 | mean log_px -0.0080 | KL -1212.38 + 151it [00:34, 4.25it/s] 152it [00:35, 4.25it/s] 153it [00:35, 4.38it/s] 154it [00:35, 4.28it/s] 155it [00:35, 4.28it/s] 156it [00:35, 4.29it/s] 157it [00:36, 4.39it/s] 158it [00:36, 4.36it/s] 159it [00:36, 4.34it/s] 160it [00:36, 4.25it/s] 161it [00:37, 4.26it/s] 162it [00:37, 4.34it/s] 163it [00:37, 4.36it/s] 164it [00:37, 4.41it/s] 165it [00:38, 4.43it/s] 166it [00:38, 4.45it/s] 167it [00:38, 4.38it/s] 168it [00:38, 4.40it/s] 169it [00:38, 4.36it/s] 170it [00:39, 4.33it/s] 171it [00:39, 4.19it/s] 172it [00:39, 4.30it/s] 173it [00:39, 4.31it/s] 174it [00:40, 4.28it/s] 175it [00:40, 4.39it/s] 176it [00:40, 4.45it/s] 177it [00:40, 4.50it/s] 178it [00:40, 4.55it/s] 179it [00:41, 4.44it/s] 180it [00:41, 4.50it/s] 181it [00:41, 4.56it/s] 182it [00:41, 4.46it/s] 183it [00:42, 4.43it/s] 184it [00:42, 4.32it/s] 185it [00:42, 4.23it/s] 186it [00:42, 4.23it/s] 187it [00:43, 4.28it/s] 188it [00:43, 4.35it/s] 189it [00:43, 4.32it/s] 190it [00:43, 4.28it/s] 191it [00:43, 4.27it/s] 192it [00:44, 4.34it/s] 193it [00:44, 4.30it/s] 194it [00:44, 4.36it/s] 195it [00:44, 4.32it/s] 196it [00:45, 4.41it/s] 196it [00:45, 4.34it/s] +2025-05-25 22:05:00,328 - INFO - Epoch: 48, Objective: tensor([1534.0585], device='cuda:0', grad_fn=), Loss: 0.016182228922843933, KL/n: 24.804851531982422 + 0it [00:00, ?it/s]2025-05-25 22:05:00,720 - INFO - [Epoch 049 | Batch 0000] IWAE-loss 1611.0990 | mean log_px -0.0056 | KL -1216.53 + 1it [00:00, 2.87it/s] 2it [00:00, 3.52it/s] 3it [00:00, 3.81it/s] 4it [00:01, 3.90it/s] 5it [00:01, 4.01it/s] 6it [00:01, 4.04it/s] 7it [00:01, 4.13it/s] 8it [00:02, 4.15it/s] 9it [00:02, 4.19it/s] 10it [00:02, 4.16it/s] 11it [00:02, 4.29it/s] 12it [00:02, 4.32it/s] 13it [00:03, 4.40it/s] 14it [00:03, 4.31it/s] 15it [00:03, 4.36it/s] 16it [00:03, 4.28it/s] 17it [00:04, 4.28it/s] 18it [00:04, 4.30it/s] 19it [00:04, 4.26it/s] 20it [00:04, 4.08it/s] 21it [00:05, 4.13it/s] 22it [00:05, 4.10it/s] 23it [00:05, 4.15it/s] 24it [00:05, 4.11it/s] 25it [00:06, 4.16it/s] 26it [00:06, 4.18it/s] 27it [00:06, 4.30it/s] 28it [00:06, 4.35it/s] 29it [00:06, 4.33it/s] 30it [00:07, 4.25it/s] 31it [00:07, 4.27it/s] 32it [00:07, 4.33it/s] 33it [00:07, 4.28it/s] 34it [00:08, 4.29it/s] 35it [00:08, 4.37it/s] 36it [00:08, 4.32it/s] 37it [00:08, 4.29it/s] 38it [00:09, 4.26it/s] 39it [00:09, 4.23it/s] 40it [00:09, 4.21it/s] 41it [00:09, 4.32it/s] 42it [00:09, 4.41it/s] 43it [00:10, 4.46it/s] 44it [00:10, 4.36it/s] 45it [00:10, 4.31it/s] 46it [00:10, 4.26it/s] 47it [00:11, 4.37it/s] 48it [00:11, 4.42it/s] 49it [00:11, 4.36it/s] 50it [00:11, 4.39it/s]2025-05-25 22:05:12,425 - INFO - [Epoch 049 | Batch 0050] IWAE-loss 1382.5945 | mean log_px -0.0030 | KL -1212.96 + 51it [00:12, 4.47it/s] 52it [00:12, 4.24it/s] 53it [00:12, 4.27it/s] 54it [00:12, 4.29it/s] 55it [00:12, 4.39it/s] 56it [00:13, 4.40it/s] 57it [00:13, 4.44it/s] 58it [00:13, 4.36it/s] 59it [00:13, 4.43it/s] 60it [00:14, 4.34it/s] 61it [00:14, 4.29it/s] 62it [00:14, 4.25it/s] 63it [00:14, 4.25it/s] 64it [00:15, 4.23it/s] 65it [00:15, 4.15it/s] 66it [00:15, 4.28it/s] 67it [00:15, 4.38it/s] 68it [00:15, 4.28it/s] 69it [00:16, 4.29it/s] 70it [00:16, 4.24it/s] 71it [00:16, 4.35it/s] 72it [00:16, 4.40it/s] 73it [00:17, 4.47it/s] 74it [00:17, 4.35it/s] 75it [00:17, 4.43it/s] 76it [00:17, 4.44it/s] 77it [00:18, 4.31it/s] 78it [00:18, 4.27it/s] 79it [00:18, 4.25it/s] 80it [00:18, 4.23it/s] 81it [00:18, 4.29it/s] 82it [00:19, 4.40it/s] 83it [00:19, 4.42it/s] 84it [00:19, 4.49it/s] 85it [00:19, 4.39it/s] 86it [00:20, 4.48it/s] 87it [00:20, 4.53it/s] 88it [00:20, 4.48it/s] 89it [00:20, 4.44it/s] 90it [00:21, 4.36it/s] 91it [00:21, 4.46it/s] 92it [00:21, 4.51it/s] 93it [00:21, 4.48it/s] 94it [00:21, 4.36it/s] 95it [00:22, 4.42it/s] 96it [00:22, 4.45it/s] 97it [00:22, 4.52it/s] 98it [00:22, 4.55it/s] 99it [00:22, 4.59it/s] 100it [00:23, 4.62it/s]2025-05-25 22:05:23,819 - INFO - [Epoch 049 | Batch 0100] IWAE-loss 1519.3214 | mean log_px -0.0086 | KL -1206.96 + 101it [00:23, 4.64it/s] 102it [00:23, 4.64it/s] 103it [00:23, 4.37it/s] 104it [00:24, 4.31it/s] 105it [00:24, 4.30it/s] 106it [00:24, 4.25it/s] 107it [00:24, 4.29it/s] 108it [00:25, 4.26it/s] 109it [00:25, 4.34it/s] 110it [00:25, 4.42it/s] 111it [00:25, 4.22it/s] 112it [00:26, 4.22it/s] 113it [00:26, 4.24it/s] 114it [00:26, 4.33it/s] 115it [00:26, 4.42it/s] 116it [00:26, 4.36it/s] 117it [00:27, 4.28it/s] 118it [00:27, 4.32it/s] 119it [00:27, 4.31it/s] 120it [00:27, 4.28it/s] 121it [00:28, 4.28it/s] 122it [00:28, 4.38it/s] 123it [00:28, 4.48it/s] 124it [00:28, 4.38it/s] 125it [00:28, 4.43it/s] 126it [00:29, 4.46it/s] 127it [00:29, 4.51it/s] 128it [00:29, 4.41it/s] 129it [00:29, 4.34it/s] 130it [00:30, 4.39it/s] 131it [00:30, 4.34it/s] 132it [00:30, 4.34it/s] 133it [00:30, 4.43it/s] 134it [00:31, 4.48it/s] 135it [00:31, 4.55it/s] 136it [00:31, 4.56it/s] 137it [00:31, 4.58it/s] 138it [00:31, 4.32it/s] 139it [00:32, 4.31it/s] 140it [00:32, 4.26it/s] 141it [00:32, 4.30it/s] 142it [00:32, 4.26it/s] 143it [00:33, 4.29it/s] 144it [00:33, 4.27it/s] 145it [00:33, 4.27it/s] 146it [00:33, 4.28it/s] 147it [00:34, 4.28it/s] 148it [00:34, 4.12it/s] 149it [00:34, 4.16it/s] 150it [00:34, 4.28it/s]2025-05-25 22:05:35,374 - INFO - [Epoch 049 | Batch 0150] IWAE-loss 1296.9624 | mean log_px -0.0015 | KL -1203.38 + 151it [00:34, 4.30it/s] 152it [00:35, 4.42it/s] 153it [00:35, 4.48it/s] 154it [00:35, 4.51it/s] 155it [00:35, 4.32it/s] 156it [00:36, 4.15it/s] 157it [00:36, 4.16it/s] 158it [00:36, 4.20it/s] 159it [00:36, 4.34it/s] 160it [00:37, 4.43it/s] 161it [00:37, 4.35it/s] 162it [00:37, 4.34it/s] 163it [00:37, 4.32it/s] 164it [00:37, 4.40it/s] 165it [00:38, 4.34it/s] 166it [00:38, 4.42it/s] 167it [00:38, 4.39it/s] 168it [00:38, 4.36it/s] 169it [00:39, 4.46it/s] 170it [00:39, 4.50it/s] 171it [00:39, 4.42it/s] 172it [00:39, 4.22it/s] 173it [00:40, 4.24it/s] 174it [00:40, 4.34it/s] 175it [00:40, 4.30it/s] 176it [00:40, 4.32it/s] 177it [00:40, 4.32it/s] 178it [00:41, 4.14it/s] 179it [00:41, 4.20it/s] 180it [00:41, 4.18it/s] 181it [00:41, 4.32it/s] 182it [00:42, 4.41it/s] 183it [00:42, 4.40it/s] 184it [00:42, 4.47it/s] 185it [00:42, 4.51it/s] 186it [00:42, 4.53it/s] 187it [00:43, 4.30it/s] 188it [00:43, 4.35it/s] 189it [00:43, 4.32it/s] 190it [00:43, 4.40it/s] 191it [00:44, 4.49it/s] 192it [00:44, 4.55it/s] 193it [00:44, 4.46it/s] 194it [00:44, 4.41it/s] 195it [00:45, 4.15it/s] 196it [00:45, 4.19it/s] 196it [00:45, 4.32it/s] +2025-05-25 22:05:45,865 - INFO - Epoch: 49, Objective: tensor([1426.3483], device='cuda:0', grad_fn=), Loss: 0.002869151998311281, KL/n: 24.51639175415039 + 0it [00:00, ?it/s]2025-05-25 22:05:46,436 - INFO - [Epoch 050 | Batch 0000] IWAE-loss 1417.0724 | mean log_px -0.0090 | KL -1203.12 + 1it [00:00, 3.09it/s] 2it [00:00, 3.71it/s] 3it [00:00, 4.11it/s] 4it [00:00, 4.23it/s] 5it [00:01, 4.40it/s] 6it [00:01, 4.25it/s] 7it [00:01, 4.29it/s] 8it [00:01, 4.29it/s] 9it [00:02, 4.30it/s] 10it [00:02, 4.28it/s] 11it [00:02, 4.30it/s] 12it [00:02, 4.30it/s] 13it [00:03, 4.42it/s] 14it [00:03, 4.50it/s] 15it [00:03, 4.32it/s] 16it [00:03, 4.44it/s] 17it [00:03, 4.38it/s] 18it [00:04, 4.37it/s] 19it [00:04, 4.34it/s] 20it [00:04, 4.31it/s] 21it [00:04, 4.42it/s] 22it [00:05, 4.43it/s] 23it [00:05, 4.40it/s] 24it [00:05, 4.47it/s] 25it [00:05, 4.29it/s] 26it [00:06, 4.29it/s] 27it [00:06, 4.30it/s] 28it [00:06, 4.30it/s] 29it [00:06, 4.35it/s] 30it [00:06, 4.44it/s] 31it [00:07, 4.50it/s] 32it [00:07, 4.41it/s] 33it [00:07, 4.40it/s] 34it [00:07, 4.49it/s] 35it [00:08, 4.33it/s] 36it [00:08, 4.42it/s] 37it [00:08, 4.43it/s] 38it [00:08, 4.46it/s] 39it [00:08, 4.54it/s] 40it [00:09, 4.55it/s] 41it [00:09, 4.61it/s] 42it [00:09, 4.48it/s] 43it [00:09, 4.56it/s] 44it [00:10, 4.42it/s] 45it [00:10, 4.37it/s] 46it [00:10, 4.32it/s] 47it [00:10, 4.35it/s] 48it [00:10, 4.45it/s] 49it [00:11, 4.40it/s] 50it [00:11, 4.21it/s]2025-05-25 22:05:57,829 - INFO - [Epoch 050 | Batch 0050] IWAE-loss 1422.3885 | mean log_px -0.0056 | KL -1198.54 + 51it [00:11, 4.28it/s] 52it [00:11, 4.25it/s] 53it [00:12, 4.25it/s] 54it [00:12, 4.23it/s] 55it [00:12, 4.25it/s] 56it [00:12, 4.38it/s] 57it [00:13, 4.34it/s] 58it [00:13, 4.41it/s] 59it [00:13, 4.46it/s] 60it [00:13, 4.49it/s] 61it [00:13, 4.44it/s] 62it [00:14, 4.32it/s] 63it [00:14, 4.38it/s] 64it [00:14, 4.44it/s] 65it [00:14, 4.35it/s] 66it [00:15, 4.32it/s] 67it [00:15, 4.37it/s] 68it [00:15, 4.47it/s] 69it [00:15, 4.44it/s] 70it [00:16, 4.26it/s] 71it [00:16, 4.27it/s] 72it [00:16, 4.35it/s] 73it [00:16, 4.43it/s] 74it [00:16, 4.40it/s] 75it [00:17, 4.38it/s] 76it [00:17, 4.16it/s] 77it [00:17, 4.22it/s] 78it [00:17, 4.32it/s] 79it [00:18, 4.34it/s] 80it [00:18, 4.44it/s] 81it [00:18, 4.48it/s] 82it [00:18, 4.39it/s] 83it [00:19, 4.48it/s] 84it [00:19, 4.53it/s] 85it [00:19, 4.30it/s] 86it [00:19, 4.35it/s] 87it [00:19, 4.43it/s] 88it [00:20, 4.39it/s] 89it [00:20, 4.48it/s] 90it [00:20, 4.54it/s] 91it [00:20, 4.58it/s] 92it [00:21, 4.61it/s] 93it [00:21, 4.50it/s] 94it [00:21, 4.29it/s] 95it [00:21, 4.25it/s] 96it [00:21, 4.39it/s] 97it [00:22, 4.34it/s] 98it [00:22, 4.32it/s] 99it [00:22, 4.42it/s] 100it [00:22, 4.49it/s]2025-05-25 22:06:09,207 - INFO - [Epoch 050 | Batch 0100] IWAE-loss 1353.2869 | mean log_px -0.0037 | KL -1194.16 + 101it [00:23, 4.55it/s] 102it [00:23, 4.53it/s] 103it [00:23, 4.44it/s] 104it [00:23, 4.52it/s] 105it [00:23, 4.53it/s] 106it [00:24, 4.43it/s] 107it [00:24, 4.37it/s] 108it [00:24, 4.46it/s] 109it [00:24, 4.49it/s] 110it [00:25, 4.44it/s] 111it [00:25, 4.45it/s] 112it [00:25, 4.33it/s] 113it [00:25, 4.42it/s] 114it [00:26, 4.46it/s] 115it [00:26, 4.50it/s] 116it [00:26, 4.55it/s] 117it [00:26, 4.60it/s] 118it [00:26, 4.57it/s] 119it [00:27, 4.62it/s] 120it [00:27, 4.63it/s] 121it [00:27, 4.45it/s] 122it [00:27, 4.38it/s] 123it [00:28, 4.47it/s] 124it [00:28, 4.47it/s] 125it [00:28, 4.44it/s] 126it [00:28, 4.48it/s] 127it [00:28, 4.53it/s] 128it [00:29, 4.58it/s] 129it [00:29, 4.43it/s] 130it [00:29, 4.39it/s] 131it [00:29, 4.35it/s] 132it [00:30, 4.41it/s] 133it [00:30, 4.50it/s] 134it [00:30, 4.52it/s] 135it [00:30, 4.46it/s] 136it [00:30, 4.37it/s] 137it [00:31, 4.35it/s] 138it [00:31, 4.33it/s] 139it [00:31, 4.30it/s] 140it [00:31, 4.31it/s] 141it [00:32, 4.27it/s] 142it [00:32, 4.38it/s] 143it [00:32, 4.34it/s] 144it [00:32, 4.33it/s] 145it [00:33, 4.42it/s] 146it [00:33, 4.35it/s] 147it [00:33, 4.20it/s] 148it [00:33, 4.23it/s] 149it [00:33, 4.23it/s] 150it [00:34, 4.25it/s]2025-05-25 22:06:20,549 - INFO - [Epoch 050 | Batch 0150] IWAE-loss 1559.9613 | mean log_px -0.0173 | KL -1188.04 + 151it [00:34, 4.27it/s] 152it [00:34, 4.15it/s] 153it [00:34, 4.24it/s] 154it [00:35, 4.30it/s] 155it [00:35, 4.38it/s] 156it [00:35, 4.46it/s] 157it [00:35, 4.41it/s] 158it [00:36, 4.40it/s] 159it [00:36, 4.30it/s] 160it [00:36, 4.28it/s] 161it [00:36, 4.27it/s] 162it [00:36, 4.30it/s] 163it [00:37, 4.27it/s] 164it [00:37, 4.15it/s] 165it [00:37, 4.18it/s] 166it [00:37, 4.19it/s] 167it [00:38, 4.33it/s] 168it [00:38, 4.32it/s] 169it [00:38, 4.39it/s] 170it [00:38, 4.46it/s] 171it [00:39, 4.54it/s] 172it [00:39, 4.59it/s] 173it [00:39, 4.39it/s] 174it [00:39, 4.40it/s] 175it [00:39, 4.46it/s] 176it [00:40, 4.47it/s] 177it [00:40, 4.41it/s] 178it [00:40, 4.35it/s] 179it [00:40, 4.32it/s] 180it [00:41, 4.29it/s] 181it [00:41, 4.33it/s] 182it [00:41, 4.26it/s] 183it [00:41, 4.24it/s] 184it [00:42, 4.33it/s] 185it [00:42, 4.37it/s] 186it [00:42, 4.44it/s] 187it [00:42, 4.41it/s] 188it [00:42, 4.35it/s] 189it [00:43, 4.43it/s] 190it [00:43, 4.46it/s] 191it [00:43, 4.51it/s] 192it [00:43, 4.55it/s] 193it [00:44, 4.58it/s] 194it [00:44, 4.43it/s] 195it [00:44, 4.36it/s] 196it [00:44, 4.30it/s] 196it [00:44, 4.37it/s] +2025-05-25 22:06:31,000 - INFO - Epoch: 50, Objective: tensor([1407.9646], device='cuda:0', grad_fn=), Loss: 0.00830838456749916, KL/n: 24.236207962036133 + 0it [00:00, ?it/s]2025-05-25 22:06:31,380 - INFO - [Epoch 051 | Batch 0000] IWAE-loss 1334.0294 | mean log_px -0.0045 | KL -1185.92 + 1it [00:00, 2.98it/s] 2it [00:00, 3.75it/s] 3it [00:00, 4.09it/s] 4it [00:00, 4.28it/s] 5it [00:01, 4.23it/s] 6it [00:01, 4.25it/s] 7it [00:01, 4.28it/s] 8it [00:01, 4.22it/s] 9it [00:02, 3.43it/s] 10it [00:02, 3.64it/s] 11it [00:02, 3.83it/s] 12it [00:03, 4.03it/s] 13it [00:03, 4.19it/s] 14it [00:03, 4.25it/s] 15it [00:03, 4.26it/s] 16it [00:03, 4.22it/s] 17it [00:04, 4.25it/s] 18it [00:04, 4.21it/s] 19it [00:04, 4.28it/s] 20it [00:04, 4.23it/s] 21it [00:05, 4.26it/s] 22it [00:05, 4.24it/s] 23it [00:05, 4.34it/s] 24it [00:05, 4.28it/s] 25it [00:06, 4.36it/s] 26it [00:06, 4.30it/s] 27it [00:06, 4.27it/s] 28it [00:06, 4.25it/s] 29it [00:06, 4.28it/s] 30it [00:07, 4.24it/s] 31it [00:07, 4.36it/s] 32it [00:07, 4.18it/s] 33it [00:07, 4.32it/s] 34it [00:08, 4.29it/s] 35it [00:08, 4.33it/s] 36it [00:08, 4.24it/s] 37it [00:08, 4.25it/s] 38it [00:09, 4.27it/s] 39it [00:09, 4.21it/s] 40it [00:09, 4.05it/s] 41it [00:09, 4.11it/s] 42it [00:10, 4.21it/s] 43it [00:10, 4.26it/s] 44it [00:10, 4.36it/s] 45it [00:10, 4.25it/s] 46it [00:10, 4.35it/s] 47it [00:11, 4.28it/s] 48it [00:11, 4.34it/s] 49it [00:11, 4.42it/s] 50it [00:11, 4.34it/s]2025-05-25 22:06:43,194 - INFO - [Epoch 051 | Batch 0050] IWAE-loss 1236.7412 | mean log_px -0.0013 | KL -1183.91 + 51it [00:12, 4.41it/s] 52it [00:12, 4.45it/s] 53it [00:12, 4.35it/s] 54it [00:12, 4.33it/s] 55it [00:13, 4.28it/s] 56it [00:13, 4.34it/s] 57it [00:13, 4.32it/s] 58it [00:13, 4.24it/s] 59it [00:13, 4.23it/s] 60it [00:14, 4.36it/s] 61it [00:14, 4.16it/s] 62it [00:14, 4.19it/s] 63it [00:14, 4.29it/s] 64it [00:15, 4.23it/s] 65it [00:15, 4.23it/s] 66it [00:15, 4.22it/s] 67it [00:15, 4.10it/s] 68it [00:16, 4.23it/s] 69it [00:16, 4.28it/s] 70it [00:16, 4.33it/s] 71it [00:16, 4.38it/s] 72it [00:17, 4.43it/s] 73it [00:17, 4.45it/s] 74it [00:17, 4.36it/s] 75it [00:17, 4.44it/s] 76it [00:17, 4.29it/s] 77it [00:18, 4.32it/s] 78it [00:18, 4.24it/s] 79it [00:18, 4.24it/s] 80it [00:18, 4.22it/s] 81it [00:19, 4.24it/s] 82it [00:19, 4.20it/s] 83it [00:19, 4.21it/s] 84it [00:19, 4.24it/s] 85it [00:20, 4.35it/s] 86it [00:20, 4.25it/s] 87it [00:20, 4.36it/s] 88it [00:20, 4.35it/s] 89it [00:20, 4.30it/s] 90it [00:21, 4.23it/s] 91it [00:21, 4.26it/s] 92it [00:21, 4.26it/s] 93it [00:21, 4.12it/s] 94it [00:22, 4.24it/s] 95it [00:22, 4.21it/s] 96it [00:22, 4.30it/s] 97it [00:22, 4.38it/s] 98it [00:23, 4.44it/s] 99it [00:23, 4.33it/s] 100it [00:23, 4.17it/s]2025-05-25 22:06:54,900 - INFO - [Epoch 051 | Batch 0100] IWAE-loss 1498.0203 | mean log_px -0.0071 | KL -1184.13 + 101it [00:23, 4.17it/s] 102it [00:24, 4.27it/s] 103it [00:24, 4.31it/s] 104it [00:24, 4.34it/s] 105it [00:24, 4.30it/s] 106it [00:24, 4.35it/s] 107it [00:25, 4.19it/s] 108it [00:25, 4.23it/s] 109it [00:25, 4.31it/s] 110it [00:25, 4.38it/s] 111it [00:26, 4.45it/s] 112it [00:26, 4.39it/s] 113it [00:26, 4.44it/s] 114it [00:26, 4.47it/s] 115it [00:27, 4.26it/s] 116it [00:27, 4.23it/s] 117it [00:27, 4.32it/s] 118it [00:27, 4.35it/s] 119it [00:27, 4.39it/s] 120it [00:28, 4.32it/s] 121it [00:28, 4.28it/s] 122it [00:28, 4.36it/s] 123it [00:28, 4.39it/s] 124it [00:29, 4.43it/s] 125it [00:29, 4.27it/s] 126it [00:29, 4.34it/s] 127it [00:29, 4.28it/s] 128it [00:30, 4.22it/s] 129it [00:30, 4.16it/s] 130it [00:30, 4.18it/s] 131it [00:30, 4.26it/s] 132it [00:30, 4.34it/s] 133it [00:31, 4.28it/s] 134it [00:31, 4.38it/s] 135it [00:31, 4.32it/s] 136it [00:31, 4.35it/s] 137it [00:32, 4.43it/s] 138it [00:32, 4.38it/s] 139it [00:32, 4.44it/s] 140it [00:32, 4.34it/s] 141it [00:33, 4.42it/s] 142it [00:33, 4.34it/s] 143it [00:33, 4.32it/s] 144it [00:33, 4.42it/s] 145it [00:33, 4.47it/s] 146it [00:34, 4.35it/s] 147it [00:34, 4.27it/s] 148it [00:34, 4.22it/s] 149it [00:34, 4.29it/s] 150it [00:35, 4.25it/s]2025-05-25 22:07:06,436 - INFO - [Epoch 051 | Batch 0150] IWAE-loss 1679.6946 | mean log_px -0.0117 | KL -1184.98 + 151it [00:35, 4.33it/s] 152it [00:35, 4.26it/s] 153it [00:35, 4.24it/s] 154it [00:36, 4.12it/s] 155it [00:36, 4.25it/s] 156it [00:36, 4.35it/s] 157it [00:36, 4.28it/s] 158it [00:37, 4.27it/s] 159it [00:37, 4.36it/s] 160it [00:37, 4.35it/s] 161it [00:37, 4.33it/s] 162it [00:37, 4.27it/s] 163it [00:38, 4.31it/s] 164it [00:38, 4.26it/s] 165it [00:38, 4.15it/s] 166it [00:38, 4.21it/s] 167it [00:39, 4.32it/s] 168it [00:39, 4.26it/s] 169it [00:39, 4.21it/s] 170it [00:39, 4.28it/s] 171it [00:40, 4.28it/s] 172it [00:40, 4.27it/s] 173it [00:40, 4.17it/s] 174it [00:40, 4.29it/s] 175it [00:40, 4.37it/s] 176it [00:41, 4.40it/s] 177it [00:41, 4.34it/s] 178it [00:41, 4.35it/s] 179it [00:41, 4.41it/s] 180it [00:42, 4.32it/s] 181it [00:42, 4.41it/s] 182it [00:42, 4.47it/s] 183it [00:42, 4.46it/s] 184it [00:43, 4.37it/s] 185it [00:43, 4.34it/s] 186it [00:43, 4.34it/s] 187it [00:43, 4.33it/s] 188it [00:43, 4.37it/s] 189it [00:44, 4.44it/s] 190it [00:44, 4.43it/s] 191it [00:44, 4.42it/s] 192it [00:44, 4.37it/s] 193it [00:45, 4.36it/s] 194it [00:45, 4.30it/s] 195it [00:45, 4.14it/s] 196it [00:45, 4.16it/s] 196it [00:45, 4.27it/s] +2025-05-25 22:07:17,036 - INFO - Epoch: 51, Objective: tensor([1720.4115], device='cuda:0', grad_fn=), Loss: 0.011251946911215782, KL/n: 24.17317771911621 + 0it [00:00, ?it/s]2025-05-25 22:07:17,444 - INFO - [Epoch 052 | Batch 0000] IWAE-loss 1308.6581 | mean log_px -0.0024 | KL -1183.32 + 1it [00:00, 2.75it/s] 2it [00:00, 3.56it/s] 3it [00:00, 3.99it/s] 4it [00:01, 4.04it/s] 5it [00:01, 4.16it/s] 6it [00:01, 4.17it/s] 7it [00:01, 4.21it/s] 8it [00:01, 4.21it/s] 9it [00:02, 4.28it/s] 10it [00:02, 4.37it/s] 11it [00:02, 4.42it/s] 12it [00:02, 4.39it/s] 13it [00:03, 4.38it/s] 14it [00:03, 4.32it/s] 15it [00:03, 4.31it/s] 16it [00:03, 4.32it/s] 17it [00:04, 4.30it/s] 18it [00:04, 4.26it/s] 19it [00:04, 4.24it/s] 20it [00:04, 4.19it/s] 21it [00:04, 4.32it/s] 22it [00:05, 4.27it/s] 23it [00:05, 4.32it/s] 24it [00:05, 4.28it/s] 25it [00:05, 4.28it/s] 26it [00:06, 4.36it/s] 27it [00:06, 4.33it/s] 28it [00:06, 4.27it/s] 29it [00:06, 4.29it/s] 30it [00:07, 4.29it/s] 31it [00:07, 4.26it/s] 32it [00:07, 4.11it/s] 33it [00:07, 4.27it/s] 34it [00:08, 4.26it/s] 35it [00:08, 4.24it/s] 36it [00:08, 4.21it/s] 37it [00:08, 4.25it/s] 38it [00:08, 4.18it/s] 39it [00:09, 4.10it/s] 40it [00:09, 4.11it/s] 41it [00:09, 4.06it/s] 42it [00:09, 4.17it/s] 43it [00:10, 4.29it/s] 44it [00:10, 4.34it/s] 45it [00:10, 4.27it/s] 46it [00:10, 4.26it/s] 47it [00:11, 4.36it/s] 48it [00:11, 4.44it/s] 49it [00:11, 4.49it/s] 50it [00:11, 4.53it/s]2025-05-25 22:07:29,096 - INFO - [Epoch 052 | Batch 0050] IWAE-loss 1253.5378 | mean log_px -0.0022 | KL -1182.44 + 51it [00:11, 4.37it/s] 52it [00:12, 4.35it/s] 53it [00:12, 4.21it/s] 54it [00:12, 4.30it/s] 55it [00:12, 4.35it/s] 56it [00:13, 4.43it/s] 57it [00:13, 4.36it/s] 58it [00:13, 4.31it/s] 59it [00:13, 4.31it/s] 60it [00:14, 4.28it/s] 61it [00:14, 4.27it/s] 62it [00:14, 4.15it/s] 63it [00:14, 4.16it/s] 64it [00:15, 4.18it/s] 65it [00:15, 4.23it/s] 66it [00:15, 4.34it/s] 67it [00:15, 4.28it/s] 68it [00:15, 4.28it/s] 69it [00:16, 4.28it/s] 70it [00:16, 4.29it/s] 71it [00:16, 4.33it/s] 72it [00:16, 4.32it/s] 73it [00:17, 4.28it/s] 74it [00:17, 4.28it/s] 75it [00:17, 4.21it/s] 76it [00:17, 4.21it/s] 77it [00:18, 4.34it/s] 78it [00:18, 4.35it/s] 79it [00:18, 4.33it/s] 80it [00:18, 4.37it/s] 81it [00:18, 4.33it/s] 82it [00:19, 4.28it/s] 83it [00:19, 4.39it/s] 84it [00:19, 4.45it/s] 85it [00:19, 4.47it/s] 86it [00:20, 4.42it/s] 87it [00:20, 4.49it/s] 88it [00:20, 4.39it/s] 89it [00:20, 4.44it/s] 90it [00:21, 4.46it/s] 91it [00:21, 4.51it/s] 92it [00:21, 4.46it/s] 93it [00:21, 4.41it/s] 94it [00:21, 4.49it/s] 95it [00:22, 4.46it/s] 96it [00:22, 4.38it/s] 97it [00:22, 4.38it/s] 98it [00:22, 4.39it/s] 99it [00:23, 4.39it/s] 100it [00:23, 4.36it/s]2025-05-25 22:07:40,627 - INFO - [Epoch 052 | Batch 0100] IWAE-loss 1299.2296 | mean log_px -0.0027 | KL -1181.27 + 101it [00:23, 4.35it/s] 102it [00:23, 4.42it/s] 103it [00:23, 4.48it/s] 104it [00:24, 4.52it/s] 105it [00:24, 4.50it/s] 106it [00:24, 4.30it/s] 107it [00:24, 4.20it/s] 108it [00:25, 4.31it/s] 109it [00:25, 4.39it/s] 110it [00:25, 4.44it/s] 111it [00:25, 4.33it/s] 112it [00:26, 4.33it/s] 113it [00:26, 4.30it/s] 114it [00:26, 4.27it/s] 115it [00:26, 4.40it/s] 116it [00:26, 4.34it/s] 117it [00:27, 4.33it/s] 118it [00:27, 4.30it/s] 119it [00:27, 4.30it/s] 120it [00:27, 4.27it/s] 121it [00:28, 4.31it/s] 122it [00:28, 4.31it/s] 123it [00:28, 4.37it/s] 124it [00:28, 4.21it/s] 125it [00:29, 4.22it/s] 126it [00:29, 4.26it/s] 127it [00:29, 4.26it/s] 128it [00:29, 4.35it/s] 129it [00:29, 4.35it/s] 130it [00:30, 4.44it/s] 131it [00:30, 4.49it/s] 132it [00:30, 4.52it/s] 133it [00:30, 4.47it/s] 134it [00:31, 4.53it/s] 135it [00:31, 4.34it/s] 136it [00:31, 4.32it/s] 137it [00:31, 4.34it/s] 138it [00:32, 4.41it/s] 139it [00:32, 4.49it/s] 140it [00:32, 4.55it/s] 141it [00:32, 4.56it/s] 142it [00:32, 4.59it/s] 143it [00:33, 4.51it/s] 144it [00:33, 4.41it/s] 145it [00:33, 4.47it/s] 146it [00:33, 4.53it/s] 147it [00:33, 4.58it/s] 148it [00:34, 4.60it/s] 149it [00:34, 4.53it/s] 150it [00:34, 4.45it/s]2025-05-25 22:07:52,001 - INFO - [Epoch 052 | Batch 0150] IWAE-loss 1224.5007 | mean log_px -0.0009 | KL -1180.44 + 151it [00:34, 4.37it/s] 152it [00:35, 4.36it/s] 153it [00:35, 4.44it/s] 154it [00:35, 4.44it/s] 155it [00:35, 4.37it/s] 156it [00:36, 4.32it/s] 157it [00:36, 4.31it/s] 158it [00:36, 4.27it/s] 159it [00:36, 4.30it/s] 160it [00:36, 4.34it/s] 161it [00:37, 4.31it/s] 162it [00:37, 4.29it/s] 163it [00:37, 4.30it/s] 164it [00:37, 4.27it/s] 165it [00:38, 4.32it/s] 166it [00:38, 4.41it/s] 167it [00:38, 4.42it/s] 168it [00:38, 4.45it/s] 169it [00:39, 4.48it/s] 170it [00:39, 4.51it/s] 171it [00:39, 4.47it/s] 172it [00:39, 4.48it/s] 173it [00:39, 4.52it/s] 174it [00:40, 4.47it/s] 175it [00:40, 4.50it/s] 176it [00:40, 4.23it/s] 177it [00:40, 4.28it/s] 178it [00:41, 4.31it/s] 179it [00:41, 4.30it/s] 180it [00:41, 4.29it/s] 181it [00:41, 4.40it/s] 182it [00:41, 4.50it/s] 183it [00:42, 4.49it/s] 184it [00:42, 4.40it/s] 185it [00:42, 4.40it/s] 186it [00:42, 4.40it/s] 187it [00:43, 4.34it/s] 188it [00:43, 4.44it/s] 189it [00:43, 4.50it/s] 190it [00:43, 4.55it/s] 191it [00:43, 4.48it/s] 192it [00:44, 4.41it/s] 193it [00:44, 4.39it/s] 194it [00:44, 4.48it/s] 195it [00:44, 4.29it/s] 196it [00:45, 4.29it/s] 196it [00:45, 4.33it/s] +2025-05-25 22:08:02,399 - INFO - Epoch: 52, Objective: tensor([1489.6241], device='cuda:0', grad_fn=), Loss: 0.0029403548687696457, KL/n: 23.974336624145508 + 0it [00:00, ?it/s]2025-05-25 22:08:02,963 - INFO - [Epoch 053 | Batch 0000] IWAE-loss 1426.3737 | mean log_px -0.0070 | KL -1176.55 + 1it [00:00, 2.98it/s] 2it [00:00, 3.81it/s] 3it [00:00, 4.17it/s] 4it [00:00, 4.36it/s] 5it [00:01, 4.47it/s] 6it [00:01, 4.53it/s] 7it [00:01, 4.59it/s] 8it [00:01, 4.46it/s] 9it [00:02, 4.50it/s] 10it [00:02, 4.56it/s] 11it [00:02, 4.60it/s] 12it [00:02, 4.62it/s] 13it [00:02, 4.66it/s] 14it [00:03, 4.66it/s] 15it [00:03, 4.67it/s] 16it [00:03, 4.67it/s] 17it [00:03, 4.67it/s] 18it [00:03, 4.68it/s] 19it [00:04, 4.69it/s] 20it [00:04, 4.69it/s] 21it [00:04, 4.68it/s] 22it [00:04, 4.68it/s] 23it [00:05, 4.70it/s] 24it [00:05, 4.68it/s] 25it [00:05, 4.69it/s] 26it [00:05, 4.67it/s] 27it [00:05, 4.69it/s] 28it [00:06, 4.68it/s] 29it [00:06, 4.68it/s] 30it [00:06, 4.65it/s] 31it [00:06, 4.64it/s] 32it [00:06, 4.65it/s] 33it [00:07, 4.66it/s] 34it [00:07, 4.51it/s] 35it [00:07, 4.57it/s] 36it [00:07, 4.59it/s] 37it [00:08, 4.60it/s] 38it [00:08, 4.58it/s] 39it [00:08, 4.60it/s] 40it [00:08, 4.59it/s] 41it [00:08, 4.60it/s] 42it [00:09, 4.51it/s] 43it [00:09, 4.48it/s] 44it [00:09, 4.53it/s] 45it [00:09, 4.56it/s] 46it [00:10, 4.58it/s] 47it [00:10, 4.60it/s] 48it [00:10, 4.45it/s] 49it [00:10, 4.47it/s] 50it [00:10, 4.52it/s]2025-05-25 22:08:13,822 - INFO - [Epoch 053 | Batch 0050] IWAE-loss 1257.6678 | mean log_px -0.0016 | KL -1169.34 + 51it [00:11, 4.57it/s] 52it [00:11, 4.59it/s] 53it [00:11, 4.62it/s] 54it [00:11, 4.49it/s] 55it [00:12, 4.56it/s] 56it [00:12, 4.57it/s] 57it [00:12, 4.59it/s] 58it [00:12, 4.60it/s] 59it [00:12, 4.61it/s] 60it [00:13, 4.61it/s] 61it [00:13, 4.61it/s] 62it [00:13, 4.62it/s] 63it [00:13, 4.63it/s] 64it [00:13, 4.63it/s] 65it [00:14, 4.63it/s] 66it [00:14, 4.63it/s] 67it [00:14, 4.64it/s] 68it [00:14, 4.63it/s] 69it [00:15, 4.64it/s] 70it [00:15, 4.64it/s] 71it [00:15, 4.64it/s] 72it [00:15, 4.50it/s] 73it [00:15, 4.55it/s] 74it [00:16, 4.57it/s] 75it [00:16, 4.58it/s] 76it [00:16, 4.61it/s] 77it [00:16, 4.62it/s] 78it [00:17, 4.62it/s] 79it [00:17, 4.62it/s] 80it [00:17, 4.62it/s] 81it [00:17, 4.63it/s] 82it [00:17, 4.46it/s] 83it [00:18, 4.50it/s] 84it [00:18, 4.52it/s] 85it [00:18, 4.56it/s] 86it [00:18, 4.57it/s] 87it [00:19, 4.59it/s] 88it [00:19, 4.47it/s] 89it [00:19, 4.53it/s] 90it [00:19, 4.55it/s] 91it [00:19, 4.58it/s] 92it [00:20, 4.60it/s] 93it [00:20, 4.48it/s] 94it [00:20, 4.53it/s] 95it [00:20, 4.57it/s] 96it [00:20, 4.58it/s] 97it [00:21, 4.60it/s] 98it [00:21, 4.61it/s] 99it [00:21, 4.62it/s] 100it [00:21, 4.62it/s]2025-05-25 22:08:24,720 - INFO - [Epoch 053 | Batch 0100] IWAE-loss 1240.2892 | mean log_px -0.0014 | KL -1168.91 + 101it [00:22, 4.61it/s] 102it [00:22, 4.62it/s] 103it [00:22, 4.63it/s] 104it [00:22, 4.62it/s] 105it [00:22, 4.62it/s] 106it [00:23, 4.64it/s] 107it [00:23, 4.64it/s] 108it [00:23, 4.49it/s] 109it [00:23, 4.55it/s] 110it [00:24, 4.53it/s] 111it [00:24, 4.55it/s] 112it [00:24, 4.43it/s] 113it [00:24, 4.47it/s] 114it [00:24, 4.51it/s] 115it [00:25, 4.55it/s] 116it [00:25, 4.57it/s] 117it [00:25, 4.59it/s] 118it [00:25, 4.47it/s] 119it [00:26, 4.53it/s] 120it [00:26, 4.56it/s] 121it [00:26, 4.58it/s] 122it [00:26, 4.57it/s] 123it [00:26, 4.57it/s] 124it [00:27, 4.58it/s] 125it [00:27, 4.59it/s] 126it [00:27, 4.59it/s] 127it [00:27, 4.61it/s] 128it [00:27, 4.61it/s] 129it [00:28, 4.62it/s] 130it [00:28, 4.61it/s] 131it [00:28, 4.63it/s] 132it [00:28, 4.63it/s] 133it [00:29, 4.62it/s] 134it [00:29, 4.60it/s] 135it [00:29, 4.62it/s] 136it [00:29, 4.61it/s] 137it [00:29, 4.62it/s] 138it [00:30, 4.63it/s] 139it [00:30, 4.64it/s] 140it [00:30, 4.63it/s] 141it [00:30, 4.63it/s] 142it [00:31, 4.62it/s] 143it [00:31, 4.63it/s] 144it [00:31, 4.62it/s] 145it [00:31, 4.63it/s] 146it [00:31, 4.63it/s] 147it [00:32, 4.49it/s] 148it [00:32, 4.53it/s] 149it [00:32, 4.56it/s] 150it [00:32, 4.58it/s]2025-05-25 22:08:35,631 - INFO - [Epoch 053 | Batch 0150] IWAE-loss 1517.0568 | mean log_px -0.0129 | KL -1162.64 + 151it [00:32, 4.60it/s] 152it [00:33, 4.62it/s] 153it [00:33, 4.48it/s] 154it [00:33, 4.53it/s] 155it [00:33, 4.56it/s] 156it [00:34, 4.59it/s] 157it [00:34, 4.60it/s] 158it [00:34, 4.60it/s] 159it [00:34, 4.62it/s] 160it [00:34, 4.62it/s] 161it [00:35, 4.63it/s] 162it [00:35, 4.62it/s] 163it [00:35, 4.64it/s] 164it [00:35, 4.64it/s] 165it [00:36, 4.64it/s] 166it [00:36, 4.64it/s] 167it [00:36, 4.64it/s] 168it [00:36, 4.63it/s] 169it [00:36, 4.64it/s] 170it [00:37, 4.64it/s] 171it [00:37, 4.64it/s] 172it [00:37, 4.63it/s] 173it [00:37, 4.64it/s] 174it [00:37, 4.64it/s] 175it [00:38, 4.64it/s] 176it [00:38, 4.64it/s] 177it [00:38, 4.61it/s] 178it [00:38, 4.61it/s] 179it [00:39, 4.60it/s] 180it [00:39, 4.52it/s] 181it [00:39, 4.55it/s] 182it [00:39, 4.57it/s] 183it [00:39, 4.58it/s] 184it [00:40, 4.60it/s] 185it [00:40, 4.62it/s] 186it [00:40, 4.61it/s] 187it [00:40, 4.60it/s] 188it [00:41, 4.47it/s] 189it [00:41, 4.53it/s] 190it [00:41, 4.55it/s] 191it [00:41, 4.58it/s] 192it [00:41, 4.48it/s] 193it [00:42, 4.50it/s] 194it [00:42, 4.53it/s] 195it [00:42, 4.29it/s] 196it [00:42, 4.37it/s] 196it [00:42, 4.57it/s] +2025-05-25 22:08:45,614 - INFO - Epoch: 53, Objective: tensor([1300.9849], device='cuda:0', grad_fn=), Loss: 0.0023734073620289564, KL/n: 23.757631301879883 + 0it [00:00, ?it/s]2025-05-25 22:08:45,989 - INFO - [Epoch 054 | Batch 0000] IWAE-loss 1428.1246 | mean log_px -0.0070 | KL -1163.56 + 1it [00:00, 3.00it/s] 2it [00:00, 3.66it/s] 3it [00:00, 3.87it/s] 4it [00:01, 4.04it/s] 5it [00:01, 4.12it/s] 6it [00:01, 4.27it/s] 7it [00:01, 3.47it/s] 8it [00:02, 3.77it/s] 9it [00:02, 4.00it/s] 10it [00:02, 4.17it/s] 11it [00:02, 4.19it/s] 12it [00:02, 4.32it/s] 13it [00:03, 4.17it/s] 14it [00:03, 4.31it/s] 15it [00:03, 4.24it/s] 16it [00:03, 4.29it/s] 17it [00:04, 4.39it/s] 18it [00:04, 4.45it/s] 19it [00:04, 4.44it/s] 20it [00:04, 4.46it/s] 21it [00:05, 4.45it/s] 22it [00:05, 4.38it/s] 23it [00:05, 4.37it/s] 24it [00:05, 4.36it/s] 25it [00:05, 4.46it/s] 26it [00:06, 4.26it/s] 27it [00:06, 4.30it/s] 28it [00:06, 4.33it/s] 29it [00:06, 4.33it/s] 30it [00:07, 4.35it/s] 31it [00:07, 4.37it/s] 32it [00:07, 4.31it/s] 33it [00:07, 4.34it/s] 34it [00:08, 4.32it/s] 35it [00:08, 4.32it/s] 36it [00:08, 4.31it/s] 37it [00:08, 4.19it/s] 38it [00:09, 4.19it/s] 39it [00:09, 4.27it/s] 40it [00:09, 4.24it/s] 41it [00:09, 4.29it/s] 42it [00:09, 4.31it/s] 43it [00:10, 4.31it/s] 44it [00:10, 4.29it/s] 45it [00:10, 4.18it/s] 46it [00:10, 4.21it/s] 47it [00:11, 4.33it/s] 48it [00:11, 4.41it/s] 49it [00:11, 4.33it/s] 50it [00:11, 4.39it/s]2025-05-25 22:08:57,698 - INFO - [Epoch 054 | Batch 0050] IWAE-loss 1222.4982 | mean log_px -0.0012 | KL -1156.77 + 51it [00:12, 4.31it/s] 52it [00:12, 4.34it/s] 53it [00:12, 4.22it/s] 54it [00:12, 4.25it/s] 55it [00:12, 4.25it/s] 56it [00:13, 4.27it/s] 57it [00:13, 4.36it/s] 58it [00:13, 4.43it/s] 59it [00:13, 4.43it/s] 60it [00:14, 4.37it/s] 61it [00:14, 4.34it/s] 62it [00:14, 4.29it/s] 63it [00:14, 4.31it/s] 64it [00:15, 4.29it/s] 65it [00:15, 4.40it/s] 66it [00:15, 4.33it/s] 67it [00:15, 4.35it/s] 68it [00:15, 4.39it/s] 69it [00:16, 4.36it/s] 70it [00:16, 4.31it/s] 71it [00:16, 4.27it/s] 72it [00:16, 4.36it/s] 73it [00:17, 4.45it/s] 74it [00:17, 4.40it/s] 75it [00:17, 4.37it/s] 76it [00:17, 4.34it/s] 77it [00:17, 4.43it/s] 78it [00:18, 4.46it/s] 79it [00:18, 4.29it/s] 80it [00:18, 4.40it/s] 81it [00:18, 4.41it/s] 82it [00:19, 4.35it/s] 83it [00:19, 4.36it/s] 84it [00:19, 4.44it/s] 85it [00:19, 4.42it/s] 86it [00:20, 4.44it/s] 87it [00:20, 4.42it/s] 88it [00:20, 4.45it/s] 89it [00:20, 4.30it/s] 90it [00:20, 4.30it/s] 91it [00:21, 4.40it/s] 92it [00:21, 4.44it/s] 93it [00:21, 4.40it/s] 94it [00:21, 4.36it/s] 95it [00:22, 4.35it/s] 96it [00:22, 4.33it/s] 97it [00:22, 4.30it/s] 98it [00:22, 4.19it/s] 99it [00:23, 4.27it/s] 100it [00:23, 4.35it/s]2025-05-25 22:09:09,185 - INFO - [Epoch 054 | Batch 0100] IWAE-loss 1336.7174 | mean log_px -0.0042 | KL -1150.52 + 101it [00:23, 4.34it/s] 102it [00:23, 4.38it/s] 103it [00:23, 4.36it/s] 104it [00:24, 4.35it/s] 105it [00:24, 4.36it/s] 106it [00:24, 4.35it/s] 107it [00:24, 4.31it/s] 108it [00:25, 4.32it/s] 109it [00:25, 4.30it/s] 110it [00:25, 4.31it/s] 111it [00:25, 4.28it/s] 112it [00:26, 4.23it/s] 113it [00:26, 4.26it/s] 114it [00:26, 4.27it/s] 115it [00:26, 4.31it/s] 116it [00:26, 4.33it/s] 117it [00:27, 4.39it/s] 118it [00:27, 4.30it/s] 119it [00:27, 4.39it/s] 120it [00:27, 4.32it/s] 121it [00:28, 4.29it/s] 122it [00:28, 4.26it/s] 123it [00:28, 4.21it/s] 124it [00:28, 4.25it/s] 125it [00:29, 4.31it/s] 126it [00:29, 4.32it/s] 127it [00:29, 4.30it/s] 128it [00:29, 4.31it/s] 129it [00:30, 4.23it/s] 130it [00:30, 4.15it/s] 131it [00:30, 4.19it/s] 132it [00:30, 4.20it/s] 133it [00:30, 4.28it/s] 134it [00:31, 4.21it/s] 135it [00:31, 4.24it/s] 136it [00:31, 4.24it/s] 137it [00:31, 4.21it/s] 138it [00:32, 4.22it/s] 139it [00:32, 4.30it/s] 140it [00:32, 4.31it/s] 141it [00:32, 4.27it/s] 142it [00:33, 4.25it/s] 143it [00:33, 4.25it/s] 144it [00:33, 4.32it/s] 145it [00:33, 4.33it/s] 146it [00:34, 4.07it/s] 147it [00:34, 4.17it/s] 148it [00:34, 4.19it/s] 149it [00:34, 4.25it/s] 150it [00:34, 4.31it/s]2025-05-25 22:09:20,878 - INFO - [Epoch 054 | Batch 0150] IWAE-loss 1233.8479 | mean log_px -0.0012 | KL -1151.34 + 151it [00:35, 4.33it/s] 152it [00:35, 4.35it/s] 153it [00:35, 4.41it/s] 154it [00:35, 4.46it/s] 155it [00:36, 4.32it/s] 156it [00:36, 4.31it/s] 157it [00:36, 4.27it/s] 158it [00:36, 4.27it/s] 159it [00:37, 4.25it/s] 160it [00:37, 4.27it/s] 161it [00:37, 4.23it/s] 162it [00:37, 4.22it/s] 163it [00:38, 4.18it/s] 164it [00:38, 4.22it/s] 165it [00:38, 4.25it/s] 166it [00:38, 4.24it/s] 167it [00:38, 4.36it/s] 168it [00:39, 4.36it/s] 169it [00:39, 4.44it/s] 170it [00:39, 4.37it/s] 171it [00:39, 4.37it/s] 172it [00:40, 4.23it/s] 173it [00:40, 4.25it/s] 174it [00:40, 4.32it/s] 175it [00:40, 4.32it/s] 176it [00:40, 4.34it/s] 177it [00:41, 4.33it/s] 178it [00:41, 4.22it/s] 179it [00:41, 4.25it/s] 180it [00:41, 4.33it/s] 181it [00:42, 4.32it/s] 182it [00:42, 4.31it/s] 183it [00:42, 4.33it/s] 184it [00:42, 4.40it/s] 185it [00:43, 4.34it/s] 186it [00:43, 4.38it/s] 187it [00:43, 4.23it/s] 188it [00:43, 4.24it/s] 189it [00:44, 4.29it/s] 190it [00:44, 4.33it/s] 191it [00:44, 4.38it/s] 192it [00:44, 4.39it/s] 193it [00:44, 4.34it/s] 194it [00:45, 4.20it/s] 195it [00:45, 4.12it/s] 196it [00:45, 4.27it/s] 196it [00:45, 4.29it/s] +2025-05-25 22:09:31,482 - INFO - Epoch: 54, Objective: tensor([1524.9691], device='cuda:0', grad_fn=), Loss: 0.006559988018125296, KL/n: 23.41026496887207 + 0it [00:00, ?it/s]2025-05-25 22:09:31,873 - INFO - [Epoch 055 | Batch 0000] IWAE-loss 1968.7968 | mean log_px -0.0207 | KL -1144.99 + 1it [00:00, 3.06it/s] 2it [00:00, 3.66it/s] 3it [00:00, 3.93it/s] 4it [00:01, 4.04it/s] 5it [00:01, 4.23it/s] 6it [00:01, 4.33it/s] 7it [00:01, 4.42it/s] 8it [00:01, 4.48it/s] 9it [00:02, 4.54it/s] 10it [00:02, 4.57it/s] 11it [00:02, 4.61it/s] 12it [00:02, 4.61it/s] 13it [00:02, 4.61it/s] 14it [00:03, 4.49it/s] 15it [00:03, 4.56it/s] 16it [00:03, 4.58it/s] 17it [00:03, 4.61it/s] 18it [00:04, 4.61it/s] 19it [00:04, 4.63it/s] 20it [00:04, 4.63it/s] 21it [00:04, 4.64it/s] 22it [00:04, 4.64it/s] 23it [00:05, 4.65it/s] 24it [00:05, 4.63it/s] 25it [00:05, 4.63it/s] 26it [00:05, 4.62it/s] 27it [00:06, 4.64it/s] 28it [00:06, 4.63it/s] 29it [00:06, 4.63it/s] 30it [00:06, 4.63it/s] 31it [00:06, 4.65it/s] 32it [00:07, 4.64it/s] 33it [00:07, 4.65it/s] 34it [00:07, 4.64it/s] 35it [00:07, 4.65it/s] 36it [00:07, 4.64it/s] 37it [00:08, 4.65it/s] 38it [00:08, 4.64it/s] 39it [00:08, 4.66it/s] 40it [00:08, 4.62it/s] 41it [00:09, 4.65it/s] 42it [00:09, 4.66it/s] 43it [00:09, 4.67it/s] 44it [00:09, 4.65it/s] 45it [00:09, 4.64it/s] 46it [00:10, 4.63it/s] 47it [00:10, 4.56it/s] 48it [00:10, 4.60it/s] 49it [00:10, 4.62it/s] 50it [00:10, 4.63it/s]2025-05-25 22:09:42,742 - INFO - [Epoch 055 | Batch 0050] IWAE-loss 1384.5171 | mean log_px -0.0034 | KL -1144.44 + 51it [00:11, 4.63it/s] 52it [00:11, 4.48it/s] 53it [00:11, 4.54it/s] 54it [00:11, 4.58it/s] 55it [00:12, 4.61it/s] 56it [00:12, 4.62it/s] 57it [00:12, 4.65it/s] 58it [00:12, 4.66it/s] 59it [00:12, 4.67it/s] 60it [00:13, 4.63it/s] 61it [00:13, 4.64it/s] 62it [00:13, 4.62it/s] 63it [00:13, 4.64it/s] 64it [00:14, 4.63it/s] 65it [00:14, 4.63it/s] 66it [00:14, 4.64it/s] 67it [00:14, 4.49it/s] 68it [00:14, 4.55it/s] 69it [00:15, 4.57it/s] 70it [00:15, 4.59it/s] 71it [00:15, 4.62it/s] 72it [00:15, 4.58it/s] 73it [00:15, 4.54it/s] 74it [00:16, 4.52it/s] 75it [00:16, 4.52it/s] 76it [00:16, 4.51it/s] 77it [00:16, 4.51it/s] 78it [00:17, 4.49it/s] 79it [00:17, 4.53it/s] 80it [00:17, 4.57it/s] 81it [00:17, 4.59it/s] 82it [00:17, 4.60it/s] 83it [00:18, 4.62it/s] 84it [00:18, 4.63it/s] 85it [00:18, 4.63it/s] 86it [00:18, 4.63it/s] 87it [00:19, 4.64it/s] 88it [00:19, 4.64it/s] 89it [00:19, 4.64it/s] 90it [00:19, 4.64it/s] 91it [00:19, 4.65it/s] 92it [00:20, 4.63it/s] 93it [00:20, 4.45it/s] 94it [00:20, 4.50it/s] 95it [00:20, 4.55it/s] 96it [00:21, 4.56it/s] 97it [00:21, 4.58it/s] 98it [00:21, 4.59it/s] 99it [00:21, 4.60it/s] 100it [00:21, 4.60it/s]2025-05-25 22:09:53,643 - INFO - [Epoch 055 | Batch 0100] IWAE-loss 1683.7357 | mean log_px -0.0097 | KL -1142.95 + 101it [00:22, 4.59it/s] 102it [00:22, 4.61it/s] 103it [00:22, 4.62it/s] 104it [00:22, 4.63it/s] 105it [00:22, 4.63it/s] 106it [00:23, 4.39it/s] 107it [00:23, 4.45it/s] 108it [00:23, 4.49it/s] 109it [00:23, 4.52it/s] 110it [00:24, 4.51it/s] 111it [00:24, 4.47it/s] 112it [00:24, 4.52it/s] 113it [00:24, 4.53it/s] 114it [00:24, 4.55it/s] 115it [00:25, 4.56it/s] 116it [00:25, 4.56it/s] 117it [00:25, 4.44it/s] 118it [00:25, 4.47it/s] 119it [00:26, 4.49it/s] 120it [00:26, 4.52it/s] 121it [00:26, 4.55it/s] 122it [00:26, 4.56it/s] 123it [00:26, 4.57it/s] 124it [00:27, 4.59it/s] 125it [00:27, 4.62it/s] 126it [00:27, 4.61it/s] 127it [00:27, 4.61it/s] 128it [00:28, 4.61it/s] 129it [00:28, 4.62it/s] 130it [00:28, 4.61it/s] 131it [00:28, 4.60it/s] 132it [00:28, 4.59it/s] 133it [00:29, 4.54it/s] 134it [00:29, 4.56it/s] 135it [00:29, 4.56it/s] 136it [00:29, 4.58it/s] 137it [00:29, 4.60it/s] 138it [00:30, 4.59it/s] 139it [00:30, 4.59it/s] 140it [00:30, 4.40it/s] 141it [00:30, 4.47it/s] 142it [00:31, 4.51it/s] 143it [00:31, 4.52it/s] 144it [00:31, 4.40it/s] 145it [00:31, 4.43it/s] 146it [00:32, 4.47it/s] 147it [00:32, 4.51it/s] 148it [00:32, 4.50it/s] 149it [00:32, 4.53it/s] 150it [00:32, 4.54it/s]2025-05-25 22:10:04,665 - INFO - [Epoch 055 | Batch 0150] IWAE-loss 1441.7352 | mean log_px -0.0088 | KL -1140.60 + 151it [00:33, 4.42it/s] 152it [00:33, 4.49it/s] 153it [00:33, 4.53it/s] 154it [00:33, 4.55it/s] 155it [00:34, 4.58it/s] 156it [00:34, 4.55it/s] 157it [00:34, 4.57it/s] 158it [00:34, 4.57it/s] 159it [00:34, 4.45it/s] 160it [00:35, 4.50it/s] 161it [00:35, 4.54it/s] 162it [00:35, 4.56it/s] 163it [00:35, 4.56it/s] 164it [00:35, 4.56it/s] 165it [00:36, 4.59it/s] 166it [00:36, 4.57it/s] 167it [00:36, 4.59it/s] 168it [00:36, 4.45it/s] 169it [00:37, 4.52it/s] 170it [00:37, 4.54it/s] 171it [00:37, 4.56it/s] 172it [00:37, 4.55it/s] 173it [00:37, 4.57it/s] 174it [00:38, 4.39it/s] 175it [00:38, 4.45it/s] 176it [00:38, 4.49it/s] 177it [00:38, 4.53it/s] 178it [00:39, 4.55it/s] 179it [00:39, 4.58it/s] 180it [00:39, 4.56it/s] 181it [00:39, 4.58it/s] 182it [00:39, 4.58it/s] 183it [00:40, 4.58it/s] 184it [00:40, 4.57it/s] 185it [00:40, 4.58it/s] 186it [00:40, 4.43it/s] 187it [00:41, 4.49it/s] 188it [00:41, 4.52it/s] 189it [00:41, 4.55it/s] 190it [00:41, 4.55it/s] 191it [00:41, 4.58it/s] 192it [00:42, 4.58it/s] 193it [00:42, 4.58it/s] 194it [00:42, 4.57it/s] 195it [00:42, 4.33it/s] 196it [00:43, 4.27it/s] 196it [00:43, 4.54it/s] +2025-05-25 22:10:14,770 - INFO - Epoch: 55, Objective: tensor([2532.4099], device='cuda:0', grad_fn=), Loss: 0.026845891028642654, KL/n: 23.29350471496582 + 0it [00:00, ?it/s]2025-05-25 22:10:15,335 - INFO - [Epoch 056 | Batch 0000] IWAE-loss 1829.8907 | mean log_px -0.0137 | KL -1141.24 + 1it [00:00, 3.18it/s] 2it [00:00, 3.55it/s] 3it [00:00, 3.87it/s] 4it [00:01, 4.06it/s] 5it [00:01, 4.10it/s] 6it [00:01, 4.20it/s] 7it [00:01, 4.24it/s] 8it [00:01, 4.28it/s] 9it [00:02, 4.24it/s] 10it [00:02, 4.28it/s] 11it [00:02, 4.16it/s] 12it [00:02, 4.13it/s] 13it [00:03, 4.17it/s] 14it [00:03, 4.22it/s] 15it [00:03, 4.30it/s] 16it [00:03, 4.25it/s] 17it [00:04, 4.36it/s] 18it [00:04, 4.31it/s] 19it [00:04, 4.34it/s] 20it [00:04, 4.35it/s] 21it [00:04, 4.40it/s] 22it [00:05, 4.36it/s] 23it [00:05, 4.37it/s] 24it [00:05, 4.32it/s] 25it [00:05, 4.31it/s] 26it [00:06, 4.39it/s] 27it [00:06, 4.42it/s] 28it [00:06, 4.35it/s] 29it [00:06, 4.33it/s] 30it [00:07, 4.39it/s] 31it [00:07, 4.33it/s] 32it [00:07, 4.41it/s] 33it [00:07, 4.47it/s] 34it [00:07, 4.52it/s] 35it [00:08, 4.44it/s] 36it [00:08, 4.36it/s] 37it [00:08, 4.41it/s] 38it [00:08, 4.43it/s] 39it [00:09, 4.47it/s] 40it [00:09, 4.48it/s] 41it [00:09, 4.44it/s] 42it [00:09, 4.35it/s] 43it [00:09, 4.38it/s] 44it [00:10, 4.39it/s] 45it [00:10, 4.35it/s] 46it [00:10, 4.26it/s] 47it [00:10, 4.27it/s] 48it [00:11, 4.32it/s] 49it [00:11, 4.38it/s] 50it [00:11, 4.37it/s]2025-05-25 22:10:26,882 - INFO - [Epoch 056 | Batch 0050] IWAE-loss 1205.6969 | mean log_px -0.0039 | KL -1133.87 + 51it [00:11, 4.20it/s] 52it [00:12, 4.29it/s] 53it [00:12, 4.37it/s] 54it [00:12, 4.44it/s] 55it [00:12, 4.50it/s] 56it [00:12, 4.40it/s] 57it [00:13, 4.36it/s] 58it [00:13, 4.33it/s] 59it [00:13, 4.31it/s] 60it [00:13, 4.38it/s] 61it [00:14, 4.32it/s] 62it [00:14, 4.32it/s] 63it [00:14, 4.34it/s] 64it [00:14, 4.27it/s] 65it [00:15, 4.28it/s] 66it [00:15, 4.27it/s] 67it [00:15, 4.26it/s] 68it [00:15, 4.17it/s] 69it [00:16, 4.18it/s] 70it [00:16, 4.15it/s] 71it [00:16, 4.19it/s] 72it [00:16, 4.23it/s] 73it [00:16, 4.23it/s] 74it [00:17, 4.20it/s] 75it [00:17, 4.22it/s] 76it [00:17, 4.21it/s] 77it [00:17, 4.30it/s] 78it [00:18, 4.37it/s] 79it [00:18, 4.31it/s] 80it [00:18, 4.26it/s] 81it [00:18, 4.31it/s] 82it [00:19, 4.29it/s] 83it [00:19, 4.31it/s] 84it [00:19, 4.31it/s] 85it [00:19, 4.30it/s] 86it [00:20, 4.26it/s] 87it [00:20, 4.30it/s] 88it [00:20, 4.26it/s] 89it [00:20, 4.31it/s] 90it [00:20, 4.37it/s] 91it [00:21, 4.34it/s] 92it [00:21, 4.42it/s] 93it [00:21, 4.36it/s] 94it [00:21, 4.32it/s] 95it [00:22, 4.35it/s] 96it [00:22, 4.29it/s] 97it [00:22, 4.27it/s] 98it [00:22, 4.35it/s] 99it [00:22, 4.42it/s] 100it [00:23, 4.36it/s]2025-05-25 22:10:38,488 - INFO - [Epoch 056 | Batch 0100] IWAE-loss 1527.7909 | mean log_px -0.0108 | KL -1131.17 + 101it [00:23, 4.34it/s] 102it [00:23, 4.30it/s] 103it [00:23, 4.14it/s] 104it [00:24, 4.25it/s] 105it [00:24, 4.36it/s] 106it [00:24, 4.32it/s] 107it [00:24, 4.32it/s] 108it [00:25, 4.30it/s] 109it [00:25, 4.34it/s] 110it [00:25, 4.38it/s] 111it [00:25, 4.46it/s] 112it [00:25, 4.48it/s] 113it [00:26, 4.53it/s] 114it [00:26, 4.55it/s] 115it [00:26, 4.46it/s] 116it [00:26, 4.49it/s] 117it [00:27, 4.41it/s] 118it [00:27, 4.33it/s] 119it [00:27, 4.24it/s] 120it [00:27, 4.35it/s] 121it [00:28, 4.37it/s] 122it [00:28, 4.30it/s] 123it [00:28, 4.27it/s] 124it [00:28, 4.27it/s] 125it [00:28, 4.31it/s] 126it [00:29, 4.27it/s] 127it [00:29, 4.31it/s] 128it [00:29, 4.36it/s] 129it [00:29, 4.31it/s] 130it [00:30, 4.28it/s] 131it [00:30, 4.32it/s] 132it [00:30, 4.37it/s] 133it [00:30, 4.34it/s] 134it [00:31, 4.39it/s] 135it [00:31, 4.32it/s] 136it [00:31, 4.30it/s] 137it [00:31, 4.36it/s] 138it [00:31, 4.44it/s] 139it [00:32, 4.33it/s] 140it [00:32, 4.27it/s] 141it [00:32, 4.28it/s] 142it [00:32, 4.30it/s] 143it [00:33, 4.36it/s] 144it [00:33, 4.40it/s] 145it [00:33, 4.48it/s] 146it [00:33, 4.50it/s] 147it [00:34, 4.43it/s] 148it [00:34, 4.32it/s] 149it [00:34, 4.41it/s] 150it [00:34, 4.45it/s]2025-05-25 22:10:49,954 - INFO - [Epoch 056 | Batch 0150] IWAE-loss 1384.1519 | mean log_px -0.0041 | KL -1127.91 + 151it [00:34, 4.45it/s] 152it [00:35, 4.37it/s] 153it [00:35, 4.30it/s] 154it [00:35, 4.38it/s] 155it [00:35, 4.35it/s] 156it [00:36, 4.31it/s] 157it [00:36, 4.20it/s] 158it [00:36, 4.31it/s] 159it [00:36, 4.40it/s] 160it [00:37, 4.33it/s] 161it [00:37, 4.34it/s] 162it [00:37, 4.28it/s] 163it [00:37, 4.28it/s] 164it [00:37, 4.27it/s] 165it [00:38, 4.36it/s] 166it [00:38, 4.29it/s] 167it [00:38, 4.34it/s] 168it [00:38, 4.28it/s] 169it [00:39, 4.31it/s] 170it [00:39, 4.13it/s] 171it [00:39, 4.21it/s] 172it [00:39, 4.28it/s] 173it [00:40, 4.29it/s] 174it [00:40, 4.24it/s] 175it [00:40, 4.28it/s] 176it [00:40, 4.34it/s] 177it [00:40, 4.42it/s] 178it [00:41, 4.34it/s] 179it [00:41, 4.23it/s] 180it [00:41, 4.21it/s] 181it [00:41, 4.26it/s] 182it [00:42, 4.34it/s] 183it [00:42, 4.36it/s] 184it [00:42, 4.31it/s] 185it [00:42, 4.30it/s] 186it [00:43, 4.25it/s] 187it [00:43, 4.23it/s] 188it [00:43, 4.28it/s] 189it [00:43, 4.25it/s] 190it [00:44, 4.25it/s] 191it [00:44, 4.25it/s] 192it [00:44, 4.23it/s] 193it [00:44, 4.23it/s] 194it [00:44, 4.25it/s] 195it [00:45, 4.05it/s] 196it [00:45, 4.15it/s] 196it [00:45, 4.30it/s] +2025-05-25 22:11:00,634 - INFO - Epoch: 56, Objective: tensor([1635.1464], device='cuda:0', grad_fn=), Loss: 0.0118552902713418, KL/n: 23.14141273498535 + 0it [00:00, ?it/s]2025-05-25 22:11:01,039 - INFO - [Epoch 057 | Batch 0000] IWAE-loss 1257.1718 | mean log_px -0.0018 | KL -1129.48 + 1it [00:00, 3.00it/s] 2it [00:00, 3.78it/s] 3it [00:00, 4.03it/s] 4it [00:00, 4.21it/s] 5it [00:01, 4.31it/s] 6it [00:01, 4.23it/s] 7it [00:01, 4.38it/s] 8it [00:01, 4.45it/s] 9it [00:02, 4.50it/s] 10it [00:02, 4.52it/s] 11it [00:02, 4.54it/s] 12it [00:02, 4.55it/s] 13it [00:03, 4.36it/s] 14it [00:03, 4.39it/s] 15it [00:03, 4.46it/s] 16it [00:03, 4.50it/s] 17it [00:03, 4.49it/s] 18it [00:04, 4.47it/s] 19it [00:04, 4.36it/s] 20it [00:04, 4.37it/s] 21it [00:04, 4.43it/s] 22it [00:05, 4.45it/s] 23it [00:05, 4.50it/s] 24it [00:05, 4.54it/s] 25it [00:05, 4.56it/s] 26it [00:05, 4.56it/s] 27it [00:06, 4.50it/s] 28it [00:06, 4.51it/s] 29it [00:06, 4.55it/s] 30it [00:06, 4.58it/s] 31it [00:06, 4.60it/s] 32it [00:07, 4.56it/s] 33it [00:07, 4.55it/s] 34it [00:07, 4.53it/s] 35it [00:07, 4.58it/s] 36it [00:08, 4.58it/s] 37it [00:08, 4.60it/s] 38it [00:08, 4.51it/s] 39it [00:08, 4.56it/s] 40it [00:08, 4.53it/s] 41it [00:09, 4.59it/s] 42it [00:09, 4.55it/s] 43it [00:09, 4.57it/s] 44it [00:09, 4.59it/s] 45it [00:10, 4.60it/s] 46it [00:10, 4.60it/s] 47it [00:10, 4.55it/s] 48it [00:10, 4.57it/s] 49it [00:10, 4.58it/s] 50it [00:11, 4.49it/s]2025-05-25 22:11:12,101 - INFO - [Epoch 057 | Batch 0050] IWAE-loss 1460.0142 | mean log_px -0.0058 | KL -1131.17 + 51it [00:11, 4.54it/s] 52it [00:11, 3.63it/s] 53it [00:12, 3.88it/s] 54it [00:12, 4.06it/s] 55it [00:12, 4.06it/s] 56it [00:12, 4.24it/s] 57it [00:12, 4.32it/s] 58it [00:13, 4.41it/s] 59it [00:13, 4.43it/s] 60it [00:13, 4.48it/s] 61it [00:13, 4.35it/s] 62it [00:14, 4.34it/s] 63it [00:14, 4.43it/s] 64it [00:14, 4.43it/s] 65it [00:14, 4.50it/s] 66it [00:14, 4.51it/s] 67it [00:15, 4.54it/s] 68it [00:15, 4.43it/s] 69it [00:15, 4.50it/s] 70it [00:15, 4.46it/s] 71it [00:16, 4.46it/s] 72it [00:16, 4.46it/s] 73it [00:16, 4.47it/s] 74it [00:16, 4.51it/s] 75it [00:16, 4.42it/s] 76it [00:17, 4.47it/s] 77it [00:17, 4.49it/s] 78it [00:17, 4.42it/s] 79it [00:17, 4.48it/s] 80it [00:18, 4.43it/s] 81it [00:18, 4.49it/s] 82it [00:18, 4.39it/s] 83it [00:18, 4.47it/s] 84it [00:18, 4.47it/s] 85it [00:19, 4.49it/s] 86it [00:19, 4.51it/s] 87it [00:19, 4.54it/s] 88it [00:19, 4.56it/s] 89it [00:20, 4.57it/s] 90it [00:20, 4.48it/s] 91it [00:20, 4.51it/s] 92it [00:20, 4.44it/s] 93it [00:20, 4.31it/s] 94it [00:21, 4.34it/s] 95it [00:21, 4.42it/s] 96it [00:21, 4.43it/s] 97it [00:21, 4.37it/s] 98it [00:22, 4.42it/s] 99it [00:22, 4.48it/s] 100it [00:22, 4.49it/s]2025-05-25 22:11:23,471 - INFO - [Epoch 057 | Batch 0100] IWAE-loss 1242.8251 | mean log_px -0.0040 | KL -1129.03 + 101it [00:22, 4.49it/s] 102it [00:22, 4.54it/s] 103it [00:23, 4.58it/s] 104it [00:23, 4.58it/s] 105it [00:23, 4.60it/s] 106it [00:23, 4.57it/s] 107it [00:24, 4.53it/s] 108it [00:24, 4.52it/s] 109it [00:24, 4.46it/s] 110it [00:24, 4.51it/s] 111it [00:24, 4.50it/s] 112it [00:25, 4.53it/s] 113it [00:25, 4.51it/s] 114it [00:25, 4.53it/s] 115it [00:25, 4.53it/s] 116it [00:26, 4.53it/s] 117it [00:26, 4.52it/s] 118it [00:26, 4.54it/s] 119it [00:26, 4.55it/s] 120it [00:26, 4.55it/s] 121it [00:27, 4.56it/s] 122it [00:27, 4.53it/s] 123it [00:27, 4.57it/s] 124it [00:27, 4.58it/s] 125it [00:28, 4.58it/s] 126it [00:28, 4.49it/s] 127it [00:28, 4.47it/s] 128it [00:28, 4.48it/s] 129it [00:28, 4.46it/s] 130it [00:29, 4.43it/s] 131it [00:29, 4.28it/s] 132it [00:29, 4.39it/s] 133it [00:29, 4.38it/s] 134it [00:30, 4.38it/s] 135it [00:30, 4.44it/s] 136it [00:30, 4.42it/s] 137it [00:30, 4.46it/s] 138it [00:31, 4.37it/s] 139it [00:31, 4.37it/s] 140it [00:31, 4.41it/s] 141it [00:31, 4.47it/s] 142it [00:31, 4.51it/s] 143it [00:32, 4.48it/s] 144it [00:32, 4.33it/s] 145it [00:32, 4.35it/s] 146it [00:32, 4.41it/s] 147it [00:33, 4.46it/s] 148it [00:33, 4.51it/s] 149it [00:33, 4.54it/s] 150it [00:33, 4.40it/s]2025-05-25 22:11:34,652 - INFO - [Epoch 057 | Batch 0150] IWAE-loss 1292.4027 | mean log_px -0.0033 | KL -1125.85 + 151it [00:33, 4.36it/s] 152it [00:34, 4.37it/s] 153it [00:34, 4.37it/s] 154it [00:34, 4.42it/s] 155it [00:34, 4.42it/s] 156it [00:35, 4.49it/s] 157it [00:35, 4.53it/s] 158it [00:35, 4.51it/s] 159it [00:35, 4.54it/s] 160it [00:35, 4.51it/s] 161it [00:36, 4.49it/s] 162it [00:36, 4.54it/s] 163it [00:36, 4.51it/s] 164it [00:36, 4.56it/s] 165it [00:37, 4.60it/s] 166it [00:37, 4.59it/s] 167it [00:37, 4.60it/s] 168it [00:37, 4.55it/s] 169it [00:37, 4.53it/s] 170it [00:38, 4.54it/s] 171it [00:38, 4.53it/s] 172it [00:38, 4.50it/s] 173it [00:38, 4.45it/s] 174it [00:39, 4.46it/s] 175it [00:39, 4.41it/s] 176it [00:39, 4.43it/s] 177it [00:39, 4.44it/s] 178it [00:39, 4.50it/s] 179it [00:40, 4.50it/s] 180it [00:40, 4.49it/s] 181it [00:40, 4.51it/s] 182it [00:40, 4.51it/s] 183it [00:41, 4.52it/s] 184it [00:41, 4.49it/s] 185it [00:41, 4.51it/s] 186it [00:41, 4.48it/s] 187it [00:41, 4.50it/s] 188it [00:42, 4.53it/s] 189it [00:42, 4.55it/s] 190it [00:42, 4.51it/s] 191it [00:42, 4.54it/s] 192it [00:43, 4.50it/s] 193it [00:43, 4.53it/s] 194it [00:43, 4.45it/s] 195it [00:43, 4.36it/s] 196it [00:43, 4.45it/s] 196it [00:44, 4.45it/s] +2025-05-25 22:11:44,780 - INFO - Epoch: 57, Objective: tensor([1774.2374], device='cuda:0', grad_fn=), Loss: 0.010805794037878513, KL/n: 22.974790573120117 + 0it [00:00, ?it/s]2025-05-25 22:11:45,184 - INFO - [Epoch 058 | Batch 0000] IWAE-loss 1154.4401 | mean log_px -0.0014 | KL -1126.00 + 1it [00:00, 2.76it/s] 2it [00:00, 3.64it/s] 3it [00:00, 4.05it/s] 4it [00:01, 4.22it/s] 5it [00:01, 4.35it/s] 6it [00:01, 4.43it/s] 7it [00:01, 4.50it/s] 8it [00:01, 4.39it/s] 9it [00:02, 4.48it/s] 10it [00:02, 4.52it/s] 11it [00:02, 4.56it/s] 12it [00:02, 4.58it/s] 13it [00:02, 4.60it/s] 14it [00:03, 4.61it/s] 15it [00:03, 4.62it/s] 16it [00:03, 4.47it/s] 17it [00:03, 4.54it/s] 18it [00:04, 4.57it/s] 19it [00:04, 4.59it/s] 20it [00:04, 4.60it/s] 21it [00:04, 4.59it/s] 22it [00:04, 4.63it/s] 23it [00:05, 4.49it/s] 24it [00:05, 4.54it/s] 25it [00:05, 4.57it/s] 26it [00:05, 4.58it/s] 27it [00:06, 4.61it/s] 28it [00:06, 4.61it/s] 29it [00:06, 4.62it/s] 30it [00:06, 4.48it/s] 31it [00:06, 4.54it/s] 32it [00:07, 4.57it/s] 33it [00:07, 4.59it/s] 34it [00:07, 4.61it/s] 35it [00:07, 4.62it/s] 36it [00:08, 4.58it/s] 37it [00:08, 4.39it/s] 38it [00:08, 4.48it/s] 39it [00:08, 4.54it/s] 40it [00:08, 4.58it/s] 41it [00:09, 4.61it/s] 42it [00:09, 4.61it/s] 43it [00:09, 4.53it/s] 44it [00:09, 4.57it/s] 45it [00:09, 4.59it/s] 46it [00:10, 4.60it/s] 47it [00:10, 4.61it/s] 48it [00:10, 4.48it/s] 49it [00:10, 4.56it/s] 50it [00:11, 4.57it/s]2025-05-25 22:11:56,149 - INFO - [Epoch 058 | Batch 0050] IWAE-loss 1403.6750 | mean log_px -0.0124 | KL -1118.93 + 51it [00:11, 4.59it/s] 52it [00:11, 4.60it/s] 53it [00:11, 4.61it/s] 54it [00:11, 4.48it/s] 55it [00:12, 4.53it/s] 56it [00:12, 4.53it/s] 57it [00:12, 4.56it/s] 58it [00:12, 4.58it/s] 59it [00:13, 4.60it/s] 60it [00:13, 4.47it/s] 61it [00:13, 4.53it/s] 62it [00:13, 4.55it/s] 63it [00:13, 4.59it/s] 64it [00:14, 4.60it/s] 65it [00:14, 4.62it/s] 66it [00:14, 4.49it/s] 67it [00:14, 4.54it/s] 68it [00:15, 4.57it/s] 69it [00:15, 4.59it/s] 70it [00:15, 4.52it/s] 71it [00:15, 4.52it/s] 72it [00:15, 4.53it/s] 73it [00:16, 4.48it/s] 74it [00:16, 4.54it/s] 75it [00:16, 4.55it/s] 76it [00:16, 4.57it/s] 77it [00:17, 4.56it/s] 78it [00:17, 4.58it/s] 79it [00:17, 4.47it/s] 80it [00:17, 4.52it/s] 81it [00:17, 4.56it/s] 82it [00:18, 4.58it/s] 83it [00:18, 4.60it/s] 84it [00:18, 4.60it/s] 85it [00:18, 4.62it/s] 86it [00:18, 4.49it/s] 87it [00:19, 4.52it/s] 88it [00:19, 4.55it/s] 89it [00:19, 4.57it/s] 90it [00:19, 4.59it/s] 91it [00:20, 4.60it/s] 92it [00:20, 4.51it/s] 93it [00:20, 4.55it/s] 94it [00:20, 4.57it/s] 95it [00:20, 4.60it/s] 96it [00:21, 4.60it/s] 97it [00:21, 4.48it/s] 98it [00:21, 4.53it/s] 99it [00:21, 4.57it/s] 100it [00:22, 4.59it/s]2025-05-25 22:12:07,131 - INFO - [Epoch 058 | Batch 0100] IWAE-loss 1223.3649 | mean log_px -0.0015 | KL -1114.54 + 101it [00:22, 4.43it/s] 102it [00:22, 4.50it/s] 103it [00:22, 4.56it/s] 104it [00:22, 4.58it/s] 105it [00:23, 4.60it/s] 106it [00:23, 4.60it/s] 107it [00:23, 4.62it/s] 108it [00:23, 4.45it/s] 109it [00:24, 4.51it/s] 110it [00:24, 4.54it/s] 111it [00:24, 4.57it/s] 112it [00:24, 4.58it/s] 113it [00:24, 4.60it/s] 114it [00:25, 4.61it/s] 115it [00:25, 4.47it/s] 116it [00:25, 4.52it/s] 117it [00:25, 4.56it/s] 118it [00:26, 4.57it/s] 119it [00:26, 4.45it/s] 120it [00:26, 4.51it/s] 121it [00:26, 4.54it/s] 122it [00:26, 4.55it/s] 123it [00:27, 4.57it/s] 124it [00:27, 4.60it/s] 125it [00:27, 4.45it/s] 126it [00:27, 4.51it/s] 127it [00:28, 4.55it/s] 128it [00:28, 4.56it/s] 129it [00:28, 4.45it/s] 130it [00:28, 4.52it/s] 131it [00:28, 4.56it/s] 132it [00:29, 4.58it/s] 133it [00:29, 4.61it/s] 134it [00:29, 4.61it/s] 135it [00:29, 4.44it/s] 136it [00:29, 4.51it/s] 137it [00:30, 4.56it/s] 138it [00:30, 4.57it/s] 139it [00:30, 4.60it/s] 140it [00:30, 4.60it/s] 141it [00:31, 4.60it/s] 142it [00:31, 4.46it/s] 143it [00:31, 4.52it/s] 144it [00:31, 4.55it/s] 145it [00:31, 4.58it/s] 146it [00:32, 4.60it/s] 147it [00:32, 4.61it/s] 148it [00:32, 4.61it/s] 149it [00:32, 4.47it/s] 150it [00:33, 4.53it/s]2025-05-25 22:12:18,133 - INFO - [Epoch 058 | Batch 0150] IWAE-loss 1539.7325 | mean log_px -0.0100 | KL -1111.33 + 151it [00:33, 4.56it/s] 152it [00:33, 4.58it/s] 153it [00:33, 4.60it/s] 154it [00:33, 4.59it/s] 155it [00:34, 4.45it/s] 156it [00:34, 4.50it/s] 157it [00:34, 4.55it/s] 158it [00:34, 4.56it/s] 159it [00:35, 4.55it/s] 160it [00:35, 4.56it/s] 161it [00:35, 4.58it/s] 162it [00:35, 4.45it/s] 163it [00:35, 4.49it/s] 164it [00:36, 4.53it/s] 165it [00:36, 4.56it/s] 166it [00:36, 4.57it/s] 167it [00:36, 4.58it/s] 168it [00:37, 4.58it/s] 169it [00:37, 4.44it/s] 170it [00:37, 4.50it/s] 171it [00:37, 4.53it/s] 172it [00:37, 4.55it/s] 173it [00:38, 4.57it/s] 174it [00:38, 4.56it/s] 175it [00:38, 4.58it/s] 176it [00:38, 4.44it/s] 177it [00:39, 4.50it/s] 178it [00:39, 4.51it/s] 179it [00:39, 4.52it/s] 180it [00:39, 4.37it/s] 181it [00:39, 4.44it/s] 182it [00:40, 4.48it/s] 183it [00:40, 4.35it/s] 184it [00:40, 4.40it/s] 185it [00:40, 4.48it/s] 186it [00:41, 4.41it/s] 187it [00:41, 4.47it/s] 188it [00:41, 4.50it/s] 189it [00:41, 4.53it/s] 190it [00:41, 4.39it/s] 191it [00:42, 4.46it/s] 192it [00:42, 4.50it/s] 193it [00:42, 4.51it/s] 194it [00:42, 4.41it/s] 195it [00:43, 4.35it/s] 196it [00:43, 4.35it/s] 196it [00:43, 4.52it/s] +2025-05-25 22:12:28,277 - INFO - Epoch: 58, Objective: tensor([1163.4995], device='cuda:0', grad_fn=), Loss: 0.0014143032021820545, KL/n: 22.712282180786133 + 0it [00:00, ?it/s]2025-05-25 22:12:28,850 - INFO - [Epoch 059 | Batch 0000] IWAE-loss 1306.7094 | mean log_px -0.0034 | KL -1115.00 + 1it [00:00, 3.06it/s] 2it [00:00, 3.64it/s] 3it [00:00, 4.03it/s] 4it [00:01, 4.21it/s] 5it [00:01, 4.35it/s] 6it [00:01, 4.28it/s] 7it [00:01, 4.30it/s] 8it [00:01, 4.35it/s] 9it [00:02, 4.30it/s] 10it [00:02, 4.29it/s] 11it [00:02, 4.38it/s] 12it [00:02, 4.28it/s] 13it [00:03, 4.34it/s] 14it [00:03, 4.33it/s] 15it [00:03, 4.28it/s] 16it [00:03, 4.28it/s] 17it [00:04, 4.30it/s] 18it [00:04, 4.25it/s] 19it [00:04, 4.33it/s] 20it [00:04, 4.41it/s] 21it [00:04, 4.43it/s] 22it [00:05, 4.26it/s] 23it [00:05, 4.36it/s] 24it [00:05, 4.42it/s] 25it [00:05, 4.44it/s] 26it [00:06, 4.40it/s] 27it [00:06, 4.45it/s] 28it [00:06, 4.45it/s] 29it [00:06, 4.39it/s] 30it [00:06, 4.33it/s] 31it [00:07, 4.29it/s] 32it [00:07, 4.39it/s] 33it [00:07, 4.32it/s] 34it [00:07, 4.32it/s] 35it [00:08, 4.31it/s] 36it [00:08, 4.38it/s] 37it [00:08, 4.35it/s] 38it [00:08, 4.33it/s] 39it [00:09, 4.40it/s] 40it [00:09, 4.32it/s] 41it [00:09, 4.35it/s] 42it [00:09, 4.42it/s] 43it [00:09, 4.35it/s] 44it [00:10, 4.41it/s] 45it [00:10, 4.45it/s] 46it [00:10, 4.49it/s] 47it [00:10, 4.54it/s] 48it [00:11, 4.52it/s] 49it [00:11, 4.55it/s] 50it [00:11, 4.57it/s]2025-05-25 22:12:40,254 - INFO - [Epoch 059 | Batch 0050] IWAE-loss 1501.0148 | mean log_px -0.0083 | KL -1108.41 + 51it [00:11, 4.32it/s] 52it [00:11, 4.26it/s] 53it [00:12, 4.28it/s] 54it [00:12, 4.34it/s] 55it [00:12, 4.30it/s] 56it [00:12, 4.27it/s] 57it [00:13, 4.36it/s] 58it [00:13, 4.37it/s] 59it [00:13, 4.44it/s] 60it [00:13, 4.49it/s] 61it [00:14, 4.24it/s] 62it [00:14, 4.34it/s] 63it [00:14, 4.27it/s] 64it [00:14, 4.27it/s] 65it [00:15, 4.26it/s] 66it [00:15, 4.26it/s] 67it [00:15, 4.25it/s] 68it [00:15, 4.17it/s] 69it [00:15, 4.19it/s] 70it [00:16, 4.17it/s] 71it [00:16, 4.22it/s] 72it [00:16, 4.18it/s] 73it [00:16, 4.24it/s] 74it [00:17, 4.32it/s] 75it [00:17, 4.29it/s] 76it [00:17, 4.35it/s] 77it [00:17, 4.28it/s] 78it [00:18, 4.26it/s] 79it [00:18, 4.30it/s] 80it [00:18, 4.39it/s] 81it [00:18, 4.29it/s] 82it [00:18, 4.27it/s] 83it [00:19, 4.29it/s] 84it [00:19, 4.24it/s] 85it [00:19, 4.05it/s] 86it [00:19, 4.11it/s] 87it [00:20, 4.23it/s] 88it [00:20, 4.32it/s] 89it [00:20, 4.27it/s] 90it [00:20, 4.37it/s] 91it [00:21, 4.30it/s] 92it [00:21, 4.30it/s] 93it [00:21, 4.35it/s] 94it [00:21, 4.30it/s] 95it [00:22, 4.37it/s] 96it [00:22, 4.35it/s] 97it [00:22, 4.42it/s] 98it [00:22, 4.47it/s] 99it [00:22, 4.52it/s] 100it [00:23, 4.36it/s]2025-05-25 22:12:51,916 - INFO - [Epoch 059 | Batch 0100] IWAE-loss 1170.6613 | mean log_px -0.0009 | KL -1106.82 + 101it [00:23, 4.32it/s] 102it [00:23, 4.38it/s] 103it [00:23, 4.34it/s] 104it [00:24, 4.27it/s] 105it [00:24, 4.27it/s] 106it [00:24, 4.27it/s] 107it [00:24, 4.29it/s] 108it [00:25, 4.39it/s] 109it [00:25, 4.40it/s] 110it [00:25, 4.24it/s] 111it [00:25, 4.27it/s] 112it [00:25, 4.22it/s] 113it [00:26, 4.24it/s] 114it [00:26, 4.29it/s] 115it [00:26, 4.28it/s] 116it [00:26, 4.28it/s] 117it [00:27, 4.37it/s] 118it [00:27, 4.11it/s] 119it [00:27, 4.15it/s] 120it [00:27, 4.26it/s] 121it [00:28, 4.33it/s] 122it [00:28, 4.34it/s] 123it [00:28, 4.27it/s] 124it [00:28, 4.38it/s] 125it [00:28, 4.33it/s] 126it [00:29, 4.34it/s] 127it [00:29, 4.41it/s] 128it [00:29, 4.32it/s] 129it [00:29, 4.33it/s] 130it [00:30, 4.40it/s] 131it [00:30, 4.37it/s] 132it [00:30, 4.36it/s] 133it [00:30, 4.33it/s] 134it [00:31, 4.32it/s] 135it [00:31, 4.30it/s] 136it [00:31, 4.32it/s] 137it [00:31, 4.28it/s] 138it [00:31, 4.26it/s] 139it [00:32, 4.29it/s] 140it [00:32, 4.37it/s] 141it [00:32, 4.36it/s] 142it [00:32, 4.32it/s] 143it [00:33, 4.25it/s] 144it [00:33, 4.28it/s] 145it [00:33, 4.17it/s] 146it [00:33, 4.21it/s] 147it [00:34, 4.29it/s] 148it [00:34, 4.27it/s] 149it [00:34, 4.27it/s] 150it [00:34, 4.24it/s]2025-05-25 22:13:03,561 - INFO - [Epoch 059 | Batch 0150] IWAE-loss 1656.5128 | mean log_px -0.0145 | KL -1106.05 + 151it [00:35, 4.22it/s] 152it [00:35, 4.22it/s] 153it [00:35, 4.23it/s] 154it [00:35, 4.34it/s] 155it [00:35, 4.39it/s] 156it [00:36, 4.44it/s] 157it [00:36, 4.35it/s] 158it [00:36, 4.18it/s] 159it [00:36, 4.21it/s] 160it [00:37, 4.23it/s] 161it [00:37, 4.23it/s] 162it [00:37, 4.33it/s] 163it [00:37, 4.28it/s] 164it [00:38, 4.28it/s] 165it [00:38, 4.25it/s] 166it [00:38, 4.26it/s] 167it [00:38, 4.37it/s] 168it [00:38, 4.44it/s] 169it [00:39, 4.49it/s] 170it [00:39, 4.38it/s] 171it [00:39, 4.37it/s] 172it [00:39, 4.44it/s] 173it [00:40, 4.49it/s] 174it [00:40, 4.53it/s] 175it [00:40, 4.56it/s] 176it [00:40, 4.58it/s] 177it [00:40, 4.60it/s] 178it [00:41, 4.49it/s] 179it [00:41, 4.53it/s] 180it [00:41, 4.44it/s] 181it [00:41, 4.37it/s] 182it [00:42, 4.43it/s] 183it [00:42, 4.47it/s] 184it [00:42, 4.41it/s] 185it [00:42, 4.35it/s] 186it [00:43, 4.41it/s] 187it [00:43, 4.42it/s] 188it [00:43, 4.38it/s] 189it [00:43, 4.45it/s] 190it [00:43, 4.49it/s] 191it [00:44, 4.51it/s] 192it [00:44, 4.55it/s] 193it [00:44, 4.42it/s] 194it [00:44, 4.38it/s] 195it [00:45, 4.34it/s] 196it [00:45, 4.45it/s] 196it [00:45, 4.32it/s] +2025-05-25 22:13:13,918 - INFO - Epoch: 59, Objective: tensor([1502.0814], device='cuda:0', grad_fn=), Loss: 0.015234545804560184, KL/n: 22.524457931518555 + 0it [00:00, ?it/s]2025-05-25 22:13:14,316 - INFO - [Epoch 060 | Batch 0000] IWAE-loss 1251.1169 | mean log_px -0.0041 | KL -1102.64 + 1it [00:00, 2.81it/s] 2it [00:00, 3.61it/s] 3it [00:00, 3.99it/s] 4it [00:01, 4.24it/s] 5it [00:01, 4.41it/s] 6it [00:01, 4.47it/s] 7it [00:01, 4.41it/s] 8it [00:01, 4.51it/s] 9it [00:02, 4.45it/s] 10it [00:02, 4.40it/s] 11it [00:02, 4.48it/s] 12it [00:02, 3.59it/s] 13it [00:03, 3.78it/s] 14it [00:03, 3.92it/s] 15it [00:03, 4.11it/s] 16it [00:03, 4.10it/s] 17it [00:04, 4.28it/s] 18it [00:04, 4.25it/s] 19it [00:04, 4.31it/s] 20it [00:04, 4.42it/s] 21it [00:05, 4.39it/s] 22it [00:05, 4.36it/s] 23it [00:05, 4.35it/s] 24it [00:05, 4.43it/s] 25it [00:05, 4.24it/s] 26it [00:06, 4.37it/s] 27it [00:06, 4.45it/s] 28it [00:06, 4.52it/s] 29it [00:06, 4.58it/s] 30it [00:07, 4.62it/s] 31it [00:07, 4.53it/s] 32it [00:07, 4.60it/s] 33it [00:07, 4.51it/s] 34it [00:07, 4.55it/s] 35it [00:08, 4.44it/s] 36it [00:08, 4.52it/s] 37it [00:08, 4.43it/s] 38it [00:08, 4.50it/s] 39it [00:09, 4.55it/s] 40it [00:09, 4.47it/s] 41it [00:09, 4.42it/s] 42it [00:09, 4.38it/s] 43it [00:09, 4.46it/s] 44it [00:10, 4.54it/s] 45it [00:10, 4.54it/s] 46it [00:10, 4.48it/s] 47it [00:10, 4.51it/s] 48it [00:11, 4.56it/s] 49it [00:11, 4.44it/s] 50it [00:11, 4.42it/s]2025-05-25 22:13:25,710 - INFO - [Epoch 060 | Batch 0050] IWAE-loss 1318.0186 | mean log_px -0.0060 | KL -1099.36 + 51it [00:11, 4.40it/s] 52it [00:11, 4.37it/s] 53it [00:12, 4.48it/s] 54it [00:12, 4.52it/s] 55it [00:12, 4.45it/s] 56it [00:12, 4.42it/s] 57it [00:13, 4.50it/s] 58it [00:13, 4.18it/s] 59it [00:13, 4.32it/s] 60it [00:13, 4.40it/s] 61it [00:13, 4.39it/s] 62it [00:14, 4.44it/s] 63it [00:14, 4.52it/s] 64it [00:14, 4.58it/s] 65it [00:14, 4.55it/s] 66it [00:15, 4.37it/s] 67it [00:15, 4.39it/s] 68it [00:15, 4.45it/s] 69it [00:15, 4.54it/s] 70it [00:15, 4.48it/s] 71it [00:16, 4.39it/s] 72it [00:16, 4.48it/s] 73it [00:16, 4.44it/s] 74it [00:16, 4.49it/s] 75it [00:17, 4.54it/s] 76it [00:17, 4.38it/s] 77it [00:17, 4.49it/s] 78it [00:17, 4.54it/s] 79it [00:18, 4.48it/s] 80it [00:18, 4.44it/s] 81it [00:18, 4.52it/s] 82it [00:18, 4.56it/s] 83it [00:18, 4.48it/s] 84it [00:19, 4.43it/s] 85it [00:19, 4.43it/s] 86it [00:19, 4.49it/s] 87it [00:19, 4.55it/s] 88it [00:20, 4.48it/s] 89it [00:20, 4.55it/s] 90it [00:20, 4.47it/s] 91it [00:20, 4.38it/s] 92it [00:20, 4.38it/s] 93it [00:21, 4.43it/s] 94it [00:21, 4.51it/s] 95it [00:21, 4.45it/s] 96it [00:21, 4.40it/s] 97it [00:22, 4.39it/s] 98it [00:22, 4.24it/s] 99it [00:22, 4.35it/s] 100it [00:22, 4.45it/s]2025-05-25 22:13:36,940 - INFO - [Epoch 060 | Batch 0100] IWAE-loss 1443.9005 | mean log_px -0.0049 | KL -1095.84 + 101it [00:22, 4.52it/s] 102it [00:23, 4.56it/s] 103it [00:23, 4.49it/s] 104it [00:23, 4.57it/s] 105it [00:23, 4.52it/s] 106it [00:24, 4.45it/s] 107it [00:24, 4.40it/s] 108it [00:24, 4.27it/s] 109it [00:24, 4.37it/s] 110it [00:24, 4.45it/s] 111it [00:25, 4.53it/s] 112it [00:25, 4.60it/s] 113it [00:25, 4.50it/s] 114it [00:25, 4.48it/s] 115it [00:26, 4.32it/s] 116it [00:26, 4.43it/s] 117it [00:26, 4.42it/s] 118it [00:26, 4.42it/s] 119it [00:27, 4.39it/s] 120it [00:27, 4.48it/s] 121it [00:27, 4.55it/s] 122it [00:27, 4.32it/s] 123it [00:27, 4.41it/s] 124it [00:28, 4.39it/s] 125it [00:28, 4.44it/s] 126it [00:28, 4.36it/s] 127it [00:28, 4.45it/s] 128it [00:29, 4.52it/s] 129it [00:29, 4.45it/s] 130it [00:29, 4.44it/s] 131it [00:29, 4.51it/s] 132it [00:29, 4.57it/s] 133it [00:30, 4.49it/s] 134it [00:30, 4.52it/s] 135it [00:30, 4.30it/s] 136it [00:30, 4.43it/s] 137it [00:31, 4.46it/s] 138it [00:31, 4.54it/s] 139it [00:31, 4.59it/s] 140it [00:31, 4.63it/s] 141it [00:31, 4.52it/s] 142it [00:32, 4.59it/s] 143it [00:32, 4.59it/s] 144it [00:32, 4.56it/s] 145it [00:32, 4.49it/s] 146it [00:33, 4.31it/s] 147it [00:33, 4.33it/s] 148it [00:33, 4.39it/s] 149it [00:33, 4.43it/s] 150it [00:33, 4.40it/s]2025-05-25 22:13:48,164 - INFO - [Epoch 060 | Batch 0150] IWAE-loss 1876.3032 | mean log_px -0.0125 | KL -1099.04 + 151it [00:34, 4.25it/s] 152it [00:34, 4.39it/s] 153it [00:34, 4.48it/s] 154it [00:34, 4.44it/s] 155it [00:35, 4.38it/s] 156it [00:35, 4.42it/s] 157it [00:35, 4.46it/s] 158it [00:35, 4.53it/s] 159it [00:35, 4.56it/s] 160it [00:36, 4.39it/s] 161it [00:36, 4.46it/s] 162it [00:36, 4.53it/s] 163it [00:36, 4.45it/s] 164it [00:37, 4.42it/s] 165it [00:37, 4.39it/s] 166it [00:37, 4.21it/s] 167it [00:37, 4.28it/s] 168it [00:38, 4.36it/s] 169it [00:38, 4.46it/s] 170it [00:38, 4.52it/s] 171it [00:38, 4.54it/s] 172it [00:38, 4.47it/s] 173it [00:39, 4.42it/s] 174it [00:39, 4.39it/s] 175it [00:39, 4.31it/s] 176it [00:39, 4.44it/s] 177it [00:40, 4.40it/s] 178it [00:40, 4.48it/s] 179it [00:40, 4.52it/s] 180it [00:40, 4.50it/s] 181it [00:40, 4.21it/s] 182it [00:41, 4.07it/s] 183it [00:41, 4.22it/s] 184it [00:41, 4.34it/s] 185it [00:41, 4.45it/s] 186it [00:42, 4.52it/s] 187it [00:42, 4.58it/s] 188it [00:42, 4.46it/s] 189it [00:42, 4.42it/s] 190it [00:42, 4.50it/s] 191it [00:43, 4.43it/s] 192it [00:43, 4.43it/s] 193it [00:43, 4.37it/s] 194it [00:43, 4.37it/s] 195it [00:44, 4.30it/s] 196it [00:44, 4.30it/s] 196it [00:44, 4.41it/s] +2025-05-25 22:13:58,522 - INFO - Epoch: 60, Objective: tensor([1335.1680], device='cuda:0', grad_fn=), Loss: 0.0030267671681940556, KL/n: 22.3603515625 + 0it [00:00, ?it/s]2025-05-25 22:13:58,954 - INFO - [Epoch 061 | Batch 0000] IWAE-loss 1409.4937 | mean log_px -0.0081 | KL -1098.50 + 1it [00:00, 2.71it/s] 2it [00:00, 3.56it/s] 3it [00:00, 3.98it/s] 4it [00:01, 4.21it/s] 5it [00:01, 4.23it/s] 6it [00:01, 4.36it/s] 7it [00:01, 4.33it/s] 8it [00:01, 4.45it/s] 9it [00:02, 4.54it/s] 10it [00:02, 4.58it/s] 11it [00:02, 4.48it/s] 12it [00:02, 4.48it/s] 13it [00:03, 4.52it/s] 14it [00:03, 4.42it/s] 15it [00:03, 4.50it/s] 16it [00:03, 4.56it/s] 17it [00:03, 4.60it/s] 18it [00:04, 4.62it/s] 19it [00:04, 4.61it/s] 20it [00:04, 4.51it/s] 21it [00:04, 4.38it/s] 22it [00:05, 4.40it/s] 23it [00:05, 4.36it/s] 24it [00:05, 4.46it/s] 25it [00:05, 4.53it/s] 26it [00:05, 4.42it/s] 27it [00:06, 4.52it/s] 28it [00:06, 4.57it/s] 29it [00:06, 4.60it/s] 30it [00:06, 4.63it/s] 31it [00:06, 4.65it/s] 32it [00:07, 4.54it/s] 33it [00:07, 4.55it/s] 34it [00:07, 4.59it/s] 35it [00:07, 4.48it/s] 36it [00:08, 4.56it/s] 37it [00:08, 4.60it/s] 38it [00:08, 4.63it/s] 39it [00:08, 4.66it/s] 40it [00:08, 4.67it/s] 41it [00:09, 4.51it/s] 42it [00:09, 4.36it/s] 43it [00:09, 4.46it/s] 44it [00:09, 4.51it/s] 45it [00:10, 4.55it/s] 46it [00:10, 4.48it/s] 47it [00:10, 4.51it/s] 48it [00:10, 4.40it/s] 49it [00:10, 4.36it/s] 50it [00:11, 4.45it/s]2025-05-25 22:14:10,037 - INFO - [Epoch 061 | Batch 0050] IWAE-loss 1398.4414 | mean log_px -0.0127 | KL -1090.44 + 51it [00:11, 4.51it/s] 52it [00:11, 4.57it/s] 53it [00:11, 4.62it/s] 54it [00:12, 4.64it/s] 55it [00:12, 4.40it/s] 56it [00:12, 4.38it/s] 57it [00:12, 4.36it/s] 58it [00:13, 4.34it/s] 59it [00:13, 4.43it/s] 60it [00:13, 4.50it/s] 61it [00:13, 4.54it/s] 62it [00:13, 4.46it/s] 63it [00:14, 4.41it/s] 64it [00:14, 4.45it/s] 65it [00:14, 4.53it/s] 66it [00:14, 4.58it/s] 67it [00:14, 4.61it/s] 68it [00:15, 4.37it/s] 69it [00:15, 4.34it/s] 70it [00:15, 4.30it/s] 71it [00:15, 4.29it/s] 72it [00:16, 4.41it/s] 73it [00:16, 4.37it/s] 74it [00:16, 4.37it/s] 75it [00:16, 4.44it/s] 76it [00:17, 4.37it/s] 77it [00:17, 4.22it/s] 78it [00:17, 4.27it/s] 79it [00:17, 4.27it/s] 80it [00:18, 4.36it/s] 81it [00:18, 4.32it/s] 82it [00:18, 4.17it/s] 83it [00:18, 4.23it/s] 84it [00:18, 4.22it/s] 85it [00:19, 4.30it/s] 86it [00:19, 4.29it/s] 87it [00:19, 4.24it/s] 88it [00:19, 4.26it/s] 89it [00:20, 4.36it/s] 90it [00:20, 4.32it/s] 91it [00:20, 4.29it/s] 92it [00:20, 4.31it/s] 93it [00:21, 4.23it/s] 94it [00:21, 4.37it/s] 95it [00:21, 4.42it/s] 96it [00:21, 4.49it/s] 97it [00:21, 4.56it/s] 98it [00:22, 4.60it/s] 99it [00:22, 4.61it/s] 100it [00:22, 4.50it/s]2025-05-25 22:14:21,429 - INFO - [Epoch 061 | Batch 0100] IWAE-loss 1398.7993 | mean log_px -0.0086 | KL -1086.49 + 101it [00:22, 4.31it/s] 102it [00:23, 4.44it/s] 103it [00:23, 4.37it/s] 104it [00:23, 4.39it/s] 105it [00:23, 4.47it/s] 106it [00:23, 4.53it/s] 107it [00:24, 4.59it/s] 108it [00:24, 4.48it/s] 109it [00:24, 4.54it/s] 110it [00:24, 4.46it/s] 111it [00:25, 4.52it/s] 112it [00:25, 4.45it/s] 113it [00:25, 4.48it/s] 114it [00:25, 4.55it/s] 115it [00:25, 4.58it/s] 116it [00:26, 4.45it/s] 117it [00:26, 4.54it/s] 118it [00:26, 4.58it/s] 119it [00:26, 4.48it/s] 120it [00:27, 4.41it/s] 121it [00:27, 4.36it/s] 122it [00:27, 4.48it/s] 123it [00:27, 4.50it/s] 124it [00:27, 4.53it/s] 125it [00:28, 4.47it/s] 126it [00:28, 4.43it/s] 127it [00:28, 4.33it/s] 128it [00:28, 4.45it/s] 129it [00:29, 4.37it/s] 130it [00:29, 4.46it/s] 131it [00:29, 4.54it/s] 132it [00:29, 4.58it/s] 133it [00:29, 4.62it/s] 134it [00:30, 4.64it/s] 135it [00:30, 4.52it/s] 136it [00:30, 4.57it/s] 137it [00:30, 4.60it/s] 138it [00:31, 4.63it/s] 139it [00:31, 4.52it/s] 140it [00:31, 4.20it/s] 141it [00:31, 4.27it/s] 142it [00:31, 4.37it/s] 143it [00:32, 4.43it/s] 144it [00:32, 4.40it/s] 145it [00:32, 4.26it/s] 146it [00:32, 4.25it/s] 147it [00:33, 4.25it/s] 148it [00:33, 4.37it/s] 149it [00:33, 4.48it/s] 150it [00:33, 4.54it/s]2025-05-25 22:14:32,628 - INFO - [Epoch 061 | Batch 0150] IWAE-loss 1164.0669 | mean log_px -0.0021 | KL -1089.75 + 151it [00:34, 4.42it/s] 152it [00:34, 4.38it/s] 153it [00:34, 4.35it/s] 154it [00:34, 4.43it/s] 155it [00:34, 4.39it/s] 156it [00:35, 4.34it/s] 157it [00:35, 4.43it/s] 158it [00:35, 4.35it/s] 159it [00:35, 4.45it/s] 160it [00:36, 4.52it/s] 161it [00:36, 4.44it/s] 162it [00:36, 4.52it/s] 163it [00:36, 4.56it/s] 164it [00:36, 4.59it/s] 165it [00:37, 4.37it/s] 166it [00:37, 4.48it/s] 167it [00:37, 4.53it/s] 168it [00:37, 4.57it/s] 169it [00:38, 4.51it/s] 170it [00:38, 4.53it/s] 171it [00:38, 4.55it/s] 172it [00:38, 4.45it/s] 173it [00:38, 4.40it/s] 174it [00:39, 4.20it/s] 175it [00:39, 4.27it/s] 176it [00:39, 4.38it/s] 177it [00:39, 4.43it/s] 178it [00:40, 4.41it/s] 179it [00:40, 4.48it/s] 180it [00:40, 4.54it/s] 181it [00:40, 4.45it/s] 182it [00:41, 4.52it/s] 183it [00:41, 4.56it/s] 184it [00:41, 4.59it/s] 185it [00:41, 4.64it/s] 186it [00:41, 4.50it/s] 187it [00:42, 4.57it/s] 188it [00:42, 4.47it/s] 189it [00:42, 4.43it/s] 190it [00:42, 4.44it/s] 191it [00:43, 4.47it/s] 192it [00:43, 4.41it/s] 193it [00:43, 4.26it/s] 194it [00:43, 4.32it/s] 195it [00:43, 4.31it/s] 196it [00:44, 4.40it/s] 196it [00:44, 4.43it/s] +2025-05-25 22:14:42,896 - INFO - Epoch: 61, Objective: tensor([2204.2148], device='cuda:0', grad_fn=), Loss: 0.01952478662133217, KL/n: 22.221717834472656 + 0it [00:00, ?it/s]2025-05-25 22:14:43,483 - INFO - [Epoch 062 | Batch 0000] IWAE-loss 1198.3219 | mean log_px -0.0081 | KL -1089.96 + 1it [00:00, 2.79it/s] 2it [00:00, 3.57it/s] 3it [00:00, 3.96it/s] 4it [00:01, 4.18it/s] 5it [00:01, 4.18it/s] 6it [00:01, 4.32it/s] 7it [00:01, 4.41it/s] 8it [00:01, 4.38it/s] 9it [00:02, 4.40it/s] 10it [00:02, 4.49it/s] 11it [00:02, 4.44it/s] 12it [00:02, 4.52it/s] 13it [00:03, 4.46it/s] 14it [00:03, 4.43it/s] 15it [00:03, 4.48it/s] 16it [00:03, 4.54it/s] 17it [00:03, 4.58it/s] 18it [00:04, 4.45it/s] 19it [00:04, 4.49it/s] 20it [00:04, 4.55it/s] 21it [00:04, 4.56it/s] 22it [00:05, 4.59it/s] 23it [00:05, 4.63it/s] 24it [00:05, 4.63it/s] 25it [00:05, 4.63it/s] 26it [00:05, 4.53it/s] 27it [00:06, 4.55it/s] 28it [00:06, 4.59it/s] 29it [00:06, 4.48it/s] 30it [00:06, 4.55it/s] 31it [00:06, 4.59it/s] 32it [00:07, 4.52it/s] 33it [00:07, 4.44it/s] 34it [00:07, 4.42it/s] 35it [00:07, 4.38it/s] 36it [00:08, 4.38it/s] 37it [00:08, 4.45it/s] 38it [00:08, 4.39it/s] 39it [00:08, 4.40it/s] 40it [00:09, 4.49it/s] 41it [00:09, 4.44it/s] 42it [00:09, 4.43it/s] 43it [00:09, 4.44it/s] 44it [00:09, 4.41it/s] 45it [00:10, 4.46it/s] 46it [00:10, 4.54it/s] 47it [00:10, 4.46it/s] 48it [00:10, 4.43it/s] 49it [00:11, 4.48it/s] 50it [00:11, 4.53it/s]2025-05-25 22:14:54,625 - INFO - [Epoch 062 | Batch 0050] IWAE-loss 1275.6980 | mean log_px -0.0043 | KL -1085.77 + 51it [00:11, 4.43it/s] 52it [00:11, 4.53it/s] 53it [00:11, 4.59it/s] 54it [00:12, 4.61it/s] 55it [00:12, 4.64it/s] 56it [00:12, 4.62it/s] 57it [00:12, 4.48it/s] 58it [00:13, 4.41it/s] 59it [00:13, 4.42it/s] 60it [00:13, 4.39it/s] 61it [00:13, 4.44it/s] 62it [00:13, 4.50it/s] 63it [00:14, 4.54it/s] 64it [00:14, 4.55it/s] 65it [00:14, 4.45it/s] 66it [00:14, 4.43it/s] 67it [00:15, 4.46it/s] 68it [00:15, 4.39it/s] 69it [00:15, 4.36it/s] 70it [00:15, 4.43it/s] 71it [00:15, 4.37it/s] 72it [00:16, 4.36it/s] 73it [00:16, 4.43it/s] 74it [00:16, 4.32it/s] 75it [00:16, 4.34it/s] 76it [00:17, 4.38it/s] 77it [00:17, 4.31it/s] 78it [00:17, 4.26it/s] 79it [00:17, 4.31it/s] 80it [00:18, 4.20it/s] 81it [00:18, 4.15it/s] 82it [00:18, 4.21it/s] 83it [00:18, 4.26it/s] 84it [00:19, 4.26it/s] 85it [00:19, 4.24it/s] 86it [00:19, 4.13it/s] 87it [00:19, 4.14it/s] 88it [00:19, 4.17it/s] 89it [00:20, 4.18it/s] 90it [00:20, 4.24it/s] 91it [00:20, 4.23it/s] 92it [00:20, 4.24it/s] 93it [00:21, 4.24it/s] 94it [00:21, 4.34it/s] 95it [00:21, 4.18it/s] 96it [00:21, 4.22it/s] 97it [00:22, 4.21it/s] 98it [00:22, 4.26it/s] 99it [00:22, 4.34it/s] 100it [00:22, 4.14it/s]2025-05-25 22:15:06,214 - INFO - [Epoch 062 | Batch 0100] IWAE-loss 1882.4122 | mean log_px -0.0167 | KL -1085.27 + 101it [00:23, 4.13it/s] 102it [00:23, 4.24it/s] 103it [00:23, 4.34it/s] 104it [00:23, 4.40it/s] 105it [00:23, 4.30it/s] 106it [00:24, 4.12it/s] 107it [00:24, 4.23it/s] 108it [00:24, 4.25it/s] 109it [00:24, 4.30it/s] 110it [00:25, 4.34it/s] 111it [00:25, 4.36it/s] 112it [00:25, 4.22it/s] 113it [00:25, 4.27it/s] 114it [00:26, 4.33it/s] 115it [00:26, 4.36it/s] 116it [00:26, 4.39it/s] 117it [00:26, 4.33it/s] 118it [00:26, 4.40it/s] 119it [00:27, 4.41it/s] 120it [00:27, 4.43it/s] 121it [00:27, 4.43it/s] 122it [00:27, 4.32it/s] 123it [00:28, 4.34it/s] 124it [00:28, 4.31it/s] 125it [00:28, 4.22it/s] 126it [00:28, 4.30it/s] 127it [00:29, 4.34it/s] 128it [00:29, 4.42it/s] 129it [00:29, 4.32it/s] 130it [00:29, 4.26it/s] 131it [00:30, 4.25it/s] 132it [00:30, 4.24it/s] 133it [00:30, 4.31it/s] 134it [00:30, 4.28it/s] 135it [00:30, 4.34it/s] 136it [00:31, 4.29it/s] 137it [00:31, 4.17it/s] 138it [00:31, 4.27it/s] 139it [00:31, 4.32it/s] 140it [00:32, 4.28it/s] 141it [00:32, 4.20it/s] 142it [00:32, 4.28it/s] 143it [00:32, 4.36it/s] 144it [00:33, 4.30it/s] 145it [00:33, 4.22it/s] 146it [00:33, 4.31it/s] 147it [00:33, 4.25it/s] 148it [00:33, 4.24it/s] 149it [00:34, 4.19it/s] 150it [00:34, 4.23it/s]2025-05-25 22:15:17,858 - INFO - [Epoch 062 | Batch 0150] IWAE-loss 1197.9325 | mean log_px -0.0030 | KL -1087.20 + 151it [00:34, 4.12it/s] 152it [00:34, 4.16it/s] 153it [00:35, 4.19it/s] 154it [00:35, 4.06it/s] 155it [00:35, 4.18it/s] 156it [00:35, 4.23it/s] 157it [00:36, 4.29it/s] 158it [00:36, 4.38it/s] 159it [00:36, 4.37it/s] 160it [00:36, 4.43it/s] 161it [00:37, 4.47it/s] 162it [00:37, 4.48it/s] 163it [00:37, 4.42it/s] 164it [00:37, 4.39it/s] 165it [00:37, 4.47it/s] 166it [00:38, 4.38it/s] 167it [00:38, 4.40it/s] 168it [00:38, 4.43it/s] 169it [00:38, 4.23it/s] 170it [00:39, 4.22it/s] 171it [00:39, 4.21it/s] 172it [00:39, 4.15it/s] 173it [00:39, 4.13it/s] 174it [00:40, 4.25it/s] 175it [00:40, 4.33it/s] 176it [00:40, 4.23it/s] 177it [00:40, 4.21it/s] 178it [00:40, 4.21it/s] 179it [00:41, 4.24it/s] 180it [00:41, 4.25it/s] 181it [00:41, 4.28it/s] 182it [00:41, 4.27it/s] 183it [00:42, 4.23it/s] 184it [00:42, 4.23it/s] 185it [00:42, 4.18it/s] 186it [00:42, 4.19it/s] 187it [00:43, 4.17it/s] 188it [00:43, 4.28it/s] 189it [00:43, 4.29it/s] 190it [00:43, 4.36it/s] 191it [00:44, 4.38it/s] 192it [00:44, 4.44it/s] 193it [00:44, 4.45it/s] 194it [00:44, 4.47it/s] 195it [00:44, 4.30it/s] 196it [00:45, 4.39it/s] 196it [00:45, 4.33it/s] +2025-05-25 22:15:28,446 - INFO - Epoch: 62, Objective: tensor([1330.0718], device='cuda:0', grad_fn=), Loss: 0.0047620623372495174, KL/n: 22.193544387817383 + 0it [00:00, ?it/s]2025-05-25 22:15:28,859 - INFO - [Epoch 063 | Batch 0000] IWAE-loss 1133.7760 | mean log_px -0.0013 | KL -1085.79 + 1it [00:00, 2.71it/s] 2it [00:00, 3.50it/s] 3it [00:00, 3.78it/s] 4it [00:01, 3.93it/s] 5it [00:01, 4.11it/s] 6it [00:01, 4.12it/s] 7it [00:01, 4.18it/s] 8it [00:02, 3.43it/s] 9it [00:02, 3.64it/s] 10it [00:02, 3.87it/s] 11it [00:02, 3.86it/s] 12it [00:03, 4.05it/s] 13it [00:03, 4.20it/s] 14it [00:03, 4.31it/s] 15it [00:03, 4.38it/s] 16it [00:03, 4.42it/s] 17it [00:04, 4.48it/s] 18it [00:04, 4.23it/s] 19it [00:04, 4.25it/s] 20it [00:04, 4.23it/s] 21it [00:05, 4.33it/s] 22it [00:05, 4.42it/s] 23it [00:05, 4.22it/s] 24it [00:05, 4.30it/s] 25it [00:06, 4.37it/s] 26it [00:06, 4.41it/s] 27it [00:06, 4.43it/s] 28it [00:06, 4.48it/s] 29it [00:06, 4.53it/s] 30it [00:07, 4.53it/s] 31it [00:07, 4.53it/s] 32it [00:07, 4.44it/s] 33it [00:07, 4.31it/s] 34it [00:08, 4.39it/s] 35it [00:08, 4.40it/s] 36it [00:08, 4.34it/s] 37it [00:08, 4.37it/s] 38it [00:09, 4.32it/s] 39it [00:09, 4.36it/s] 40it [00:09, 4.31it/s] 41it [00:09, 4.10it/s] 42it [00:10, 4.14it/s] 43it [00:10, 4.22it/s] 44it [00:10, 4.21it/s] 45it [00:10, 4.16it/s] 46it [00:10, 4.18it/s] 47it [00:11, 4.14it/s] 48it [00:11, 4.24it/s] 49it [00:11, 4.33it/s] 50it [00:11, 4.26it/s]2025-05-25 22:15:40,624 - INFO - [Epoch 063 | Batch 0050] IWAE-loss 1150.0118 | mean log_px -0.0013 | KL -1081.11 + 51it [00:12, 4.32it/s] 52it [00:12, 4.36it/s] 53it [00:12, 4.34it/s] 54it [00:12, 4.38it/s] 55it [00:13, 4.24it/s] 56it [00:13, 4.32it/s] 57it [00:13, 4.34it/s] 58it [00:13, 4.26it/s] 59it [00:13, 4.24it/s] 60it [00:14, 4.23it/s] 61it [00:14, 4.32it/s] 62it [00:14, 4.25it/s] 63it [00:14, 4.26it/s] 64it [00:15, 4.21it/s] 65it [00:15, 4.23it/s] 66it [00:15, 4.32it/s] 67it [00:15, 4.28it/s] 68it [00:16, 4.13it/s] 69it [00:16, 4.24it/s] 70it [00:16, 4.31it/s] 71it [00:16, 4.28it/s] 72it [00:17, 4.34it/s] 73it [00:17, 4.41it/s] 74it [00:17, 4.41it/s] 75it [00:17, 4.37it/s] 76it [00:17, 4.41it/s] 77it [00:18, 4.33it/s] 78it [00:18, 4.36it/s] 79it [00:18, 4.43it/s] 80it [00:18, 4.48it/s] 81it [00:19, 4.35it/s] 82it [00:19, 4.25it/s] 83it [00:19, 4.27it/s] 84it [00:19, 4.25it/s] 85it [00:19, 4.33it/s] 86it [00:20, 4.25it/s] 87it [00:20, 4.25it/s] 88it [00:20, 4.31it/s] 89it [00:20, 4.35it/s] 90it [00:21, 4.40it/s] 91it [00:21, 4.28it/s] 92it [00:21, 4.36it/s] 93it [00:21, 4.42it/s] 94it [00:22, 4.43it/s] 95it [00:22, 4.40it/s] 96it [00:22, 4.46it/s] 97it [00:22, 4.49it/s] 98it [00:22, 4.35it/s] 99it [00:23, 4.37it/s] 100it [00:23, 4.30it/s]2025-05-25 22:15:52,180 - INFO - [Epoch 063 | Batch 0100] IWAE-loss 1351.5203 | mean log_px -0.0092 | KL -1081.81 + 101it [00:23, 4.28it/s] 102it [00:23, 4.36it/s] 103it [00:24, 4.32it/s] 104it [00:24, 4.38it/s] 105it [00:24, 4.27it/s] 106it [00:24, 4.34it/s] 107it [00:25, 4.42it/s] 108it [00:25, 4.44it/s] 109it [00:25, 4.36it/s] 110it [00:25, 4.32it/s] 111it [00:25, 4.33it/s] 112it [00:26, 4.19it/s] 113it [00:26, 4.30it/s] 114it [00:26, 4.27it/s] 115it [00:26, 4.28it/s] 116it [00:27, 4.23it/s] 117it [00:27, 4.33it/s] 118it [00:27, 4.41it/s] 119it [00:27, 4.31it/s] 120it [00:28, 4.13it/s] 121it [00:28, 4.23it/s] 122it [00:28, 4.22it/s] 123it [00:28, 4.16it/s] 124it [00:29, 4.28it/s] 125it [00:29, 4.21it/s] 126it [00:29, 4.31it/s] 127it [00:29, 4.27it/s] 128it [00:29, 4.20it/s] 129it [00:30, 4.25it/s] 130it [00:30, 4.34it/s] 131it [00:30, 4.30it/s] 132it [00:30, 4.38it/s] 133it [00:31, 4.33it/s] 134it [00:31, 4.35it/s] 135it [00:31, 4.39it/s] 136it [00:31, 4.32it/s] 137it [00:32, 4.25it/s] 138it [00:32, 4.34it/s] 139it [00:32, 4.28it/s] 140it [00:32, 4.37it/s] 141it [00:32, 4.43it/s] 142it [00:33, 4.29it/s] 143it [00:33, 4.22it/s] 144it [00:33, 4.32it/s] 145it [00:33, 4.38it/s] 146it [00:34, 4.44it/s] 147it [00:34, 4.49it/s] 148it [00:34, 4.49it/s] 149it [00:34, 4.37it/s] 150it [00:35, 4.41it/s]2025-05-25 22:16:03,751 - INFO - [Epoch 063 | Batch 0150] IWAE-loss 1242.8817 | mean log_px -0.0063 | KL -1077.83 + 151it [00:35, 4.32it/s] 152it [00:35, 4.26it/s] 153it [00:35, 4.29it/s] 154it [00:35, 4.29it/s] 155it [00:36, 4.37it/s] 156it [00:36, 4.31it/s] 157it [00:36, 4.33it/s] 158it [00:36, 4.41it/s] 159it [00:37, 4.39it/s] 160it [00:37, 4.47it/s] 161it [00:37, 4.44it/s] 162it [00:37, 4.47it/s] 163it [00:37, 4.45it/s] 164it [00:38, 4.49it/s] 165it [00:38, 4.54it/s] 166it [00:38, 4.45it/s] 167it [00:38, 4.32it/s] 168it [00:39, 4.29it/s] 169it [00:39, 4.28it/s] 170it [00:39, 4.38it/s] 171it [00:39, 4.33it/s] 172it [00:40, 4.29it/s] 173it [00:40, 4.22it/s] 174it [00:40, 4.24it/s] 175it [00:40, 4.27it/s] 176it [00:40, 4.35it/s] 177it [00:41, 4.40it/s] 178it [00:41, 4.45it/s] 179it [00:41, 4.53it/s] 180it [00:41, 4.45it/s] 181it [00:42, 4.39it/s] 182it [00:42, 4.46it/s] 183it [00:42, 4.52it/s] 184it [00:42, 4.57it/s] 185it [00:42, 4.47it/s] 186it [00:43, 4.49it/s] 187it [00:43, 4.37it/s] 188it [00:43, 4.43it/s] 189it [00:43, 4.36it/s] 190it [00:44, 4.42it/s] 191it [00:44, 4.49it/s] 192it [00:44, 4.52it/s] 193it [00:44, 4.43it/s] 194it [00:45, 4.47it/s] 195it [00:45, 4.41it/s] 196it [00:45, 4.49it/s] 196it [00:45, 4.30it/s] +2025-05-25 22:16:14,120 - INFO - Epoch: 63, Objective: tensor([1271.1880], device='cuda:0', grad_fn=), Loss: 0.0068045128136873245, KL/n: 21.986188888549805 + 0it [00:00, ?it/s]2025-05-25 22:16:14,549 - INFO - [Epoch 064 | Batch 0000] IWAE-loss 1491.5543 | mean log_px -0.0086 | KL -1077.20 + 1it [00:00, 2.60it/s] 2it [00:00, 3.49it/s] 3it [00:00, 3.80it/s] 4it [00:01, 4.08it/s] 5it [00:01, 4.25it/s] 6it [00:01, 4.25it/s] 7it [00:01, 4.19it/s] 8it [00:01, 4.23it/s] 9it [00:02, 4.23it/s] 10it [00:02, 4.24it/s] 11it [00:02, 4.17it/s] 12it [00:02, 4.29it/s] 13it [00:03, 4.28it/s] 14it [00:03, 4.35it/s] 15it [00:03, 4.41it/s] 16it [00:03, 4.32it/s] 17it [00:04, 4.27it/s] 18it [00:04, 4.26it/s] 19it [00:04, 4.31it/s] 20it [00:04, 4.26it/s] 21it [00:05, 4.36it/s] 22it [00:05, 4.43it/s] 23it [00:05, 4.49it/s] 24it [00:05, 4.53it/s] 25it [00:05, 4.52it/s] 26it [00:06, 4.57it/s] 27it [00:06, 4.47it/s] 28it [00:06, 4.41it/s] 29it [00:06, 4.29it/s] 30it [00:07, 4.40it/s] 31it [00:07, 4.35it/s] 32it [00:07, 4.43it/s] 33it [00:07, 4.37it/s] 34it [00:07, 4.37it/s] 35it [00:08, 4.47it/s] 36it [00:08, 4.40it/s] 37it [00:08, 4.37it/s] 38it [00:08, 4.45it/s] 39it [00:09, 4.50it/s] 40it [00:09, 4.54it/s] 41it [00:09, 4.46it/s] 42it [00:09, 4.52it/s] 43it [00:09, 4.51it/s] 44it [00:10, 4.54it/s] 45it [00:10, 4.54it/s] 46it [00:10, 4.58it/s] 47it [00:10, 4.35it/s] 48it [00:11, 4.46it/s] 49it [00:11, 4.52it/s] 50it [00:11, 4.52it/s]2025-05-25 22:16:25,916 - INFO - [Epoch 064 | Batch 0050] IWAE-loss 1201.7369 | mean log_px -0.0023 | KL -1074.23 + 51it [00:11, 4.42it/s] 52it [00:11, 4.38it/s] 53it [00:12, 4.44it/s] 54it [00:12, 4.47it/s] 55it [00:12, 4.53it/s] 56it [00:12, 4.57it/s] 57it [00:13, 4.60it/s] 58it [00:13, 4.62it/s] 59it [00:13, 4.65it/s] 60it [00:13, 4.66it/s] 61it [00:13, 4.53it/s] 62it [00:14, 4.40it/s] 63it [00:14, 4.46it/s] 64it [00:14, 4.38it/s] 65it [00:14, 4.42it/s] 66it [00:15, 4.47it/s] 67it [00:15, 4.39it/s] 68it [00:15, 4.44it/s] 69it [00:15, 4.36it/s] 70it [00:15, 4.43it/s] 71it [00:16, 4.47it/s] 72it [00:16, 4.40it/s] 73it [00:16, 4.24it/s] 74it [00:16, 4.27it/s] 75it [00:17, 4.36it/s] 76it [00:17, 4.42it/s] 77it [00:17, 4.37it/s] 78it [00:17, 4.33it/s] 79it [00:18, 4.33it/s] 80it [00:18, 4.31it/s] 81it [00:18, 4.28it/s] 82it [00:18, 4.31it/s] 83it [00:18, 4.36it/s] 84it [00:19, 4.20it/s] 85it [00:19, 4.30it/s] 86it [00:19, 4.40it/s] 87it [00:19, 4.37it/s] 88it [00:20, 4.45it/s] 89it [00:20, 4.41it/s] 90it [00:20, 4.48it/s] 91it [00:20, 4.53it/s] 92it [00:21, 4.43it/s] 93it [00:21, 4.27it/s] 94it [00:21, 4.33it/s] 95it [00:21, 4.33it/s] 96it [00:21, 4.37it/s] 97it [00:22, 4.30it/s] 98it [00:22, 4.35it/s] 99it [00:22, 4.37it/s] 100it [00:22, 4.29it/s]2025-05-25 22:16:37,285 - INFO - [Epoch 064 | Batch 0100] IWAE-loss 1448.6731 | mean log_px -0.0105 | KL -1068.36 + 101it [00:23, 4.32it/s] 102it [00:23, 4.40it/s] 103it [00:23, 4.35it/s] 104it [00:23, 4.34it/s] 105it [00:24, 4.39it/s] 106it [00:24, 4.47it/s] 107it [00:24, 4.51it/s] 108it [00:24, 4.55it/s] 109it [00:24, 4.57it/s] 110it [00:25, 4.49it/s] 111it [00:25, 4.40it/s] 112it [00:25, 4.37it/s] 113it [00:25, 4.34it/s] 114it [00:26, 4.31it/s] 115it [00:26, 4.15it/s] 116it [00:26, 4.30it/s] 117it [00:26, 4.41it/s] 118it [00:26, 4.46it/s] 119it [00:27, 4.37it/s] 120it [00:27, 4.45it/s] 121it [00:27, 4.31it/s] 122it [00:27, 4.19it/s] 123it [00:28, 4.29it/s] 124it [00:28, 4.29it/s] 125it [00:28, 4.30it/s] 126it [00:28, 4.26it/s] 127it [00:29, 4.39it/s] 128it [00:29, 4.29it/s] 129it [00:29, 4.36it/s] 130it [00:29, 4.42it/s] 131it [00:29, 4.24it/s] 132it [00:30, 4.36it/s] 133it [00:30, 4.32it/s] 134it [00:30, 4.41it/s] 135it [00:30, 4.47it/s] 136it [00:31, 4.51it/s] 137it [00:31, 4.43it/s] 138it [00:31, 4.38it/s] 139it [00:31, 4.47it/s] 140it [00:32, 4.37it/s] 141it [00:32, 4.35it/s] 142it [00:32, 4.43it/s] 143it [00:32, 4.34it/s] 144it [00:32, 4.45it/s] 145it [00:33, 4.49it/s] 146it [00:33, 4.44it/s] 147it [00:33, 4.45it/s] 148it [00:33, 4.50it/s] 149it [00:34, 4.55it/s] 150it [00:34, 4.48it/s]2025-05-25 22:16:48,646 - INFO - [Epoch 064 | Batch 0150] IWAE-loss 1139.3844 | mean log_px -0.0025 | KL -1069.10 + 151it [00:34, 4.53it/s] 152it [00:34, 4.56it/s] 153it [00:34, 4.47it/s] 154it [00:35, 4.49it/s] 155it [00:35, 4.50it/s] 156it [00:35, 4.30it/s] 157it [00:35, 4.35it/s] 158it [00:36, 4.42it/s] 159it [00:36, 4.49it/s] 160it [00:36, 4.54it/s] 161it [00:36, 4.44it/s] 162it [00:36, 4.28it/s] 163it [00:37, 4.38it/s] 164it [00:37, 4.43it/s] 165it [00:37, 4.41it/s] 166it [00:37, 4.48it/s] 167it [00:38, 4.26it/s] 168it [00:38, 4.28it/s] 169it [00:38, 4.26it/s] 170it [00:38, 4.30it/s] 171it [00:39, 4.30it/s] 172it [00:39, 4.40it/s] 173it [00:39, 4.20it/s] 174it [00:39, 4.22it/s] 175it [00:39, 4.33it/s] 176it [00:40, 4.26it/s] 177it [00:40, 4.37it/s] 178it [00:40, 4.44it/s] 179it [00:40, 4.45it/s] 180it [00:41, 4.30it/s] 181it [00:41, 4.26it/s] 182it [00:41, 4.29it/s] 183it [00:41, 4.37it/s] 184it [00:42, 4.45it/s] 185it [00:42, 4.35it/s] 186it [00:42, 4.19it/s] 187it [00:42, 4.29it/s] 188it [00:42, 4.38it/s] 189it [00:43, 4.30it/s] 190it [00:43, 4.34it/s] 191it [00:43, 4.21it/s] 192it [00:43, 4.35it/s] 193it [00:44, 4.43it/s] 194it [00:44, 4.47it/s] 195it [00:44, 4.30it/s] 196it [00:44, 4.30it/s] 196it [00:44, 4.37it/s] +2025-05-25 22:16:59,132 - INFO - Epoch: 64, Objective: tensor([1219.0177], device='cuda:0', grad_fn=), Loss: 0.005087015684694052, KL/n: 21.777986526489258 + 0it [00:00, ?it/s]2025-05-25 22:16:59,731 - INFO - [Epoch 065 | Batch 0000] IWAE-loss 1199.1672 | mean log_px -0.0037 | KL -1066.61 + 1it [00:00, 2.98it/s] 2it [00:00, 3.64it/s] 3it [00:00, 3.93it/s] 4it [00:01, 4.18it/s] 5it [00:01, 4.34it/s] 6it [00:01, 4.43it/s] 7it [00:01, 4.52it/s] 8it [00:01, 4.56it/s] 9it [00:02, 4.38it/s] 10it [00:02, 4.47it/s] 11it [00:02, 4.43it/s] 12it [00:02, 4.40it/s] 13it [00:03, 4.40it/s] 14it [00:03, 4.34it/s] 15it [00:03, 4.38it/s] 16it [00:03, 4.33it/s] 17it [00:03, 4.36it/s] 18it [00:04, 4.27it/s] 19it [00:04, 4.40it/s] 20it [00:04, 4.47it/s] 21it [00:04, 4.51it/s] 22it [00:05, 4.55it/s] 23it [00:05, 4.49it/s] 24it [00:05, 4.45it/s] 25it [00:05, 4.28it/s] 26it [00:05, 4.27it/s] 27it [00:06, 4.31it/s] 28it [00:06, 4.29it/s] 29it [00:06, 4.38it/s] 30it [00:06, 4.36it/s] 31it [00:07, 4.42it/s] 32it [00:07, 4.42it/s] 33it [00:07, 4.38it/s] 34it [00:07, 4.26it/s] 35it [00:08, 4.26it/s] 36it [00:08, 4.38it/s] 37it [00:08, 4.44it/s] 38it [00:08, 4.51it/s] 39it [00:08, 4.56it/s] 40it [00:09, 4.46it/s] 41it [00:09, 4.43it/s] 42it [00:09, 4.39it/s] 43it [00:09, 4.40it/s] 44it [00:10, 4.46it/s] 45it [00:10, 4.43it/s] 46it [00:10, 4.51it/s] 47it [00:10, 4.50it/s] 48it [00:10, 4.42it/s] 49it [00:11, 4.41it/s] 50it [00:11, 4.41it/s]2025-05-25 22:17:11,042 - INFO - [Epoch 065 | Batch 0050] IWAE-loss 1212.4058 | mean log_px -0.0064 | KL -1062.44 + 51it [00:11, 4.46it/s] 52it [00:11, 4.44it/s] 53it [00:12, 4.47it/s] 54it [00:12, 4.51it/s] 55it [00:12, 4.47it/s] 56it [00:12, 4.47it/s] 57it [00:12, 4.45it/s] 58it [00:13, 4.41it/s] 59it [00:13, 4.40it/s] 60it [00:13, 4.37it/s] 61it [00:13, 4.42it/s] 62it [00:14, 4.48it/s] 63it [00:14, 4.39it/s] 64it [00:14, 4.39it/s] 65it [00:14, 4.40it/s] 66it [00:15, 4.40it/s] 67it [00:15, 4.32it/s] 68it [00:15, 4.35it/s] 69it [00:15, 4.37it/s] 70it [00:15, 4.34it/s] 71it [00:16, 4.43it/s] 72it [00:16, 4.27it/s] 73it [00:16, 4.34it/s] 74it [00:16, 4.34it/s] 75it [00:17, 4.36it/s] 76it [00:17, 4.38it/s] 77it [00:17, 4.43it/s] 78it [00:17, 4.37it/s] 79it [00:18, 4.43it/s] 80it [00:18, 4.36it/s] 81it [00:18, 4.47it/s] 82it [00:18, 4.53it/s] 83it [00:18, 4.56it/s] 84it [00:19, 4.46it/s] 85it [00:19, 4.50it/s] 86it [00:19, 4.51it/s] 87it [00:19, 4.56it/s] 88it [00:20, 4.56it/s] 89it [00:20, 4.51it/s] 90it [00:20, 4.52it/s] 91it [00:20, 4.52it/s] 92it [00:20, 4.32it/s] 93it [00:21, 4.38it/s] 94it [00:21, 4.41it/s] 95it [00:21, 4.36it/s] 96it [00:21, 4.37it/s] 97it [00:22, 4.45it/s] 98it [00:22, 4.38it/s] 99it [00:22, 4.38it/s] 100it [00:22, 4.33it/s]2025-05-25 22:17:22,370 - INFO - [Epoch 065 | Batch 0100] IWAE-loss 1217.0249 | mean log_px -0.0038 | KL -1067.40 + 101it [00:22, 4.36it/s] 102it [00:23, 4.35it/s] 103it [00:23, 4.44it/s] 104it [00:23, 4.47it/s] 105it [00:23, 4.52it/s] 106it [00:24, 4.51it/s] 107it [00:24, 4.46it/s] 108it [00:24, 4.37it/s] 109it [00:24, 4.34it/s] 110it [00:25, 4.36it/s] 111it [00:25, 4.34it/s] 112it [00:25, 4.32it/s] 113it [00:25, 4.31it/s] 114it [00:25, 4.32it/s] 115it [00:26, 4.29it/s] 116it [00:26, 4.32it/s] 117it [00:26, 4.33it/s] 118it [00:26, 4.19it/s] 119it [00:27, 4.35it/s] 120it [00:27, 4.39it/s] 121it [00:27, 4.43it/s] 122it [00:27, 4.47it/s] 123it [00:27, 4.53it/s] 124it [00:28, 4.45it/s] 125it [00:28, 4.48it/s] 126it [00:28, 4.45it/s] 127it [00:28, 4.46it/s] 128it [00:29, 4.49it/s] 129it [00:29, 4.51it/s] 130it [00:29, 4.42it/s] 131it [00:29, 4.41it/s] 132it [00:30, 4.22it/s] 133it [00:30, 4.37it/s] 134it [00:30, 4.33it/s] 135it [00:30, 4.37it/s] 136it [00:30, 4.44it/s] 137it [00:31, 4.51it/s] 138it [00:31, 4.44it/s] 139it [00:31, 4.45it/s] 140it [00:31, 4.44it/s] 141it [00:32, 4.51it/s] 142it [00:32, 4.46it/s] 143it [00:32, 4.41it/s] 144it [00:32, 4.24it/s] 145it [00:33, 4.19it/s] 146it [00:33, 4.31it/s] 147it [00:33, 4.35it/s] 148it [00:33, 4.37it/s] 149it [00:33, 4.38it/s] 150it [00:34, 4.24it/s]2025-05-25 22:17:33,772 - INFO - [Epoch 065 | Batch 0150] IWAE-loss 1168.8063 | mean log_px -0.0032 | KL -1064.15 + 151it [00:34, 4.34it/s] 152it [00:34, 4.32it/s] 153it [00:34, 4.41it/s] 154it [00:35, 4.45it/s] 155it [00:35, 4.42it/s] 156it [00:35, 4.38it/s] 157it [00:35, 4.46it/s] 158it [00:35, 4.41it/s] 159it [00:36, 4.43it/s] 160it [00:36, 4.23it/s] 161it [00:36, 4.27it/s] 162it [00:36, 4.29it/s] 163it [00:37, 4.32it/s] 164it [00:37, 4.38it/s] 165it [00:37, 4.47it/s] 166it [00:37, 4.32it/s] 167it [00:38, 4.39it/s] 168it [00:38, 4.47it/s] 169it [00:38, 4.49it/s] 170it [00:38, 4.53it/s] 171it [00:38, 4.57it/s] 172it [00:39, 4.55it/s] 173it [00:39, 4.26it/s] 174it [00:39, 4.28it/s] 175it [00:39, 4.29it/s] 176it [00:40, 4.32it/s] 177it [00:40, 4.39it/s] 178it [00:40, 4.43it/s] 179it [00:40, 4.43it/s] 180it [00:41, 4.22it/s] 181it [00:41, 4.21it/s] 182it [00:41, 4.24it/s] 183it [00:41, 4.25it/s] 184it [00:41, 4.27it/s] 185it [00:42, 4.30it/s] 186it [00:42, 4.19it/s] 187it [00:42, 4.24it/s] 188it [00:42, 4.25it/s] 189it [00:43, 4.29it/s] 190it [00:43, 4.26it/s] 191it [00:43, 4.31it/s] 192it [00:43, 4.32it/s] 193it [00:44, 4.33it/s] 194it [00:44, 4.32it/s] 195it [00:44, 4.29it/s] 196it [00:44, 4.26it/s] 196it [00:44, 4.37it/s] +2025-05-25 22:17:44,281 - INFO - Epoch: 65, Objective: tensor([1230.9609], device='cuda:0', grad_fn=), Loss: 0.005760730244219303, KL/n: 21.655872344970703 + 0it [00:00, ?it/s]2025-05-25 22:17:44,681 - INFO - [Epoch 066 | Batch 0000] IWAE-loss 1246.0516 | mean log_px -0.0045 | KL -1060.09 + 1it [00:00, 3.01it/s] 2it [00:00, 3.63it/s] 3it [00:00, 3.86it/s] 4it [00:01, 4.10it/s] 5it [00:01, 4.09it/s] 6it [00:01, 4.13it/s] 7it [00:01, 4.13it/s] 8it [00:01, 4.19it/s] 9it [00:02, 4.29it/s] 10it [00:02, 4.11it/s] 11it [00:02, 4.12it/s] 12it [00:02, 4.18it/s] 13it [00:03, 4.23it/s] 14it [00:03, 4.33it/s] 15it [00:03, 4.40it/s] 16it [00:03, 4.35it/s] 17it [00:04, 4.40it/s] 18it [00:04, 4.46it/s] 19it [00:04, 4.34it/s] 20it [00:04, 4.32it/s] 21it [00:05, 4.27it/s] 22it [00:05, 4.28it/s] 23it [00:05, 4.26it/s] 24it [00:05, 4.28it/s] 25it [00:05, 4.35it/s] 26it [00:06, 4.42it/s] 27it [00:06, 4.47it/s] 28it [00:06, 4.43it/s] 29it [00:06, 4.47it/s] 30it [00:07, 4.51it/s] 31it [00:07, 4.42it/s] 32it [00:07, 4.34it/s] 33it [00:07, 4.28it/s] 34it [00:07, 4.28it/s] 35it [00:08, 4.10it/s] 36it [00:08, 4.08it/s] 37it [00:08, 4.12it/s] 38it [00:08, 4.26it/s] 39it [00:09, 4.35it/s] 40it [00:09, 4.30it/s] 41it [00:09, 4.17it/s] 42it [00:09, 4.21it/s] 43it [00:10, 4.31it/s] 44it [00:10, 4.28it/s] 45it [00:10, 4.35it/s] 46it [00:10, 4.15it/s] 47it [00:11, 4.15it/s] 48it [00:11, 4.17it/s] 49it [00:11, 4.19it/s] 50it [00:11, 4.30it/s]2025-05-25 22:17:56,345 - INFO - [Epoch 066 | Batch 0050] IWAE-loss 1207.2434 | mean log_px -0.0082 | KL -1055.60 + 51it [00:11, 4.38it/s] 52it [00:12, 4.32it/s] 53it [00:12, 4.27it/s] 54it [00:12, 4.35it/s] 55it [00:12, 4.28it/s] 56it [00:13, 4.28it/s] 57it [00:13, 4.28it/s] 58it [00:13, 4.24it/s] 59it [00:13, 4.32it/s] 60it [00:14, 4.38it/s] 61it [00:14, 4.28it/s] 62it [00:14, 4.12it/s] 63it [00:14, 4.12it/s] 64it [00:15, 4.17it/s] 65it [00:15, 4.14it/s] 66it [00:15, 4.19it/s] 67it [00:15, 4.21it/s] 68it [00:16, 4.23it/s] 69it [00:16, 4.29it/s] 70it [00:16, 4.41it/s] 71it [00:16, 4.34it/s] 72it [00:16, 4.35it/s] 73it [00:17, 4.29it/s] 74it [00:17, 4.27it/s] 75it [00:17, 4.25it/s] 76it [00:17, 4.30it/s] 77it [00:18, 3.51it/s] 78it [00:18, 3.72it/s] 79it [00:18, 3.87it/s] 80it [00:18, 3.95it/s] 81it [00:19, 4.03it/s] 82it [00:19, 4.10it/s] 83it [00:19, 4.15it/s] 84it [00:19, 4.21it/s] 85it [00:20, 4.22it/s] 86it [00:20, 4.22it/s] 87it [00:20, 4.27it/s] 88it [00:20, 4.39it/s] 89it [00:21, 4.48it/s] 90it [00:21, 4.51it/s] 91it [00:21, 4.39it/s] 92it [00:21, 4.40it/s] 93it [00:21, 4.46it/s] 94it [00:22, 4.50it/s] 95it [00:22, 4.42it/s] 96it [00:22, 4.36it/s] 97it [00:22, 4.33it/s] 98it [00:23, 4.32it/s] 99it [00:23, 4.29it/s] 100it [00:23, 4.40it/s]2025-05-25 22:18:08,134 - INFO - [Epoch 066 | Batch 0100] IWAE-loss 1485.7710 | mean log_px -0.0174 | KL -1055.98 + 101it [00:23, 4.35it/s] 102it [00:24, 4.32it/s] 103it [00:24, 4.28it/s] 104it [00:24, 4.32it/s] 105it [00:24, 4.37it/s] 106it [00:24, 4.36it/s] 107it [00:25, 4.43it/s] 108it [00:25, 4.35it/s] 109it [00:25, 4.24it/s] 110it [00:25, 4.20it/s] 111it [00:26, 4.22it/s] 112it [00:26, 4.23it/s] 113it [00:26, 4.35it/s] 114it [00:26, 4.29it/s] 115it [00:27, 4.28it/s] 116it [00:27, 4.28it/s] 117it [00:27, 4.27it/s] 118it [00:27, 4.40it/s] 119it [00:27, 4.32it/s] 120it [00:28, 4.32it/s] 121it [00:28, 4.32it/s] 122it [00:28, 4.43it/s] 123it [00:28, 4.36it/s] 124it [00:29, 4.37it/s] 125it [00:29, 4.38it/s] 126it [00:29, 4.34it/s] 127it [00:29, 4.32it/s] 128it [00:30, 4.18it/s] 129it [00:30, 4.19it/s] 130it [00:30, 4.32it/s] 131it [00:30, 4.41it/s] 132it [00:30, 4.49it/s] 133it [00:31, 4.44it/s] 134it [00:31, 4.36it/s] 135it [00:31, 4.43it/s] 136it [00:31, 4.48it/s] 137it [00:32, 4.41it/s] 138it [00:32, 4.33it/s] 139it [00:32, 4.37it/s] 140it [00:32, 4.29it/s] 141it [00:33, 4.30it/s] 142it [00:33, 4.39it/s] 143it [00:33, 4.37it/s] 144it [00:33, 4.43it/s] 145it [00:33, 4.38it/s] 146it [00:34, 4.32it/s] 147it [00:34, 4.39it/s] 148it [00:34, 4.31it/s] 149it [00:34, 4.37it/s] 150it [00:35, 4.42it/s]2025-05-25 22:18:19,645 - INFO - [Epoch 066 | Batch 0150] IWAE-loss 1216.0743 | mean log_px -0.0039 | KL -1054.95 + 151it [00:35, 4.43it/s] 152it [00:35, 4.35it/s] 153it [00:35, 4.39it/s] 154it [00:35, 4.45it/s] 155it [00:36, 4.38it/s] 156it [00:36, 4.37it/s] 157it [00:36, 4.46it/s] 158it [00:36, 4.51it/s] 159it [00:37, 4.54it/s] 160it [00:37, 4.49it/s] 161it [00:37, 4.51it/s] 162it [00:37, 4.48it/s] 163it [00:37, 4.51it/s] 164it [00:38, 4.43it/s] 165it [00:38, 4.39it/s] 166it [00:38, 4.41it/s] 167it [00:38, 4.35it/s] 168it [00:39, 4.35it/s] 169it [00:39, 4.35it/s] 170it [00:39, 4.46it/s] 171it [00:39, 4.52it/s] 172it [00:40, 4.51it/s] 173it [00:40, 4.55it/s] 174it [00:40, 4.56it/s] 175it [00:40, 4.46it/s] 176it [00:40, 4.46it/s] 177it [00:41, 4.51it/s] 178it [00:41, 4.56it/s] 179it [00:41, 4.58it/s] 180it [00:41, 4.30it/s] 181it [00:42, 4.28it/s] 182it [00:42, 4.32it/s] 183it [00:42, 4.36it/s] 184it [00:42, 4.31it/s] 185it [00:42, 4.36it/s] 186it [00:43, 4.33it/s] 187it [00:43, 4.33it/s] 188it [00:43, 4.41it/s] 189it [00:43, 4.47it/s] 190it [00:44, 4.54it/s] 191it [00:44, 4.43it/s] 192it [00:44, 4.43it/s] 193it [00:44, 4.39it/s] 194it [00:44, 4.43it/s] 195it [00:45, 4.32it/s] 196it [00:45, 4.43it/s] 196it [00:45, 4.31it/s] +2025-05-25 22:18:29,936 - INFO - Epoch: 66, Objective: tensor([1588.1846], device='cuda:0', grad_fn=), Loss: 0.013912596739828587, KL/n: 21.540197372436523 + 0it [00:00, ?it/s]2025-05-25 22:18:30,343 - INFO - [Epoch 067 | Batch 0000] IWAE-loss 1198.7195 | mean log_px -0.0020 | KL -1053.46 + 1it [00:00, 2.81it/s] 2it [00:00, 3.59it/s] 3it [00:00, 3.98it/s] 4it [00:01, 4.24it/s] 5it [00:01, 4.24it/s] 6it [00:01, 4.38it/s] 7it [00:01, 4.32it/s] 8it [00:01, 4.32it/s] 9it [00:02, 4.42it/s] 10it [00:02, 4.49it/s] 11it [00:02, 4.54it/s] 12it [00:02, 4.57it/s] 13it [00:03, 4.59it/s] 14it [00:03, 4.62it/s] 15it [00:03, 4.62it/s] 16it [00:03, 4.64it/s] 17it [00:03, 4.50it/s] 18it [00:04, 4.52it/s] 19it [00:04, 4.51it/s] 20it [00:04, 4.41it/s] 21it [00:04, 4.30it/s] 22it [00:05, 4.31it/s] 23it [00:05, 4.42it/s] 24it [00:05, 4.45it/s] 25it [00:05, 4.52it/s] 26it [00:05, 4.54it/s] 27it [00:06, 4.49it/s] 28it [00:06, 4.48it/s] 29it [00:06, 4.38it/s] 30it [00:06, 4.34it/s] 31it [00:07, 4.42it/s] 32it [00:07, 4.51it/s] 33it [00:07, 4.41it/s] 34it [00:07, 4.48it/s] 35it [00:07, 4.53it/s] 36it [00:08, 4.56it/s] 37it [00:08, 4.59it/s] 38it [00:08, 4.60it/s] 39it [00:08, 4.64it/s] 40it [00:09, 4.51it/s] 41it [00:09, 4.54it/s] 42it [00:09, 4.58it/s] 43it [00:09, 4.62it/s] 44it [00:09, 4.64it/s] 45it [00:10, 4.66it/s] 46it [00:10, 4.66it/s] 47it [00:10, 4.67it/s] 48it [00:10, 4.67it/s] 49it [00:10, 4.69it/s] 50it [00:11, 4.66it/s]2025-05-25 22:18:41,408 - INFO - [Epoch 067 | Batch 0050] IWAE-loss 1289.7285 | mean log_px -0.0091 | KL -1050.17 + 51it [00:11, 4.57it/s] 52it [00:11, 4.56it/s] 53it [00:11, 4.44it/s] 54it [00:12, 4.47it/s] 55it [00:12, 4.50it/s] 56it [00:12, 4.52it/s] 57it [00:12, 4.43it/s] 58it [00:12, 4.49it/s] 59it [00:13, 4.53it/s] 60it [00:13, 4.56it/s] 61it [00:13, 4.34it/s] 62it [00:13, 4.41it/s] 63it [00:14, 4.49it/s] 64it [00:14, 4.41it/s] 65it [00:14, 4.48it/s] 66it [00:14, 4.54it/s] 67it [00:14, 4.49it/s] 68it [00:15, 4.56it/s] 69it [00:15, 4.45it/s] 70it [00:15, 4.51it/s] 71it [00:15, 4.58it/s] 72it [00:16, 4.60it/s] 73it [00:16, 4.62it/s] 74it [00:16, 4.48it/s] 75it [00:16, 4.52it/s] 76it [00:16, 4.58it/s] 77it [00:17, 4.59it/s] 78it [00:17, 4.64it/s] 79it [00:17, 4.52it/s] 80it [00:17, 4.53it/s] 81it [00:18, 4.46it/s] 82it [00:18, 4.46it/s] 83it [00:18, 4.51it/s] 84it [00:18, 4.56it/s] 85it [00:18, 4.47it/s] 86it [00:19, 4.49it/s] 87it [00:19, 4.58it/s] 88it [00:19, 4.56it/s] 89it [00:19, 4.59it/s] 90it [00:20, 4.64it/s] 91it [00:20, 4.63it/s] 92it [00:20, 4.65it/s] 93it [00:20, 4.68it/s] 94it [00:20, 4.68it/s] 95it [00:21, 4.50it/s] 96it [00:21, 4.41it/s] 97it [00:21, 4.46it/s] 98it [00:21, 4.50it/s] 99it [00:22, 4.54it/s] 100it [00:22, 4.58it/s]2025-05-25 22:18:52,457 - INFO - [Epoch 067 | Batch 0100] IWAE-loss 1387.3746 | mean log_px -0.0188 | KL -1049.04 + 101it [00:22, 4.56it/s] 102it [00:22, 4.44it/s] 103it [00:22, 4.51it/s] 104it [00:23, 4.55it/s] 105it [00:23, 4.58it/s] 106it [00:23, 4.59it/s] 107it [00:23, 4.60it/s] 108it [00:23, 4.60it/s] 109it [00:24, 4.46it/s] 110it [00:24, 4.52it/s] 111it [00:24, 4.52it/s] 112it [00:24, 4.55it/s] 113it [00:25, 4.58it/s] 114it [00:25, 4.59it/s] 115it [00:25, 4.61it/s] 116it [00:25, 4.33it/s] 117it [00:26, 4.30it/s] 118it [00:26, 4.38it/s] 119it [00:26, 4.47it/s] 120it [00:26, 4.50it/s] 121it [00:26, 4.54it/s] 122it [00:27, 4.56it/s] 123it [00:27, 4.58it/s] 124it [00:27, 4.32it/s] 125it [00:27, 4.30it/s] 126it [00:28, 4.38it/s] 127it [00:28, 4.45it/s] 128it [00:28, 4.36it/s] 129it [00:28, 4.42it/s] 130it [00:28, 4.49it/s] 131it [00:29, 4.52it/s] 132it [00:29, 4.54it/s] 133it [00:29, 4.40it/s] 134it [00:29, 4.47it/s] 135it [00:30, 4.52it/s] 136it [00:30, 4.54it/s] 137it [00:30, 4.39it/s] 138it [00:30, 4.43it/s] 139it [00:30, 4.49it/s] 140it [00:31, 4.54it/s] 141it [00:31, 4.56it/s] 142it [00:31, 4.59it/s] 143it [00:31, 4.58it/s] 144it [00:32, 4.59it/s] 145it [00:32, 4.47it/s] 146it [00:32, 4.50it/s] 147it [00:32, 4.40it/s] 148it [00:32, 4.35it/s] 149it [00:33, 4.42it/s] 150it [00:33, 4.47it/s]2025-05-25 22:19:03,611 - INFO - [Epoch 067 | Batch 0150] IWAE-loss 1194.1609 | mean log_px -0.0024 | KL -1048.20 + 151it [00:33, 4.52it/s] 152it [00:33, 4.55it/s] 153it [00:34, 4.55it/s] 154it [00:34, 4.56it/s] 155it [00:34, 4.57it/s] 156it [00:34, 4.56it/s] 157it [00:34, 4.42it/s] 158it [00:35, 4.48it/s] 159it [00:35, 4.37it/s] 160it [00:35, 4.36it/s] 161it [00:35, 4.41it/s] 162it [00:36, 4.46it/s] 163it [00:36, 4.50it/s] 164it [00:36, 4.51it/s] 165it [00:36, 4.35it/s] 166it [00:36, 4.31it/s] 167it [00:37, 4.36it/s] 168it [00:37, 4.42it/s] 169it [00:37, 4.47it/s] 170it [00:37, 4.42it/s] 171it [00:38, 4.33it/s] 172it [00:38, 4.38it/s] 173it [00:38, 4.43it/s] 174it [00:38, 4.34it/s] 175it [00:39, 4.37it/s] 176it [00:39, 4.43it/s] 177it [00:39, 4.46it/s] 178it [00:39, 4.49it/s] 179it [00:39, 4.37it/s] 180it [00:40, 4.27it/s] 181it [00:40, 4.26it/s] 182it [00:40, 4.33it/s] 183it [00:40, 4.39it/s] 184it [00:41, 4.45it/s] 185it [00:41, 4.34it/s] 186it [00:41, 4.30it/s] 187it [00:41, 4.22it/s] 188it [00:42, 4.09it/s] 189it [00:42, 4.23it/s] 190it [00:42, 4.20it/s] 191it [00:42, 4.24it/s] 192it [00:42, 4.26it/s] 193it [00:43, 4.09it/s] 194it [00:43, 4.11it/s] 195it [00:43, 4.00it/s] 196it [00:43, 4.14it/s] 196it [00:44, 4.45it/s] +2025-05-25 22:19:14,116 - INFO - Epoch: 67, Objective: tensor([1625.6294], device='cuda:0', grad_fn=), Loss: 0.012983052060008049, KL/n: 21.431779861450195 + 0it [00:00, ?it/s]2025-05-25 22:19:14,692 - INFO - [Epoch 068 | Batch 0000] IWAE-loss 1262.3419 | mean log_px -0.0057 | KL -1050.64 + 1it [00:00, 2.87it/s] 2it [00:00, 3.66it/s] 3it [00:00, 3.94it/s] 4it [00:01, 4.17it/s] 5it [00:01, 4.30it/s] 6it [00:01, 4.32it/s] 7it [00:01, 4.41it/s] 8it [00:01, 4.36it/s] 9it [00:02, 4.44it/s] 10it [00:02, 4.49it/s] 11it [00:02, 4.53it/s] 12it [00:02, 4.35it/s] 13it [00:03, 4.44it/s] 14it [00:03, 4.47it/s] 15it [00:03, 4.51it/s] 16it [00:03, 4.52it/s] 17it [00:03, 4.53it/s] 18it [00:04, 4.39it/s] 19it [00:04, 4.45it/s] 20it [00:04, 4.48it/s] 21it [00:04, 4.50it/s] 22it [00:05, 4.48it/s] 23it [00:05, 4.46it/s] 24it [00:05, 4.49it/s] 25it [00:05, 4.38it/s] 26it [00:05, 4.41it/s] 27it [00:06, 4.47it/s] 28it [00:06, 4.49it/s] 29it [00:06, 4.44it/s] 30it [00:06, 4.31it/s] 31it [00:07, 4.39it/s] 32it [00:07, 4.41it/s] 33it [00:07, 4.36it/s] 34it [00:07, 4.42it/s] 35it [00:07, 4.40it/s] 36it [00:08, 4.44it/s] 37it [00:08, 4.46it/s] 38it [00:08, 4.49it/s] 39it [00:08, 4.53it/s] 40it [00:09, 4.40it/s] 41it [00:09, 4.46it/s] 42it [00:09, 4.50it/s] 43it [00:09, 4.51it/s] 44it [00:09, 4.52it/s] 45it [00:10, 4.52it/s] 46it [00:10, 4.53it/s] 47it [00:10, 4.41it/s] 48it [00:10, 4.47it/s] 49it [00:11, 4.51it/s] 50it [00:11, 4.52it/s]2025-05-25 22:19:25,908 - INFO - [Epoch 068 | Batch 0050] IWAE-loss 1151.6068 | mean log_px -0.0023 | KL -1047.97 + 51it [00:11, 4.53it/s] 52it [00:11, 4.54it/s] 53it [00:11, 4.42it/s] 54it [00:12, 4.45it/s] 55it [00:12, 4.46it/s] 56it [00:12, 4.34it/s] 57it [00:12, 4.41it/s] 58it [00:13, 4.46it/s] 59it [00:13, 4.50it/s] 60it [00:13, 4.52it/s] 61it [00:13, 4.55it/s] 62it [00:14, 4.36it/s] 63it [00:14, 4.44it/s] 64it [00:14, 4.45it/s] 65it [00:14, 4.49it/s] 66it [00:14, 4.50it/s] 67it [00:15, 4.52it/s] 68it [00:15, 4.39it/s] 69it [00:15, 4.44it/s] 70it [00:15, 4.44it/s] 71it [00:16, 4.48it/s] 72it [00:16, 4.52it/s] 73it [00:16, 4.54it/s] 74it [00:16, 4.51it/s] 75it [00:16, 4.39it/s] 76it [00:17, 4.43it/s] 77it [00:17, 4.47it/s] 78it [00:17, 4.49it/s] 79it [00:17, 4.52it/s] 80it [00:18, 4.53it/s] 81it [00:18, 4.41it/s] 82it [00:18, 4.47it/s] 83it [00:18, 4.48it/s] 84it [00:18, 4.51it/s] 85it [00:19, 4.53it/s] 86it [00:19, 4.54it/s] 87it [00:19, 4.39it/s] 88it [00:19, 4.46it/s] 89it [00:20, 4.49it/s] 90it [00:20, 4.48it/s] 91it [00:20, 4.46it/s] 92it [00:20, 4.48it/s] 93it [00:20, 4.52it/s] 94it [00:21, 4.40it/s] 95it [00:21, 4.47it/s] 96it [00:21, 4.50it/s] 97it [00:21, 4.54it/s] 98it [00:22, 4.49it/s] 99it [00:22, 4.51it/s] 100it [00:22, 4.39it/s]2025-05-25 22:19:37,102 - INFO - [Epoch 068 | Batch 0100] IWAE-loss 1225.7665 | mean log_px -0.0087 | KL -1041.03 + 101it [00:22, 4.44it/s] 102it [00:22, 4.49it/s] 103it [00:23, 4.50it/s] 104it [00:23, 4.51it/s] 105it [00:23, 4.53it/s] 106it [00:23, 4.37it/s] 107it [00:24, 4.43it/s] 108it [00:24, 4.46it/s] 109it [00:24, 4.48it/s] 110it [00:24, 4.50it/s] 111it [00:24, 4.50it/s] 112it [00:25, 4.52it/s] 113it [00:25, 4.38it/s] 114it [00:25, 4.44it/s] 115it [00:25, 4.44it/s] 116it [00:26, 4.47it/s] 117it [00:26, 4.49it/s] 118it [00:26, 4.52it/s] 119it [00:26, 4.40it/s] 120it [00:26, 4.47it/s] 121it [00:27, 4.50it/s] 122it [00:27, 4.49it/s] 123it [00:27, 4.39it/s] 124it [00:27, 4.44it/s] 125it [00:28, 4.47it/s] 126it [00:28, 4.49it/s] 127it [00:28, 4.52it/s] 128it [00:28, 4.50it/s] 129it [00:28, 4.53it/s] 130it [00:29, 4.36it/s] 131it [00:29, 4.41it/s] 132it [00:29, 4.44it/s] 133it [00:29, 4.30it/s] 134it [00:30, 4.36it/s] 135it [00:30, 4.44it/s] 136it [00:30, 4.52it/s] 137it [00:30, 4.58it/s] 138it [00:31, 4.60it/s] 139it [00:31, 4.64it/s] 140it [00:31, 4.63it/s] 141it [00:31, 4.61it/s] 142it [00:31, 4.62it/s] 143it [00:32, 4.65it/s] 144it [00:32, 4.67it/s] 145it [00:32, 4.68it/s] 146it [00:32, 4.69it/s] 147it [00:32, 4.70it/s] 148it [00:33, 4.70it/s] 149it [00:33, 4.71it/s] 150it [00:33, 4.70it/s]2025-05-25 22:19:48,147 - INFO - [Epoch 068 | Batch 0150] IWAE-loss 1264.9144 | mean log_px -0.0035 | KL -1042.59 + 151it [00:33, 4.70it/s] 152it [00:33, 4.70it/s] 153it [00:34, 4.71it/s] 154it [00:34, 4.71it/s] 155it [00:34, 4.72it/s] 156it [00:34, 4.71it/s] 157it [00:35, 4.72it/s] 158it [00:35, 4.71it/s] 159it [00:35, 4.72it/s] 160it [00:35, 4.71it/s] 161it [00:35, 4.71it/s] 162it [00:36, 4.71it/s] 163it [00:36, 4.72it/s] 164it [00:36, 4.71it/s] 165it [00:36, 4.73it/s] 166it [00:36, 4.75it/s] 167it [00:37, 4.72it/s] 168it [00:37, 4.72it/s] 169it [00:37, 4.72it/s] 170it [00:37, 4.74it/s] 171it [00:38, 4.72it/s] 172it [00:38, 4.71it/s] 173it [00:38, 4.72it/s] 174it [00:38, 4.72it/s] 175it [00:38, 4.72it/s] 176it [00:39, 4.72it/s] 177it [00:39, 4.72it/s] 178it [00:39, 4.72it/s] 179it [00:39, 4.72it/s] 180it [00:39, 4.71it/s] 181it [00:40, 4.72it/s] 182it [00:40, 4.71it/s] 183it [00:40, 4.72it/s] 184it [00:40, 4.72it/s] 185it [00:40, 4.72it/s] 186it [00:41, 4.72it/s] 187it [00:41, 4.73it/s] 188it [00:41, 4.72it/s] 189it [00:41, 4.72it/s] 190it [00:42, 4.72it/s] 191it [00:42, 4.72it/s] 192it [00:42, 4.71it/s] 193it [00:42, 4.72it/s] 194it [00:42, 4.72it/s] 195it [00:43, 4.47it/s] 196it [00:43, 4.41it/s] 196it [00:43, 4.51it/s] +2025-05-25 22:19:57,879 - INFO - Epoch: 68, Objective: tensor([1242.0751], device='cuda:0', grad_fn=), Loss: 0.003887968137860298, KL/n: 21.28978157043457 + 0it [00:00, ?it/s]2025-05-25 22:19:58,280 - INFO - [Epoch 069 | Batch 0000] IWAE-loss 1280.5768 | mean log_px -0.0051 | KL -1042.65 + 1it [00:00, 3.05it/s] 2it [00:00, 3.65it/s] 3it [00:00, 3.90it/s] 4it [00:01, 4.01it/s] 5it [00:01, 4.12it/s] 6it [00:01, 4.16it/s] 7it [00:01, 4.19it/s] 8it [00:01, 4.25it/s] 9it [00:02, 4.39it/s] 10it [00:02, 4.48it/s] 11it [00:02, 4.42it/s] 12it [00:02, 4.47it/s] 13it [00:03, 4.55it/s] 14it [00:03, 3.64it/s] 15it [00:03, 3.88it/s] 16it [00:03, 4.09it/s] 17it [00:04, 4.14it/s] 18it [00:04, 4.15it/s] 19it [00:04, 4.24it/s] 20it [00:04, 4.34it/s] 21it [00:05, 4.34it/s] 22it [00:05, 4.33it/s] 23it [00:05, 4.32it/s] 24it [00:05, 4.31it/s] 25it [00:05, 4.20it/s] 26it [00:06, 4.33it/s] 27it [00:06, 4.31it/s] 28it [00:06, 4.31it/s] 29it [00:06, 4.39it/s] 30it [00:07, 4.48it/s] 31it [00:07, 4.40it/s] 32it [00:07, 4.49it/s] 33it [00:07, 4.56it/s] 34it [00:07, 4.59it/s] 35it [00:08, 4.66it/s] 36it [00:08, 4.66it/s] 37it [00:08, 4.68it/s] 38it [00:08, 4.63it/s] 39it [00:09, 4.60it/s] 40it [00:09, 4.50it/s] 41it [00:09, 4.40it/s] 42it [00:09, 4.46it/s] 43it [00:09, 4.25it/s] 44it [00:10, 4.36it/s] 45it [00:10, 4.42it/s] 46it [00:10, 4.48it/s] 47it [00:10, 4.48it/s] 48it [00:11, 4.13it/s] 49it [00:11, 4.20it/s] 50it [00:11, 4.26it/s]2025-05-25 22:20:09,780 - INFO - [Epoch 069 | Batch 0050] IWAE-loss 1204.5205 | mean log_px -0.0046 | KL -1043.10 + 51it [00:11, 4.35it/s] 52it [00:12, 4.32it/s] 53it [00:12, 4.39it/s] 54it [00:12, 4.31it/s] 55it [00:12, 4.32it/s] 56it [00:12, 4.41it/s] 57it [00:13, 4.52it/s] 58it [00:13, 4.55it/s] 59it [00:13, 4.59it/s] 60it [00:13, 4.62it/s] 61it [00:14, 4.52it/s] 62it [00:14, 4.58it/s] 63it [00:14, 4.43it/s] 64it [00:14, 4.50it/s] 65it [00:14, 4.53it/s] 66it [00:15, 4.58it/s] 67it [00:15, 4.64it/s] 68it [00:15, 4.53it/s] 69it [00:15, 4.44it/s] 70it [00:16, 4.51it/s] 71it [00:16, 4.45it/s] 72it [00:16, 4.42it/s] 73it [00:16, 4.48it/s] 74it [00:16, 4.52it/s] 75it [00:17, 4.49it/s] 76it [00:17, 4.55it/s] 77it [00:17, 4.57it/s] 78it [00:17, 4.40it/s] 79it [00:18, 4.42it/s] 80it [00:18, 4.48it/s] 81it [00:18, 4.40it/s] 82it [00:18, 4.45it/s] 83it [00:18, 4.51it/s] 84it [00:19, 4.54it/s] 85it [00:19, 4.48it/s] 86it [00:19, 4.39it/s] 87it [00:19, 4.47it/s] 88it [00:20, 4.52it/s] 89it [00:20, 4.56it/s] 90it [00:20, 4.57it/s] 91it [00:20, 4.60it/s] 92it [00:20, 4.56it/s] 93it [00:21, 4.47it/s] 94it [00:21, 4.50it/s] 95it [00:21, 4.56it/s] 96it [00:21, 4.48it/s] 97it [00:22, 4.50it/s] 98it [00:22, 4.41it/s] 99it [00:22, 4.43it/s] 100it [00:22, 4.51it/s]2025-05-25 22:20:20,892 - INFO - [Epoch 069 | Batch 0100] IWAE-loss 1164.3147 | mean log_px -0.0017 | KL -1040.04 + 101it [00:22, 4.56it/s] 102it [00:23, 4.48it/s] 103it [00:23, 4.51it/s] 104it [00:23, 4.56it/s] 105it [00:23, 4.61it/s] 106it [00:24, 4.63it/s] 107it [00:24, 4.52it/s] 108it [00:24, 4.44it/s] 109it [00:24, 4.39it/s] 110it [00:24, 4.47it/s] 111it [00:25, 4.54it/s] 112it [00:25, 4.57it/s] 113it [00:25, 4.60it/s] 114it [00:25, 4.60it/s] 115it [00:26, 4.60it/s] 116it [00:26, 4.61it/s] 117it [00:26, 4.65it/s] 118it [00:26, 4.65it/s] 119it [00:26, 4.67it/s] 120it [00:27, 4.67it/s] 121it [00:27, 4.52it/s] 122it [00:27, 4.57it/s] 123it [00:27, 4.57it/s] 124it [00:27, 4.61it/s] 125it [00:28, 4.59it/s] 126it [00:28, 4.62it/s] 127it [00:28, 4.64it/s] 128it [00:28, 4.49it/s] 129it [00:29, 4.45it/s] 130it [00:29, 4.38it/s] 131it [00:29, 4.34it/s] 132it [00:29, 4.32it/s] 133it [00:30, 4.29it/s] 134it [00:30, 4.28it/s] 135it [00:30, 4.26it/s] 136it [00:30, 4.37it/s] 137it [00:30, 4.45it/s] 138it [00:31, 4.52it/s] 139it [00:31, 4.57it/s] 140it [00:31, 4.60it/s] 141it [00:31, 4.63it/s] 142it [00:32, 4.63it/s] 143it [00:32, 4.64it/s] 144it [00:32, 4.65it/s] 145it [00:32, 4.66it/s] 146it [00:32, 4.51it/s] 147it [00:33, 4.55it/s] 148it [00:33, 4.56it/s] 149it [00:33, 4.56it/s] 150it [00:33, 4.56it/s]2025-05-25 22:20:31,923 - INFO - [Epoch 069 | Batch 0150] IWAE-loss 1321.3817 | mean log_px -0.0040 | KL -1039.04 + 151it [00:33, 4.57it/s] 152it [00:34, 4.57it/s] 153it [00:34, 4.46it/s] 154it [00:34, 4.40it/s] 155it [00:34, 4.36it/s] 156it [00:35, 4.29it/s] 157it [00:35, 4.30it/s] 158it [00:35, 4.27it/s] 159it [00:35, 4.35it/s] 160it [00:36, 4.32it/s] 161it [00:36, 4.27it/s] 162it [00:36, 4.36it/s] 163it [00:36, 4.40it/s] 164it [00:36, 4.35it/s] 165it [00:37, 4.41it/s] 166it [00:37, 4.46it/s] 167it [00:37, 4.40it/s] 168it [00:37, 4.47it/s] 169it [00:38, 4.37it/s] 170it [00:38, 4.45it/s] 171it [00:38, 4.52it/s] 172it [00:38, 4.52it/s] 173it [00:38, 4.54it/s] 174it [00:39, 4.44it/s] 175it [00:39, 4.46it/s] 176it [00:39, 4.47it/s] 177it [00:39, 4.44it/s] 178it [00:40, 4.48it/s] 179it [00:40, 4.41it/s] 180it [00:40, 4.23it/s] 181it [00:40, 4.29it/s] 182it [00:41, 4.26it/s] 183it [00:41, 4.24it/s] 184it [00:41, 4.35it/s] 185it [00:41, 4.42it/s] 186it [00:41, 4.48it/s] 187it [00:42, 4.38it/s] 188it [00:42, 4.23it/s] 189it [00:42, 4.32it/s] 190it [00:42, 4.29it/s] 191it [00:43, 4.27it/s] 192it [00:43, 4.34it/s] 193it [00:43, 4.41it/s] 194it [00:43, 4.35it/s] 195it [00:44, 4.31it/s] 196it [00:44, 4.39it/s] 196it [00:44, 4.42it/s] +2025-05-25 22:20:42,356 - INFO - Epoch: 69, Objective: tensor([1152.8077], device='cuda:0', grad_fn=), Loss: 0.006191767752170563, KL/n: 21.240211486816406 + 0it [00:00, ?it/s]2025-05-25 22:20:42,729 - INFO - [Epoch 070 | Batch 0000] IWAE-loss 1134.6925 | mean log_px -0.0031 | KL -1039.89 + 1it [00:00, 3.06it/s] 2it [00:00, 3.71it/s] 3it [00:00, 4.03it/s] 4it [00:00, 4.25it/s] 5it [00:01, 4.21it/s] 6it [00:01, 4.22it/s] 7it [00:01, 4.20it/s] 8it [00:01, 4.33it/s] 9it [00:02, 4.27it/s] 10it [00:02, 4.26it/s] 11it [00:02, 4.35it/s] 12it [00:02, 4.44it/s] 13it [00:03, 4.36it/s] 14it [00:03, 4.32it/s] 15it [00:03, 4.31it/s] 16it [00:03, 4.28it/s] 17it [00:04, 4.26it/s] 18it [00:04, 4.24it/s] 19it [00:04, 4.22it/s] 20it [00:04, 4.05it/s] 21it [00:04, 4.18it/s] 22it [00:05, 4.31it/s] 23it [00:05, 4.41it/s] 24it [00:05, 4.33it/s] 25it [00:05, 4.25it/s] 26it [00:06, 4.23it/s] 27it [00:06, 4.30it/s] 28it [00:06, 4.41it/s] 29it [00:06, 4.49it/s] 30it [00:07, 4.55it/s] 31it [00:07, 4.57it/s] 32it [00:07, 4.61it/s] 33it [00:07, 4.58it/s] 34it [00:07, 4.60it/s] 35it [00:08, 4.44it/s] 36it [00:08, 4.36it/s] 37it [00:08, 4.36it/s] 38it [00:08, 4.44it/s] 39it [00:09, 4.51it/s] 40it [00:09, 4.55it/s] 41it [00:09, 4.41it/s] 42it [00:09, 4.35it/s] 43it [00:09, 4.30it/s] 44it [00:10, 4.33it/s] 45it [00:10, 4.42it/s] 46it [00:10, 4.35it/s] 47it [00:10, 4.30it/s] 48it [00:11, 4.40it/s] 49it [00:11, 4.45it/s] 50it [00:11, 4.50it/s]2025-05-25 22:20:54,194 - INFO - [Epoch 070 | Batch 0050] IWAE-loss 1186.9631 | mean log_px -0.0027 | KL -1039.01 + 51it [00:11, 4.21it/s] 52it [00:12, 4.34it/s] 53it [00:12, 4.38it/s] 54it [00:12, 4.45it/s] 55it [00:12, 4.35it/s] 56it [00:12, 4.42it/s] 57it [00:13, 4.44it/s] 58it [00:13, 4.50it/s] 59it [00:13, 4.55it/s] 60it [00:13, 4.41it/s] 61it [00:14, 4.46it/s] 62it [00:14, 4.52it/s] 63it [00:14, 4.55it/s] 64it [00:14, 4.45it/s] 65it [00:14, 4.36it/s] 66it [00:15, 4.30it/s] 67it [00:15, 4.27it/s] 68it [00:15, 4.25it/s] 69it [00:15, 4.22it/s] 70it [00:16, 4.20it/s] 71it [00:16, 4.31it/s] 72it [00:16, 4.39it/s] 73it [00:16, 4.36it/s] 74it [00:17, 4.29it/s] 75it [00:17, 4.34it/s] 76it [00:17, 4.40it/s] 77it [00:17, 4.34it/s] 78it [00:17, 4.36it/s] 79it [00:18, 4.30it/s] 80it [00:18, 4.26it/s] 81it [00:18, 4.36it/s] 82it [00:18, 4.37it/s] 83it [00:19, 4.43it/s] 84it [00:19, 4.48it/s] 85it [00:19, 4.36it/s] 86it [00:19, 4.43it/s] 87it [00:20, 4.35it/s] 88it [00:20, 4.29it/s] 89it [00:20, 4.30it/s] 90it [00:20, 4.12it/s] 91it [00:20, 4.13it/s] 92it [00:21, 4.27it/s] 93it [00:21, 4.37it/s] 94it [00:21, 4.30it/s] 95it [00:21, 4.37it/s] 96it [00:22, 4.45it/s] 97it [00:22, 4.41it/s] 98it [00:22, 4.50it/s] 99it [00:22, 4.55it/s] 100it [00:22, 4.59it/s]2025-05-25 22:21:05,619 - INFO - [Epoch 070 | Batch 0100] IWAE-loss 1322.7841 | mean log_px -0.0044 | KL -1041.32 + 101it [00:23, 4.37it/s] 102it [00:23, 4.46it/s] 103it [00:23, 4.49it/s] 104it [00:23, 4.39it/s] 105it [00:24, 4.32it/s] 106it [00:24, 4.42it/s] 107it [00:24, 4.33it/s] 108it [00:24, 4.29it/s] 109it [00:25, 4.25it/s] 110it [00:25, 4.22it/s] 111it [00:25, 4.27it/s] 112it [00:25, 4.25it/s] 113it [00:26, 4.23it/s] 114it [00:26, 4.22it/s] 115it [00:26, 4.31it/s] 116it [00:26, 4.31it/s] 117it [00:26, 4.17it/s] 118it [00:27, 4.30it/s] 119it [00:27, 4.40it/s] 120it [00:27, 4.48it/s] 121it [00:27, 4.53it/s] 122it [00:28, 4.56it/s] 123it [00:28, 4.59it/s] 124it [00:28, 4.61it/s] 125it [00:28, 4.64it/s] 126it [00:28, 4.60it/s] 127it [00:29, 4.63it/s] 128it [00:29, 4.63it/s] 129it [00:29, 4.42it/s] 130it [00:29, 4.49it/s] 131it [00:30, 4.51it/s] 132it [00:30, 4.53it/s] 133it [00:30, 4.57it/s] 134it [00:30, 4.60it/s] 135it [00:30, 4.47it/s] 136it [00:31, 4.37it/s] 137it [00:31, 4.33it/s] 138it [00:31, 4.40it/s] 139it [00:31, 4.49it/s] 140it [00:32, 4.52it/s] 141it [00:32, 4.42it/s] 142it [00:32, 4.34it/s] 143it [00:32, 4.42it/s] 144it [00:32, 4.33it/s] 145it [00:33, 4.23it/s] 146it [00:33, 4.21it/s] 147it [00:33, 4.20it/s] 148it [00:33, 4.23it/s] 149it [00:34, 4.35it/s] 150it [00:34, 4.27it/s]2025-05-25 22:21:17,035 - INFO - [Epoch 070 | Batch 0150] IWAE-loss 1312.4045 | mean log_px -0.0061 | KL -1034.94 + 151it [00:34, 4.28it/s] 152it [00:34, 4.36it/s] 153it [00:35, 4.29it/s] 154it [00:35, 4.38it/s] 155it [00:35, 4.35it/s] 156it [00:35, 4.27it/s] 157it [00:35, 4.27it/s] 158it [00:36, 4.25it/s] 159it [00:36, 4.39it/s] 160it [00:36, 4.47it/s] 161it [00:36, 4.38it/s] 162it [00:37, 4.32it/s] 163it [00:37, 4.41it/s] 164it [00:37, 4.45it/s] 165it [00:37, 4.37it/s] 166it [00:38, 4.42it/s] 167it [00:38, 4.32it/s] 168it [00:38, 4.43it/s] 169it [00:38, 4.51it/s] 170it [00:38, 4.55it/s] 171it [00:39, 4.59it/s] 172it [00:39, 4.60it/s] 173it [00:39, 4.31it/s] 174it [00:39, 4.27it/s] 175it [00:40, 4.25it/s] 176it [00:40, 4.32it/s] 177it [00:40, 4.41it/s] 178it [00:40, 4.47it/s] 179it [00:40, 4.37it/s] 180it [00:41, 4.46it/s] 181it [00:41, 4.52it/s] 182it [00:41, 4.51it/s] 183it [00:41, 4.54it/s] 184it [00:42, 4.54it/s] 185it [00:42, 4.43it/s] 186it [00:42, 4.49it/s] 187it [00:42, 4.40it/s] 188it [00:42, 4.44it/s] 189it [00:43, 4.50it/s] 190it [00:43, 4.53it/s] 191it [00:43, 4.43it/s] 192it [00:43, 4.51it/s] 193it [00:44, 4.41it/s] 194it [00:44, 4.32it/s] 195it [00:44, 4.29it/s] 196it [00:44, 4.39it/s] 196it [00:44, 4.37it/s] +2025-05-25 22:21:27,353 - INFO - Epoch: 70, Objective: tensor([1542.3411], device='cuda:0', grad_fn=), Loss: 0.008527607657015324, KL/n: 21.169261932373047 + 0it [00:00, ?it/s]2025-05-25 22:21:27,934 - INFO - [Epoch 071 | Batch 0000] IWAE-loss 1529.1766 | mean log_px -0.0078 | KL -1036.11 + 1it [00:00, 2.84it/s] 2it [00:00, 3.60it/s] 3it [00:00, 3.94it/s] 4it [00:01, 4.16it/s] 5it [00:01, 4.27it/s] 6it [00:01, 4.36it/s] 7it [00:01, 4.42it/s] 8it [00:01, 4.51it/s] 9it [00:02, 4.39it/s] 10it [00:02, 4.47it/s] 11it [00:02, 4.54it/s] 12it [00:02, 4.57it/s] 13it [00:03, 4.54it/s] 14it [00:03, 4.59it/s] 15it [00:03, 4.60it/s] 16it [00:03, 4.63it/s] 17it [00:03, 4.60it/s] 18it [00:04, 4.63it/s] 19it [00:04, 4.60it/s] 20it [00:04, 4.66it/s] 21it [00:04, 4.62it/s] 22it [00:04, 4.48it/s] 23it [00:05, 4.55it/s] 24it [00:05, 4.57it/s] 25it [00:05, 4.59it/s] 26it [00:05, 4.56it/s] 27it [00:06, 4.62it/s] 28it [00:06, 4.61it/s] 29it [00:06, 4.66it/s] 30it [00:06, 4.64it/s] 31it [00:06, 4.62it/s] 32it [00:07, 4.42it/s] 33it [00:07, 4.47it/s] 34it [00:07, 4.51it/s] 35it [00:07, 4.51it/s] 36it [00:08, 4.51it/s] 37it [00:08, 4.55it/s] 38it [00:08, 4.41it/s] 39it [00:08, 4.48it/s] 40it [00:08, 4.47it/s] 41it [00:09, 4.53it/s] 42it [00:09, 4.58it/s] 43it [00:09, 4.54it/s] 44it [00:09, 4.55it/s] 45it [00:10, 4.37it/s] 46it [00:10, 4.49it/s] 47it [00:10, 4.47it/s] 48it [00:10, 4.51it/s] 49it [00:10, 4.53it/s] 50it [00:11, 4.54it/s]2025-05-25 22:21:38,968 - INFO - [Epoch 071 | Batch 0050] IWAE-loss 1191.1381 | mean log_px -0.0072 | KL -1032.97 + 51it [00:11, 4.59it/s] 52it [00:11, 4.62it/s] 53it [00:11, 4.64it/s] 54it [00:12, 4.60it/s] 55it [00:12, 4.64it/s] 56it [00:12, 4.38it/s] 57it [00:12, 4.41it/s] 58it [00:12, 4.46it/s] 59it [00:13, 4.45it/s] 60it [00:13, 4.45it/s] 61it [00:13, 4.54it/s] 62it [00:13, 4.59it/s] 63it [00:14, 4.61it/s] 64it [00:14, 4.53it/s] 65it [00:14, 4.52it/s] 66it [00:14, 4.54it/s] 67it [00:14, 4.58it/s] 68it [00:15, 4.49it/s] 69it [00:15, 4.53it/s] 70it [00:15, 4.58it/s] 71it [00:15, 4.53it/s] 72it [00:15, 4.54it/s] 73it [00:16, 4.51it/s] 74it [00:16, 4.51it/s] 75it [00:16, 4.43it/s] 76it [00:16, 4.48it/s] 77it [00:17, 4.41it/s] 78it [00:17, 4.44it/s] 79it [00:17, 4.48it/s] 80it [00:17, 4.53it/s] 81it [00:18, 4.52it/s] 82it [00:18, 4.45it/s] 83it [00:18, 4.39it/s] 84it [00:18, 4.37it/s] 85it [00:18, 4.42it/s] 86it [00:19, 4.47it/s] 87it [00:19, 4.48it/s] 88it [00:19, 4.49it/s] 89it [00:19, 4.45it/s] 90it [00:20, 4.48it/s] 91it [00:20, 4.51it/s] 92it [00:20, 4.51it/s] 93it [00:20, 4.50it/s] 94it [00:20, 4.51it/s] 95it [00:21, 4.50it/s] 96it [00:21, 4.37it/s] 97it [00:21, 4.39it/s] 98it [00:21, 4.47it/s] 99it [00:22, 4.44it/s] 100it [00:22, 4.39it/s]2025-05-25 22:21:50,123 - INFO - [Epoch 071 | Batch 0100] IWAE-loss 1299.5299 | mean log_px -0.0067 | KL -1027.02 + 101it [00:22, 4.39it/s] 102it [00:22, 4.47it/s] 103it [00:22, 4.49it/s] 104it [00:23, 4.43it/s] 105it [00:23, 4.51it/s] 106it [00:23, 4.52it/s] 107it [00:23, 4.56it/s] 108it [00:24, 4.57it/s] 109it [00:24, 4.57it/s] 110it [00:24, 4.55it/s] 111it [00:24, 4.41it/s] 112it [00:24, 4.51it/s] 113it [00:25, 4.49it/s] 114it [00:25, 4.56it/s] 115it [00:25, 4.47it/s] 116it [00:25, 4.53it/s] 117it [00:26, 4.36it/s] 118it [00:26, 4.44it/s] 119it [00:26, 4.47it/s] 120it [00:26, 4.54it/s] 121it [00:26, 4.53it/s] 122it [00:27, 4.41it/s] 123it [00:27, 4.51it/s] 124it [00:27, 4.52it/s] 125it [00:27, 4.56it/s] 126it [00:28, 4.60it/s] 127it [00:28, 4.51it/s] 128it [00:28, 4.54it/s] 129it [00:28, 4.55it/s] 130it [00:28, 4.56it/s] 131it [00:29, 4.57it/s] 132it [00:29, 4.44it/s] 133it [00:29, 4.55it/s] 134it [00:29, 4.58it/s] 135it [00:30, 4.50it/s] 136it [00:30, 4.52it/s] 137it [00:30, 4.52it/s] 138it [00:30, 4.58it/s] 139it [00:30, 4.56it/s] 140it [00:31, 4.59it/s] 141it [00:31, 4.64it/s] 142it [00:31, 4.57it/s] 143it [00:31, 4.58it/s] 144it [00:32, 4.54it/s] 145it [00:32, 4.54it/s] 146it [00:32, 4.59it/s] 147it [00:32, 4.61it/s] 148it [00:32, 4.58it/s] 149it [00:33, 4.50it/s] 150it [00:33, 4.59it/s]2025-05-25 22:22:01,138 - INFO - [Epoch 071 | Batch 0150] IWAE-loss 1175.8381 | mean log_px -0.0057 | KL -1027.57 + 151it [00:33, 4.60it/s] 152it [00:33, 4.59it/s] 153it [00:33, 4.63it/s] 154it [00:34, 4.65it/s] 155it [00:34, 4.61it/s] 156it [00:34, 4.55it/s] 157it [00:34, 4.58it/s] 158it [00:35, 4.60it/s] 159it [00:35, 4.57it/s] 160it [00:35, 4.60it/s] 161it [00:35, 4.61it/s] 162it [00:35, 4.62it/s] 163it [00:36, 4.38it/s] 164it [00:36, 4.47it/s] 165it [00:36, 4.52it/s] 166it [00:36, 4.52it/s] 167it [00:37, 4.54it/s] 168it [00:37, 4.61it/s] 169it [00:37, 4.56it/s] 170it [00:37, 4.60it/s] 171it [00:37, 4.63it/s] 172it [00:38, 4.60it/s] 173it [00:38, 4.60it/s] 174it [00:38, 4.63it/s] 175it [00:38, 4.60it/s] 176it [00:38, 4.62it/s] 177it [00:39, 4.43it/s] 178it [00:39, 4.51it/s] 179it [00:39, 4.54it/s] 180it [00:39, 4.54it/s] 181it [00:40, 4.54it/s] 182it [00:40, 4.58it/s] 183it [00:40, 4.63it/s] 184it [00:40, 4.55it/s] 185it [00:40, 4.58it/s] 186it [00:41, 4.52it/s] 187it [00:41, 4.60it/s] 188it [00:41, 4.52it/s] 189it [00:41, 4.56it/s] 190it [00:42, 4.43it/s] 191it [00:42, 4.50it/s] 192it [00:42, 4.54it/s] 193it [00:42, 4.60it/s] 194it [00:42, 4.62it/s] 195it [00:43, 4.53it/s] 196it [00:43, 4.60it/s] 196it [00:43, 4.51it/s] +2025-05-25 22:22:11,133 - INFO - Epoch: 71, Objective: tensor([1101.7721], device='cuda:0', grad_fn=), Loss: 0.003083721501752734, KL/n: 21.038372039794922 + 0it [00:00, ?it/s]2025-05-25 22:22:11,542 - INFO - [Epoch 072 | Batch 0000] IWAE-loss 1105.3588 | mean log_px -0.0021 | KL -1030.98 + 1it [00:00, 2.77it/s] 2it [00:00, 3.62it/s] 3it [00:00, 4.00it/s] 4it [00:01, 4.21it/s] 5it [00:01, 4.37it/s] 6it [00:01, 4.43it/s] 7it [00:01, 4.50it/s] 8it [00:01, 4.53it/s] 9it [00:02, 4.59it/s] 10it [00:02, 4.62it/s] 11it [00:02, 4.63it/s] 12it [00:02, 4.65it/s] 13it [00:02, 4.67it/s] 14it [00:03, 4.68it/s] 15it [00:03, 4.66it/s] 16it [00:03, 4.66it/s] 17it [00:03, 4.68it/s] 18it [00:04, 4.55it/s] 19it [00:04, 4.56it/s] 20it [00:04, 4.60it/s] 21it [00:04, 4.59it/s] 22it [00:04, 4.58it/s] 23it [00:05, 4.59it/s] 24it [00:05, 4.59it/s] 25it [00:05, 3.64it/s] 26it [00:05, 3.90it/s] 27it [00:06, 4.08it/s] 28it [00:06, 4.23it/s] 29it [00:06, 4.35it/s] 30it [00:06, 4.40it/s] 31it [00:07, 4.47it/s] 32it [00:07, 4.48it/s] 33it [00:07, 4.55it/s] 34it [00:07, 4.50it/s] 35it [00:07, 4.56it/s] 36it [00:08, 4.60it/s] 37it [00:08, 4.57it/s] 38it [00:08, 4.44it/s] 39it [00:08, 4.46it/s] 40it [00:09, 4.36it/s] 41it [00:09, 4.46it/s] 42it [00:09, 4.48it/s] 43it [00:09, 4.39it/s] 44it [00:09, 4.38it/s] 45it [00:10, 4.26it/s] 46it [00:10, 4.24it/s] 47it [00:10, 4.34it/s] 48it [00:10, 4.34it/s] 49it [00:11, 4.44it/s] 50it [00:11, 4.50it/s]2025-05-25 22:22:22,747 - INFO - [Epoch 072 | Batch 0050] IWAE-loss 1345.4274 | mean log_px -0.0059 | KL -1030.80 + 51it [00:11, 4.55it/s] 52it [00:11, 4.43it/s] 53it [00:11, 4.52it/s] 54it [00:12, 4.53it/s] 55it [00:12, 4.58it/s] 56it [00:12, 4.60it/s] 57it [00:12, 4.49it/s] 58it [00:13, 4.52it/s] 59it [00:13, 4.58it/s] 60it [00:13, 4.61it/s] 61it [00:13, 4.49it/s] 62it [00:13, 4.54it/s] 63it [00:14, 4.56it/s] 64it [00:14, 4.60it/s] 65it [00:14, 4.63it/s] 66it [00:14, 4.58it/s] 67it [00:15, 4.48it/s] 68it [00:15, 4.49it/s] 69it [00:15, 4.53it/s] 70it [00:15, 4.51it/s] 71it [00:15, 4.57it/s] 72it [00:16, 4.42it/s] 73it [00:16, 4.40it/s] 74it [00:16, 4.45it/s] 75it [00:16, 4.52it/s] 76it [00:17, 4.40it/s] 77it [00:17, 4.44it/s] 78it [00:17, 4.42it/s] 79it [00:17, 4.41it/s] 80it [00:17, 4.41it/s] 81it [00:18, 4.49it/s] 82it [00:18, 4.39it/s] 83it [00:18, 4.38it/s] 84it [00:18, 4.43it/s] 85it [00:19, 4.39it/s] 86it [00:19, 4.32it/s] 87it [00:19, 4.33it/s] 88it [00:19, 4.36it/s] 89it [00:20, 4.34it/s] 90it [00:20, 4.35it/s] 91it [00:20, 4.45it/s] 92it [00:20, 4.49it/s] 93it [00:20, 4.41it/s] 94it [00:21, 4.36it/s] 95it [00:21, 4.45it/s] 96it [00:21, 4.41it/s] 97it [00:21, 4.49it/s] 98it [00:22, 4.52it/s] 99it [00:22, 4.36it/s] 100it [00:22, 4.30it/s]2025-05-25 22:22:33,983 - INFO - [Epoch 072 | Batch 0100] IWAE-loss 1193.0322 | mean log_px -0.0023 | KL -1026.61 + 101it [00:22, 4.32it/s] 102it [00:23, 4.28it/s] 103it [00:23, 4.31it/s] 104it [00:23, 4.32it/s] 105it [00:23, 4.42it/s] 106it [00:23, 4.43it/s] 107it [00:24, 4.46it/s] 108it [00:24, 4.41it/s] 109it [00:24, 4.36it/s] 110it [00:24, 4.32it/s] 111it [00:25, 4.31it/s] 112it [00:25, 4.38it/s] 113it [00:25, 4.36it/s] 114it [00:25, 4.35it/s] 115it [00:25, 4.43it/s] 116it [00:26, 4.34it/s] 117it [00:26, 4.27it/s] 118it [00:26, 4.22it/s] 119it [00:26, 4.21it/s] 120it [00:27, 4.18it/s] 121it [00:27, 4.31it/s] 122it [00:27, 4.24it/s] 123it [00:27, 4.37it/s] 124it [00:28, 4.44it/s] 125it [00:28, 4.49it/s] 126it [00:28, 4.54it/s] 127it [00:28, 4.59it/s] 128it [00:28, 4.61it/s] 129it [00:29, 4.58it/s] 130it [00:29, 4.43it/s] 131it [00:29, 4.49it/s] 132it [00:29, 4.54it/s] 133it [00:30, 4.56it/s] 134it [00:30, 4.45it/s] 135it [00:30, 4.24it/s] 136it [00:30, 4.26it/s] 137it [00:30, 4.38it/s] 138it [00:31, 4.20it/s] 139it [00:31, 4.23it/s] 140it [00:31, 4.33it/s] 141it [00:31, 4.32it/s] 142it [00:32, 4.40it/s] 143it [00:32, 4.30it/s] 144it [00:32, 4.29it/s] 145it [00:32, 4.35it/s] 146it [00:33, 4.44it/s] 147it [00:33, 4.35it/s] 148it [00:33, 4.34it/s] 149it [00:33, 4.43it/s] 150it [00:33, 4.35it/s]2025-05-25 22:22:45,424 - INFO - [Epoch 072 | Batch 0150] IWAE-loss 1439.5580 | mean log_px -0.0069 | KL -1025.86 + 151it [00:34, 4.22it/s] 152it [00:34, 4.29it/s] 153it [00:34, 4.41it/s] 154it [00:34, 4.39it/s] 155it [00:35, 4.46it/s] 156it [00:35, 4.36it/s] 157it [00:35, 4.21it/s] 158it [00:35, 4.32it/s] 159it [00:36, 4.28it/s] 160it [00:36, 4.40it/s] 161it [00:36, 4.37it/s] 162it [00:36, 4.34it/s] 163it [00:37, 4.16it/s] 164it [00:37, 4.16it/s] 165it [00:37, 4.22it/s] 166it [00:37, 4.20it/s] 167it [00:37, 4.24it/s] 168it [00:38, 4.22it/s] 169it [00:38, 4.20it/s] 170it [00:38, 4.19it/s] 171it [00:38, 4.23it/s] 172it [00:39, 4.28it/s] 173it [00:39, 4.27it/s] 174it [00:39, 4.33it/s] 175it [00:39, 4.42it/s] 176it [00:40, 4.30it/s] 177it [00:40, 4.40it/s] 178it [00:40, 4.31it/s] 179it [00:40, 4.41it/s] 180it [00:40, 4.21it/s] 181it [00:41, 4.26it/s] 182it [00:41, 4.28it/s] 183it [00:41, 4.18it/s] 184it [00:41, 4.14it/s] 185it [00:42, 4.20it/s] 186it [00:42, 4.19it/s] 187it [00:42, 4.15it/s] 188it [00:42, 4.30it/s] 189it [00:43, 4.39it/s] 190it [00:43, 4.36it/s] 191it [00:43, 4.33it/s] 192it [00:43, 4.38it/s] 193it [00:44, 4.45it/s] 194it [00:44, 4.49it/s] 195it [00:44, 4.29it/s] 196it [00:44, 4.26it/s] 196it [00:44, 4.38it/s] +2025-05-25 22:22:56,063 - INFO - Epoch: 72, Objective: tensor([1084.2766], device='cuda:0', grad_fn=), Loss: 0.004034184850752354, KL/n: 20.965299606323242 + 0it [00:00, ?it/s]2025-05-25 22:22:56,470 - INFO - [Epoch 073 | Batch 0000] IWAE-loss 1114.9978 | mean log_px -0.0042 | KL -1030.27 + 1it [00:00, 3.00it/s] 2it [00:00, 3.61it/s] 3it [00:00, 3.88it/s] 4it [00:01, 4.05it/s] 5it [00:01, 4.27it/s] 6it [00:01, 4.37it/s] 7it [00:01, 4.19it/s] 8it [00:01, 4.30it/s] 9it [00:02, 4.42it/s] 10it [00:02, 4.35it/s] 11it [00:02, 4.46it/s] 12it [00:02, 4.36it/s] 13it [00:03, 4.26it/s] 14it [00:03, 4.32it/s] 15it [00:03, 4.41it/s] 16it [00:03, 4.33it/s] 17it [00:03, 4.40it/s] 18it [00:04, 4.48it/s] 19it [00:04, 4.51it/s] 20it [00:04, 4.24it/s] 21it [00:04, 4.36it/s] 22it [00:05, 4.31it/s] 23it [00:05, 4.28it/s] 24it [00:05, 4.28it/s] 25it [00:05, 4.24it/s] 26it [00:06, 4.24it/s] 27it [00:06, 4.31it/s] 28it [00:06, 4.31it/s] 29it [00:06, 4.35it/s] 30it [00:06, 4.42it/s] 31it [00:07, 4.40it/s] 32it [00:07, 4.25it/s] 33it [00:07, 4.35it/s] 34it [00:07, 4.29it/s] 35it [00:08, 4.39it/s] 36it [00:08, 4.47it/s] 37it [00:08, 4.22it/s] 38it [00:08, 4.24it/s] 39it [00:09, 4.37it/s] 40it [00:09, 4.30it/s] 41it [00:09, 4.41it/s] 42it [00:09, 4.32it/s] 43it [00:10, 4.25it/s] 44it [00:10, 4.32it/s] 45it [00:10, 4.34it/s] 46it [00:10, 4.31it/s] 47it [00:10, 4.34it/s] 48it [00:11, 4.33it/s] 49it [00:11, 4.16it/s] 50it [00:11, 4.17it/s]2025-05-25 22:23:08,035 - INFO - [Epoch 073 | Batch 0050] IWAE-loss 1135.3855 | mean log_px -0.0090 | KL -1023.86 + 51it [00:11, 4.21it/s] 52it [00:12, 4.31it/s] 53it [00:12, 4.42it/s] 54it [00:12, 4.50it/s] 55it [00:12, 4.30it/s] 56it [00:13, 4.31it/s] 57it [00:13, 4.27it/s] 58it [00:13, 4.29it/s] 59it [00:13, 4.36it/s] 60it [00:13, 4.28it/s] 61it [00:14, 4.41it/s] 62it [00:14, 4.48it/s] 63it [00:14, 4.44it/s] 64it [00:14, 4.52it/s] 65it [00:15, 4.48it/s] 66it [00:15, 4.28it/s] 67it [00:15, 4.42it/s] 68it [00:15, 4.37it/s] 69it [00:15, 4.46it/s] 70it [00:16, 4.33it/s] 71it [00:16, 4.33it/s] 72it [00:16, 4.40it/s] 73it [00:16, 4.22it/s] 74it [00:17, 4.21it/s] 75it [00:17, 4.25it/s] 76it [00:17, 4.22it/s] 77it [00:17, 4.36it/s] 78it [00:18, 4.45it/s] 79it [00:18, 4.32it/s] 80it [00:18, 4.32it/s] 81it [00:18, 4.28it/s] 82it [00:19, 4.30it/s] 83it [00:19, 4.26it/s] 84it [00:19, 4.27it/s] 85it [00:19, 4.24it/s] 86it [00:19, 4.24it/s] 87it [00:20, 4.22it/s] 88it [00:20, 4.23it/s] 89it [00:20, 4.22it/s] 90it [00:20, 4.24it/s] 91it [00:21, 4.25it/s] 92it [00:21, 4.21it/s] 93it [00:21, 4.10it/s] 94it [00:21, 4.25it/s] 95it [00:22, 4.23it/s] 96it [00:22, 4.33it/s] 97it [00:22, 4.32it/s] 98it [00:22, 4.30it/s] 99it [00:23, 4.27it/s] 100it [00:23, 4.24it/s]2025-05-25 22:23:19,615 - INFO - [Epoch 073 | Batch 0100] IWAE-loss 1121.1622 | mean log_px -0.0042 | KL -1021.58 + 101it [00:23, 4.23it/s] 102it [00:23, 4.25it/s] 103it [00:23, 4.36it/s] 104it [00:24, 4.38it/s] 105it [00:24, 4.47it/s] 106it [00:24, 4.37it/s] 107it [00:24, 4.46it/s] 108it [00:25, 4.51it/s] 109it [00:25, 4.43it/s] 110it [00:25, 4.30it/s] 111it [00:25, 4.29it/s] 112it [00:26, 4.24it/s] 113it [00:26, 4.21it/s] 114it [00:26, 4.28it/s] 115it [00:26, 4.40it/s] 116it [00:26, 4.43it/s] 117it [00:27, 4.44it/s] 118it [00:27, 4.30it/s] 119it [00:27, 4.35it/s] 120it [00:27, 4.40it/s] 121it [00:28, 4.30it/s] 122it [00:28, 4.31it/s] 123it [00:28, 4.34it/s] 124it [00:28, 4.30it/s] 125it [00:29, 4.28it/s] 126it [00:29, 4.25it/s] 127it [00:29, 4.21it/s] 128it [00:29, 4.23it/s] 129it [00:29, 4.20it/s] 130it [00:30, 4.21it/s] 131it [00:30, 4.20it/s] 132it [00:30, 4.10it/s] 133it [00:30, 4.11it/s] 134it [00:31, 4.15it/s] 135it [00:31, 4.17it/s] 136it [00:31, 4.17it/s] 137it [00:31, 4.30it/s] 138it [00:32, 4.39it/s] 139it [00:32, 4.47it/s] 140it [00:32, 4.32it/s] 141it [00:32, 4.33it/s] 142it [00:33, 4.25it/s] 143it [00:33, 4.28it/s] 144it [00:33, 4.35it/s] 145it [00:33, 4.21it/s] 146it [00:33, 4.27it/s] 147it [00:34, 4.37it/s] 148it [00:34, 4.30it/s] 149it [00:34, 4.41it/s] 150it [00:34, 4.31it/s]2025-05-25 22:23:31,246 - INFO - [Epoch 073 | Batch 0150] IWAE-loss 1471.0764 | mean log_px -0.0143 | KL -1019.94 + 151it [00:35, 4.30it/s] 152it [00:35, 4.25it/s] 153it [00:35, 4.25it/s] 154it [00:35, 4.19it/s] 155it [00:36, 4.21it/s] 156it [00:36, 4.14it/s] 157it [00:36, 4.21it/s] 158it [00:36, 4.16it/s] 159it [00:37, 4.18it/s] 160it [00:37, 4.14it/s] 161it [00:37, 4.28it/s] 162it [00:37, 4.24it/s] 163it [00:37, 4.32it/s] 164it [00:38, 4.25it/s] 165it [00:38, 4.27it/s] 166it [00:38, 4.35it/s] 167it [00:38, 4.43it/s] 168it [00:39, 4.33it/s] 169it [00:39, 4.42it/s] 170it [00:39, 4.42it/s] 171it [00:39, 4.36it/s] 172it [00:40, 4.30it/s] 173it [00:40, 4.28it/s] 174it [00:40, 4.32it/s] 175it [00:40, 4.33it/s] 176it [00:40, 4.42it/s] 177it [00:41, 4.47it/s] 178it [00:41, 4.52it/s] 179it [00:41, 4.52it/s] 180it [00:41, 4.30it/s] 181it [00:42, 4.26it/s] 182it [00:42, 4.24it/s] 183it [00:42, 4.23it/s] 184it [00:42, 4.22it/s] 185it [00:43, 4.34it/s] 186it [00:43, 4.25it/s] 187it [00:43, 4.14it/s] 188it [00:43, 4.27it/s] 189it [00:43, 4.23it/s] 190it [00:44, 4.24it/s] 191it [00:44, 4.26it/s] 192it [00:44, 4.36it/s] 193it [00:44, 4.24it/s] 194it [00:45, 4.22it/s] 195it [00:45, 4.17it/s] 196it [00:45, 4.28it/s] 196it [00:45, 4.29it/s] +2025-05-25 22:23:41,886 - INFO - Epoch: 73, Objective: tensor([1196.2977], device='cuda:0', grad_fn=), Loss: 0.0025322872679680586, KL/n: 20.85674285888672 + 0it [00:00, ?it/s]2025-05-25 22:23:42,468 - INFO - [Epoch 074 | Batch 0000] IWAE-loss 1272.5872 | mean log_px -0.0103 | KL -1021.67 + 1it [00:00, 3.02it/s] 2it [00:00, 3.67it/s] 3it [00:00, 3.81it/s] 4it [00:01, 3.98it/s] 5it [00:01, 4.14it/s] 6it [00:01, 4.27it/s] 7it [00:01, 4.38it/s] 8it [00:01, 4.30it/s] 9it [00:02, 4.32it/s] 10it [00:02, 4.18it/s] 11it [00:02, 4.22it/s] 12it [00:02, 4.18it/s] 13it [00:03, 4.23it/s] 14it [00:03, 4.34it/s] 15it [00:03, 4.26it/s] 16it [00:03, 4.25it/s] 17it [00:04, 4.09it/s] 18it [00:04, 4.11it/s] 19it [00:04, 4.16it/s] 20it [00:04, 4.29it/s] 21it [00:05, 4.14it/s] 22it [00:05, 4.19it/s] 23it [00:05, 4.21it/s] 24it [00:05, 4.24it/s] 25it [00:05, 4.23it/s] 26it [00:06, 4.14it/s] 27it [00:06, 4.18it/s] 28it [00:06, 4.18it/s] 29it [00:06, 4.14it/s] 30it [00:07, 4.25it/s] 31it [00:07, 4.30it/s] 32it [00:07, 4.37it/s] 33it [00:07, 4.36it/s] 34it [00:08, 4.40it/s] 35it [00:08, 4.45it/s] 36it [00:08, 4.32it/s] 37it [00:08, 4.31it/s] 38it [00:09, 4.34it/s] 39it [00:09, 4.31it/s] 40it [00:09, 4.32it/s] 41it [00:09, 4.39it/s] 42it [00:09, 4.40it/s] 43it [00:10, 4.46it/s] 44it [00:10, 4.35it/s] 45it [00:10, 4.34it/s] 46it [00:10, 4.33it/s] 47it [00:11, 4.31it/s] 48it [00:11, 4.31it/s] 49it [00:11, 4.33it/s] 50it [00:11, 4.32it/s]2025-05-25 22:23:54,152 - INFO - [Epoch 074 | Batch 0050] IWAE-loss 1296.5245 | mean log_px -0.0073 | KL -1021.05 + 51it [00:12, 4.29it/s] 52it [00:12, 4.30it/s] 53it [00:12, 4.37it/s] 54it [00:12, 4.44it/s] 55it [00:12, 4.42it/s] 56it [00:13, 4.37it/s] 57it [00:13, 4.29it/s] 58it [00:13, 4.20it/s] 59it [00:13, 4.24it/s] 60it [00:14, 4.20it/s] 61it [00:14, 4.12it/s] 62it [00:14, 4.23it/s] 63it [00:14, 4.27it/s] 64it [00:15, 4.34it/s] 65it [00:15, 4.32it/s] 66it [00:15, 4.32it/s] 67it [00:15, 4.27it/s] 68it [00:15, 4.26it/s] 69it [00:16, 4.28it/s] 70it [00:16, 4.29it/s] 71it [00:16, 4.41it/s] 72it [00:16, 4.34it/s] 73it [00:17, 4.22it/s] 74it [00:17, 4.24it/s] 75it [00:17, 4.22it/s] 76it [00:17, 4.26it/s] 77it [00:18, 4.27it/s] 78it [00:18, 4.24it/s] 79it [00:18, 4.24it/s] 80it [00:18, 4.22it/s] 81it [00:19, 4.20it/s] 82it [00:19, 4.22it/s] 83it [00:19, 4.20it/s] 84it [00:19, 4.31it/s] 85it [00:19, 4.27it/s] 86it [00:20, 4.24it/s] 87it [00:20, 4.23it/s] 88it [00:20, 4.35it/s] 89it [00:20, 4.45it/s] 90it [00:21, 4.37it/s] 91it [00:21, 4.33it/s] 92it [00:21, 4.33it/s] 93it [00:21, 4.21it/s] 94it [00:22, 4.34it/s] 95it [00:22, 4.40it/s] 96it [00:22, 4.32it/s] 97it [00:22, 4.27it/s] 98it [00:23, 4.13it/s] 99it [00:23, 4.26it/s] 100it [00:23, 4.31it/s]2025-05-25 22:24:05,811 - INFO - [Epoch 074 | Batch 0100] IWAE-loss 1122.7998 | mean log_px -0.0063 | KL -1019.44 + 101it [00:23, 4.37it/s] 102it [00:23, 4.42it/s] 103it [00:24, 4.45it/s] 104it [00:24, 4.28it/s] 105it [00:24, 4.33it/s] 106it [00:24, 4.42it/s] 107it [00:25, 4.49it/s] 108it [00:25, 4.39it/s] 109it [00:25, 4.48it/s] 110it [00:25, 4.31it/s] 111it [00:25, 4.28it/s] 112it [00:26, 4.39it/s] 113it [00:26, 4.29it/s] 114it [00:26, 4.31it/s] 115it [00:26, 4.26it/s] 116it [00:27, 4.13it/s] 117it [00:27, 4.18it/s] 118it [00:27, 4.18it/s] 119it [00:27, 4.18it/s] 120it [00:28, 4.29it/s] 121it [00:28, 4.31it/s] 122it [00:28, 4.17it/s] 123it [00:28, 4.18it/s] 124it [00:29, 4.31it/s] 125it [00:29, 4.39it/s] 126it [00:29, 4.34it/s] 127it [00:29, 4.45it/s] 128it [00:29, 4.27it/s] 129it [00:30, 4.26it/s] 130it [00:30, 4.35it/s] 131it [00:30, 4.44it/s] 132it [00:30, 4.40it/s] 133it [00:31, 4.49it/s] 134it [00:31, 4.33it/s] 135it [00:31, 4.31it/s] 136it [00:31, 4.25it/s] 137it [00:32, 4.26it/s] 138it [00:32, 4.22it/s] 139it [00:32, 4.22it/s] 140it [00:32, 4.20it/s] 141it [00:32, 4.10it/s] 142it [00:33, 4.12it/s] 143it [00:33, 4.16it/s] 144it [00:33, 4.17it/s] 145it [00:33, 4.29it/s] 146it [00:34, 4.30it/s] 147it [00:34, 4.29it/s] 148it [00:34, 4.23it/s] 149it [00:34, 4.35it/s] 150it [00:35, 4.42it/s]2025-05-25 22:24:17,433 - INFO - [Epoch 074 | Batch 0150] IWAE-loss 1158.7916 | mean log_px -0.0036 | KL -1011.06 + 151it [00:35, 4.46it/s] 152it [00:35, 4.52it/s] 153it [00:35, 4.39it/s] 154it [00:36, 4.23it/s] 155it [00:36, 4.33it/s] 156it [00:36, 4.28it/s] 157it [00:36, 4.38it/s] 158it [00:36, 4.29it/s] 159it [00:37, 4.16it/s] 160it [00:37, 4.26it/s] 161it [00:37, 4.23it/s] 162it [00:37, 4.34it/s] 163it [00:38, 4.37it/s] 164it [00:38, 4.31it/s] 165it [00:38, 4.38it/s] 166it [00:38, 4.31it/s] 167it [00:39, 4.39it/s] 168it [00:39, 4.41it/s] 169it [00:39, 4.45it/s] 170it [00:39, 4.24it/s] 171it [00:39, 4.21it/s] 172it [00:40, 4.19it/s] 173it [00:40, 4.15it/s] 174it [00:40, 4.17it/s] 175it [00:40, 4.15it/s] 176it [00:41, 4.18it/s] 177it [00:41, 4.16it/s] 178it [00:41, 4.26it/s] 179it [00:41, 4.38it/s] 180it [00:42, 4.29it/s] 181it [00:42, 4.28it/s] 182it [00:42, 4.39it/s] 183it [00:42, 4.19it/s] 184it [00:43, 4.30it/s] 185it [00:43, 4.31it/s] 186it [00:43, 4.42it/s] 187it [00:43, 4.38it/s] 188it [00:43, 4.32it/s] 189it [00:44, 4.33it/s] 190it [00:44, 4.29it/s] 191it [00:44, 4.37it/s] 192it [00:44, 4.29it/s] 193it [00:45, 4.35it/s] 194it [00:45, 4.39it/s] 195it [00:45, 4.33it/s] 196it [00:45, 4.25it/s] 196it [00:45, 4.27it/s] +2025-05-25 22:24:28,062 - INFO - Epoch: 74, Objective: tensor([1074.4708], device='cuda:0', grad_fn=), Loss: 0.0014531121123582125, KL/n: 20.634225845336914 + 0it [00:00, ?it/s]2025-05-25 22:24:28,476 - INFO - [Epoch 075 | Batch 0000] IWAE-loss 1407.3490 | mean log_px -0.0097 | KL -1012.06 + 1it [00:00, 2.89it/s] 2it [00:00, 3.64it/s] 3it [00:00, 4.04it/s] 4it [00:01, 4.27it/s] 5it [00:01, 4.23it/s] 6it [00:01, 4.07it/s] 7it [00:01, 4.14it/s] 8it [00:01, 4.19it/s] 9it [00:02, 4.34it/s] 10it [00:02, 4.33it/s] 11it [00:02, 4.31it/s] 12it [00:03, 3.45it/s] 13it [00:03, 3.67it/s] 14it [00:03, 3.72it/s] 15it [00:03, 3.86it/s] 16it [00:04, 3.85it/s] 17it [00:04, 3.97it/s] 18it [00:04, 4.07it/s] 19it [00:04, 4.22it/s] 20it [00:04, 4.33it/s] 21it [00:05, 4.34it/s] 22it [00:05, 4.17it/s] 23it [00:05, 4.22it/s] 24it [00:05, 4.26it/s] 25it [00:06, 4.28it/s] 26it [00:06, 4.28it/s] 27it [00:06, 4.32it/s] 28it [00:06, 4.31it/s] 29it [00:07, 4.32it/s] 30it [00:07, 4.16it/s] 31it [00:07, 4.31it/s] 32it [00:07, 4.29it/s] 33it [00:08, 4.32it/s] 34it [00:08, 4.32it/s] 35it [00:08, 4.33it/s] 36it [00:08, 4.35it/s] 37it [00:08, 4.37it/s] 38it [00:09, 4.35it/s] 39it [00:09, 4.31it/s] 40it [00:09, 4.44it/s] 41it [00:09, 4.41it/s] 42it [00:10, 4.38it/s] 43it [00:10, 4.33it/s] 44it [00:10, 4.42it/s] 45it [00:10, 4.48it/s] 46it [00:10, 4.43it/s] 47it [00:11, 4.38it/s] 48it [00:11, 4.41it/s] 49it [00:11, 4.37it/s] 50it [00:11, 4.34it/s]2025-05-25 22:24:40,257 - INFO - [Epoch 075 | Batch 0050] IWAE-loss 1448.6622 | mean log_px -0.0086 | KL -1008.97 + 51it [00:12, 4.17it/s] 52it [00:12, 4.23it/s] 53it [00:12, 4.35it/s] 54it [00:12, 4.34it/s] 55it [00:13, 4.30it/s] 56it [00:13, 4.33it/s] 57it [00:13, 4.14it/s] 58it [00:13, 4.19it/s] 59it [00:13, 4.35it/s] 60it [00:14, 4.32it/s] 61it [00:14, 4.28it/s] 62it [00:14, 4.42it/s] 63it [00:14, 4.36it/s] 64it [00:15, 4.33it/s] 65it [00:15, 4.32it/s] 66it [00:15, 4.32it/s] 67it [00:15, 4.33it/s] 68it [00:16, 4.43it/s] 69it [00:16, 4.39it/s] 70it [00:16, 4.33it/s] 71it [00:16, 4.32it/s] 72it [00:16, 4.35it/s] 73it [00:17, 4.35it/s] 74it [00:17, 4.42it/s] 75it [00:17, 4.45it/s] 76it [00:17, 4.47it/s] 77it [00:18, 4.31it/s] 78it [00:18, 4.38it/s] 79it [00:18, 4.48it/s] 80it [00:18, 4.54it/s] 81it [00:19, 4.48it/s] 82it [00:19, 4.35it/s] 83it [00:19, 4.33it/s] 84it [00:19, 4.46it/s] 85it [00:19, 4.53it/s] 86it [00:20, 4.46it/s] 87it [00:20, 4.45it/s] 88it [00:20, 4.53it/s] 89it [00:20, 4.53it/s] 90it [00:21, 4.56it/s] 91it [00:21, 4.52it/s] 92it [00:21, 4.30it/s] 93it [00:21, 4.33it/s] 94it [00:21, 4.41it/s] 95it [00:22, 4.47it/s] 96it [00:22, 4.43it/s] 97it [00:22, 4.43it/s] 98it [00:22, 4.42it/s] 99it [00:23, 4.51it/s] 100it [00:23, 4.28it/s]2025-05-25 22:24:51,665 - INFO - [Epoch 075 | Batch 0100] IWAE-loss 1112.7964 | mean log_px -0.0021 | KL -1007.40 + 101it [00:23, 4.39it/s] 102it [00:23, 4.43it/s] 103it [00:23, 4.51it/s] 104it [00:24, 4.44it/s] 105it [00:24, 4.44it/s] 106it [00:24, 4.38it/s] 107it [00:24, 4.29it/s] 108it [00:25, 4.36it/s] 109it [00:25, 4.35it/s] 110it [00:25, 4.32it/s] 111it [00:25, 4.44it/s] 112it [00:26, 4.42it/s] 113it [00:26, 4.49it/s] 114it [00:26, 4.26it/s] 115it [00:26, 4.30it/s] 116it [00:26, 4.33it/s] 117it [00:27, 4.29it/s] 118it [00:27, 4.27it/s] 119it [00:27, 4.27it/s] 120it [00:27, 4.29it/s] 121it [00:28, 4.19it/s] 122it [00:28, 4.34it/s] 123it [00:28, 4.29it/s] 124it [00:28, 4.28it/s] 125it [00:29, 4.28it/s] 126it [00:29, 4.29it/s] 127it [00:29, 4.25it/s] 128it [00:29, 4.34it/s] 129it [00:29, 4.43it/s] 130it [00:30, 4.47it/s] 131it [00:30, 4.21it/s] 132it [00:30, 4.32it/s] 133it [00:30, 4.37it/s] 134it [00:31, 4.44it/s] 135it [00:31, 4.52it/s] 136it [00:31, 4.56it/s] 137it [00:31, 4.48it/s] 138it [00:32, 4.39it/s] 139it [00:32, 4.32it/s] 140it [00:32, 4.42it/s] 141it [00:32, 4.47it/s] 142it [00:32, 4.56it/s] 143it [00:33, 4.61it/s] 144it [00:33, 4.61it/s] 145it [00:33, 4.52it/s] 146it [00:33, 4.51it/s] 147it [00:34, 4.43it/s] 148it [00:34, 4.25it/s] 149it [00:34, 4.35it/s] 150it [00:34, 4.33it/s]2025-05-25 22:25:03,072 - INFO - [Epoch 075 | Batch 0150] IWAE-loss 2491.0842 | mean log_px -0.0430 | KL -1002.79 + 151it [00:34, 4.44it/s] 152it [00:35, 4.53it/s] 153it [00:35, 4.48it/s] 154it [00:35, 4.38it/s] 155it [00:35, 4.48it/s] 156it [00:36, 4.45it/s] 157it [00:36, 4.55it/s] 158it [00:36, 4.49it/s] 159it [00:36, 4.30it/s] 160it [00:36, 4.31it/s] 161it [00:37, 4.34it/s] 162it [00:37, 4.36it/s] 163it [00:37, 4.39it/s] 164it [00:37, 4.45it/s] 165it [00:38, 4.52it/s] 166it [00:38, 4.59it/s] 167it [00:38, 4.63it/s] 168it [00:38, 4.65it/s] 169it [00:38, 4.67it/s] 170it [00:39, 4.65it/s] 171it [00:39, 4.63it/s] 172it [00:39, 4.66it/s] 173it [00:39, 4.64it/s] 174it [00:40, 4.59it/s] 175it [00:40, 4.65it/s] 176it [00:40, 4.51it/s] 177it [00:40, 4.37it/s] 178it [00:40, 4.34it/s] 179it [00:41, 4.37it/s] 180it [00:41, 4.35it/s] 181it [00:41, 4.44it/s] 182it [00:41, 4.50it/s] 183it [00:42, 4.56it/s] 184it [00:42, 4.45it/s] 185it [00:42, 4.54it/s] 186it [00:42, 4.45it/s] 187it [00:42, 4.40it/s] 188it [00:43, 4.37it/s] 189it [00:43, 4.49it/s] 190it [00:43, 4.41it/s] 191it [00:43, 4.32it/s] 192it [00:44, 4.39it/s] 193it [00:44, 4.50it/s] 194it [00:44, 4.55it/s] 195it [00:44, 4.51it/s] 196it [00:45, 4.26it/s] 196it [00:45, 4.35it/s] +2025-05-25 22:25:13,279 - INFO - Epoch: 75, Objective: tensor([1224.8317], device='cuda:0', grad_fn=), Loss: 0.005707655567675829, KL/n: 20.583492279052734 + 0it [00:00, ?it/s]2025-05-25 22:25:13,676 - INFO - [Epoch 076 | Batch 0000] IWAE-loss 3191.0737 | mean log_px -0.0381 | KL -1011.61 + 1it [00:00, 3.10it/s] 2it [00:00, 3.81it/s] 3it [00:00, 4.18it/s] 4it [00:00, 4.19it/s] 5it [00:01, 4.38it/s] 6it [00:01, 4.47it/s] 7it [00:01, 4.35it/s] 8it [00:01, 4.33it/s] 9it [00:02, 4.31it/s] 10it [00:02, 4.32it/s] 11it [00:02, 4.33it/s] 12it [00:02, 4.43it/s] 13it [00:03, 4.41it/s] 14it [00:03, 4.36it/s] 15it [00:03, 4.37it/s] 16it [00:03, 4.33it/s] 17it [00:03, 4.39it/s] 18it [00:04, 4.35it/s] 19it [00:04, 4.34it/s] 20it [00:04, 4.21it/s] 21it [00:04, 4.36it/s] 22it [00:05, 4.45it/s] 23it [00:05, 4.45it/s] 24it [00:05, 4.40it/s] 25it [00:05, 4.39it/s] 26it [00:06, 4.34it/s] 27it [00:06, 4.29it/s] 28it [00:06, 4.17it/s] 29it [00:06, 4.34it/s] 30it [00:06, 4.39it/s] 31it [00:07, 4.34it/s] 32it [00:07, 4.43it/s] 33it [00:07, 4.22it/s] 34it [00:07, 4.36it/s] 35it [00:08, 4.32it/s] 36it [00:08, 4.30it/s] 37it [00:08, 4.32it/s] 38it [00:08, 4.41it/s] 39it [00:09, 4.21it/s] 40it [00:09, 4.23it/s] 41it [00:09, 4.25it/s] 42it [00:09, 4.26it/s] 43it [00:09, 4.27it/s] 44it [00:10, 4.28it/s] 45it [00:10, 4.29it/s] 46it [00:10, 4.17it/s] 47it [00:10, 4.19it/s] 48it [00:11, 4.21it/s] 49it [00:11, 4.22it/s] 50it [00:11, 4.33it/s]2025-05-25 22:25:25,197 - INFO - [Epoch 076 | Batch 0050] IWAE-loss 1105.2787 | mean log_px -0.0032 | KL -1006.82 + 51it [00:11, 4.28it/s] 52it [00:12, 4.25it/s] 53it [00:12, 4.28it/s] 54it [00:12, 4.36it/s] 55it [00:12, 4.34it/s] 56it [00:13, 4.33it/s] 57it [00:13, 4.32it/s] 58it [00:13, 4.17it/s] 59it [00:13, 4.21it/s] 60it [00:13, 4.23it/s] 61it [00:14, 4.22it/s] 62it [00:14, 4.23it/s] 63it [00:14, 4.25it/s] 64it [00:14, 4.16it/s] 65it [00:15, 4.31it/s] 66it [00:15, 4.25it/s] 67it [00:15, 4.28it/s] 68it [00:15, 4.28it/s] 69it [00:16, 4.25it/s] 70it [00:16, 4.14it/s] 71it [00:16, 4.05it/s] 72it [00:16, 4.16it/s] 73it [00:17, 4.16it/s] 74it [00:17, 4.28it/s] 75it [00:17, 4.22it/s] 76it [00:17, 4.22it/s] 77it [00:18, 4.26it/s] 78it [00:18, 4.22it/s] 79it [00:18, 4.10it/s] 80it [00:18, 4.26it/s] 81it [00:18, 4.38it/s] 82it [00:19, 4.33it/s] 83it [00:19, 4.26it/s] 84it [00:19, 4.17it/s] 85it [00:19, 4.23it/s] 86it [00:20, 4.36it/s] 87it [00:20, 4.31it/s] 88it [00:20, 4.30it/s] 89it [00:20, 4.31it/s] 90it [00:21, 4.18it/s] 91it [00:21, 4.23it/s] 92it [00:21, 4.23it/s] 93it [00:21, 4.09it/s] 94it [00:22, 4.14it/s] 95it [00:22, 4.24it/s] 96it [00:22, 4.37it/s] 97it [00:22, 4.36it/s] 98it [00:22, 4.43it/s] 99it [00:23, 4.42it/s] 100it [00:23, 4.25it/s]2025-05-25 22:25:36,963 - INFO - [Epoch 076 | Batch 0100] IWAE-loss 1797.6439 | mean log_px -0.0222 | KL -1009.94 + 101it [00:23, 4.39it/s] 102it [00:23, 4.33it/s] 103it [00:24, 4.31it/s] 104it [00:24, 4.35it/s] 105it [00:24, 4.34it/s] 106it [00:24, 4.32it/s] 107it [00:24, 4.34it/s] 108it [00:25, 4.41it/s] 109it [00:25, 4.37it/s] 110it [00:25, 4.32it/s] 111it [00:25, 4.36it/s] 112it [00:26, 4.46it/s] 113it [00:26, 4.47it/s] 114it [00:26, 4.44it/s] 115it [00:26, 4.49it/s] 116it [00:27, 4.50it/s] 117it [00:27, 4.52it/s] 118it [00:27, 4.57it/s] 119it [00:27, 4.33it/s] 120it [00:27, 4.32it/s] 121it [00:28, 4.31it/s] 122it [00:28, 4.33it/s] 123it [00:28, 4.34it/s] 124it [00:28, 4.46it/s] 125it [00:29, 4.27it/s] 126it [00:29, 4.39it/s] 127it [00:29, 4.34it/s] 128it [00:29, 4.32it/s] 129it [00:30, 4.30it/s] 130it [00:30, 4.15it/s] 131it [00:30, 4.18it/s] 132it [00:30, 4.23it/s] 133it [00:30, 4.23it/s] 134it [00:31, 4.24it/s] 135it [00:31, 4.22it/s] 136it [00:31, 4.37it/s] 137it [00:31, 4.33it/s] 138it [00:32, 4.32it/s] 139it [00:32, 4.39it/s] 140it [00:32, 4.39it/s] 141it [00:32, 4.29it/s] 142it [00:33, 4.33it/s] 143it [00:33, 4.44it/s] 144it [00:33, 4.36it/s] 145it [00:33, 4.34it/s] 146it [00:33, 4.24it/s] 147it [00:34, 4.28it/s] 148it [00:34, 4.28it/s] 149it [00:34, 4.25it/s] 150it [00:34, 4.27it/s]2025-05-25 22:25:48,482 - INFO - [Epoch 076 | Batch 0150] IWAE-loss 1153.4496 | mean log_px -0.0023 | KL -1007.40 + 151it [00:35, 4.22it/s] 152it [00:35, 4.36it/s] 153it [00:35, 4.47it/s] 154it [00:35, 4.45it/s] 155it [00:36, 4.43it/s] 156it [00:36, 4.28it/s] 157it [00:36, 4.39it/s] 158it [00:36, 4.41it/s] 159it [00:36, 4.36it/s] 160it [00:37, 4.40it/s] 161it [00:37, 4.41it/s] 162it [00:37, 4.35it/s] 163it [00:37, 4.44it/s] 164it [00:38, 4.49it/s] 165it [00:38, 4.38it/s] 166it [00:38, 4.40it/s] 167it [00:38, 4.34it/s] 168it [00:39, 4.20it/s] 169it [00:39, 4.25it/s] 170it [00:39, 4.25it/s] 171it [00:39, 4.25it/s] 172it [00:39, 4.27it/s] 173it [00:40, 4.38it/s] 174it [00:40, 4.48it/s] 175it [00:40, 4.34it/s] 176it [00:40, 4.45it/s] 177it [00:41, 4.40it/s] 178it [00:41, 4.34it/s] 179it [00:41, 4.32it/s] 180it [00:41, 4.34it/s] 181it [00:42, 4.29it/s] 182it [00:42, 4.31it/s] 183it [00:42, 4.29it/s] 184it [00:42, 4.14it/s] 185it [00:42, 4.31it/s] 186it [00:43, 4.27it/s] 187it [00:43, 4.25it/s] 188it [00:43, 4.16it/s] 189it [00:43, 4.21it/s] 190it [00:44, 4.22it/s] 191it [00:44, 4.25it/s] 192it [00:44, 4.34it/s] 193it [00:44, 4.30it/s] 194it [00:45, 4.21it/s] 195it [00:45, 4.21it/s] 196it [00:45, 4.36it/s] 196it [00:45, 4.30it/s] +2025-05-25 22:25:59,021 - INFO - Epoch: 76, Objective: tensor([1119.1392], device='cuda:0', grad_fn=), Loss: 0.006396050099283457, KL/n: 20.540983200073242 + 0it [00:00, ?it/s]2025-05-25 22:25:59,589 - INFO - [Epoch 077 | Batch 0000] IWAE-loss 1210.2894 | mean log_px -0.0075 | KL -1004.59 + 1it [00:00, 3.17it/s] 2it [00:00, 3.77it/s] 3it [00:00, 3.93it/s] 4it [00:01, 4.08it/s] 5it [00:01, 4.16it/s] 6it [00:01, 4.32it/s] 7it [00:01, 4.30it/s] 8it [00:01, 4.30it/s] 9it [00:02, 4.07it/s] 10it [00:02, 4.25it/s] 11it [00:02, 4.32it/s] 12it [00:02, 4.42it/s] 13it [00:03, 4.35it/s] 14it [00:03, 4.22it/s] 15it [00:03, 4.38it/s] 16it [00:03, 4.31it/s] 17it [00:04, 4.30it/s] 18it [00:04, 4.28it/s] 19it [00:04, 4.28it/s] 20it [00:04, 4.24it/s] 21it [00:04, 4.15it/s] 22it [00:05, 4.33it/s] 23it [00:05, 4.41it/s] 24it [00:05, 4.49it/s] 25it [00:05, 4.48it/s] 26it [00:06, 4.53it/s] 27it [00:06, 4.60it/s] 28it [00:06, 4.62it/s] 29it [00:06, 4.66it/s] 30it [00:06, 4.66it/s] 31it [00:07, 4.63it/s] 32it [00:07, 4.45it/s] 33it [00:07, 4.46it/s] 34it [00:07, 4.53it/s] 35it [00:08, 4.60it/s] 36it [00:08, 4.50it/s] 37it [00:08, 4.35it/s] 38it [00:08, 4.46it/s] 39it [00:08, 4.55it/s] 40it [00:09, 4.57it/s] 41it [00:09, 4.59it/s] 42it [00:09, 4.63it/s] 43it [00:09, 4.48it/s] 44it [00:10, 4.34it/s] 45it [00:10, 4.38it/s] 46it [00:10, 4.34it/s] 47it [00:10, 4.43it/s] 48it [00:10, 4.51it/s] 49it [00:11, 4.58it/s] 50it [00:11, 4.43it/s]2025-05-25 22:26:10,906 - INFO - [Epoch 077 | Batch 0050] IWAE-loss 1236.3286 | mean log_px -0.0053 | KL -1002.10 + 51it [00:11, 4.27it/s] 52it [00:11, 4.25it/s] 53it [00:12, 4.29it/s] 54it [00:12, 4.27it/s] 55it [00:12, 4.42it/s] 56it [00:12, 4.35it/s] 57it [00:13, 4.43it/s] 58it [00:13, 4.50it/s] 59it [00:13, 4.56it/s] 60it [00:13, 4.41it/s] 61it [00:13, 4.23it/s] 62it [00:14, 4.32it/s] 63it [00:14, 4.44it/s] 64it [00:14, 4.38it/s] 65it [00:14, 4.39it/s] 66it [00:15, 4.40it/s] 67it [00:15, 4.47it/s] 68it [00:15, 4.53it/s] 69it [00:15, 4.59it/s] 70it [00:15, 4.63it/s] 71it [00:16, 4.64it/s] 72it [00:16, 4.61it/s] 73it [00:16, 4.51it/s] 74it [00:16, 4.51it/s] 75it [00:17, 4.45it/s] 76it [00:17, 4.26it/s] 77it [00:17, 4.26it/s] 78it [00:17, 4.25it/s] 79it [00:17, 4.39it/s] 80it [00:18, 4.39it/s] 81it [00:18, 4.36it/s] 82it [00:18, 4.33it/s] 83it [00:18, 4.36it/s] 84it [00:19, 4.24it/s] 85it [00:19, 4.25it/s] 86it [00:19, 4.38it/s] 87it [00:19, 4.28it/s] 88it [00:20, 4.30it/s] 89it [00:20, 4.13it/s] 90it [00:20, 4.31it/s] 91it [00:20, 4.27it/s] 92it [00:21, 4.30it/s] 93it [00:21, 4.22it/s] 94it [00:21, 4.17it/s] 95it [00:21, 4.19it/s] 96it [00:21, 4.13it/s] 97it [00:22, 4.16it/s] 98it [00:22, 4.19it/s] 99it [00:22, 4.25it/s] 100it [00:22, 4.23it/s]2025-05-25 22:26:22,442 - INFO - [Epoch 077 | Batch 0100] IWAE-loss 1310.2383 | mean log_px -0.0126 | KL -997.80 + 101it [00:23, 4.12it/s] 102it [00:23, 4.16it/s] 103it [00:23, 4.30it/s] 104it [00:23, 4.28it/s] 105it [00:24, 4.32it/s] 106it [00:24, 4.29it/s] 107it [00:24, 4.25it/s] 108it [00:24, 4.14it/s] 109it [00:25, 4.21it/s] 110it [00:25, 4.25it/s] 111it [00:25, 4.38it/s] 112it [00:25, 4.47it/s] 113it [00:25, 4.37it/s] 114it [00:26, 4.26it/s] 115it [00:26, 4.27it/s] 116it [00:26, 4.28it/s] 117it [00:26, 4.37it/s] 118it [00:27, 4.31it/s] 119it [00:27, 4.17it/s] 120it [00:27, 4.32it/s] 121it [00:27, 4.28it/s] 122it [00:28, 4.29it/s] 123it [00:28, 4.16it/s] 124it [00:28, 4.25it/s] 125it [00:28, 4.27it/s] 126it [00:29, 4.31it/s] 127it [00:29, 4.43it/s] 128it [00:29, 4.35it/s] 129it [00:29, 4.23it/s] 130it [00:29, 4.23it/s] 131it [00:30, 4.28it/s] 132it [00:30, 4.40it/s] 133it [00:30, 4.46it/s] 134it [00:30, 4.38it/s] 135it [00:31, 4.39it/s] 136it [00:31, 4.35it/s] 137it [00:31, 4.33it/s] 138it [00:31, 4.21it/s] 139it [00:32, 4.35it/s] 140it [00:32, 4.44it/s] 141it [00:32, 4.37it/s] 142it [00:32, 4.39it/s] 143it [00:32, 4.20it/s] 144it [00:33, 4.34it/s] 145it [00:33, 4.39it/s] 146it [00:33, 4.38it/s] 147it [00:33, 4.41it/s] 148it [00:34, 4.34it/s] 149it [00:34, 4.41it/s] 150it [00:34, 4.18it/s]2025-05-25 22:26:34,063 - INFO - [Epoch 077 | Batch 0150] IWAE-loss 1114.1711 | mean log_px -0.0020 | KL -998.09 + 151it [00:34, 4.24it/s] 152it [00:35, 4.24it/s] 153it [00:35, 4.22it/s] 154it [00:35, 4.25it/s] 155it [00:35, 4.38it/s] 156it [00:35, 4.45it/s] 157it [00:36, 4.37it/s] 158it [00:36, 4.33it/s] 159it [00:36, 4.40it/s] 160it [00:36, 4.34it/s] 161it [00:37, 4.33it/s] 162it [00:37, 4.26it/s] 163it [00:37, 4.21it/s] 164it [00:37, 4.23it/s] 165it [00:38, 4.30it/s] 166it [00:38, 4.26it/s] 167it [00:38, 4.21it/s] 168it [00:38, 4.34it/s] 169it [00:38, 4.45it/s] 170it [00:39, 4.48it/s] 171it [00:39, 4.55it/s] 172it [00:39, 4.59it/s] 173it [00:39, 4.63it/s] 174it [00:40, 4.65it/s] 175it [00:40, 4.67it/s] 176it [00:40, 4.64it/s] 177it [00:40, 4.67it/s] 178it [00:40, 4.68it/s] 179it [00:41, 4.69it/s] 180it [00:41, 4.52it/s] 181it [00:41, 4.56it/s] 182it [00:41, 4.61it/s] 183it [00:41, 4.55it/s] 184it [00:42, 4.61it/s] 185it [00:42, 4.63it/s] 186it [00:42, 4.66it/s] 187it [00:42, 4.52it/s] 188it [00:43, 4.59it/s] 189it [00:43, 4.63it/s] 190it [00:43, 4.66it/s] 191it [00:43, 4.68it/s] 192it [00:43, 4.63it/s] 193it [00:44, 4.68it/s] 194it [00:44, 4.67it/s] 195it [00:44, 4.60it/s] 196it [00:44, 4.63it/s] 196it [00:44, 4.37it/s] +2025-05-25 22:26:44,173 - INFO - Epoch: 77, Objective: tensor([1058.8920], device='cuda:0', grad_fn=), Loss: 0.0013972671004012227, KL/n: 20.369314193725586 + 0it [00:00, ?it/s]2025-05-25 22:26:44,589 - INFO - [Epoch 078 | Batch 0000] IWAE-loss 1110.0542 | mean log_px -0.0045 | KL -998.70 + 1it [00:00, 2.73it/s] 2it [00:00, 3.64it/s] 3it [00:00, 4.05it/s] 4it [00:01, 4.28it/s] 5it [00:01, 4.43it/s] 6it [00:01, 4.51it/s] 7it [00:01, 4.47it/s] 8it [00:01, 4.53it/s] 9it [00:02, 3.48it/s] 10it [00:02, 3.78it/s] 11it [00:02, 3.95it/s] 12it [00:02, 4.06it/s] 13it [00:03, 4.15it/s] 14it [00:03, 4.08it/s] 15it [00:03, 4.27it/s] 16it [00:03, 4.32it/s] 17it [00:04, 4.43it/s] 18it [00:04, 4.46it/s] 19it [00:04, 4.39it/s] 20it [00:04, 4.24it/s] 21it [00:05, 4.28it/s] 22it [00:05, 4.24it/s] 23it [00:05, 4.26it/s] 24it [00:05, 4.24it/s] 25it [00:06, 4.13it/s] 26it [00:06, 4.21it/s] 27it [00:06, 4.24it/s] 28it [00:06, 4.39it/s] 29it [00:06, 4.37it/s] 30it [00:07, 4.19it/s] 31it [00:07, 4.23it/s] 32it [00:07, 4.28it/s] 33it [00:07, 4.12it/s] 34it [00:08, 4.19it/s] 35it [00:08, 4.23it/s] 36it [00:08, 4.36it/s] 37it [00:08, 4.38it/s] 38it [00:09, 4.45it/s] 39it [00:09, 4.38it/s] 40it [00:09, 4.27it/s] 41it [00:09, 4.35it/s] 42it [00:09, 4.42it/s] 43it [00:10, 4.40it/s] 44it [00:10, 4.51it/s] 45it [00:10, 4.32it/s] 46it [00:10, 4.31it/s] 47it [00:11, 4.31it/s] 48it [00:11, 4.39it/s] 49it [00:11, 4.48it/s] 50it [00:11, 4.39it/s]2025-05-25 22:26:56,240 - INFO - [Epoch 078 | Batch 0050] IWAE-loss 1141.6960 | mean log_px -0.0026 | KL -994.03 + 51it [00:12, 4.25it/s] 52it [00:12, 4.26it/s] 53it [00:12, 4.27it/s] 54it [00:12, 4.30it/s] 55it [00:12, 4.32it/s] 56it [00:13, 4.40it/s] 57it [00:13, 4.23it/s] 58it [00:13, 4.37it/s] 59it [00:13, 4.35it/s] 60it [00:14, 4.35it/s] 61it [00:14, 4.44it/s] 62it [00:14, 4.39it/s] 63it [00:14, 4.34it/s] 64it [00:15, 4.22it/s] 65it [00:15, 4.26it/s] 66it [00:15, 4.26it/s] 67it [00:15, 4.26it/s] 68it [00:15, 4.38it/s] 69it [00:16, 4.43it/s] 70it [00:16, 4.48it/s] 71it [00:16, 4.33it/s] 72it [00:16, 4.44it/s] 73it [00:17, 4.52it/s] 74it [00:17, 4.56it/s] 75it [00:17, 4.56it/s] 76it [00:17, 4.60it/s] 77it [00:17, 4.62it/s] 78it [00:18, 4.66it/s] 79it [00:18, 4.68it/s] 80it [00:18, 4.69it/s] 81it [00:18, 4.48it/s] 82it [00:19, 4.54it/s] 83it [00:19, 4.50it/s] 84it [00:19, 4.48it/s] 85it [00:19, 4.44it/s] 86it [00:19, 4.48it/s] 87it [00:20, 4.49it/s] 88it [00:20, 4.46it/s] 89it [00:20, 4.44it/s] 90it [00:20, 4.49it/s] 91it [00:21, 4.50it/s] 92it [00:21, 4.37it/s] 93it [00:21, 4.36it/s] 94it [00:21, 4.25it/s] 95it [00:21, 4.28it/s] 96it [00:22, 4.27it/s] 97it [00:22, 4.31it/s] 98it [00:22, 4.28it/s] 99it [00:22, 4.27it/s] 100it [00:23, 4.18it/s]2025-05-25 22:27:07,627 - INFO - [Epoch 078 | Batch 0100] IWAE-loss 1110.1791 | mean log_px -0.0030 | KL -994.81 + 101it [00:23, 4.25it/s] 102it [00:23, 4.31it/s] 103it [00:23, 4.28it/s] 104it [00:24, 4.42it/s] 105it [00:24, 4.50it/s] 106it [00:24, 4.44it/s] 107it [00:24, 4.42it/s] 108it [00:24, 4.51it/s] 109it [00:25, 4.57it/s] 110it [00:25, 4.34it/s] 111it [00:25, 4.37it/s] 112it [00:25, 4.48it/s] 113it [00:26, 4.49it/s] 114it [00:26, 4.44it/s] 115it [00:26, 4.32it/s] 116it [00:26, 4.29it/s] 117it [00:27, 4.34it/s] 118it [00:27, 4.42it/s] 119it [00:27, 4.40it/s] 120it [00:27, 4.34it/s] 121it [00:27, 4.46it/s] 122it [00:28, 4.41it/s] 123it [00:28, 4.46it/s] 124it [00:28, 4.48it/s] 125it [00:28, 4.52it/s] 126it [00:29, 4.45it/s] 127it [00:29, 4.51it/s] 128it [00:29, 4.35it/s] 129it [00:29, 4.39it/s] 130it [00:29, 4.45it/s] 131it [00:30, 4.39it/s] 132it [00:30, 4.40it/s] 133it [00:30, 4.47it/s] 134it [00:30, 4.47it/s] 135it [00:31, 4.49it/s] 136it [00:31, 4.40it/s] 137it [00:31, 4.38it/s] 138it [00:31, 4.47it/s] 139it [00:31, 4.45it/s] 140it [00:32, 4.52it/s] 141it [00:32, 4.47it/s] 142it [00:32, 4.43it/s] 143it [00:32, 4.50it/s] 144it [00:33, 4.46it/s] 145it [00:33, 4.43it/s] 146it [00:33, 4.40it/s] 147it [00:33, 4.48it/s] 148it [00:33, 4.45it/s] 149it [00:34, 4.39it/s] 150it [00:34, 4.40it/s]2025-05-25 22:27:18,904 - INFO - [Epoch 078 | Batch 0150] IWAE-loss 1227.6323 | mean log_px -0.0173 | KL -994.20 + 151it [00:34, 4.26it/s] 152it [00:34, 4.40it/s] 153it [00:35, 4.50it/s] 154it [00:35, 4.52it/s] 155it [00:35, 4.47it/s] 156it [00:35, 4.41it/s] 157it [00:36, 4.39it/s] 158it [00:36, 4.28it/s] 159it [00:36, 4.29it/s] 160it [00:36, 4.31it/s] 161it [00:36, 4.41it/s] 162it [00:37, 4.47it/s] 163it [00:37, 4.52it/s] 164it [00:37, 4.57it/s] 165it [00:37, 4.51it/s] 166it [00:38, 4.28it/s] 167it [00:38, 4.39it/s] 168it [00:38, 4.44it/s] 169it [00:38, 4.53it/s] 170it [00:38, 4.54it/s] 171it [00:39, 4.49it/s] 172it [00:39, 4.26it/s] 173it [00:39, 4.31it/s] 174it [00:39, 4.35it/s] 175it [00:40, 4.30it/s] 176it [00:40, 4.32it/s] 177it [00:40, 4.16it/s] 178it [00:40, 4.21it/s] 179it [00:41, 4.37it/s] 180it [00:41, 4.36it/s] 181it [00:41, 4.42it/s] 182it [00:41, 4.47it/s] 183it [00:41, 4.33it/s] 184it [00:42, 4.41it/s] 185it [00:42, 4.49it/s] 186it [00:42, 4.52it/s] 187it [00:42, 4.48it/s] 188it [00:43, 4.54it/s] 189it [00:43, 4.45it/s] 190it [00:43, 4.31it/s] 191it [00:43, 4.41it/s] 192it [00:43, 4.47it/s] 193it [00:44, 4.40it/s] 194it [00:44, 4.37it/s] 195it [00:44, 4.34it/s] 196it [00:44, 4.48it/s] 196it [00:44, 4.36it/s] +2025-05-25 22:27:29,259 - INFO - Epoch: 78, Objective: tensor([2114.0513], device='cuda:0', grad_fn=), Loss: 0.018417079001665115, KL/n: 20.35153579711914 + 0it [00:00, ?it/s]2025-05-25 22:27:29,660 - INFO - [Epoch 079 | Batch 0000] IWAE-loss 1181.8622 | mean log_px -0.0096 | KL -996.42 + 1it [00:00, 2.81it/s] 2it [00:00, 3.49it/s] 3it [00:00, 3.77it/s] 4it [00:01, 3.89it/s] 5it [00:01, 4.00it/s] 6it [00:01, 4.17it/s] 7it [00:01, 4.31it/s] 8it [00:01, 4.40it/s] 9it [00:02, 4.30it/s] 10it [00:02, 4.27it/s] 11it [00:02, 4.24it/s] 12it [00:02, 4.27it/s] 13it [00:03, 4.22it/s] 14it [00:03, 4.24it/s] 15it [00:03, 4.22it/s] 16it [00:03, 4.31it/s] 17it [00:04, 4.26it/s] 18it [00:04, 4.38it/s] 19it [00:04, 4.34it/s] 20it [00:04, 4.43it/s] 21it [00:04, 4.40it/s] 22it [00:05, 4.20it/s] 23it [00:05, 4.17it/s] 24it [00:05, 4.21it/s] 25it [00:05, 4.27it/s] 26it [00:06, 4.21it/s] 27it [00:06, 4.20it/s] 28it [00:06, 4.07it/s] 29it [00:06, 4.15it/s] 30it [00:07, 4.28it/s] 31it [00:07, 4.22it/s] 32it [00:07, 4.27it/s] 33it [00:07, 4.31it/s] 34it [00:08, 4.39it/s] 35it [00:08, 4.36it/s] 36it [00:08, 4.34it/s] 37it [00:08, 4.23it/s] 38it [00:09, 4.25it/s] 39it [00:09, 4.24it/s] 40it [00:09, 4.37it/s] 41it [00:09, 4.48it/s] 42it [00:09, 4.39it/s] 43it [00:10, 4.33it/s] 44it [00:10, 4.18it/s] 45it [00:10, 4.24it/s] 46it [00:10, 4.28it/s] 47it [00:11, 4.26it/s] 48it [00:11, 4.25it/s] 49it [00:11, 4.37it/s] 50it [00:11, 4.46it/s]2025-05-25 22:27:41,319 - INFO - [Epoch 079 | Batch 0050] IWAE-loss 1083.8743 | mean log_px -0.0050 | KL -990.57 + 51it [00:11, 4.54it/s] 52it [00:12, 4.42it/s] 53it [00:12, 4.25it/s] 54it [00:12, 4.30it/s] 55it [00:12, 4.40it/s] 56it [00:13, 4.35it/s] 57it [00:13, 4.35it/s] 58it [00:13, 4.33it/s] 59it [00:13, 4.22it/s] 60it [00:14, 4.36it/s] 61it [00:14, 4.31it/s] 62it [00:14, 4.26it/s] 63it [00:14, 4.31it/s] 64it [00:15, 4.42it/s] 65it [00:15, 4.36it/s] 66it [00:15, 4.31it/s] 67it [00:15, 4.26it/s] 68it [00:15, 4.29it/s] 69it [00:16, 4.31it/s] 70it [00:16, 4.26it/s] 71it [00:16, 4.40it/s] 72it [00:16, 4.29it/s] 73it [00:17, 4.39it/s] 74it [00:17, 4.39it/s] 75it [00:17, 4.45it/s] 76it [00:17, 4.51it/s] 77it [00:17, 4.50it/s] 78it [00:18, 4.42it/s] 79it [00:18, 4.37it/s] 80it [00:18, 4.22it/s] 81it [00:18, 4.34it/s] 82it [00:19, 4.30it/s] 83it [00:19, 4.28it/s] 84it [00:19, 4.34it/s] 85it [00:19, 4.44it/s] 86it [00:20, 4.51it/s] 87it [00:20, 4.41it/s] 88it [00:20, 4.49it/s] 89it [00:20, 4.41it/s] 90it [00:20, 4.49it/s] 91it [00:21, 4.49it/s] 92it [00:21, 4.46it/s] 93it [00:21, 4.51it/s] 94it [00:21, 4.56it/s] 95it [00:22, 4.62it/s] 96it [00:22, 4.64it/s] 97it [00:22, 4.67it/s] 98it [00:22, 4.50it/s] 99it [00:22, 4.58it/s] 100it [00:23, 4.57it/s]2025-05-25 22:27:52,681 - INFO - [Epoch 079 | Batch 0100] IWAE-loss 1205.5616 | mean log_px -0.0082 | KL -991.58 + 101it [00:23, 4.55it/s] 102it [00:23, 4.55it/s] 103it [00:23, 4.53it/s] 104it [00:24, 4.58it/s] 105it [00:24, 4.52it/s] 106it [00:24, 4.48it/s] 107it [00:24, 4.46it/s] 108it [00:24, 4.32it/s] 109it [00:25, 4.42it/s] 110it [00:25, 4.50it/s] 111it [00:25, 4.57it/s] 112it [00:25, 4.48it/s] 113it [00:26, 4.45it/s] 114it [00:26, 4.50it/s] 115it [00:26, 4.42it/s] 116it [00:26, 4.52it/s] 117it [00:26, 4.54it/s] 118it [00:27, 4.49it/s] 119it [00:27, 4.48it/s] 120it [00:27, 4.29it/s] 121it [00:27, 4.24it/s] 122it [00:28, 4.37it/s] 123it [00:28, 4.34it/s] 124it [00:28, 4.36it/s] 125it [00:28, 4.15it/s] 126it [00:29, 4.21it/s] 127it [00:29, 4.21it/s] 128it [00:29, 4.33it/s] 129it [00:29, 4.45it/s] 130it [00:29, 4.22it/s] 131it [00:30, 4.25it/s] 132it [00:30, 4.38it/s] 133it [00:30, 4.40it/s] 134it [00:30, 4.36it/s] 135it [00:31, 4.37it/s] 136it [00:31, 4.32it/s] 137it [00:31, 4.45it/s] 138it [00:31, 4.36it/s] 139it [00:32, 4.35it/s] 140it [00:32, 4.46it/s] 141it [00:32, 4.41it/s] 142it [00:32, 4.39it/s] 143it [00:32, 4.37it/s] 144it [00:33, 4.36it/s] 145it [00:33, 4.44it/s] 146it [00:33, 4.51it/s] 147it [00:33, 4.57it/s] 148it [00:34, 4.45it/s] 149it [00:34, 4.52it/s] 150it [00:34, 4.58it/s]2025-05-25 22:28:03,998 - INFO - [Epoch 079 | Batch 0150] IWAE-loss 1199.3240 | mean log_px -0.0036 | KL -990.65 + 151it [00:34, 4.44it/s] 152it [00:34, 4.54it/s] 153it [00:35, 4.60it/s] 154it [00:35, 4.60it/s] 155it [00:35, 4.64it/s] 156it [00:35, 4.52it/s] 157it [00:35, 4.60it/s] 158it [00:36, 4.63it/s] 159it [00:36, 4.49it/s] 160it [00:36, 4.57it/s] 161it [00:36, 4.54it/s] 162it [00:37, 4.50it/s] 163it [00:37, 4.46it/s] 164it [00:37, 4.28it/s] 165it [00:37, 4.20it/s] 166it [00:38, 4.23it/s] 167it [00:38, 4.31it/s] 168it [00:38, 4.40it/s] 169it [00:38, 4.33it/s] 170it [00:38, 4.43it/s] 171it [00:39, 4.33it/s] 172it [00:39, 4.34it/s] 173it [00:39, 4.41it/s] 174it [00:39, 4.38it/s] 175it [00:40, 4.50it/s] 176it [00:40, 4.50it/s] 177it [00:40, 4.42it/s] 178it [00:40, 4.36it/s] 179it [00:40, 4.39it/s] 180it [00:41, 4.47it/s] 181it [00:41, 4.45it/s] 182it [00:41, 4.35it/s] 183it [00:41, 4.42it/s] 184it [00:42, 4.51it/s] 185it [00:42, 4.41it/s] 186it [00:42, 4.41it/s] 187it [00:42, 4.50it/s] 188it [00:43, 4.54it/s] 189it [00:43, 4.43it/s] 190it [00:43, 4.29it/s] 191it [00:43, 4.41it/s] 192it [00:43, 4.42it/s] 193it [00:44, 4.36it/s] 194it [00:44, 4.31it/s] 195it [00:44, 4.18it/s] 196it [00:44, 4.28it/s] 196it [00:44, 4.36it/s] +2025-05-25 22:28:14,338 - INFO - Epoch: 79, Objective: tensor([1057.2749], device='cuda:0', grad_fn=), Loss: 0.0020423263777047396, KL/n: 20.246395111083984 + 0it [00:00, ?it/s]2025-05-25 22:28:14,916 - INFO - [Epoch 080 | Batch 0000] IWAE-loss 1272.5481 | mean log_px -0.0040 | KL -991.26 + 1it [00:00, 3.09it/s] 2it [00:00, 3.82it/s] 3it [00:00, 4.19it/s] 4it [00:00, 4.38it/s] 5it [00:01, 4.51it/s] 6it [00:01, 4.58it/s] 7it [00:01, 4.46it/s] 8it [00:01, 4.56it/s] 9it [00:02, 4.62it/s] 10it [00:02, 4.64it/s] 11it [00:02, 4.67it/s] 12it [00:02, 4.69it/s] 13it [00:02, 4.71it/s] 14it [00:03, 4.58it/s] 15it [00:03, 4.66it/s] 16it [00:03, 4.68it/s] 17it [00:03, 4.69it/s] 18it [00:03, 4.69it/s] 19it [00:04, 4.71it/s] 20it [00:04, 4.55it/s] 21it [00:04, 4.62it/s] 22it [00:04, 4.64it/s] 23it [00:05, 4.68it/s] 24it [00:05, 4.69it/s] 25it [00:05, 4.54it/s] 26it [00:05, 4.59it/s] 27it [00:05, 4.63it/s] 28it [00:06, 4.66it/s] 29it [00:06, 4.69it/s] 30it [00:06, 4.69it/s] 31it [00:06, 4.71it/s] 32it [00:06, 4.71it/s] 33it [00:07, 4.72it/s] 34it [00:07, 4.71it/s] 35it [00:07, 4.72it/s] 36it [00:07, 4.54it/s] 37it [00:08, 4.61it/s] 38it [00:08, 4.64it/s] 39it [00:08, 4.67it/s] 40it [00:08, 4.47it/s] 41it [00:08, 4.49it/s] 42it [00:09, 4.55it/s] 43it [00:09, 4.60it/s] 44it [00:09, 4.63it/s] 45it [00:09, 4.67it/s] 46it [00:10, 4.68it/s] 47it [00:10, 4.58it/s] 48it [00:10, 4.63it/s] 49it [00:10, 4.66it/s] 50it [00:10, 4.68it/s]2025-05-25 22:28:25,677 - INFO - [Epoch 080 | Batch 0050] IWAE-loss 1194.4015 | mean log_px -0.0039 | KL -991.29 + 51it [00:11, 4.69it/s] 52it [00:11, 4.51it/s] 53it [00:11, 4.60it/s] 54it [00:11, 4.63it/s] 55it [00:11, 4.60it/s] 56it [00:12, 4.63it/s] 57it [00:12, 4.66it/s] 58it [00:12, 4.67it/s] 59it [00:12, 4.65it/s] 60it [00:13, 4.66it/s] 61it [00:13, 4.68it/s] 62it [00:13, 4.52it/s] 63it [00:13, 4.58it/s] 64it [00:13, 4.61it/s] 65it [00:14, 4.64it/s] 66it [00:14, 4.63it/s] 67it [00:14, 4.65it/s] 68it [00:14, 4.66it/s] 69it [00:15, 4.49it/s] 70it [00:15, 4.55it/s] 71it [00:15, 4.60it/s] 72it [00:15, 4.62it/s] 73it [00:15, 4.52it/s] 74it [00:16, 4.58it/s] 75it [00:16, 4.64it/s] 76it [00:16, 4.66it/s] 77it [00:16, 4.68it/s] 78it [00:16, 4.69it/s] 79it [00:17, 4.69it/s] 80it [00:17, 4.65it/s] 81it [00:17, 4.70it/s] 82it [00:17, 4.53it/s] 83it [00:18, 4.60it/s] 84it [00:18, 4.63it/s] 85it [00:18, 4.67it/s] 86it [00:18, 4.68it/s] 87it [00:18, 4.69it/s] 88it [00:19, 4.70it/s] 89it [00:19, 4.71it/s] 90it [00:19, 4.54it/s] 91it [00:19, 4.61it/s] 92it [00:19, 4.63it/s] 93it [00:20, 4.66it/s] 94it [00:20, 4.65it/s] 95it [00:20, 4.68it/s] 96it [00:20, 4.69it/s] 97it [00:21, 4.70it/s] 98it [00:21, 4.70it/s] 99it [00:21, 4.70it/s] 100it [00:21, 4.54it/s]2025-05-25 22:28:36,484 - INFO - [Epoch 080 | Batch 0100] IWAE-loss 1640.9240 | mean log_px -0.0125 | KL -990.32 + 101it [00:21, 4.61it/s] 102it [00:22, 4.63it/s] 103it [00:22, 4.67it/s] 104it [00:22, 4.69it/s] 105it [00:22, 4.70it/s] 106it [00:22, 4.68it/s] 107it [00:23, 4.70it/s] 108it [00:23, 4.70it/s] 109it [00:23, 4.71it/s] 110it [00:23, 4.49it/s] 111it [00:24, 4.55it/s] 112it [00:24, 4.59it/s] 113it [00:24, 4.63it/s] 114it [00:24, 4.65it/s] 115it [00:24, 4.66it/s] 116it [00:25, 4.67it/s] 117it [00:25, 4.69it/s] 118it [00:25, 4.70it/s] 119it [00:25, 4.53it/s] 120it [00:25, 4.60it/s] 121it [00:26, 4.64it/s] 122it [00:26, 4.65it/s] 123it [00:26, 4.67it/s] 124it [00:26, 4.68it/s] 125it [00:27, 4.53it/s] 126it [00:27, 4.59it/s] 127it [00:27, 4.63it/s] 128it [00:27, 4.64it/s] 129it [00:27, 4.67it/s] 130it [00:28, 4.55it/s] 131it [00:28, 4.61it/s] 132it [00:28, 4.56it/s] 133it [00:28, 4.60it/s] 134it [00:29, 4.47it/s] 135it [00:29, 4.56it/s] 136it [00:29, 4.60it/s] 137it [00:29, 4.65it/s] 138it [00:29, 4.66it/s] 139it [00:30, 4.68it/s] 140it [00:30, 4.67it/s] 141it [00:30, 4.69it/s] 142it [00:30, 4.70it/s] 143it [00:30, 4.71it/s] 144it [00:31, 4.71it/s] 145it [00:31, 4.55it/s] 146it [00:31, 4.61it/s] 147it [00:31, 4.65it/s] 148it [00:32, 4.66it/s] 149it [00:32, 4.68it/s] 150it [00:32, 4.69it/s]2025-05-25 22:28:47,256 - INFO - [Epoch 080 | Batch 0150] IWAE-loss 1795.7816 | mean log_px -0.0194 | KL -987.38 + 151it [00:32, 4.70it/s] 152it [00:32, 4.70it/s] 153it [00:33, 4.71it/s] 154it [00:33, 4.71it/s] 155it [00:33, 4.71it/s] 156it [00:33, 4.54it/s] 157it [00:33, 4.61it/s] 158it [00:34, 4.64it/s] 159it [00:34, 4.66it/s] 160it [00:34, 4.67it/s] 161it [00:34, 4.68it/s] 162it [00:35, 4.69it/s] 163it [00:35, 4.70it/s] 164it [00:35, 4.53it/s] 165it [00:35, 4.60it/s] 166it [00:35, 4.63it/s] 167it [00:36, 4.65it/s] 168it [00:36, 4.66it/s] 169it [00:36, 4.67it/s] 170it [00:36, 4.51it/s] 171it [00:36, 4.58it/s] 172it [00:37, 4.61it/s] 173it [00:37, 4.64it/s] 174it [00:37, 4.61it/s] 175it [00:37, 4.64it/s] 176it [00:38, 4.49it/s] 177it [00:38, 4.56it/s] 178it [00:38, 4.60it/s] 179it [00:38, 4.63it/s] 180it [00:38, 4.65it/s] 181it [00:39, 4.67it/s] 182it [00:39, 4.68it/s] 183it [00:39, 4.69it/s] 184it [00:39, 4.67it/s] 185it [00:39, 4.69it/s] 186it [00:40, 4.51it/s] 187it [00:40, 4.43it/s] 188it [00:40, 4.51it/s] 189it [00:40, 4.57it/s] 190it [00:41, 4.60it/s] 191it [00:41, 4.65it/s] 192it [00:41, 4.49it/s] 193it [00:41, 4.57it/s] 194it [00:41, 4.61it/s] 195it [00:42, 4.34it/s] 196it [00:42, 4.41it/s] 196it [00:42, 4.61it/s] +2025-05-25 22:28:57,186 - INFO - Epoch: 80, Objective: tensor([1140.7397], device='cuda:0', grad_fn=), Loss: 0.0032359547913074493, KL/n: 20.226318359375 + 0it [00:00, ?it/s]2025-05-25 22:28:57,775 - INFO - [Epoch 081 | Batch 0000] IWAE-loss 1103.5593 | mean log_px -0.0022 | KL -990.32 + 1it [00:00, 3.05it/s] 2it [00:00, 3.84it/s] 3it [00:00, 4.06it/s] 4it [00:01, 4.14it/s] 5it [00:01, 4.33it/s] 6it [00:01, 4.45it/s] 7it [00:01, 4.41it/s] 8it [00:01, 4.31it/s] 9it [00:02, 4.44it/s] 10it [00:02, 4.45it/s] 11it [00:02, 4.51it/s] 12it [00:02, 4.55it/s] 13it [00:02, 4.61it/s] 14it [00:03, 4.51it/s] 15it [00:03, 4.47it/s] 16it [00:03, 4.46it/s] 17it [00:03, 4.50it/s] 18it [00:04, 4.42it/s] 19it [00:04, 4.39it/s] 20it [00:04, 4.34it/s] 21it [00:04, 4.34it/s] 22it [00:05, 4.36it/s] 23it [00:05, 4.38it/s] 24it [00:05, 4.45it/s] 25it [00:05, 4.53it/s] 26it [00:05, 4.54it/s] 27it [00:06, 4.42it/s] 28it [00:06, 4.49it/s] 29it [00:06, 4.44it/s] 30it [00:06, 4.42it/s] 31it [00:07, 4.50it/s] 32it [00:07, 4.56it/s] 33it [00:07, 4.56it/s] 34it [00:07, 4.58it/s] 35it [00:07, 4.62it/s] 36it [00:08, 4.49it/s] 37it [00:08, 4.44it/s] 38it [00:08, 4.50it/s] 39it [00:08, 4.28it/s] 40it [00:09, 4.42it/s] 41it [00:09, 4.37it/s] 42it [00:09, 4.39it/s] 43it [00:09, 4.43it/s] 44it [00:09, 4.39it/s] 45it [00:10, 4.48it/s] 46it [00:10, 4.55it/s] 47it [00:10, 4.48it/s] 48it [00:10, 4.37it/s] 49it [00:11, 4.36it/s] 50it [00:11, 4.35it/s]2025-05-25 22:29:08,996 - INFO - [Epoch 081 | Batch 0050] IWAE-loss 1255.6204 | mean log_px -0.0048 | KL -987.30 + 51it [00:11, 4.42it/s] 52it [00:11, 4.38it/s] 53it [00:11, 4.47it/s] 54it [00:12, 4.54it/s] 55it [00:12, 4.38it/s] 56it [00:12, 4.40it/s] 57it [00:12, 4.40it/s] 58it [00:13, 4.47it/s] 59it [00:13, 4.42it/s] 60it [00:13, 4.46it/s] 61it [00:13, 4.49it/s] 62it [00:14, 4.44it/s] 63it [00:14, 4.48it/s] 64it [00:14, 4.35it/s] 65it [00:14, 4.37it/s] 66it [00:14, 4.35it/s] 67it [00:15, 4.40it/s] 68it [00:15, 4.48it/s] 69it [00:15, 4.31it/s] 70it [00:15, 4.44it/s] 71it [00:16, 4.37it/s] 72it [00:16, 4.39it/s] 73it [00:16, 4.36it/s] 74it [00:16, 4.37it/s] 75it [00:16, 4.35it/s] 76it [00:17, 4.44it/s] 77it [00:17, 4.40it/s] 78it [00:17, 4.47it/s] 79it [00:17, 4.54it/s] 80it [00:18, 4.61it/s] 81it [00:18, 4.65it/s] 82it [00:18, 4.52it/s] 83it [00:18, 4.51it/s] 84it [00:18, 4.54it/s] 85it [00:19, 4.47it/s] 86it [00:19, 4.39it/s] 87it [00:19, 4.38it/s] 88it [00:19, 4.34it/s] 89it [00:20, 4.46it/s] 90it [00:20, 4.49it/s] 91it [00:20, 4.47it/s] 92it [00:20, 4.40it/s] 93it [00:21, 4.37it/s] 94it [00:21, 4.44it/s] 95it [00:21, 4.32it/s] 96it [00:21, 4.44it/s] 97it [00:21, 4.53it/s] 98it [00:22, 4.44it/s] 99it [00:22, 4.40it/s] 100it [00:22, 4.48it/s]2025-05-25 22:29:20,251 - INFO - [Epoch 081 | Batch 0100] IWAE-loss 1271.0948 | mean log_px -0.0054 | KL -990.43 + 101it [00:22, 4.54it/s] 102it [00:23, 4.59it/s] 103it [00:23, 4.52it/s] 104it [00:23, 4.43it/s] 105it [00:23, 4.42it/s] 106it [00:23, 4.28it/s] 107it [00:24, 4.43it/s] 108it [00:24, 4.46it/s] 109it [00:24, 4.51it/s] 110it [00:24, 4.57it/s] 111it [00:25, 4.47it/s] 112it [00:25, 4.54it/s] 113it [00:25, 4.52it/s] 114it [00:25, 4.57it/s] 115it [00:25, 4.46it/s] 116it [00:26, 4.55it/s] 117it [00:26, 4.47it/s] 118it [00:26, 4.39it/s] 119it [00:26, 4.40it/s] 120it [00:27, 4.35it/s] 121it [00:27, 4.38it/s] 122it [00:27, 4.34it/s] 123it [00:27, 4.38it/s] 124it [00:27, 4.43it/s] 125it [00:28, 4.52it/s] 126it [00:28, 4.58it/s] 127it [00:28, 4.62it/s] 128it [00:28, 4.48it/s] 129it [00:29, 4.51it/s] 130it [00:29, 4.55it/s] 131it [00:29, 4.59it/s] 132it [00:29, 4.52it/s] 133it [00:29, 4.36it/s] 134it [00:30, 4.38it/s] 135it [00:30, 4.40it/s] 136it [00:30, 4.42it/s] 137it [00:30, 4.44it/s] 138it [00:31, 4.45it/s] 139it [00:31, 4.54it/s] 140it [00:31, 4.57it/s] 141it [00:31, 4.50it/s] 142it [00:31, 4.52it/s] 143it [00:32, 4.43it/s] 144it [00:32, 4.53it/s] 145it [00:32, 4.52it/s] 146it [00:32, 4.57it/s] 147it [00:33, 4.54it/s] 148it [00:33, 4.57it/s] 149it [00:33, 4.62it/s] 150it [00:33, 4.51it/s]2025-05-25 22:29:31,410 - INFO - [Epoch 081 | Batch 0150] IWAE-loss 1643.7526 | mean log_px -0.0269 | KL -987.94 + 151it [00:33, 4.49it/s] 152it [00:34, 4.49it/s] 153it [00:34, 4.55it/s] 154it [00:34, 4.59it/s] 155it [00:34, 4.47it/s] 156it [00:35, 4.41it/s] 157it [00:35, 4.39it/s] 158it [00:35, 4.48it/s] 159it [00:35, 4.47it/s] 160it [00:35, 4.53it/s] 161it [00:36, 4.43it/s] 162it [00:36, 4.53it/s] 163it [00:36, 4.59it/s] 164it [00:36, 4.62it/s] 165it [00:37, 4.66it/s] 166it [00:37, 4.41it/s] 167it [00:37, 4.51it/s] 168it [00:37, 4.56it/s] 169it [00:37, 4.61it/s] 170it [00:38, 4.50it/s] 171it [00:38, 4.52it/s] 172it [00:38, 4.40it/s] 173it [00:38, 4.26it/s] 174it [00:39, 4.39it/s] 175it [00:39, 4.43it/s] 176it [00:39, 4.40it/s] 177it [00:39, 4.45it/s] 178it [00:39, 4.53it/s] 179it [00:40, 4.45it/s] 180it [00:40, 4.22it/s] 181it [00:40, 4.29it/s] 182it [00:40, 4.37it/s] 183it [00:41, 4.48it/s] 184it [00:41, 4.42it/s] 185it [00:41, 4.44it/s] 186it [00:41, 4.50it/s] 187it [00:42, 4.48it/s] 188it [00:42, 4.52it/s] 189it [00:42, 4.43it/s] 190it [00:42, 4.51it/s] 191it [00:42, 4.27it/s] 192it [00:43, 4.30it/s] 193it [00:43, 4.31it/s] 194it [00:43, 4.40it/s] 195it [00:43, 4.27it/s] 196it [00:44, 4.42it/s] 196it [00:44, 4.44it/s] +2025-05-25 22:29:41,669 - INFO - Epoch: 81, Objective: tensor([1722.9547], device='cuda:0', grad_fn=), Loss: 0.013793299905955791, KL/n: 20.196060180664062 + 0it [00:00, ?it/s]2025-05-25 22:29:42,066 - INFO - [Epoch 082 | Batch 0000] IWAE-loss 1131.7792 | mean log_px -0.0034 | KL -989.71 + 1it [00:00, 2.80it/s] 2it [00:00, 3.53it/s] 3it [00:00, 3.83it/s] 4it [00:01, 4.12it/s] 5it [00:01, 4.23it/s] 6it [00:01, 4.34it/s] 7it [00:01, 4.46it/s] 8it [00:01, 4.50it/s] 9it [00:02, 4.56it/s] 10it [00:02, 4.46it/s] 11it [00:02, 4.32it/s] 12it [00:02, 4.40it/s] 13it [00:03, 4.49it/s] 14it [00:03, 4.42it/s] 15it [00:03, 4.51it/s] 16it [00:03, 4.47it/s] 17it [00:03, 4.28it/s] 18it [00:04, 4.28it/s] 19it [00:04, 4.28it/s] 20it [00:04, 4.27it/s] 21it [00:04, 4.42it/s] 22it [00:05, 4.35it/s] 23it [00:05, 4.14it/s] 24it [00:05, 4.10it/s] 25it [00:05, 4.15it/s] 26it [00:06, 4.17it/s] 27it [00:06, 4.32it/s] 28it [00:06, 4.29it/s] 29it [00:06, 4.35it/s] 30it [00:07, 4.27it/s] 31it [00:07, 4.27it/s] 32it [00:07, 4.27it/s] 33it [00:07, 4.33it/s] 34it [00:07, 4.33it/s] 35it [00:08, 4.40it/s] 36it [00:08, 4.35it/s] 37it [00:08, 4.28it/s] 38it [00:08, 4.22it/s] 39it [00:09, 4.30it/s] 40it [00:09, 4.34it/s] 41it [00:09, 4.30it/s] 42it [00:09, 4.28it/s] 43it [00:10, 4.34it/s] 44it [00:10, 4.37it/s] 45it [00:10, 4.33it/s] 46it [00:10, 4.18it/s] 47it [00:10, 4.33it/s] 48it [00:11, 4.29it/s] 49it [00:11, 4.39it/s] 50it [00:11, 4.37it/s]2025-05-25 22:29:53,603 - INFO - [Epoch 082 | Batch 0050] IWAE-loss 1399.6855 | mean log_px -0.0098 | KL -989.36 + 51it [00:11, 4.45it/s] 52it [00:12, 4.37it/s] 53it [00:12, 4.29it/s] 54it [00:12, 4.29it/s] 55it [00:12, 4.35it/s] 56it [00:13, 4.43it/s] 57it [00:13, 4.36it/s] 58it [00:13, 4.38it/s] 59it [00:13, 4.33it/s] 60it [00:13, 4.29it/s] 61it [00:14, 4.32it/s] 62it [00:14, 4.31it/s] 63it [00:14, 4.26it/s] 64it [00:14, 4.27it/s] 65it [00:15, 4.25it/s] 66it [00:15, 4.20it/s] 67it [00:15, 4.24it/s] 68it [00:15, 4.28it/s] 69it [00:16, 4.27it/s] 70it [00:16, 4.27it/s] 71it [00:16, 4.15it/s] 72it [00:16, 4.17it/s] 73it [00:17, 4.22it/s] 74it [00:17, 4.23it/s] 75it [00:17, 4.16it/s] 76it [00:17, 4.19it/s] 77it [00:17, 4.27it/s] 78it [00:18, 4.37it/s] 79it [00:18, 4.39it/s] 80it [00:18, 4.21it/s] 81it [00:18, 4.32it/s] 82it [00:19, 4.35it/s] 83it [00:19, 4.41it/s] 84it [00:19, 4.41it/s] 85it [00:19, 4.39it/s] 86it [00:20, 4.36it/s] 87it [00:20, 4.28it/s] 88it [00:20, 4.31it/s] 89it [00:20, 4.38it/s] 90it [00:20, 4.33it/s] 91it [00:21, 4.18it/s] 92it [00:21, 4.30it/s] 93it [00:21, 4.27it/s] 94it [00:21, 4.38it/s] 95it [00:22, 4.48it/s] 96it [00:22, 4.40it/s] 97it [00:22, 4.43it/s] 98it [00:22, 4.23it/s] 99it [00:23, 4.33it/s] 100it [00:23, 4.29it/s]2025-05-25 22:30:05,234 - INFO - [Epoch 082 | Batch 0100] IWAE-loss 1105.8473 | mean log_px -0.0035 | KL -983.66 + 101it [00:23, 4.34it/s] 102it [00:23, 4.26it/s] 103it [00:23, 4.26it/s] 104it [00:24, 4.31it/s] 105it [00:24, 4.30it/s] 106it [00:24, 4.37it/s] 107it [00:24, 4.48it/s] 108it [00:25, 4.53it/s] 109it [00:25, 4.28it/s] 110it [00:25, 4.32it/s] 111it [00:25, 4.29it/s] 112it [00:26, 4.32it/s] 113it [00:26, 4.40it/s] 114it [00:26, 4.35it/s] 115it [00:26, 4.28it/s] 116it [00:26, 4.24it/s] 117it [00:27, 4.23it/s] 118it [00:27, 4.22it/s] 119it [00:27, 4.27it/s] 120it [00:27, 4.14it/s] 121it [00:28, 4.24it/s] 122it [00:28, 4.21it/s] 123it [00:28, 4.18it/s] 124it [00:28, 4.33it/s] 125it [00:29, 4.29it/s] 126it [00:29, 4.30it/s] 127it [00:29, 4.30it/s] 128it [00:29, 4.16it/s] 129it [00:30, 4.26it/s] 130it [00:30, 4.27it/s] 131it [00:30, 4.25it/s] 132it [00:30, 4.30it/s] 133it [00:30, 4.22it/s] 134it [00:31, 4.21it/s] 135it [00:31, 4.19it/s] 136it [00:31, 4.21it/s] 137it [00:31, 4.32it/s] 138it [00:32, 4.21it/s] 139it [00:32, 4.25it/s] 140it [00:32, 4.30it/s] 141it [00:32, 4.35it/s] 142it [00:33, 4.30it/s] 143it [00:33, 4.24it/s] 144it [00:33, 4.35it/s] 145it [00:33, 4.45it/s] 146it [00:33, 4.37it/s] 147it [00:34, 4.36it/s] 148it [00:34, 4.45it/s] 149it [00:34, 4.41it/s] 150it [00:34, 4.22it/s]2025-05-25 22:30:16,900 - INFO - [Epoch 082 | Batch 0150] IWAE-loss 1394.0895 | mean log_px -0.0172 | KL -984.26 + 151it [00:35, 4.24it/s] 152it [00:35, 4.36it/s] 153it [00:35, 4.30it/s] 154it [00:35, 4.29it/s] 155it [00:36, 4.22it/s] 156it [00:36, 4.32it/s] 157it [00:36, 4.28it/s] 158it [00:36, 4.34it/s] 159it [00:36, 4.44it/s] 160it [00:37, 4.51it/s] 161it [00:37, 4.41it/s] 162it [00:37, 4.46it/s] 163it [00:37, 4.52it/s] 164it [00:38, 4.37it/s] 165it [00:38, 4.32it/s] 166it [00:38, 4.41it/s] 167it [00:38, 4.20it/s] 168it [00:39, 4.27it/s] 169it [00:39, 4.23it/s] 170it [00:39, 4.36it/s] 171it [00:39, 4.31it/s] 172it [00:39, 4.39it/s] 173it [00:40, 4.33it/s] 174it [00:40, 4.15it/s] 175it [00:40, 4.26it/s] 176it [00:40, 4.23it/s] 177it [00:41, 4.26it/s] 178it [00:41, 4.23it/s] 179it [00:41, 4.27it/s] 180it [00:41, 4.23it/s] 181it [00:42, 4.23it/s] 182it [00:42, 4.22it/s] 183it [00:42, 4.35it/s] 184it [00:42, 4.42it/s] 185it [00:43, 4.47it/s] 186it [00:43, 4.50it/s] 187it [00:43, 4.51it/s] 188it [00:43, 4.43it/s] 189it [00:43, 4.34it/s] 190it [00:44, 4.41it/s] 191it [00:44, 4.34it/s] 192it [00:44, 4.16it/s] 193it [00:44, 4.17it/s] 194it [00:45, 4.26it/s] 195it [00:45, 4.26it/s] 196it [00:45, 4.24it/s] 196it [00:45, 4.29it/s] +2025-05-25 22:30:27,441 - INFO - Epoch: 82, Objective: tensor([1214.3734], device='cuda:0', grad_fn=), Loss: 0.005592620465904474, KL/n: 20.130046844482422 + 0it [00:00, ?it/s]2025-05-25 22:30:28,016 - INFO - [Epoch 083 | Batch 0000] IWAE-loss 1186.2911 | mean log_px -0.0061 | KL -989.00 + 1it [00:00, 3.07it/s] 2it [00:00, 3.89it/s] 3it [00:00, 4.24it/s] 4it [00:00, 4.38it/s] 5it [00:01, 4.52it/s] 6it [00:01, 4.57it/s] 7it [00:01, 4.63it/s] 8it [00:01, 4.64it/s] 9it [00:02, 4.66it/s] 10it [00:02, 4.67it/s] 11it [00:02, 4.68it/s] 12it [00:02, 4.52it/s] 13it [00:02, 4.60it/s] 14it [00:03, 4.62it/s] 15it [00:03, 4.65it/s] 16it [00:03, 4.67it/s] 17it [00:03, 4.69it/s] 18it [00:03, 4.69it/s] 19it [00:04, 4.70it/s] 20it [00:04, 4.69it/s] 21it [00:04, 4.53it/s] 22it [00:04, 4.59it/s] 23it [00:05, 4.63it/s] 24it [00:05, 4.64it/s] 25it [00:05, 4.65it/s] 26it [00:05, 4.66it/s] 27it [00:05, 4.52it/s] 28it [00:06, 4.58it/s] 29it [00:06, 4.62it/s] 30it [00:06, 4.64it/s] 31it [00:06, 4.66it/s] 32it [00:06, 4.62it/s] 33it [00:07, 4.65it/s] 34it [00:07, 4.66it/s] 35it [00:07, 4.67it/s] 36it [00:07, 4.66it/s] 37it [00:08, 4.68it/s] 38it [00:08, 4.51it/s] 39it [00:08, 4.58it/s] 40it [00:08, 4.62it/s] 41it [00:08, 4.64it/s] 42it [00:09, 4.60it/s] 43it [00:09, 4.64it/s] 44it [00:09, 4.65it/s] 45it [00:09, 4.66it/s] 46it [00:10, 4.66it/s] 47it [00:10, 4.68it/s] 48it [00:10, 4.69it/s] 49it [00:10, 4.53it/s] 50it [00:10, 4.59it/s]2025-05-25 22:30:38,796 - INFO - [Epoch 083 | Batch 0050] IWAE-loss 1646.4308 | mean log_px -0.0101 | KL -982.95 + 51it [00:11, 4.61it/s] 52it [00:11, 4.63it/s] 53it [00:11, 4.66it/s] 54it [00:11, 4.68it/s] 55it [00:11, 4.69it/s] 56it [00:12, 4.69it/s] 57it [00:12, 4.54it/s] 58it [00:12, 4.60it/s] 59it [00:12, 4.63it/s] 60it [00:13, 4.65it/s] 61it [00:13, 4.67it/s] 62it [00:13, 4.68it/s] 63it [00:13, 4.53it/s] 64it [00:13, 4.59it/s] 65it [00:14, 4.62it/s] 66it [00:14, 4.51it/s] 67it [00:14, 4.55it/s] 68it [00:14, 4.59it/s] 69it [00:14, 4.60it/s] 70it [00:15, 4.62it/s] 71it [00:15, 4.63it/s] 72it [00:15, 4.64it/s] 73it [00:15, 4.66it/s] 74it [00:16, 4.49it/s] 75it [00:16, 4.46it/s] 76it [00:16, 4.50it/s] 77it [00:16, 4.54it/s] 78it [00:16, 4.56it/s] 79it [00:17, 4.56it/s] 80it [00:17, 4.59it/s] 81it [00:17, 4.63it/s] 82it [00:17, 4.64it/s] 83it [00:18, 4.50it/s] 84it [00:18, 4.56it/s] 85it [00:18, 4.60it/s] 86it [00:18, 4.63it/s] 87it [00:18, 4.65it/s] 88it [00:19, 4.65it/s] 89it [00:19, 4.50it/s] 90it [00:19, 4.56it/s] 91it [00:19, 4.60it/s] 92it [00:20, 4.63it/s] 93it [00:20, 4.64it/s] 94it [00:20, 4.64it/s] 95it [00:20, 4.57it/s] 96it [00:20, 4.59it/s] 97it [00:21, 4.62it/s] 98it [00:21, 4.64it/s] 99it [00:21, 4.49it/s] 100it [00:21, 4.54it/s]2025-05-25 22:30:49,676 - INFO - [Epoch 083 | Batch 0100] IWAE-loss 1244.4196 | mean log_px -0.0098 | KL -981.24 + 101it [00:21, 4.58it/s] 102it [00:22, 4.61it/s] 103it [00:22, 4.62it/s] 104it [00:22, 4.63it/s] 105it [00:22, 4.65it/s] 106it [00:23, 4.66it/s] 107it [00:23, 4.68it/s] 108it [00:23, 4.66it/s] 109it [00:23, 4.68it/s] 110it [00:23, 4.68it/s] 111it [00:24, 4.69it/s] 112it [00:24, 4.69it/s] 113it [00:24, 4.53it/s] 114it [00:24, 4.58it/s] 115it [00:24, 4.60it/s] 116it [00:25, 4.63it/s] 117it [00:25, 4.66it/s] 118it [00:25, 4.50it/s] 119it [00:25, 4.57it/s] 120it [00:26, 4.60it/s] 121it [00:26, 4.64it/s] 122it [00:26, 4.65it/s] 123it [00:26, 4.65it/s] 124it [00:26, 4.66it/s] 125it [00:27, 4.68it/s] 126it [00:27, 4.68it/s] 127it [00:27, 4.53it/s] 128it [00:27, 4.58it/s] 129it [00:28, 4.62it/s] 130it [00:28, 4.63it/s] 131it [00:28, 4.65it/s] 132it [00:28, 4.65it/s] 133it [00:28, 4.65it/s] 134it [00:29, 4.52it/s] 135it [00:29, 4.58it/s] 136it [00:29, 4.59it/s] 137it [00:29, 4.61it/s] 138it [00:29, 4.62it/s] 139it [00:30, 4.65it/s] 140it [00:30, 4.66it/s] 141it [00:30, 4.67it/s] 142it [00:30, 4.68it/s] 143it [00:31, 4.69it/s] 144it [00:31, 4.69it/s] 145it [00:31, 4.69it/s] 146it [00:31, 4.68it/s] 147it [00:31, 4.69it/s] 148it [00:32, 4.64it/s] 149it [00:32, 4.46it/s] 150it [00:32, 4.54it/s]2025-05-25 22:31:00,483 - INFO - [Epoch 083 | Batch 0150] IWAE-loss 1072.7214 | mean log_px -0.0020 | KL -980.33 + 151it [00:32, 4.58it/s] 152it [00:32, 4.61it/s] 153it [00:33, 4.64it/s] 154it [00:33, 4.65it/s] 155it [00:33, 4.49it/s] 156it [00:33, 4.55it/s] 157it [00:34, 4.59it/s] 158it [00:34, 4.62it/s] 159it [00:34, 4.64it/s] 160it [00:34, 4.65it/s] 161it [00:34, 4.66it/s] 162it [00:35, 4.66it/s] 163it [00:35, 4.56it/s] 164it [00:35, 4.60it/s] 165it [00:35, 4.63it/s] 166it [00:36, 4.57it/s] 167it [00:36, 4.62it/s] 168it [00:36, 4.62it/s] 169it [00:36, 4.65it/s] 170it [00:36, 4.65it/s] 171it [00:37, 4.65it/s] 172it [00:37, 4.66it/s] 173it [00:37, 4.50it/s] 174it [00:37, 4.56it/s] 175it [00:37, 4.60it/s] 176it [00:38, 4.62it/s] 177it [00:38, 4.65it/s] 178it [00:38, 4.49it/s] 179it [00:38, 4.57it/s] 180it [00:39, 4.60it/s] 181it [00:39, 4.64it/s] 182it [00:39, 4.64it/s] 183it [00:39, 4.66it/s] 184it [00:39, 4.66it/s] 185it [00:40, 4.68it/s] 186it [00:40, 4.68it/s] 187it [00:40, 4.69it/s] 188it [00:40, 4.52it/s] 189it [00:41, 4.56it/s] 190it [00:41, 4.60it/s] 191it [00:41, 4.63it/s] 192it [00:41, 4.62it/s] 193it [00:41, 4.63it/s] 194it [00:42, 4.65it/s] 195it [00:42, 4.31it/s] 196it [00:42, 4.42it/s] 196it [00:42, 4.60it/s] +2025-05-25 22:31:10,408 - INFO - Epoch: 83, Objective: tensor([1636.0144], device='cuda:0', grad_fn=), Loss: 0.006700733210891485, KL/n: 19.999908447265625 + 0it [00:00, ?it/s]2025-05-25 22:31:10,762 - INFO - [Epoch 084 | Batch 0000] IWAE-loss 1054.2181 | mean log_px -0.0055 | KL -978.12 + 1it [00:00, 3.57it/s] 2it [00:00, 3.88it/s] 3it [00:00, 4.08it/s] 4it [00:00, 4.25it/s] 5it [00:01, 4.23it/s] 6it [00:01, 4.16it/s] 7it [00:01, 3.40it/s] 8it [00:02, 3.69it/s] 9it [00:02, 3.84it/s] 10it [00:02, 3.96it/s] 11it [00:02, 4.08it/s] 12it [00:03, 4.03it/s] 13it [00:03, 4.19it/s] 14it [00:03, 4.20it/s] 15it [00:03, 4.22it/s] 16it [00:03, 4.22it/s] 17it [00:04, 4.13it/s] 18it [00:04, 4.27it/s] 19it [00:04, 4.18it/s] 20it [00:04, 4.27it/s] 21it [00:05, 4.32it/s] 22it [00:05, 4.30it/s] 23it [00:05, 4.37it/s] 24it [00:05, 4.16it/s] 25it [00:06, 4.23it/s] 26it [00:06, 4.26it/s] 27it [00:06, 4.29it/s] 28it [00:06, 4.30it/s] 29it [00:07, 4.33it/s] 30it [00:07, 4.35it/s] 31it [00:07, 4.44it/s] 32it [00:07, 4.51it/s] 33it [00:07, 4.50it/s] 34it [00:08, 4.45it/s] 35it [00:08, 4.48it/s] 36it [00:08, 4.41it/s] 37it [00:08, 4.36it/s] 38it [00:09, 4.36it/s] 39it [00:09, 4.30it/s] 40it [00:09, 4.32it/s] 41it [00:09, 4.27it/s] 42it [00:09, 4.28it/s] 43it [00:10, 4.29it/s] 44it [00:10, 4.28it/s] 45it [00:10, 4.28it/s] 46it [00:10, 4.38it/s] 47it [00:11, 4.27it/s] 48it [00:11, 4.39it/s] 49it [00:11, 4.42it/s] 50it [00:11, 4.45it/s]2025-05-25 22:31:22,497 - INFO - [Epoch 084 | Batch 0050] IWAE-loss 1040.5332 | mean log_px -0.0009 | KL -971.92 + 51it [00:12, 4.48it/s] 52it [00:12, 4.35it/s] 53it [00:12, 4.46it/s] 54it [00:12, 4.37it/s] 55it [00:12, 4.33it/s] 56it [00:13, 4.30it/s] 57it [00:13, 4.17it/s] 58it [00:13, 4.17it/s] 59it [00:13, 4.20it/s] 60it [00:14, 4.29it/s] 61it [00:14, 4.22it/s] 62it [00:14, 4.12it/s] 63it [00:14, 4.17it/s] 64it [00:15, 4.21it/s] 65it [00:15, 4.22it/s] 66it [00:15, 4.34it/s] 67it [00:15, 4.28it/s] 68it [00:16, 4.37it/s] 69it [00:16, 4.34it/s] 70it [00:16, 4.32it/s] 71it [00:16, 4.28it/s] 72it [00:16, 4.26it/s] 73it [00:17, 4.29it/s] 74it [00:17, 4.30it/s] 75it [00:17, 4.28it/s] 76it [00:17, 4.26it/s] 77it [00:18, 4.23it/s] 78it [00:18, 4.24it/s] 79it [00:18, 4.28it/s] 80it [00:18, 4.35it/s] 81it [00:19, 4.41it/s] 82it [00:19, 4.33it/s] 83it [00:19, 4.30it/s] 84it [00:19, 4.38it/s] 85it [00:19, 4.41it/s] 86it [00:20, 4.29it/s] 87it [00:20, 4.28it/s] 88it [00:20, 4.40it/s] 89it [00:20, 4.30it/s] 90it [00:21, 4.31it/s] 91it [00:21, 4.33it/s] 92it [00:21, 4.38it/s] 93it [00:21, 4.22it/s] 94it [00:22, 4.22it/s] 95it [00:22, 4.31it/s] 96it [00:22, 4.24it/s] 97it [00:22, 4.33it/s] 98it [00:22, 4.35it/s] 99it [00:23, 4.32it/s] 100it [00:23, 4.18it/s]2025-05-25 22:31:34,173 - INFO - [Epoch 084 | Batch 0100] IWAE-loss 1327.8715 | mean log_px -0.0200 | KL -971.95 + 101it [00:23, 4.29it/s] 102it [00:23, 4.24it/s] 103it [00:24, 4.27it/s] 104it [00:24, 4.36it/s] 105it [00:24, 4.31it/s] 106it [00:24, 4.31it/s] 107it [00:25, 4.30it/s] 108it [00:25, 4.28it/s] 109it [00:25, 4.38it/s] 110it [00:25, 4.33it/s] 111it [00:26, 4.31it/s] 112it [00:26, 4.16it/s] 113it [00:26, 4.18it/s] 114it [00:26, 4.18it/s] 115it [00:26, 4.21it/s] 116it [00:27, 4.29it/s] 117it [00:27, 4.39it/s] 118it [00:27, 4.34it/s] 119it [00:27, 4.25it/s] 120it [00:28, 4.25it/s] 121it [00:28, 4.33it/s] 122it [00:28, 4.32it/s] 123it [00:28, 4.34it/s] 124it [00:29, 4.30it/s] 125it [00:29, 4.39it/s] 126it [00:29, 4.34it/s] 127it [00:29, 4.43it/s] 128it [00:29, 4.33it/s] 129it [00:30, 4.30it/s] 130it [00:30, 4.26it/s] 131it [00:30, 4.16it/s] 132it [00:30, 4.16it/s] 133it [00:31, 4.18it/s] 134it [00:31, 4.21it/s] 135it [00:31, 4.15it/s] 136it [00:31, 4.15it/s] 137it [00:32, 4.27it/s] 138it [00:32, 4.23it/s] 139it [00:32, 4.33it/s] 140it [00:32, 4.13it/s] 141it [00:33, 4.18it/s] 142it [00:33, 4.27it/s] 143it [00:33, 4.26it/s] 144it [00:33, 4.26it/s] 145it [00:34, 4.23it/s] 146it [00:34, 4.10it/s] 147it [00:34, 4.24it/s] 148it [00:34, 4.22it/s] 149it [00:34, 4.27it/s] 150it [00:35, 4.22it/s]2025-05-25 22:31:45,917 - INFO - [Epoch 084 | Batch 0150] IWAE-loss 1146.8926 | mean log_px -0.0061 | KL -970.53 + 151it [00:35, 4.20it/s] 152it [00:35, 4.23it/s] 153it [00:35, 4.09it/s] 154it [00:36, 4.10it/s] 155it [00:36, 4.10it/s] 156it [00:36, 4.15it/s] 157it [00:36, 4.12it/s] 158it [00:37, 4.10it/s] 159it [00:37, 4.10it/s] 160it [00:37, 3.96it/s] 161it [00:37, 4.14it/s] 162it [00:38, 4.29it/s] 163it [00:38, 4.29it/s] 164it [00:38, 4.29it/s] 165it [00:38, 4.41it/s] 166it [00:39, 4.18it/s] 167it [00:39, 4.24it/s] 168it [00:39, 4.27it/s] 169it [00:39, 4.28it/s] 170it [00:39, 4.29it/s] 171it [00:40, 4.32it/s] 172it [00:40, 4.30it/s] 173it [00:40, 4.29it/s] 174it [00:40, 4.32it/s] 175it [00:41, 4.38it/s] 176it [00:41, 4.22it/s] 177it [00:41, 4.29it/s] 178it [00:41, 4.25it/s] 179it [00:42, 4.38it/s] 180it [00:42, 4.31it/s] 181it [00:42, 4.21it/s] 182it [00:42, 4.26it/s] 183it [00:42, 4.29it/s] 184it [00:43, 4.33it/s] 185it [00:43, 4.36it/s] 186it [00:43, 4.25it/s] 187it [00:43, 4.32it/s] 188it [00:44, 4.43it/s] 189it [00:44, 4.49it/s] 190it [00:44, 4.36it/s] 191it [00:44, 4.36it/s] 192it [00:45, 4.41it/s] 193it [00:45, 4.36it/s] 194it [00:45, 4.43it/s] 195it [00:45, 4.25it/s] 196it [00:45, 4.26it/s] 196it [00:46, 4.26it/s] +2025-05-25 22:31:56,602 - INFO - Epoch: 84, Objective: tensor([1178.6591], device='cuda:0', grad_fn=), Loss: 0.002942966530099511, KL/n: 19.77838897705078 + 0it [00:00, ?it/s]2025-05-25 22:31:57,007 - INFO - [Epoch 085 | Batch 0000] IWAE-loss 1131.1300 | mean log_px -0.0023 | KL -968.19 + 1it [00:00, 2.95it/s] 2it [00:00, 3.62it/s] 3it [00:00, 4.03it/s] 4it [00:00, 4.28it/s] 5it [00:01, 4.26it/s] 6it [00:01, 4.43it/s] 7it [00:01, 4.53it/s] 8it [00:01, 4.59it/s] 9it [00:02, 4.64it/s] 10it [00:02, 4.66it/s] 11it [00:02, 4.69it/s] 12it [00:02, 4.70it/s] 13it [00:02, 4.71it/s] 14it [00:03, 4.58it/s] 15it [00:03, 4.65it/s] 16it [00:03, 4.57it/s] 17it [00:03, 4.49it/s] 18it [00:04, 4.56it/s] 19it [00:04, 4.45it/s] 20it [00:04, 4.54it/s] 21it [00:04, 4.57it/s] 22it [00:04, 4.61it/s] 23it [00:05, 4.64it/s] 24it [00:05, 4.67it/s] 25it [00:05, 4.69it/s] 26it [00:05, 4.70it/s] 27it [00:05, 4.70it/s] 28it [00:06, 4.55it/s] 29it [00:06, 4.62it/s] 30it [00:06, 4.64it/s] 31it [00:06, 4.67it/s] 32it [00:07, 4.68it/s] 33it [00:07, 4.53it/s] 34it [00:07, 4.60it/s] 35it [00:07, 4.64it/s] 36it [00:07, 4.55it/s] 37it [00:08, 4.56it/s] 38it [00:08, 4.56it/s] 39it [00:08, 4.58it/s] 40it [00:08, 4.57it/s] 41it [00:09, 4.44it/s] 42it [00:09, 4.50it/s] 43it [00:09, 4.48it/s] 44it [00:09, 4.50it/s] 45it [00:09, 4.55it/s] 46it [00:10, 4.56it/s] 47it [00:10, 4.45it/s] 48it [00:10, 4.49it/s] 49it [00:10, 4.53it/s] 50it [00:11, 4.56it/s]2025-05-25 22:32:07,922 - INFO - [Epoch 085 | Batch 0050] IWAE-loss 1197.8279 | mean log_px -0.0056 | KL -967.47 + 51it [00:11, 4.58it/s] 52it [00:11, 4.59it/s] 53it [00:11, 4.58it/s] 54it [00:11, 4.58it/s] 55it [00:12, 4.59it/s] 56it [00:12, 4.60it/s] 57it [00:12, 4.62it/s] 58it [00:12, 4.61it/s] 59it [00:12, 4.61it/s] 60it [00:13, 4.61it/s] 61it [00:13, 4.62it/s] 62it [00:13, 4.61it/s] 63it [00:13, 4.61it/s] 64it [00:14, 4.59it/s] 65it [00:14, 4.60it/s] 66it [00:14, 4.37it/s] 67it [00:14, 4.48it/s] 68it [00:14, 4.53it/s] 69it [00:15, 4.59it/s] 70it [00:15, 4.62it/s] 71it [00:15, 4.67it/s] 72it [00:15, 4.68it/s] 73it [00:16, 4.67it/s] 74it [00:16, 4.53it/s] 75it [00:16, 4.61it/s] 76it [00:16, 4.64it/s] 77it [00:16, 4.68it/s] 78it [00:17, 4.70it/s] 79it [00:17, 4.71it/s] 80it [00:17, 4.72it/s] 81it [00:17, 4.73it/s] 82it [00:17, 4.69it/s] 83it [00:18, 4.55it/s] 84it [00:18, 4.61it/s] 85it [00:18, 4.66it/s] 86it [00:18, 4.68it/s] 87it [00:19, 4.69it/s] 88it [00:19, 4.70it/s] 89it [00:19, 4.55it/s] 90it [00:19, 4.62it/s] 91it [00:19, 4.65it/s] 92it [00:20, 4.67it/s] 93it [00:20, 4.70it/s] 94it [00:20, 4.71it/s] 95it [00:20, 4.72it/s] 96it [00:20, 4.72it/s] 97it [00:21, 4.68it/s] 98it [00:21, 4.52it/s] 99it [00:21, 4.60it/s] 100it [00:21, 4.63it/s]2025-05-25 22:32:18,722 - INFO - [Epoch 085 | Batch 0100] IWAE-loss 1239.2491 | mean log_px -0.0051 | KL -968.42 + 101it [00:22, 4.66it/s] 102it [00:22, 4.68it/s] 103it [00:22, 4.53it/s] 104it [00:22, 4.60it/s] 105it [00:22, 4.63it/s] 106it [00:23, 4.64it/s] 107it [00:23, 4.66it/s] 108it [00:23, 4.52it/s] 109it [00:23, 4.60it/s] 110it [00:23, 4.64it/s] 111it [00:24, 4.67it/s] 112it [00:24, 4.69it/s] 113it [00:24, 4.71it/s] 114it [00:24, 4.55it/s] 115it [00:25, 4.62it/s] 116it [00:25, 4.65it/s] 117it [00:25, 4.68it/s] 118it [00:25, 4.70it/s] 119it [00:25, 4.70it/s] 120it [00:26, 4.71it/s] 121it [00:26, 4.73it/s] 122it [00:26, 4.71it/s] 123it [00:26, 4.73it/s] 124it [00:26, 4.73it/s] 125it [00:27, 4.74it/s] 126it [00:27, 4.73it/s] 127it [00:27, 4.74it/s] 128it [00:27, 4.73it/s] 129it [00:28, 4.73it/s] 130it [00:28, 4.73it/s] 131it [00:28, 4.56it/s] 132it [00:28, 4.60it/s] 133it [00:28, 4.64it/s] 134it [00:29, 4.67it/s] 135it [00:29, 4.70it/s] 136it [00:29, 4.71it/s] 137it [00:29, 4.72it/s] 138it [00:29, 4.54it/s] 139it [00:30, 4.62it/s] 140it [00:30, 4.62it/s] 141it [00:30, 4.65it/s] 142it [00:30, 4.67it/s] 143it [00:31, 4.68it/s] 144it [00:31, 4.69it/s] 145it [00:31, 4.70it/s] 146it [00:31, 4.59it/s] 147it [00:31, 4.63it/s] 148it [00:32, 4.66it/s] 149it [00:32, 4.69it/s] 150it [00:32, 4.70it/s]2025-05-25 22:32:29,438 - INFO - [Epoch 085 | Batch 0150] IWAE-loss 1040.0924 | mean log_px -0.0081 | KL -968.21 + 151it [00:32, 4.54it/s] 152it [00:32, 4.60it/s] 153it [00:33, 4.64it/s] 154it [00:33, 4.66it/s] 155it [00:33, 4.69it/s] 156it [00:33, 4.53it/s] 157it [00:34, 4.60it/s] 158it [00:34, 4.62it/s] 159it [00:34, 4.66it/s] 160it [00:34, 4.67it/s] 161it [00:34, 4.68it/s] 162it [00:35, 4.67it/s] 163it [00:35, 4.70it/s] 164it [00:35, 4.70it/s] 165it [00:35, 4.55it/s] 166it [00:36, 4.60it/s] 167it [00:36, 4.63it/s] 168it [00:36, 4.66it/s] 169it [00:36, 4.67it/s] 170it [00:36, 4.52it/s] 171it [00:37, 4.58it/s] 172it [00:37, 4.60it/s] 173it [00:37, 4.65it/s] 174it [00:37, 4.68it/s] 175it [00:37, 4.67it/s] 176it [00:38, 4.68it/s] 177it [00:38, 4.66it/s] 178it [00:38, 4.50it/s] 179it [00:38, 4.59it/s] 180it [00:39, 4.62it/s] 181it [00:39, 4.66it/s] 182it [00:39, 4.68it/s] 183it [00:39, 4.52it/s] 184it [00:39, 4.59it/s] 185it [00:40, 4.62it/s] 186it [00:40, 4.64it/s] 187it [00:40, 4.67it/s] 188it [00:40, 4.68it/s] 189it [00:40, 4.70it/s] 190it [00:41, 4.71it/s] 191it [00:41, 4.55it/s] 192it [00:41, 4.61it/s] 193it [00:41, 4.64it/s] 194it [00:42, 4.66it/s] 195it [00:42, 4.45it/s] 196it [00:42, 4.24it/s] 196it [00:42, 4.60it/s] +2025-05-25 22:32:39,364 - INFO - Epoch: 85, Objective: tensor([1487.8380], device='cuda:0', grad_fn=), Loss: 0.007994958199560642, KL/n: 19.7778263092041 + 0it [00:00, ?it/s]2025-05-25 22:32:39,950 - INFO - [Epoch 086 | Batch 0000] IWAE-loss 1127.4233 | mean log_px -0.0047 | KL -967.19 + 1it [00:00, 3.01it/s] 2it [00:00, 3.64it/s] 3it [00:00, 4.02it/s] 4it [00:01, 4.24it/s] 5it [00:01, 4.29it/s] 6it [00:01, 4.40it/s] 7it [00:01, 4.33it/s] 8it [00:01, 4.46it/s] 9it [00:02, 4.43it/s] 10it [00:02, 4.47it/s] 11it [00:02, 4.30it/s] 12it [00:02, 4.26it/s] 13it [00:03, 4.30it/s] 14it [00:03, 4.41it/s] 15it [00:03, 4.49it/s] 16it [00:03, 4.56it/s] 17it [00:03, 4.61it/s] 18it [00:04, 4.63it/s] 19it [00:04, 4.47it/s] 20it [00:04, 4.38it/s] 21it [00:04, 4.36it/s] 22it [00:05, 4.44it/s] 23it [00:05, 4.51it/s] 24it [00:05, 4.42it/s] 25it [00:05, 4.36it/s] 26it [00:05, 4.21it/s] 27it [00:06, 4.34it/s] 28it [00:06, 4.28it/s] 29it [00:06, 4.27it/s] 30it [00:06, 4.23it/s] 31it [00:07, 4.24it/s] 32it [00:07, 4.16it/s] 33it [00:07, 4.19it/s] 34it [00:07, 4.19it/s] 35it [00:08, 4.26it/s] 36it [00:08, 4.36it/s] 37it [00:08, 4.46it/s] 38it [00:08, 4.22it/s] 39it [00:09, 4.37it/s] 40it [00:09, 4.34it/s] 41it [00:09, 4.40it/s] 42it [00:09, 4.30it/s] 43it [00:09, 4.30it/s] 44it [00:10, 4.36it/s] 45it [00:10, 4.31it/s] 46it [00:10, 4.14it/s] 47it [00:10, 4.20it/s] 48it [00:11, 4.20it/s] 49it [00:11, 4.32it/s] 50it [00:11, 4.42it/s]2025-05-25 22:32:51,409 - INFO - [Epoch 086 | Batch 0050] IWAE-loss 1551.1642 | mean log_px -0.0101 | KL -964.08 + 51it [00:11, 4.51it/s] 52it [00:12, 4.38it/s] 53it [00:12, 4.36it/s] 54it [00:12, 4.46it/s] 55it [00:12, 4.39it/s] 56it [00:12, 4.33it/s] 57it [00:13, 4.31it/s] 58it [00:13, 4.30it/s] 59it [00:13, 4.27it/s] 60it [00:13, 4.39it/s] 61it [00:14, 4.39it/s] 62it [00:14, 4.43it/s] 63it [00:14, 4.39it/s] 64it [00:14, 4.20it/s] 65it [00:15, 4.25it/s] 66it [00:15, 4.26it/s] 67it [00:15, 4.27it/s] 68it [00:15, 4.25it/s] 69it [00:15, 4.23it/s] 70it [00:16, 4.08it/s] 71it [00:16, 4.16it/s] 72it [00:16, 4.17it/s] 73it [00:16, 4.29it/s] 74it [00:17, 4.39it/s] 75it [00:17, 4.48it/s] 76it [00:17, 4.37it/s] 77it [00:17, 4.45it/s] 78it [00:18, 4.36it/s] 79it [00:18, 4.44it/s] 80it [00:18, 4.36it/s] 81it [00:18, 4.21it/s] 82it [00:18, 4.35it/s] 83it [00:19, 4.28it/s] 84it [00:19, 4.39it/s] 85it [00:19, 4.49it/s] 86it [00:19, 4.54it/s] 87it [00:20, 4.53it/s] 88it [00:20, 4.58it/s] 89it [00:20, 4.51it/s] 90it [00:20, 4.28it/s] 91it [00:21, 4.29it/s] 92it [00:21, 4.26it/s] 93it [00:21, 4.24it/s] 94it [00:21, 4.28it/s] 95it [00:21, 4.39it/s] 96it [00:22, 4.30it/s] 97it [00:22, 4.36it/s] 98it [00:22, 4.42it/s] 99it [00:22, 4.33it/s] 100it [00:23, 4.19it/s]2025-05-25 22:33:02,980 - INFO - [Epoch 086 | Batch 0100] IWAE-loss 1123.9008 | mean log_px -0.0059 | KL -964.63 + 101it [00:23, 4.19it/s] 102it [00:23, 4.20it/s] 103it [00:23, 4.34it/s] 104it [00:24, 4.44it/s] 105it [00:24, 4.51it/s] 106it [00:24, 4.56it/s] 107it [00:24, 4.26it/s] 108it [00:24, 4.26it/s] 109it [00:25, 4.24it/s] 110it [00:25, 4.22it/s] 111it [00:25, 4.22it/s] 112it [00:25, 4.22it/s] 113it [00:26, 4.24it/s] 114it [00:26, 4.14it/s] 115it [00:26, 4.18it/s] 116it [00:26, 4.30it/s] 117it [00:27, 4.26it/s] 118it [00:27, 4.24it/s] 119it [00:27, 4.24it/s] 120it [00:27, 4.16it/s] 121it [00:28, 4.18it/s] 122it [00:28, 4.31it/s] 123it [00:28, 4.42it/s] 124it [00:28, 4.48it/s] 125it [00:28, 4.23it/s] 126it [00:29, 4.35it/s] 127it [00:29, 4.44it/s] 128it [00:29, 4.52it/s] 129it [00:29, 4.55it/s] 130it [00:30, 4.59it/s] 131it [00:30, 4.44it/s] 132it [00:30, 4.39it/s] 133it [00:30, 4.24it/s] 134it [00:30, 4.39it/s] 135it [00:31, 4.33it/s] 136it [00:31, 4.29it/s] 137it [00:31, 4.33it/s] 138it [00:31, 4.31it/s] 139it [00:32, 4.31it/s] 140it [00:32, 4.30it/s] 141it [00:32, 4.40it/s] 142it [00:32, 4.32it/s] 143it [00:33, 4.43it/s] 144it [00:33, 4.35it/s] 145it [00:33, 4.33it/s] 146it [00:33, 4.34it/s] 147it [00:33, 4.29it/s] 148it [00:34, 4.31it/s] 149it [00:34, 4.29it/s] 150it [00:34, 4.15it/s]2025-05-25 22:33:14,564 - INFO - [Epoch 086 | Batch 0150] IWAE-loss 1505.1322 | mean log_px -0.0137 | KL -965.18 + 151it [00:34, 4.19it/s] 152it [00:35, 4.32it/s] 153it [00:35, 4.42it/s] 154it [00:35, 4.32it/s] 155it [00:35, 4.30it/s] 156it [00:36, 4.40it/s] 157it [00:36, 4.29it/s] 158it [00:36, 4.42it/s] 159it [00:36, 4.47it/s] 160it [00:36, 4.32it/s] 161it [00:37, 4.24it/s] 162it [00:37, 4.36it/s] 163it [00:37, 4.32it/s] 164it [00:37, 4.28it/s] 165it [00:38, 4.27it/s] 166it [00:38, 4.39it/s] 167it [00:38, 4.36it/s] 168it [00:38, 4.32it/s] 169it [00:39, 4.42it/s] 170it [00:39, 4.50it/s] 171it [00:39, 4.57it/s] 172it [00:39, 4.43it/s] 173it [00:39, 4.37it/s] 174it [00:40, 4.39it/s] 175it [00:40, 4.38it/s] 176it [00:40, 4.18it/s] 177it [00:40, 4.18it/s] 178it [00:41, 4.21it/s] 179it [00:41, 4.20it/s] 180it [00:41, 4.17it/s] 181it [00:41, 4.31it/s] 182it [00:42, 4.24it/s] 183it [00:42, 4.21it/s] 184it [00:42, 4.25it/s] 185it [00:42, 4.23it/s] 186it [00:43, 4.10it/s] 187it [00:43, 4.14it/s] 188it [00:43, 4.18it/s] 189it [00:43, 4.18it/s] 190it [00:44, 4.21it/s] 191it [00:44, 4.20it/s] 192it [00:44, 4.20it/s] 193it [00:44, 4.20it/s] 194it [00:44, 4.33it/s] 195it [00:45, 4.19it/s] 196it [00:45, 4.32it/s] 196it [00:45, 4.31it/s] +2025-05-25 22:33:25,157 - INFO - Epoch: 86, Objective: tensor([1302.8038], device='cuda:0', grad_fn=), Loss: 0.0075148637406528, KL/n: 19.660505294799805 + 0it [00:00, ?it/s]2025-05-25 22:33:25,552 - INFO - [Epoch 087 | Batch 0000] IWAE-loss 1044.9692 | mean log_px -0.0016 | KL -964.23 + 1it [00:00, 3.09it/s] 2it [00:00, 3.84it/s] 3it [00:00, 4.19it/s] 4it [00:00, 4.38it/s] 5it [00:01, 4.36it/s] 6it [00:01, 4.49it/s] 7it [00:01, 4.58it/s] 8it [00:01, 4.61it/s] 9it [00:02, 4.65it/s] 10it [00:02, 4.66it/s] 11it [00:02, 4.69it/s] 12it [00:02, 4.70it/s] 13it [00:02, 4.70it/s] 14it [00:03, 4.49it/s] 15it [00:03, 4.58it/s] 16it [00:03, 4.61it/s] 17it [00:03, 4.65it/s] 18it [00:04, 4.50it/s] 19it [00:04, 4.58it/s] 20it [00:04, 4.58it/s] 21it [00:04, 4.63it/s] 22it [00:04, 4.66it/s] 23it [00:05, 4.69it/s] 24it [00:05, 4.70it/s] 25it [00:05, 4.71it/s] 26it [00:05, 4.71it/s] 27it [00:05, 4.56it/s] 28it [00:06, 4.62it/s] 29it [00:06, 4.65it/s] 30it [00:06, 4.65it/s] 31it [00:06, 4.67it/s] 32it [00:06, 4.69it/s] 33it [00:07, 4.65it/s] 34it [00:07, 4.68it/s] 35it [00:07, 4.52it/s] 36it [00:07, 4.59it/s] 37it [00:08, 4.63it/s] 38it [00:08, 4.64it/s] 39it [00:08, 3.71it/s] 40it [00:08, 3.93it/s] 41it [00:09, 4.14it/s] 42it [00:09, 4.29it/s] 43it [00:09, 4.42it/s] 44it [00:09, 4.50it/s] 45it [00:09, 4.45it/s] 46it [00:10, 4.54it/s] 47it [00:10, 4.60it/s] 48it [00:10, 4.63it/s] 49it [00:10, 4.66it/s] 50it [00:11, 4.52it/s]2025-05-25 22:33:36,518 - INFO - [Epoch 087 | Batch 0050] IWAE-loss 1112.0288 | mean log_px -0.0045 | KL -961.18 + 51it [00:11, 4.58it/s] 52it [00:11, 4.61it/s] 53it [00:11, 4.65it/s] 54it [00:11, 4.67it/s] 55it [00:12, 4.69it/s] 56it [00:12, 4.70it/s] 57it [00:12, 4.55it/s] 58it [00:12, 4.62it/s] 59it [00:13, 4.66it/s] 60it [00:13, 4.68it/s] 61it [00:13, 4.71it/s] 62it [00:13, 4.71it/s] 63it [00:13, 4.72it/s] 64it [00:14, 4.72it/s] 65it [00:14, 4.71it/s] 66it [00:14, 4.51it/s] 67it [00:14, 4.58it/s] 68it [00:14, 4.60it/s] 69it [00:15, 4.65it/s] 70it [00:15, 4.66it/s] 71it [00:15, 4.68it/s] 72it [00:15, 4.69it/s] 73it [00:16, 4.53it/s] 74it [00:16, 4.59it/s] 75it [00:16, 4.61it/s] 76it [00:16, 4.64it/s] 77it [00:16, 4.67it/s] 78it [00:17, 4.51it/s] 79it [00:17, 4.57it/s] 80it [00:17, 4.62it/s] 81it [00:17, 4.65it/s] 82it [00:17, 4.67it/s] 83it [00:18, 4.57it/s] 84it [00:18, 4.63it/s] 85it [00:18, 4.66it/s] 86it [00:18, 4.67it/s] 87it [00:19, 4.53it/s] 88it [00:19, 4.60it/s] 89it [00:19, 4.63it/s] 90it [00:19, 4.66it/s] 91it [00:19, 4.68it/s] 92it [00:20, 4.69it/s] 93it [00:20, 4.71it/s] 94it [00:20, 4.71it/s] 95it [00:20, 4.72it/s] 96it [00:20, 4.72it/s] 97it [00:21, 4.55it/s] 98it [00:21, 4.61it/s] 99it [00:21, 4.63it/s] 100it [00:21, 4.66it/s]2025-05-25 22:33:47,280 - INFO - [Epoch 087 | Batch 0100] IWAE-loss 1093.4396 | mean log_px -0.0022 | KL -958.57 + 101it [00:22, 4.67it/s] 102it [00:22, 4.67it/s] 103it [00:22, 4.52it/s] 104it [00:22, 4.59it/s] 105it [00:22, 4.63it/s] 106it [00:23, 4.65it/s] 107it [00:23, 4.65it/s] 108it [00:23, 4.66it/s] 109it [00:23, 4.69it/s] 110it [00:23, 4.68it/s] 111it [00:24, 4.53it/s] 112it [00:24, 4.60it/s] 113it [00:24, 4.64it/s] 114it [00:24, 4.66it/s] 115it [00:25, 4.68it/s] 116it [00:25, 4.69it/s] 117it [00:25, 4.72it/s] 118it [00:25, 4.71it/s] 119it [00:25, 4.67it/s] 120it [00:26, 4.71it/s] 121it [00:26, 4.72it/s] 122it [00:26, 4.72it/s] 123it [00:26, 4.68it/s] 124it [00:27, 4.46it/s] 125it [00:27, 4.54it/s] 126it [00:27, 4.59it/s] 127it [00:27, 4.63it/s] 128it [00:27, 4.66it/s] 129it [00:28, 4.52it/s] 130it [00:28, 4.60it/s] 131it [00:28, 4.63it/s] 132it [00:28, 4.65it/s] 133it [00:28, 4.68it/s] 134it [00:29, 4.69it/s] 135it [00:29, 4.53it/s] 136it [00:29, 4.60it/s] 137it [00:29, 4.64it/s] 138it [00:30, 4.66it/s] 139it [00:30, 4.69it/s] 140it [00:30, 4.70it/s] 141it [00:30, 4.71it/s] 142it [00:30, 4.71it/s] 143it [00:31, 4.72it/s] 144it [00:31, 4.71it/s] 145it [00:31, 4.72it/s] 146it [00:31, 4.72it/s] 147it [00:31, 4.71it/s] 148it [00:32, 4.67it/s] 149it [00:32, 4.66it/s] 150it [00:32, 4.64it/s]2025-05-25 22:33:58,031 - INFO - [Epoch 087 | Batch 0150] IWAE-loss 1118.8979 | mean log_px -0.0022 | KL -959.16 + 151it [00:32, 4.51it/s] 152it [00:33, 4.59it/s] 153it [00:33, 4.63it/s] 154it [00:33, 4.66it/s] 155it [00:33, 4.68it/s] 156it [00:33, 4.69it/s] 157it [00:34, 4.70it/s] 158it [00:34, 4.65it/s] 159it [00:34, 4.68it/s] 160it [00:34, 4.69it/s] 161it [00:34, 4.70it/s] 162it [00:35, 4.71it/s] 163it [00:35, 4.71it/s] 164it [00:35, 4.71it/s] 165it [00:35, 4.72it/s] 166it [00:36, 4.72it/s] 167it [00:36, 4.70it/s] 168it [00:36, 4.71it/s] 169it [00:36, 4.71it/s] 170it [00:36, 4.71it/s] 171it [00:37, 4.72it/s] 172it [00:37, 4.70it/s] 173it [00:37, 4.70it/s] 174it [00:37, 4.70it/s] 175it [00:37, 4.72it/s] 176it [00:38, 4.72it/s] 177it [00:38, 4.56it/s] 178it [00:38, 4.62it/s] 179it [00:38, 4.67it/s] 180it [00:38, 4.68it/s] 181it [00:39, 4.69it/s] 182it [00:39, 4.69it/s] 183it [00:39, 4.70it/s] 184it [00:39, 4.52it/s] 185it [00:40, 4.59it/s] 186it [00:40, 4.63it/s] 187it [00:40, 4.66it/s] 188it [00:40, 4.66it/s] 189it [00:40, 4.69it/s] 190it [00:41, 4.69it/s] 191it [00:41, 4.53it/s] 192it [00:41, 4.60it/s] 193it [00:41, 4.65it/s] 194it [00:42, 4.66it/s] 195it [00:42, 4.46it/s] 196it [00:42, 4.44it/s] 196it [00:42, 4.61it/s] +2025-05-25 22:34:07,849 - INFO - Epoch: 87, Objective: tensor([1106.9209], device='cuda:0', grad_fn=), Loss: 0.006249045487493277, KL/n: 19.581295013427734 + 0it [00:00, ?it/s]2025-05-25 22:34:08,259 - INFO - [Epoch 088 | Batch 0000] IWAE-loss 1091.5936 | mean log_px -0.0041 | KL -957.80 + 1it [00:00, 2.75it/s] 2it [00:00, 3.47it/s] 3it [00:00, 3.82it/s] 4it [00:01, 4.12it/s] 5it [00:01, 4.29it/s] 6it [00:01, 4.42it/s] 7it [00:01, 4.47it/s] 8it [00:01, 4.54it/s] 9it [00:02, 4.51it/s] 10it [00:02, 4.52it/s] 11it [00:02, 4.36it/s] 12it [00:02, 4.44it/s] 13it [00:03, 4.49it/s] 14it [00:03, 4.40it/s] 15it [00:03, 4.45it/s] 16it [00:03, 4.50it/s] 17it [00:03, 4.41it/s] 18it [00:04, 4.45it/s] 19it [00:04, 4.53it/s] 20it [00:04, 4.43it/s] 21it [00:04, 4.39it/s] 22it [00:05, 4.36it/s] 23it [00:05, 4.23it/s] 24it [00:05, 4.27it/s] 25it [00:05, 4.31it/s] 26it [00:06, 4.34it/s] 27it [00:06, 4.27it/s] 28it [00:06, 4.36it/s] 29it [00:06, 4.38it/s] 30it [00:06, 4.31it/s] 31it [00:07, 4.29it/s] 32it [00:07, 4.37it/s] 33it [00:07, 4.46it/s] 34it [00:07, 4.53it/s] 35it [00:08, 4.41it/s] 36it [00:08, 4.42it/s] 37it [00:08, 4.38it/s] 38it [00:08, 4.38it/s] 39it [00:09, 4.17it/s] 40it [00:09, 4.32it/s] 41it [00:09, 4.42it/s] 42it [00:09, 4.40it/s] 43it [00:09, 4.33it/s] 44it [00:10, 4.32it/s] 45it [00:10, 4.42it/s] 46it [00:10, 4.49it/s] 47it [00:10, 4.55it/s] 48it [00:11, 4.52it/s] 49it [00:11, 4.42it/s] 50it [00:11, 4.36it/s]2025-05-25 22:34:19,630 - INFO - [Epoch 088 | Batch 0050] IWAE-loss 1129.9476 | mean log_px -0.0060 | KL -957.38 + 51it [00:11, 4.36it/s] 52it [00:11, 4.29it/s] 53it [00:12, 4.28it/s] 54it [00:12, 4.24it/s] 55it [00:12, 4.32it/s] 56it [00:12, 4.39it/s] 57it [00:13, 4.37it/s] 58it [00:13, 4.20it/s] 59it [00:13, 4.27it/s] 60it [00:13, 4.27it/s] 61it [00:14, 4.23it/s] 62it [00:14, 4.27it/s] 63it [00:14, 4.28it/s] 64it [00:14, 4.14it/s] 65it [00:15, 4.14it/s] 66it [00:15, 4.17it/s] 67it [00:15, 4.16it/s] 68it [00:15, 4.14it/s] 69it [00:15, 4.14it/s] 70it [00:16, 4.14it/s] 71it [00:16, 4.29it/s] 72it [00:16, 4.39it/s] 73it [00:16, 4.48it/s] 74it [00:17, 4.53it/s] 75it [00:17, 4.43it/s] 76it [00:17, 4.27it/s] 77it [00:17, 4.25it/s] 78it [00:18, 4.27it/s] 79it [00:18, 4.36it/s] 80it [00:18, 4.43it/s] 81it [00:18, 4.49it/s] 82it [00:18, 4.38it/s] 83it [00:19, 4.45it/s] 84it [00:19, 4.41it/s] 85it [00:19, 4.38it/s] 86it [00:19, 4.31it/s] 87it [00:20, 4.30it/s] 88it [00:20, 4.30it/s] 89it [00:20, 4.28it/s] 90it [00:20, 4.32it/s] 91it [00:21, 4.28it/s] 92it [00:21, 4.28it/s] 93it [00:21, 4.35it/s] 94it [00:21, 4.42it/s] 95it [00:21, 4.47it/s] 96it [00:22, 4.51it/s] 97it [00:22, 4.39it/s] 98it [00:22, 4.44it/s] 99it [00:22, 4.46it/s] 100it [00:23, 4.41it/s]2025-05-25 22:34:31,195 - INFO - [Epoch 088 | Batch 0100] IWAE-loss 1050.3236 | mean log_px -0.0014 | KL -958.19 + 101it [00:23, 4.41it/s] 102it [00:23, 4.47it/s] 103it [00:23, 4.40it/s] 104it [00:23, 4.43it/s] 105it [00:24, 4.40it/s] 106it [00:24, 4.44it/s] 107it [00:24, 4.38it/s] 108it [00:24, 4.35it/s] 109it [00:25, 4.30it/s] 110it [00:25, 4.37it/s] 111it [00:25, 4.31it/s] 112it [00:25, 4.31it/s] 113it [00:26, 4.38it/s] 114it [00:26, 4.39it/s] 115it [00:26, 4.46it/s] 116it [00:26, 4.35it/s] 117it [00:26, 4.39it/s] 118it [00:27, 4.35it/s] 119it [00:27, 4.39it/s] 120it [00:27, 4.33it/s] 121it [00:27, 4.30it/s] 122it [00:28, 4.26it/s] 123it [00:28, 4.34it/s] 124it [00:28, 4.27it/s] 125it [00:28, 4.36it/s] 126it [00:29, 4.40it/s] 127it [00:29, 4.27it/s] 128it [00:29, 4.30it/s] 129it [00:29, 4.36it/s] 130it [00:29, 4.38it/s] 131it [00:30, 4.26it/s] 132it [00:30, 4.23it/s] 133it [00:30, 4.21it/s] 134it [00:30, 4.32it/s] 135it [00:31, 4.33it/s] 136it [00:31, 4.32it/s] 137it [00:31, 4.28it/s] 138it [00:31, 4.34it/s] 139it [00:32, 4.33it/s] 140it [00:32, 4.27it/s] 141it [00:32, 4.12it/s] 142it [00:32, 4.23it/s] 143it [00:33, 4.20it/s] 144it [00:33, 4.24it/s] 145it [00:33, 4.30it/s] 146it [00:33, 4.26it/s] 147it [00:33, 4.11it/s] 148it [00:34, 4.13it/s] 149it [00:34, 4.19it/s] 150it [00:34, 4.27it/s]2025-05-25 22:34:42,819 - INFO - [Epoch 088 | Batch 0150] IWAE-loss 1027.6443 | mean log_px -0.0013 | KL -960.73 + 151it [00:34, 4.22it/s] 152it [00:35, 4.33it/s] 153it [00:35, 4.40it/s] 154it [00:35, 4.38it/s] 155it [00:35, 4.36it/s] 156it [00:36, 4.43it/s] 157it [00:36, 4.47it/s] 158it [00:36, 4.49it/s] 159it [00:36, 4.45it/s] 160it [00:36, 4.24it/s] 161it [00:37, 4.14it/s] 162it [00:37, 4.11it/s] 163it [00:37, 4.23it/s] 164it [00:37, 4.32it/s] 165it [00:38, 4.36it/s] 166it [00:38, 4.33it/s] 167it [00:38, 4.22it/s] 168it [00:38, 4.32it/s] 169it [00:39, 4.38it/s] 170it [00:39, 4.42it/s] 171it [00:39, 4.35it/s] 172it [00:39, 4.35it/s] 173it [00:39, 4.39it/s] 174it [00:40, 4.44it/s] 175it [00:40, 4.28it/s] 176it [00:40, 4.28it/s] 177it [00:40, 4.27it/s] 178it [00:41, 4.10it/s] 179it [00:41, 4.12it/s] 180it [00:41, 4.15it/s] 181it [00:41, 4.13it/s] 182it [00:42, 4.16it/s] 183it [00:42, 4.13it/s] 184it [00:42, 4.12it/s] 185it [00:42, 4.23it/s] 186it [00:43, 4.29it/s] 187it [00:43, 4.14it/s] 188it [00:43, 4.12it/s] 189it [00:43, 4.14it/s] 190it [00:44, 4.17it/s] 191it [00:44, 4.26it/s] 192it [00:44, 4.09it/s] 193it [00:44, 4.12it/s] 194it [00:44, 4.21it/s] 195it [00:45, 4.17it/s] 196it [00:45, 4.29it/s] 196it [00:45, 4.31it/s] +2025-05-25 22:34:53,505 - INFO - Epoch: 88, Objective: tensor([1130.0813], device='cuda:0', grad_fn=), Loss: 0.0030066303443163633, KL/n: 19.562442779541016 + 0it [00:00, ?it/s]2025-05-25 22:34:54,095 - INFO - [Epoch 089 | Batch 0000] IWAE-loss 1094.9982 | mean log_px -0.0019 | KL -957.34 + 1it [00:00, 2.74it/s] 2it [00:00, 3.54it/s] 3it [00:00, 3.96it/s] 4it [00:01, 3.91it/s] 5it [00:01, 3.94it/s] 6it [00:01, 4.08it/s] 7it [00:01, 4.12it/s] 8it [00:02, 4.19it/s] 9it [00:02, 4.19it/s] 10it [00:02, 4.28it/s] 11it [00:02, 4.37it/s] 12it [00:02, 4.34it/s] 13it [00:03, 4.30it/s] 14it [00:03, 4.31it/s] 15it [00:03, 4.26it/s] 16it [00:03, 4.32it/s] 17it [00:04, 4.37it/s] 18it [00:04, 4.42it/s] 19it [00:04, 4.32it/s] 20it [00:04, 4.36it/s] 21it [00:05, 4.29it/s] 22it [00:05, 4.20it/s] 23it [00:05, 4.22it/s] 24it [00:05, 4.22it/s] 25it [00:05, 4.22it/s] 26it [00:06, 4.17it/s] 27it [00:06, 4.22it/s] 28it [00:06, 4.17it/s] 29it [00:06, 4.22it/s] 30it [00:07, 4.16it/s] 31it [00:07, 4.23it/s] 32it [00:07, 4.18it/s] 33it [00:07, 4.19it/s] 34it [00:08, 4.17it/s] 35it [00:08, 4.20it/s] 36it [00:08, 4.14it/s] 37it [00:08, 4.19it/s] 38it [00:09, 4.18it/s] 39it [00:09, 4.10it/s] 40it [00:09, 4.07it/s] 41it [00:09, 4.15it/s] 42it [00:10, 4.18it/s] 43it [00:10, 4.30it/s] 44it [00:10, 4.29it/s] 45it [00:10, 4.28it/s] 46it [00:11, 4.08it/s] 47it [00:11, 4.14it/s] 48it [00:11, 4.19it/s] 49it [00:11, 4.29it/s] 50it [00:11, 4.32it/s]2025-05-25 22:35:05,923 - INFO - [Epoch 089 | Batch 0050] IWAE-loss 1109.4702 | mean log_px -0.0021 | KL -958.17 + 51it [00:12, 4.21it/s] 52it [00:12, 4.16it/s] 53it [00:12, 4.12it/s] 54it [00:12, 4.26it/s] 55it [00:13, 4.23it/s] 56it [00:13, 4.23it/s] 57it [00:13, 4.21it/s] 58it [00:13, 4.12it/s] 59it [00:14, 4.20it/s] 60it [00:14, 4.29it/s] 61it [00:14, 4.35it/s] 62it [00:14, 4.32it/s] 63it [00:14, 4.38it/s] 64it [00:15, 4.28it/s] 65it [00:15, 4.37it/s] 66it [00:15, 4.25it/s] 67it [00:15, 4.33it/s] 68it [00:16, 4.35it/s] 69it [00:16, 4.43it/s] 70it [00:16, 4.36it/s] 71it [00:16, 4.43it/s] 72it [00:17, 4.22it/s] 73it [00:17, 4.19it/s] 74it [00:17, 4.20it/s] 75it [00:17, 4.30it/s] 76it [00:18, 4.31it/s] 77it [00:18, 4.42it/s] 78it [00:18, 4.41it/s] 79it [00:18, 4.34it/s] 80it [00:18, 4.28it/s] 81it [00:19, 4.33it/s] 82it [00:19, 4.38it/s] 83it [00:19, 4.40it/s] 84it [00:19, 4.36it/s] 85it [00:20, 4.20it/s] 86it [00:20, 4.20it/s] 87it [00:20, 4.22it/s] 88it [00:20, 4.17it/s] 89it [00:21, 4.05it/s] 90it [00:21, 4.13it/s] 91it [00:21, 4.15it/s] 92it [00:21, 4.25it/s] 93it [00:21, 4.32it/s] 94it [00:22, 4.20it/s] 95it [00:22, 4.10it/s] 96it [00:22, 4.10it/s] 97it [00:22, 4.22it/s] 98it [00:23, 4.17it/s] 99it [00:23, 4.25it/s] 100it [00:23, 4.13it/s]2025-05-25 22:35:17,667 - INFO - [Epoch 089 | Batch 0100] IWAE-loss 1056.6552 | mean log_px -0.0079 | KL -953.52 + 101it [00:23, 4.25it/s] 102it [00:24, 4.31it/s] 103it [00:24, 4.33it/s] 104it [00:24, 4.28it/s] 105it [00:24, 4.33it/s] 106it [00:25, 4.27it/s] 107it [00:25, 4.24it/s] 108it [00:25, 4.24it/s] 109it [00:25, 4.33it/s] 110it [00:26, 4.25it/s] 111it [00:26, 4.24it/s] 112it [00:26, 4.23it/s] 113it [00:26, 4.21it/s] 114it [00:26, 4.24it/s] 115it [00:27, 4.33it/s] 116it [00:27, 4.35it/s] 117it [00:27, 4.42it/s] 118it [00:27, 4.32it/s] 119it [00:28, 4.22it/s] 120it [00:28, 4.24it/s] 121it [00:28, 4.36it/s] 122it [00:28, 4.27it/s] 123it [00:29, 4.25it/s] 124it [00:29, 4.25it/s] 125it [00:29, 4.11it/s] 126it [00:29, 4.06it/s] 127it [00:30, 4.12it/s] 128it [00:30, 4.12it/s] 129it [00:30, 4.24it/s] 130it [00:30, 4.30it/s] 131it [00:30, 4.25it/s] 132it [00:31, 4.25it/s] 133it [00:31, 4.20it/s] 134it [00:31, 4.18it/s] 135it [00:31, 4.16it/s] 136it [00:32, 4.10it/s] 137it [00:32, 4.13it/s] 138it [00:32, 4.14it/s] 139it [00:32, 4.17it/s] 140it [00:33, 4.19it/s] 141it [00:33, 4.27it/s] 142it [00:33, 4.29it/s] 143it [00:33, 4.30it/s] 144it [00:34, 4.34it/s] 145it [00:34, 4.26it/s] 146it [00:34, 4.32it/s] 147it [00:34, 4.32it/s] 148it [00:34, 4.40it/s] 149it [00:35, 4.30it/s] 150it [00:35, 4.25it/s]2025-05-25 22:35:29,430 - INFO - [Epoch 089 | Batch 0150] IWAE-loss 1259.3633 | mean log_px -0.0045 | KL -950.79 + 151it [00:35, 4.15it/s] 152it [00:35, 4.25it/s] 153it [00:36, 4.34it/s] 154it [00:36, 4.31it/s] 155it [00:36, 4.26it/s] 156it [00:36, 4.31it/s] 157it [00:37, 4.22it/s] 158it [00:37, 4.23it/s] 159it [00:37, 4.34it/s] 160it [00:37, 4.38it/s] 161it [00:38, 4.25it/s] 162it [00:38, 4.17it/s] 163it [00:38, 4.23it/s] 164it [00:38, 4.19it/s] 165it [00:38, 4.27it/s] 166it [00:39, 4.36it/s] 167it [00:39, 4.31it/s] 168it [00:39, 4.36it/s] 169it [00:39, 4.16it/s] 170it [00:40, 4.17it/s] 171it [00:40, 4.17it/s] 172it [00:40, 4.06it/s] 173it [00:40, 4.14it/s] 174it [00:41, 4.23it/s] 175it [00:41, 4.29it/s] 176it [00:41, 4.28it/s] 177it [00:41, 4.39it/s] 178it [00:42, 4.32it/s] 179it [00:42, 4.40it/s] 180it [00:42, 4.44it/s] 181it [00:42, 4.47it/s] 182it [00:42, 4.44it/s] 183it [00:43, 4.28it/s] 184it [00:43, 4.26it/s] 185it [00:43, 4.31it/s] 186it [00:43, 4.25it/s] 187it [00:44, 4.29it/s] 188it [00:44, 4.27it/s] 189it [00:44, 4.31it/s] 190it [00:44, 4.27it/s] 191it [00:45, 4.13it/s] 192it [00:45, 4.27it/s] 193it [00:45, 4.37it/s] 194it [00:45, 4.39it/s] 195it [00:45, 4.35it/s] 196it [00:46, 4.36it/s] 196it [00:46, 4.24it/s] +2025-05-25 22:35:40,069 - INFO - Epoch: 89, Objective: tensor([1205.1879], device='cuda:0', grad_fn=), Loss: 0.005796458572149277, KL/n: 19.43310546875 + 0it [00:00, ?it/s]2025-05-25 22:35:40,446 - INFO - [Epoch 090 | Batch 0000] IWAE-loss 1041.4233 | mean log_px -0.0023 | KL -952.96 + 1it [00:00, 3.10it/s] 2it [00:00, 3.84it/s] 3it [00:00, 4.18it/s] 4it [00:00, 4.18it/s] 5it [00:01, 4.38it/s] 6it [00:01, 4.41it/s] 7it [00:01, 4.47it/s] 8it [00:01, 4.50it/s] 9it [00:02, 4.56it/s] 10it [00:02, 4.59it/s] 11it [00:02, 3.54it/s] 12it [00:02, 3.84it/s] 13it [00:03, 4.07it/s] 14it [00:03, 4.23it/s] 15it [00:03, 4.36it/s] 16it [00:03, 4.45it/s] 17it [00:03, 4.53it/s] 18it [00:04, 4.41it/s] 19it [00:04, 4.51it/s] 20it [00:04, 4.56it/s] 21it [00:04, 4.61it/s] 22it [00:05, 4.64it/s] 23it [00:05, 4.62it/s] 24it [00:05, 4.49it/s] 25it [00:05, 4.58it/s] 26it [00:05, 4.61it/s] 27it [00:06, 4.64it/s] 28it [00:06, 4.66it/s] 29it [00:06, 4.67it/s] 30it [00:06, 4.68it/s] 31it [00:07, 4.69it/s] 32it [00:07, 4.70it/s] 33it [00:07, 4.54it/s] 34it [00:07, 4.60it/s] 35it [00:07, 4.64it/s] 36it [00:08, 4.65it/s] 37it [00:08, 4.67it/s] 38it [00:08, 4.68it/s] 39it [00:08, 4.52it/s] 40it [00:08, 4.59it/s] 41it [00:09, 4.63it/s] 42it [00:09, 4.65it/s] 43it [00:09, 4.67it/s] 44it [00:09, 4.67it/s] 45it [00:10, 4.69it/s] 46it [00:10, 4.53it/s] 47it [00:10, 4.60it/s] 48it [00:10, 4.63it/s] 49it [00:10, 4.66it/s] 50it [00:11, 4.67it/s]2025-05-25 22:35:51,482 - INFO - [Epoch 090 | Batch 0050] IWAE-loss 1354.5846 | mean log_px -0.0103 | KL -952.79 + 51it [00:11, 4.69it/s] 52it [00:11, 4.69it/s] 53it [00:11, 4.58it/s] 54it [00:11, 4.63it/s] 55it [00:12, 4.65it/s] 56it [00:12, 4.66it/s] 57it [00:12, 4.67it/s] 58it [00:12, 4.68it/s] 59it [00:13, 4.69it/s] 60it [00:13, 4.69it/s] 61it [00:13, 4.71it/s] 62it [00:13, 4.70it/s] 63it [00:13, 4.71it/s] 64it [00:14, 4.54it/s] 65it [00:14, 4.61it/s] 66it [00:14, 4.63it/s] 67it [00:14, 4.65it/s] 68it [00:15, 4.51it/s] 69it [00:15, 4.53it/s] 70it [00:15, 4.51it/s] 71it [00:15, 4.56it/s] 72it [00:15, 4.60it/s] 73it [00:16, 4.64it/s] 74it [00:16, 4.66it/s] 75it [00:16, 4.53it/s] 76it [00:16, 4.57it/s] 77it [00:16, 4.60it/s] 78it [00:17, 4.63it/s] 79it [00:17, 4.61it/s] 80it [00:17, 4.44it/s] 81it [00:17, 4.54it/s] 82it [00:18, 4.59it/s] 83it [00:18, 4.63it/s] 84it [00:18, 4.67it/s] 85it [00:18, 4.67it/s] 86it [00:18, 4.68it/s] 87it [00:19, 4.70it/s] 88it [00:19, 4.69it/s] 89it [00:19, 4.69it/s] 90it [00:19, 4.69it/s] 91it [00:20, 4.54it/s] 92it [00:20, 4.59it/s] 93it [00:20, 4.59it/s] 94it [00:20, 4.60it/s] 95it [00:20, 4.61it/s] 96it [00:21, 4.61it/s] 97it [00:21, 4.64it/s] 98it [00:21, 4.63it/s] 99it [00:21, 4.67it/s] 100it [00:21, 4.67it/s]2025-05-25 22:36:02,293 - INFO - [Epoch 090 | Batch 0100] IWAE-loss 1023.6895 | mean log_px -0.0019 | KL -951.39 + 101it [00:22, 4.68it/s] 102it [00:22, 4.68it/s] 103it [00:22, 4.52it/s] 104it [00:22, 4.58it/s] 105it [00:23, 4.61it/s] 106it [00:23, 4.61it/s] 107it [00:23, 4.64it/s] 108it [00:23, 4.62it/s] 109it [00:23, 4.62it/s] 110it [00:24, 4.50it/s] 111it [00:24, 4.56it/s] 112it [00:24, 4.57it/s] 113it [00:24, 4.60it/s] 114it [00:24, 4.62it/s] 115it [00:25, 4.62it/s] 116it [00:25, 4.62it/s] 117it [00:25, 4.63it/s] 118it [00:25, 4.64it/s] 119it [00:26, 4.64it/s] 120it [00:26, 4.45it/s] 121it [00:26, 4.46it/s] 122it [00:26, 4.52it/s] 123it [00:26, 4.56it/s] 124it [00:27, 4.43it/s] 125it [00:27, 4.51it/s] 126it [00:27, 4.55it/s] 127it [00:27, 4.58it/s] 128it [00:28, 4.57it/s] 129it [00:28, 4.59it/s] 130it [00:28, 4.61it/s] 131it [00:28, 4.62it/s] 132it [00:28, 4.62it/s] 133it [00:29, 4.64it/s] 134it [00:29, 4.62it/s] 135it [00:29, 4.62it/s] 136it [00:29, 4.62it/s] 137it [00:30, 4.62it/s] 138it [00:30, 4.49it/s] 139it [00:30, 4.54it/s] 140it [00:30, 4.56it/s] 141it [00:30, 4.57it/s] 142it [00:31, 4.58it/s] 143it [00:31, 4.59it/s] 144it [00:31, 4.53it/s] 145it [00:31, 4.48it/s] 146it [00:32, 4.53it/s] 147it [00:32, 4.55it/s] 148it [00:32, 4.57it/s] 149it [00:32, 4.59it/s] 150it [00:32, 4.58it/s]2025-05-25 22:36:13,228 - INFO - [Epoch 090 | Batch 0150] IWAE-loss 1153.8442 | mean log_px -0.0029 | KL -949.34 + 151it [00:33, 4.59it/s] 152it [00:33, 4.59it/s] 153it [00:33, 4.60it/s] 154it [00:33, 4.60it/s] 155it [00:33, 4.60it/s] 156it [00:34, 4.60it/s] 157it [00:34, 4.61it/s] 158it [00:34, 4.49it/s] 159it [00:34, 4.54it/s] 160it [00:35, 4.56it/s] 161it [00:35, 4.59it/s] 162it [00:35, 4.59it/s] 163it [00:35, 4.59it/s] 164it [00:35, 4.60it/s] 165it [00:36, 4.60it/s] 166it [00:36, 4.45it/s] 167it [00:36, 4.51it/s] 168it [00:36, 4.52it/s] 169it [00:37, 4.56it/s] 170it [00:37, 4.58it/s] 171it [00:37, 4.59it/s] 172it [00:37, 4.59it/s] 173it [00:37, 4.60it/s] 174it [00:38, 4.60it/s] 175it [00:38, 4.61it/s] 176it [00:38, 4.62it/s] 177it [00:38, 4.62it/s] 178it [00:38, 4.61it/s] 179it [00:39, 4.62it/s] 180it [00:39, 4.43it/s] 181it [00:39, 4.50it/s] 182it [00:39, 4.54it/s] 183it [00:40, 4.57it/s] 184it [00:40, 4.58it/s] 185it [00:40, 4.59it/s] 186it [00:40, 4.44it/s] 187it [00:40, 4.50it/s] 188it [00:41, 4.54it/s] 189it [00:41, 4.56it/s] 190it [00:41, 4.58it/s] 191it [00:41, 4.59it/s] 192it [00:42, 4.58it/s] 193it [00:42, 4.58it/s] 194it [00:42, 4.58it/s] 195it [00:42, 4.46it/s] 196it [00:42, 4.37it/s] 196it [00:43, 4.55it/s] +2025-05-25 22:36:23,249 - INFO - Epoch: 90, Objective: tensor([1778.1040], device='cuda:0', grad_fn=), Loss: 0.016707276925444603, KL/n: 19.43993377685547 + 0it [00:00, ?it/s]2025-05-25 22:36:23,643 - INFO - [Epoch 091 | Batch 0000] IWAE-loss 1187.3732 | mean log_px -0.0049 | KL -951.82 + 1it [00:00, 3.13it/s] 2it [00:00, 3.87it/s] 3it [00:00, 4.20it/s] 4it [00:00, 4.36it/s] 5it [00:01, 4.45it/s] 6it [00:01, 4.51it/s] 7it [00:01, 4.55it/s] 8it [00:01, 4.58it/s] 9it [00:02, 4.61it/s] 10it [00:02, 4.61it/s] 11it [00:02, 4.63it/s] 12it [00:02, 4.61it/s] 13it [00:02, 4.63it/s] 14it [00:03, 4.62it/s] 15it [00:03, 4.64it/s] 16it [00:03, 4.64it/s] 17it [00:03, 4.62it/s] 18it [00:03, 4.63it/s] 19it [00:04, 4.64it/s] 20it [00:04, 4.63it/s] 21it [00:04, 4.64it/s] 22it [00:04, 4.50it/s] 23it [00:05, 4.54it/s] 24it [00:05, 4.56it/s] 25it [00:05, 4.57it/s] 26it [00:05, 4.50it/s] 27it [00:05, 4.42it/s] 28it [00:06, 4.49it/s] 29it [00:06, 4.54it/s] 30it [00:06, 4.56it/s] 31it [00:06, 4.60it/s] 32it [00:07, 4.62it/s] 33it [00:07, 4.59it/s] 34it [00:07, 4.45it/s] 35it [00:07, 4.51it/s] 36it [00:07, 4.54it/s] 37it [00:08, 4.56it/s] 38it [00:08, 4.57it/s] 39it [00:08, 4.58it/s] 40it [00:08, 4.55it/s] 41it [00:09, 4.57it/s] 42it [00:09, 4.56it/s] 43it [00:09, 4.58it/s] 44it [00:09, 4.59it/s] 45it [00:09, 4.62it/s] 46it [00:10, 4.62it/s] 47it [00:10, 4.63it/s] 48it [00:10, 4.62it/s] 49it [00:10, 4.60it/s] 50it [00:10, 4.59it/s]2025-05-25 22:36:34,539 - INFO - [Epoch 091 | Batch 0050] IWAE-loss 1333.3361 | mean log_px -0.0116 | KL -948.98 + 51it [00:11, 4.60it/s] 52it [00:11, 4.60it/s] 53it [00:11, 4.47it/s] 54it [00:11, 4.53it/s] 55it [00:12, 4.56it/s] 56it [00:12, 4.57it/s] 57it [00:12, 4.60it/s] 58it [00:12, 4.61it/s] 59it [00:12, 4.62it/s] 60it [00:13, 4.61it/s] 61it [00:13, 4.63it/s] 62it [00:13, 4.62it/s] 63it [00:13, 4.63it/s] 64it [00:14, 4.63it/s] 65it [00:14, 4.64it/s] 66it [00:14, 4.63it/s] 67it [00:14, 4.62it/s] 68it [00:14, 4.61it/s] 69it [00:15, 4.62it/s] 70it [00:15, 4.60it/s] 71it [00:15, 4.56it/s] 72it [00:15, 4.59it/s] 73it [00:16, 4.46it/s] 74it [00:16, 4.51it/s] 75it [00:16, 4.55it/s] 76it [00:16, 4.56it/s] 77it [00:16, 4.58it/s] 78it [00:17, 4.59it/s] 79it [00:17, 4.59it/s] 80it [00:17, 4.59it/s] 81it [00:17, 4.47it/s] 82it [00:17, 4.52it/s] 83it [00:18, 4.54it/s] 84it [00:18, 4.53it/s] 85it [00:18, 4.46it/s] 86it [00:18, 4.50it/s] 87it [00:19, 4.51it/s] 88it [00:19, 4.54it/s] 89it [00:19, 4.56it/s] 90it [00:19, 4.59it/s] 91it [00:19, 4.61it/s] 92it [00:20, 4.61it/s] 93it [00:20, 4.62it/s] 94it [00:20, 4.61it/s] 95it [00:20, 4.61it/s] 96it [00:21, 4.61it/s] 97it [00:21, 4.62it/s] 98it [00:21, 4.62it/s] 99it [00:21, 4.60it/s] 100it [00:21, 4.61it/s]2025-05-25 22:36:45,459 - INFO - [Epoch 091 | Batch 0100] IWAE-loss 1001.7884 | mean log_px -0.0025 | KL -947.29 + 101it [00:22, 4.61it/s] 102it [00:22, 4.57it/s] 103it [00:22, 4.60it/s] 104it [00:22, 4.60it/s] 105it [00:23, 4.62it/s] 106it [00:23, 4.62it/s] 107it [00:23, 4.62it/s] 108it [00:23, 4.62it/s] 109it [00:23, 4.62it/s] 110it [00:24, 4.62it/s] 111it [00:24, 4.49it/s] 112it [00:24, 4.54it/s] 113it [00:24, 4.57it/s] 114it [00:24, 4.58it/s] 115it [00:25, 4.58it/s] 116it [00:25, 4.58it/s] 117it [00:25, 4.59it/s] 118it [00:25, 4.58it/s] 119it [00:26, 4.59it/s] 120it [00:26, 4.42it/s] 121it [00:26, 4.49it/s] 122it [00:26, 4.52it/s] 123it [00:26, 4.54it/s] 124it [00:27, 4.57it/s] 125it [00:27, 4.59it/s] 126it [00:27, 4.60it/s] 127it [00:27, 4.62it/s] 128it [00:28, 4.49it/s] 129it [00:28, 4.55it/s] 130it [00:28, 4.57it/s] 131it [00:28, 4.58it/s] 132it [00:28, 4.58it/s] 133it [00:29, 4.59it/s] 134it [00:29, 4.61it/s] 135it [00:29, 4.62it/s] 136it [00:29, 4.63it/s] 137it [00:29, 4.64it/s] 138it [00:30, 4.64it/s] 139it [00:30, 4.62it/s] 140it [00:30, 4.64it/s] 141it [00:30, 4.62it/s] 142it [00:31, 4.62it/s] 143it [00:31, 4.48it/s] 144it [00:31, 4.53it/s] 145it [00:31, 4.58it/s] 146it [00:31, 4.58it/s] 147it [00:32, 4.56it/s] 148it [00:32, 4.57it/s] 149it [00:32, 4.49it/s] 150it [00:32, 4.56it/s]2025-05-25 22:36:56,388 - INFO - [Epoch 091 | Batch 0150] IWAE-loss 1206.0220 | mean log_px -0.0106 | KL -951.12 + 151it [00:33, 4.59it/s] 152it [00:33, 4.61it/s] 153it [00:33, 4.62it/s] 154it [00:33, 4.63it/s] 155it [00:33, 4.63it/s] 156it [00:34, 4.62it/s] 157it [00:34, 4.48it/s] 158it [00:34, 4.52it/s] 159it [00:34, 4.57it/s] 160it [00:35, 4.57it/s] 161it [00:35, 4.60it/s] 162it [00:35, 4.61it/s] 163it [00:35, 4.62it/s] 164it [00:35, 4.63it/s] 165it [00:36, 4.63it/s] 166it [00:36, 4.64it/s] 167it [00:36, 4.64it/s] 168it [00:36, 4.65it/s] 169it [00:36, 4.66it/s] 170it [00:37, 4.44it/s] 171it [00:37, 4.46it/s] 172it [00:37, 4.52it/s] 173it [00:37, 4.56it/s] 174it [00:38, 4.59it/s] 175it [00:38, 4.58it/s] 176it [00:38, 4.57it/s] 177it [00:38, 4.59it/s] 178it [00:38, 4.46it/s] 179it [00:39, 4.51it/s] 180it [00:39, 4.54it/s] 181it [00:39, 4.58it/s] 182it [00:39, 4.58it/s] 183it [00:40, 4.60it/s] 184it [00:40, 4.62it/s] 185it [00:40, 4.63it/s] 186it [00:40, 4.63it/s] 187it [00:40, 4.64it/s] 188it [00:41, 4.64it/s] 189it [00:41, 4.49it/s] 190it [00:41, 4.54it/s] 191it [00:41, 4.52it/s] 192it [00:42, 4.57it/s] 193it [00:42, 4.61it/s] 194it [00:42, 4.60it/s] 195it [00:42, 4.32it/s] 196it [00:42, 4.43it/s] 196it [00:42, 4.56it/s] +2025-05-25 22:37:06,371 - INFO - Epoch: 91, Objective: tensor([1234.4763], device='cuda:0', grad_fn=), Loss: 0.004630007315427065, KL/n: 19.411489486694336 + 0it [00:00, ?it/s]2025-05-25 22:37:06,924 - INFO - [Epoch 092 | Batch 0000] IWAE-loss 1096.1681 | mean log_px -0.0068 | KL -950.23 + 1it [00:00, 3.29it/s] 2it [00:00, 3.97it/s] 3it [00:00, 4.28it/s] 4it [00:00, 4.44it/s] 5it [00:01, 4.54it/s] 6it [00:01, 4.60it/s] 7it [00:01, 4.63it/s] 8it [00:01, 4.65it/s] 9it [00:02, 4.67it/s] 10it [00:02, 4.68it/s] 11it [00:02, 4.69it/s] 12it [00:02, 4.54it/s] 13it [00:02, 4.61it/s] 14it [00:03, 4.63it/s] 15it [00:03, 4.66it/s] 16it [00:03, 4.67it/s] 17it [00:03, 4.69it/s] 18it [00:03, 4.69it/s] 19it [00:04, 4.69it/s] 20it [00:04, 4.70it/s] 21it [00:04, 4.71it/s] 22it [00:04, 4.70it/s] 23it [00:05, 4.70it/s] 24it [00:05, 4.54it/s] 25it [00:05, 4.60it/s] 26it [00:05, 4.62it/s] 27it [00:05, 4.65it/s] 28it [00:06, 4.64it/s] 29it [00:06, 4.66it/s] 30it [00:06, 4.67it/s] 31it [00:06, 4.68it/s] 32it [00:06, 4.68it/s] 33it [00:07, 4.69it/s] 34it [00:07, 4.53it/s] 35it [00:07, 4.60it/s] 36it [00:07, 4.62it/s] 37it [00:08, 4.61it/s] 38it [00:08, 4.63it/s] 39it [00:08, 4.65it/s] 40it [00:08, 4.66it/s] 41it [00:08, 4.67it/s] 42it [00:09, 4.68it/s] 43it [00:09, 4.69it/s] 44it [00:09, 4.54it/s] 45it [00:09, 4.60it/s] 46it [00:09, 4.61it/s] 47it [00:10, 4.64it/s] 48it [00:10, 4.65it/s] 49it [00:10, 4.52it/s] 50it [00:10, 4.59it/s]2025-05-25 22:37:17,686 - INFO - [Epoch 092 | Batch 0050] IWAE-loss 1275.9679 | mean log_px -0.0117 | KL -948.22 + 51it [00:11, 4.62it/s] 52it [00:11, 4.64it/s] 53it [00:11, 4.63it/s] 54it [00:11, 4.65it/s] 55it [00:11, 4.67it/s] 56it [00:12, 4.61it/s] 57it [00:12, 4.63it/s] 58it [00:12, 4.48it/s] 59it [00:12, 4.53it/s] 60it [00:13, 4.54it/s] 61it [00:13, 4.58it/s] 62it [00:13, 4.59it/s] 63it [00:13, 4.60it/s] 64it [00:13, 4.61it/s] 65it [00:14, 4.61it/s] 66it [00:14, 4.62it/s] 67it [00:14, 4.63it/s] 68it [00:14, 4.48it/s] 69it [00:14, 4.53it/s] 70it [00:15, 4.55it/s] 71it [00:15, 4.55it/s] 72it [00:15, 4.58it/s] 73it [00:15, 4.60it/s] 74it [00:16, 4.59it/s] 75it [00:16, 4.62it/s] 76it [00:16, 4.64it/s] 77it [00:16, 4.67it/s] 78it [00:16, 4.64it/s] 79it [00:17, 4.65it/s] 80it [00:17, 4.63it/s] 81it [00:17, 4.64it/s] 82it [00:17, 4.64it/s] 83it [00:18, 4.63it/s] 84it [00:18, 4.63it/s] 85it [00:18, 4.63it/s] 86it [00:18, 4.63it/s] 87it [00:18, 4.64it/s] 88it [00:19, 4.64it/s] 89it [00:19, 4.65it/s] 90it [00:19, 4.64it/s] 91it [00:19, 4.64it/s] 92it [00:19, 4.63it/s] 93it [00:20, 4.63it/s] 94it [00:20, 4.62it/s] 95it [00:20, 4.62it/s] 96it [00:20, 4.53it/s] 97it [00:21, 4.57it/s] 98it [00:21, 4.57it/s] 99it [00:21, 4.61it/s] 100it [00:21, 4.63it/s]2025-05-25 22:37:28,538 - INFO - [Epoch 092 | Batch 0100] IWAE-loss 1220.1927 | mean log_px -0.0129 | KL -944.11 + 101it [00:21, 4.63it/s] 102it [00:22, 4.63it/s] 103it [00:22, 4.64it/s] 104it [00:22, 4.62it/s] 105it [00:22, 4.62it/s] 106it [00:23, 4.53it/s] 107it [00:23, 4.58it/s] 108it [00:23, 4.59it/s] 109it [00:23, 4.61it/s] 110it [00:23, 4.61it/s] 111it [00:24, 4.49it/s] 112it [00:24, 4.53it/s] 113it [00:24, 4.57it/s] 114it [00:24, 4.58it/s] 115it [00:24, 4.61it/s] 116it [00:25, 4.56it/s] 117it [00:25, 4.53it/s] 118it [00:25, 4.39it/s] 119it [00:25, 4.43it/s] 120it [00:26, 4.45it/s] 121it [00:26, 4.46it/s] 122it [00:26, 4.49it/s] 123it [00:26, 4.54it/s] 124it [00:26, 4.57it/s] 125it [00:27, 4.60it/s] 126it [00:27, 4.61it/s] 127it [00:27, 4.61it/s] 128it [00:27, 4.62it/s] 129it [00:28, 4.62it/s] 130it [00:28, 4.48it/s] 131it [00:28, 4.53it/s] 132it [00:28, 4.55it/s] 133it [00:28, 4.57it/s] 134it [00:29, 4.58it/s] 135it [00:29, 4.59it/s] 136it [00:29, 4.59it/s] 137it [00:29, 4.60it/s] 138it [00:30, 4.60it/s] 139it [00:30, 4.61it/s] 140it [00:30, 4.61it/s] 141it [00:30, 4.61it/s] 142it [00:30, 4.62it/s] 143it [00:31, 4.61it/s] 144it [00:31, 4.61it/s] 145it [00:31, 4.62it/s] 146it [00:31, 4.63it/s] 147it [00:31, 4.62it/s] 148it [00:32, 4.63it/s] 149it [00:32, 4.62it/s] 150it [00:32, 4.56it/s]2025-05-25 22:37:39,475 - INFO - [Epoch 092 | Batch 0150] IWAE-loss 1267.1647 | mean log_px -0.0153 | KL -942.56 + 151it [00:32, 4.56it/s] 152it [00:33, 4.53it/s] 153it [00:33, 4.54it/s] 154it [00:33, 4.41it/s] 155it [00:33, 4.47it/s] 156it [00:33, 4.51it/s] 157it [00:34, 4.57it/s] 158it [00:34, 4.60it/s] 159it [00:34, 4.63it/s] 160it [00:34, 4.65it/s] 161it [00:35, 4.50it/s] 162it [00:35, 4.58it/s] 163it [00:35, 4.62it/s] 164it [00:35, 4.64it/s] 165it [00:35, 4.51it/s] 166it [00:36, 4.58it/s] 167it [00:36, 4.62it/s] 168it [00:36, 4.64it/s] 169it [00:36, 4.66it/s] 170it [00:37, 4.65it/s] 171it [00:37, 4.55it/s] 172it [00:37, 4.61it/s] 173it [00:37, 4.64it/s] 174it [00:37, 4.65it/s] 175it [00:38, 4.68it/s] 176it [00:38, 4.68it/s] 177it [00:38, 4.58it/s] 178it [00:38, 4.64it/s] 179it [00:38, 4.67it/s] 180it [00:39, 4.67it/s] 181it [00:39, 4.69it/s] 182it [00:39, 4.69it/s] 183it [00:39, 4.70it/s] 184it [00:40, 4.55it/s] 185it [00:40, 4.61it/s] 186it [00:40, 4.63it/s] 187it [00:40, 4.65it/s] 188it [00:40, 4.67it/s] 189it [00:41, 4.68it/s] 190it [00:41, 4.69it/s] 191it [00:41, 4.70it/s] 192it [00:41, 4.70it/s] 193it [00:41, 4.71it/s] 194it [00:42, 4.70it/s] 195it [00:42, 4.58it/s] 196it [00:42, 4.63it/s] 196it [00:42, 4.59it/s] +2025-05-25 22:37:49,344 - INFO - Epoch: 92, Objective: tensor([1376.6708], device='cuda:0', grad_fn=), Loss: 0.012566782534122467, KL/n: 19.321582794189453 + 0it [00:00, ?it/s]2025-05-25 22:37:49,722 - INFO - [Epoch 093 | Batch 0000] IWAE-loss 999.4476 | mean log_px -0.0021 | KL -946.94 + 1it [00:00, 3.31it/s] 2it [00:00, 4.00it/s] 3it [00:00, 4.30it/s] 4it [00:00, 4.40it/s] 5it [00:01, 4.39it/s] 6it [00:01, 4.40it/s] 7it [00:01, 4.46it/s] 8it [00:01, 4.47it/s] 9it [00:02, 4.41it/s] 10it [00:02, 3.40it/s] 11it [00:02, 3.63it/s] 12it [00:02, 3.89it/s] 13it [00:03, 4.01it/s] 14it [00:03, 4.08it/s] 15it [00:03, 4.27it/s] 16it [00:03, 4.28it/s] 17it [00:04, 4.31it/s] 18it [00:04, 4.28it/s] 19it [00:04, 4.32it/s] 20it [00:04, 4.30it/s] 21it [00:05, 4.30it/s] 22it [00:05, 4.31it/s] 23it [00:05, 4.38it/s] 24it [00:05, 4.31it/s] 25it [00:05, 4.32it/s] 26it [00:06, 4.29it/s] 27it [00:06, 4.17it/s] 28it [00:06, 4.19it/s] 29it [00:06, 4.24it/s] 30it [00:07, 4.34it/s] 31it [00:07, 4.30it/s] 32it [00:07, 4.28it/s] 33it [00:07, 4.28it/s] 34it [00:08, 4.38it/s] 35it [00:08, 4.48it/s] 36it [00:08, 4.53it/s] 37it [00:08, 4.43it/s] 38it [00:08, 4.37it/s] 39it [00:09, 4.33it/s] 40it [00:09, 4.32it/s] 41it [00:09, 4.34it/s] 42it [00:09, 4.33it/s] 43it [00:10, 4.33it/s] 44it [00:10, 4.26it/s] 45it [00:10, 4.27it/s] 46it [00:10, 4.29it/s] 47it [00:11, 4.34it/s] 48it [00:11, 4.40it/s] 49it [00:11, 4.38it/s] 50it [00:11, 4.34it/s]2025-05-25 22:38:01,374 - INFO - [Epoch 093 | Batch 0050] IWAE-loss 1235.3208 | mean log_px -0.0091 | KL -945.62 + 51it [00:11, 4.40it/s] 52it [00:12, 4.32it/s] 53it [00:12, 4.41it/s] 54it [00:12, 4.31it/s] 55it [00:12, 4.41it/s] 56it [00:13, 4.44it/s] 57it [00:13, 4.47it/s] 58it [00:13, 4.43it/s] 59it [00:13, 4.19it/s] 60it [00:14, 4.26it/s] 61it [00:14, 4.31it/s] 62it [00:14, 4.40it/s] 63it [00:14, 4.46it/s] 64it [00:14, 4.28it/s] 65it [00:15, 4.37it/s] 66it [00:15, 4.40it/s] 67it [00:15, 4.39it/s] 68it [00:15, 4.49it/s] 69it [00:16, 4.41it/s] 70it [00:16, 4.50it/s] 71it [00:16, 4.35it/s] 72it [00:16, 4.29it/s] 73it [00:17, 4.28it/s] 74it [00:17, 4.28it/s] 75it [00:17, 4.30it/s] 76it [00:17, 4.29it/s] 77it [00:17, 4.42it/s] 78it [00:18, 4.37it/s] 79it [00:18, 4.32it/s] 80it [00:18, 4.31it/s] 81it [00:18, 4.44it/s] 82it [00:19, 4.42it/s] 83it [00:19, 4.36it/s] 84it [00:19, 4.40it/s] 85it [00:19, 4.46it/s] 86it [00:19, 4.31it/s] 87it [00:20, 4.31it/s] 88it [00:20, 4.21it/s] 89it [00:20, 4.30it/s] 90it [00:20, 4.31it/s] 91it [00:21, 4.42it/s] 92it [00:21, 4.42it/s] 93it [00:21, 4.43it/s] 94it [00:21, 4.49it/s] 95it [00:22, 4.40it/s] 96it [00:22, 4.42it/s] 97it [00:22, 4.36it/s] 98it [00:22, 4.35it/s] 99it [00:22, 4.45it/s] 100it [00:23, 4.40it/s]2025-05-25 22:38:12,823 - INFO - [Epoch 093 | Batch 0100] IWAE-loss 1168.9042 | mean log_px -0.0071 | KL -945.60 + 101it [00:23, 4.36it/s] 102it [00:23, 4.32it/s] 103it [00:23, 4.30it/s] 104it [00:24, 4.28it/s] 105it [00:24, 4.29it/s] 106it [00:24, 4.35it/s] 107it [00:24, 4.42it/s] 108it [00:24, 4.52it/s] 109it [00:25, 4.58it/s] 110it [00:25, 4.62it/s] 111it [00:25, 4.52it/s] 112it [00:25, 4.47it/s] 113it [00:26, 4.41it/s] 114it [00:26, 4.49it/s] 115it [00:26, 4.41it/s] 116it [00:26, 4.34it/s] 117it [00:27, 4.37it/s] 118it [00:27, 4.31it/s] 119it [00:27, 4.32it/s] 120it [00:27, 4.41it/s] 121it [00:27, 4.43it/s] 122it [00:28, 4.38it/s] 123it [00:28, 4.42it/s] 124it [00:28, 4.35it/s] 125it [00:28, 4.31it/s] 126it [00:29, 4.40it/s] 127it [00:29, 4.26it/s] 128it [00:29, 4.36it/s] 129it [00:29, 4.45it/s] 130it [00:29, 4.52it/s] 131it [00:30, 4.55it/s] 132it [00:30, 4.33it/s] 133it [00:30, 4.30it/s] 134it [00:30, 4.43it/s] 135it [00:31, 4.39it/s] 136it [00:31, 4.46it/s] 137it [00:31, 4.40it/s] 138it [00:31, 4.34it/s] 139it [00:32, 4.18it/s] 140it [00:32, 4.21it/s] 141it [00:32, 4.36it/s] 142it [00:32, 4.46it/s] 143it [00:32, 4.35it/s] 144it [00:33, 4.31it/s] 145it [00:33, 4.36it/s] 146it [00:33, 4.46it/s] 147it [00:33, 4.41it/s] 148it [00:34, 4.37it/s] 149it [00:34, 4.37it/s] 150it [00:34, 4.37it/s]2025-05-25 22:38:24,227 - INFO - [Epoch 093 | Batch 0150] IWAE-loss 1105.6846 | mean log_px -0.0088 | KL -947.32 + 151it [00:34, 4.34it/s] 152it [00:35, 4.44it/s] 153it [00:35, 4.37it/s] 154it [00:35, 4.48it/s] 155it [00:35, 4.45it/s] 156it [00:35, 4.29it/s] 157it [00:36, 4.30it/s] 158it [00:36, 4.39it/s] 159it [00:36, 4.45it/s] 160it [00:36, 4.42it/s] 161it [00:37, 4.35it/s] 162it [00:37, 4.36it/s] 163it [00:37, 4.38it/s] 164it [00:37, 4.34it/s] 165it [00:38, 4.32it/s] 166it [00:38, 4.36it/s] 167it [00:38, 4.30it/s] 168it [00:38, 4.32it/s] 169it [00:38, 4.41it/s] 170it [00:39, 4.35it/s] 171it [00:39, 4.28it/s] 172it [00:39, 4.29it/s] 173it [00:39, 4.13it/s] 174it [00:40, 4.23it/s] 175it [00:40, 4.22it/s] 176it [00:40, 4.20it/s] 177it [00:40, 4.21it/s] 178it [00:41, 4.22it/s] 179it [00:41, 4.09it/s] 180it [00:41, 4.25it/s] 181it [00:41, 4.29it/s] 182it [00:41, 4.30it/s] 183it [00:42, 4.39it/s] 184it [00:42, 4.46it/s] 185it [00:42, 4.36it/s] 186it [00:42, 4.28it/s] 187it [00:43, 4.40it/s] 188it [00:43, 4.49it/s] 189it [00:43, 4.38it/s] 190it [00:43, 4.35it/s] 191it [00:44, 4.43it/s] 192it [00:44, 4.36it/s] 193it [00:44, 4.46it/s] 194it [00:44, 4.40it/s] 195it [00:44, 4.30it/s] 196it [00:45, 4.25it/s] 196it [00:45, 4.33it/s] +2025-05-25 22:38:34,740 - INFO - Epoch: 93, Objective: tensor([1070.6356], device='cuda:0', grad_fn=), Loss: 0.00409930944442749, KL/n: 19.31393051147461 + 0it [00:00, ?it/s]2025-05-25 22:38:35,131 - INFO - [Epoch 094 | Batch 0000] IWAE-loss 1022.8226 | mean log_px -0.0018 | KL -944.74 + 1it [00:00, 3.11it/s] 2it [00:00, 3.90it/s] 3it [00:00, 4.08it/s] 4it [00:00, 4.15it/s] 5it [00:01, 4.22it/s] 6it [00:01, 4.37it/s] 7it [00:01, 4.30it/s] 8it [00:01, 4.26it/s] 9it [00:02, 4.13it/s] 10it [00:02, 4.18it/s] 11it [00:02, 4.24it/s] 12it [00:02, 4.34it/s] 13it [00:03, 4.31it/s] 14it [00:03, 4.31it/s] 15it [00:03, 4.28it/s] 16it [00:03, 4.30it/s] 17it [00:04, 4.28it/s] 18it [00:04, 4.29it/s] 19it [00:04, 4.41it/s] 20it [00:04, 4.49it/s] 21it [00:04, 4.44it/s] 22it [00:05, 4.51it/s] 23it [00:05, 4.41it/s] 24it [00:05, 4.34it/s] 25it [00:05, 4.44it/s] 26it [00:06, 4.51it/s] 27it [00:06, 4.57it/s] 28it [00:06, 4.60it/s] 29it [00:06, 4.47it/s] 30it [00:06, 4.49it/s] 31it [00:07, 4.29it/s] 32it [00:07, 4.28it/s] 33it [00:07, 4.25it/s] 34it [00:07, 4.36it/s] 35it [00:08, 4.30it/s] 36it [00:08, 4.16it/s] 37it [00:08, 4.17it/s] 38it [00:08, 4.31it/s] 39it [00:09, 4.27it/s] 40it [00:09, 4.29it/s] 41it [00:09, 4.29it/s] 42it [00:09, 4.30it/s] 43it [00:09, 4.33it/s] 44it [00:10, 4.16it/s] 45it [00:10, 4.23it/s] 46it [00:10, 4.21it/s] 47it [00:10, 4.21it/s] 48it [00:11, 4.27it/s] 49it [00:11, 4.25it/s] 50it [00:11, 4.23it/s]2025-05-25 22:38:46,683 - INFO - [Epoch 094 | Batch 0050] IWAE-loss 1190.5052 | mean log_px -0.0090 | KL -945.57 + 51it [00:11, 4.34it/s] 52it [00:12, 4.26it/s] 53it [00:12, 4.27it/s] 54it [00:12, 4.23it/s] 55it [00:12, 4.21it/s] 56it [00:13, 4.33it/s] 57it [00:13, 4.29it/s] 58it [00:13, 4.42it/s] 59it [00:13, 4.33it/s] 60it [00:13, 4.30it/s] 61it [00:14, 4.08it/s] 62it [00:14, 4.14it/s] 63it [00:14, 4.16it/s] 64it [00:14, 4.22it/s] 65it [00:15, 4.32it/s] 66it [00:15, 4.30it/s] 67it [00:15, 4.42it/s] 68it [00:15, 4.47it/s] 69it [00:16, 4.24it/s] 70it [00:16, 4.26it/s] 71it [00:16, 4.37it/s] 72it [00:16, 4.44it/s] 73it [00:16, 4.45it/s] 74it [00:17, 4.36it/s] 75it [00:17, 4.44it/s] 76it [00:17, 4.34it/s] 77it [00:17, 4.22it/s] 78it [00:18, 4.23it/s] 79it [00:18, 4.24it/s] 80it [00:18, 4.27it/s] 81it [00:18, 4.25it/s] 82it [00:19, 4.35it/s] 83it [00:19, 4.45it/s] 84it [00:19, 4.50it/s] 85it [00:19, 4.26it/s] 86it [00:19, 4.37it/s] 87it [00:20, 4.34it/s] 88it [00:20, 4.44it/s] 89it [00:20, 4.52it/s] 90it [00:20, 4.40it/s] 91it [00:21, 4.36it/s] 92it [00:21, 4.31it/s] 93it [00:21, 4.32it/s] 94it [00:21, 4.34it/s] 95it [00:22, 4.43it/s] 96it [00:22, 4.37it/s] 97it [00:22, 4.41it/s] 98it [00:22, 4.49it/s] 99it [00:22, 4.40it/s] 100it [00:23, 4.34it/s]2025-05-25 22:38:58,219 - INFO - [Epoch 094 | Batch 0100] IWAE-loss 1009.5639 | mean log_px -0.0037 | KL -944.66 + 101it [00:23, 4.40it/s] 102it [00:23, 4.48it/s] 103it [00:23, 4.55it/s] 104it [00:24, 4.49it/s] 105it [00:24, 4.28it/s] 106it [00:24, 4.39it/s] 107it [00:24, 4.45it/s] 108it [00:24, 4.52it/s] 109it [00:25, 4.38it/s] 110it [00:25, 4.35it/s] 111it [00:25, 4.44it/s] 112it [00:25, 4.49it/s] 113it [00:26, 4.41it/s] 114it [00:26, 4.34it/s] 115it [00:26, 4.38it/s] 116it [00:26, 4.46it/s] 117it [00:27, 4.44it/s] 118it [00:27, 4.40it/s] 119it [00:27, 4.19it/s] 120it [00:27, 4.20it/s] 121it [00:27, 4.21it/s] 122it [00:28, 4.24it/s] 123it [00:28, 4.30it/s] 124it [00:28, 4.26it/s] 125it [00:28, 4.38it/s] 126it [00:29, 4.31it/s] 127it [00:29, 4.33it/s] 128it [00:29, 4.41it/s] 129it [00:29, 4.48it/s] 130it [00:30, 4.46it/s] 131it [00:30, 4.38it/s] 132it [00:30, 4.43it/s] 133it [00:30, 4.39it/s] 134it [00:30, 4.32it/s] 135it [00:31, 4.39it/s] 136it [00:31, 4.26it/s] 137it [00:31, 4.23it/s] 138it [00:31, 4.22it/s] 139it [00:32, 4.26it/s] 140it [00:32, 4.23it/s] 141it [00:32, 4.27it/s] 142it [00:32, 4.19it/s] 143it [00:33, 4.18it/s] 144it [00:33, 4.31it/s] 145it [00:33, 4.28it/s] 146it [00:33, 4.36it/s] 147it [00:33, 4.42it/s] 148it [00:34, 4.47it/s] 149it [00:34, 4.52it/s] 150it [00:34, 4.52it/s]2025-05-25 22:39:09,667 - INFO - [Epoch 094 | Batch 0150] IWAE-loss 1335.1519 | mean log_px -0.0069 | KL -943.56 + 151it [00:34, 4.55it/s] 152it [00:35, 4.34it/s] 153it [00:35, 4.40it/s] 154it [00:35, 4.35it/s] 155it [00:35, 4.30it/s] 156it [00:36, 4.26it/s] 157it [00:36, 4.21it/s] 158it [00:36, 4.14it/s] 159it [00:36, 4.21it/s] 160it [00:37, 4.07it/s] 161it [00:37, 4.10it/s] 162it [00:37, 4.10it/s] 163it [00:37, 4.17it/s] 164it [00:38, 4.07it/s] 165it [00:38, 4.10it/s] 166it [00:38, 4.09it/s] 167it [00:38, 4.13it/s] 168it [00:38, 4.21it/s] 169it [00:39, 4.23it/s] 170it [00:39, 4.27it/s] 171it [00:39, 4.32it/s] 172it [00:39, 4.23it/s] 173it [00:40, 4.34it/s] 174it [00:40, 4.41it/s] 175it [00:40, 4.24it/s] 176it [00:40, 4.26it/s] 177it [00:41, 4.32it/s] 178it [00:41, 4.29it/s] 179it [00:41, 4.27it/s] 180it [00:41, 4.25it/s] 181it [00:42, 4.14it/s] 182it [00:42, 4.17it/s] 183it [00:42, 4.30it/s] 184it [00:42, 4.26it/s] 185it [00:42, 4.37it/s] 186it [00:43, 4.45it/s] 187it [00:43, 4.47it/s] 188it [00:43, 4.40it/s] 189it [00:43, 4.33it/s] 190it [00:44, 4.31it/s] 191it [00:44, 4.35it/s] 192it [00:44, 4.31it/s] 193it [00:44, 4.22it/s] 194it [00:45, 4.21it/s] 195it [00:45, 4.22it/s] 196it [00:45, 4.34it/s] 196it [00:45, 4.31it/s] +2025-05-25 22:39:20,379 - INFO - Epoch: 94, Objective: tensor([1227.7629], device='cuda:0', grad_fn=), Loss: 0.007183433044701815, KL/n: 19.307418823242188 + 0it [00:00, ?it/s]2025-05-25 22:39:20,968 - INFO - [Epoch 095 | Batch 0000] IWAE-loss 1115.9677 | mean log_px -0.0096 | KL -943.85 + 1it [00:00, 3.10it/s] 2it [00:00, 3.70it/s] 3it [00:00, 4.02it/s] 4it [00:00, 4.22it/s] 5it [00:01, 4.24it/s] 6it [00:01, 4.30it/s] 7it [00:01, 4.42it/s] 8it [00:01, 4.43it/s] 9it [00:02, 4.51it/s] 10it [00:02, 4.56it/s] 11it [00:02, 4.60it/s] 12it [00:02, 4.50it/s] 13it [00:02, 4.51it/s] 14it [00:03, 4.46it/s] 15it [00:03, 4.28it/s] 16it [00:03, 4.32it/s] 17it [00:03, 4.29it/s] 18it [00:04, 4.33it/s] 19it [00:04, 4.30it/s] 20it [00:04, 4.33it/s] 21it [00:04, 4.41it/s] 22it [00:05, 4.49it/s] 23it [00:05, 4.57it/s] 24it [00:05, 4.61it/s] 25it [00:05, 4.49it/s] 26it [00:05, 4.41it/s] 27it [00:06, 4.46it/s] 28it [00:06, 4.42it/s] 29it [00:06, 4.37it/s] 30it [00:06, 4.20it/s] 31it [00:07, 4.31it/s] 32it [00:07, 4.41it/s] 33it [00:07, 4.45it/s] 34it [00:07, 4.30it/s] 35it [00:08, 4.42it/s] 36it [00:08, 4.47it/s] 37it [00:08, 4.52it/s] 38it [00:08, 4.54it/s] 39it [00:08, 4.58it/s] 40it [00:09, 4.60it/s] 41it [00:09, 4.63it/s] 42it [00:09, 4.61it/s] 43it [00:09, 4.61it/s] 44it [00:09, 4.55it/s] 45it [00:10, 4.46it/s] 46it [00:10, 4.51it/s] 47it [00:10, 4.55it/s] 48it [00:10, 4.58it/s] 49it [00:11, 4.39it/s] 50it [00:11, 4.42it/s]2025-05-25 22:39:32,199 - INFO - [Epoch 095 | Batch 0050] IWAE-loss 1069.6550 | mean log_px -0.0162 | KL -945.07 + 51it [00:11, 4.37it/s] 52it [00:11, 4.37it/s] 53it [00:12, 4.30it/s] 54it [00:12, 4.31it/s] 55it [00:12, 4.27it/s] 56it [00:12, 4.10it/s] 57it [00:12, 4.21it/s] 58it [00:13, 4.17it/s] 59it [00:13, 4.21it/s] 60it [00:13, 4.21it/s] 61it [00:13, 4.29it/s] 62it [00:14, 4.37it/s] 63it [00:14, 4.30it/s] 64it [00:14, 4.17it/s] 65it [00:14, 4.17it/s] 66it [00:15, 4.21it/s] 67it [00:15, 4.22it/s] 68it [00:15, 4.34it/s] 69it [00:15, 4.37it/s] 70it [00:16, 4.35it/s] 71it [00:16, 4.39it/s] 72it [00:16, 4.45it/s] 73it [00:16, 4.43it/s] 74it [00:16, 4.25it/s] 75it [00:17, 4.17it/s] 76it [00:17, 4.31it/s] 77it [00:17, 4.26it/s] 78it [00:17, 4.31it/s] 79it [00:18, 4.23it/s] 80it [00:18, 4.11it/s] 81it [00:18, 4.06it/s] 82it [00:18, 4.23it/s] 83it [00:19, 4.37it/s] 84it [00:19, 4.32it/s] 85it [00:19, 4.18it/s] 86it [00:19, 4.22it/s] 87it [00:20, 4.23it/s] 88it [00:20, 4.23it/s] 89it [00:20, 4.13it/s] 90it [00:20, 4.27it/s] 91it [00:20, 4.24it/s] 92it [00:21, 4.22it/s] 93it [00:21, 4.33it/s] 94it [00:21, 4.40it/s] 95it [00:21, 4.48it/s] 96it [00:22, 4.54it/s] 97it [00:22, 4.43it/s] 98it [00:22, 4.51it/s] 99it [00:22, 4.34it/s] 100it [00:22, 4.46it/s]2025-05-25 22:39:43,852 - INFO - [Epoch 095 | Batch 0100] IWAE-loss 1063.1974 | mean log_px -0.0022 | KL -944.21 + 101it [00:23, 4.47it/s] 102it [00:23, 4.42it/s] 103it [00:23, 4.22it/s] 104it [00:23, 4.33it/s] 105it [00:24, 4.36it/s] 106it [00:24, 4.35it/s] 107it [00:24, 4.35it/s] 108it [00:24, 4.36it/s] 109it [00:25, 4.40it/s] 110it [00:25, 4.47it/s] 111it [00:25, 4.54it/s] 112it [00:25, 4.56it/s] 113it [00:25, 4.45it/s] 114it [00:26, 4.40it/s] 115it [00:26, 4.36it/s] 116it [00:26, 4.45it/s] 117it [00:26, 4.43it/s] 118it [00:27, 4.50it/s] 119it [00:27, 4.50it/s] 120it [00:27, 4.27it/s] 121it [00:27, 4.26it/s] 122it [00:28, 4.25it/s] 123it [00:28, 4.32it/s] 124it [00:28, 4.41it/s] 125it [00:28, 4.42it/s] 126it [00:28, 4.23it/s] 127it [00:29, 4.31it/s] 128it [00:29, 4.42it/s] 129it [00:29, 4.49it/s] 130it [00:29, 4.50it/s] 131it [00:30, 4.35it/s] 132it [00:30, 4.33it/s] 133it [00:30, 4.35it/s] 134it [00:30, 4.32it/s] 135it [00:30, 4.39it/s] 136it [00:31, 4.48it/s] 137it [00:31, 4.23it/s] 138it [00:31, 4.27it/s] 139it [00:31, 4.36it/s] 140it [00:32, 4.46it/s] 141it [00:32, 4.54it/s] 142it [00:32, 4.56it/s] 143it [00:32, 4.61it/s] 144it [00:32, 4.49it/s] 145it [00:33, 4.50it/s] 146it [00:33, 4.41it/s] 147it [00:33, 4.36it/s] 148it [00:33, 4.47it/s] 149it [00:34, 4.29it/s] 150it [00:34, 4.42it/s]2025-05-25 22:39:55,241 - INFO - [Epoch 095 | Batch 0150] IWAE-loss 1082.0015 | mean log_px -0.0033 | KL -939.44 + 151it [00:34, 4.36it/s] 152it [00:34, 4.45it/s] 153it [00:35, 4.37it/s] 154it [00:35, 4.27it/s] 155it [00:35, 4.29it/s] 156it [00:35, 4.38it/s] 157it [00:35, 4.29it/s] 158it [00:36, 4.34it/s] 159it [00:36, 4.29it/s] 160it [00:36, 4.32it/s] 161it [00:36, 4.33it/s] 162it [00:37, 4.40it/s] 163it [00:37, 4.50it/s] 164it [00:37, 4.42it/s] 165it [00:37, 4.41it/s] 166it [00:38, 4.37it/s] 167it [00:38, 4.32it/s] 168it [00:38, 4.42it/s] 169it [00:38, 4.51it/s] 170it [00:38, 4.49it/s] 171it [00:39, 4.28it/s] 172it [00:39, 4.26it/s] 173it [00:39, 4.29it/s] 174it [00:39, 4.23it/s] 175it [00:40, 4.22it/s] 176it [00:40, 4.35it/s] 177it [00:40, 4.42it/s] 178it [00:40, 4.50it/s] 179it [00:40, 4.48it/s] 180it [00:41, 4.39it/s] 181it [00:41, 4.18it/s] 182it [00:41, 4.24it/s] 183it [00:41, 4.31it/s] 184it [00:42, 4.31it/s] 185it [00:42, 4.24it/s] 186it [00:42, 4.24it/s] 187it [00:42, 4.35it/s] 188it [00:43, 4.31it/s] 189it [00:43, 4.44it/s] 190it [00:43, 4.51it/s] 191it [00:43, 4.41it/s] 192it [00:44, 4.35it/s] 193it [00:44, 4.35it/s] 194it [00:44, 4.44it/s] 195it [00:44, 4.26it/s] 196it [00:44, 4.41it/s] 196it [00:44, 4.36it/s] +2025-05-25 22:40:05,701 - INFO - Epoch: 95, Objective: tensor([1025.7579], device='cuda:0', grad_fn=), Loss: 0.00621769716963172, KL/n: 19.164661407470703 + 0it [00:00, ?it/s]2025-05-25 22:40:06,074 - INFO - [Epoch 096 | Batch 0000] IWAE-loss 970.0466 | mean log_px -0.0005 | KL -939.20 + 1it [00:00, 3.30it/s] 2it [00:00, 3.99it/s] 3it [00:00, 4.29it/s] 4it [00:00, 4.42it/s] 5it [00:01, 4.52it/s] 6it [00:01, 4.57it/s] 7it [00:01, 4.62it/s] 8it [00:01, 4.64it/s] 9it [00:02, 4.67it/s] 10it [00:02, 4.64it/s] 11it [00:02, 4.66it/s] 12it [00:02, 4.67it/s] 13it [00:02, 4.69it/s] 14it [00:03, 4.69it/s] 15it [00:03, 4.48it/s] 16it [00:03, 4.43it/s] 17it [00:03, 4.49it/s] 18it [00:03, 4.51it/s] 19it [00:04, 4.53it/s] 20it [00:04, 4.51it/s] 21it [00:04, 4.56it/s] 22it [00:04, 4.56it/s] 23it [00:05, 4.59it/s] 24it [00:05, 4.46it/s] 25it [00:05, 4.55it/s] 26it [00:05, 4.59it/s] 27it [00:05, 4.62it/s] 28it [00:06, 4.63it/s] 29it [00:06, 4.65it/s] 30it [00:06, 4.51it/s] 31it [00:06, 4.56it/s] 32it [00:07, 4.62it/s] 33it [00:07, 4.65it/s] 34it [00:07, 4.50it/s] 35it [00:07, 4.58it/s] 36it [00:07, 4.61it/s] 37it [00:08, 4.64it/s] 38it [00:08, 4.66it/s] 39it [00:08, 4.66it/s] 40it [00:08, 4.51it/s] 41it [00:09, 4.59it/s] 42it [00:09, 4.62it/s] 43it [00:09, 4.64it/s] 44it [00:09, 4.64it/s] 45it [00:09, 4.67it/s] 46it [00:10, 4.50it/s] 47it [00:10, 4.58it/s] 48it [00:10, 4.61it/s] 49it [00:10, 4.61it/s] 50it [00:10, 4.62it/s]2025-05-25 22:40:16,940 - INFO - [Epoch 096 | Batch 0050] IWAE-loss 988.4781 | mean log_px -0.0008 | KL -937.70 + 51it [00:11, 4.61it/s] 52it [00:11, 4.62it/s] 53it [00:11, 4.64it/s] 54it [00:11, 4.63it/s] 55it [00:12, 4.40it/s] 56it [00:12, 4.48it/s] 57it [00:12, 4.53it/s] 58it [00:12, 4.57it/s] 59it [00:12, 4.60it/s] 60it [00:13, 4.61it/s] 61it [00:13, 4.62it/s] 62it [00:13, 4.59it/s] 63it [00:13, 4.60it/s] 64it [00:14, 4.61it/s] 65it [00:14, 4.63it/s] 66it [00:14, 4.63it/s] 67it [00:14, 4.64it/s] 68it [00:14, 4.64it/s] 69it [00:15, 4.64it/s] 70it [00:15, 4.63it/s] 71it [00:15, 4.64it/s] 72it [00:15, 4.63it/s] 73it [00:15, 4.60it/s] 74it [00:16, 4.61it/s] 75it [00:16, 4.65it/s] 76it [00:16, 4.66it/s] 77it [00:16, 4.51it/s] 78it [00:17, 4.58it/s] 79it [00:17, 4.62it/s] 80it [00:17, 4.64it/s] 81it [00:17, 4.65it/s] 82it [00:17, 4.67it/s] 83it [00:18, 4.69it/s] 84it [00:18, 4.69it/s] 85it [00:18, 4.70it/s] 86it [00:18, 4.68it/s] 87it [00:18, 4.54it/s] 88it [00:19, 4.58it/s] 89it [00:19, 4.61it/s] 90it [00:19, 4.58it/s] 91it [00:20, 3.65it/s] 92it [00:20, 3.90it/s] 93it [00:20, 4.10it/s] 94it [00:20, 4.13it/s] 95it [00:20, 4.28it/s] 96it [00:21, 4.37it/s] 97it [00:21, 4.45it/s] 98it [00:21, 4.50it/s] 99it [00:21, 4.54it/s] 100it [00:21, 4.57it/s]2025-05-25 22:40:27,984 - INFO - [Epoch 096 | Batch 0100] IWAE-loss 1141.4642 | mean log_px -0.0031 | KL -935.62 + 101it [00:22, 4.59it/s] 102it [00:22, 4.61it/s] 103it [00:22, 4.60it/s] 104it [00:22, 4.62it/s] 105it [00:23, 4.63it/s] 106it [00:23, 4.63it/s] 107it [00:23, 4.64it/s] 108it [00:23, 4.64it/s] 109it [00:23, 4.65it/s] 110it [00:24, 4.63it/s] 111it [00:24, 4.64it/s] 112it [00:24, 4.61it/s] 113it [00:24, 4.63it/s] 114it [00:25, 4.51it/s] 115it [00:25, 4.55it/s] 116it [00:25, 4.57it/s] 117it [00:25, 4.58it/s] 118it [00:25, 4.61it/s] 119it [00:26, 4.45it/s] 120it [00:26, 4.49it/s] 121it [00:26, 4.53it/s] 122it [00:26, 4.57it/s] 123it [00:27, 4.59it/s] 124it [00:27, 4.60it/s] 125it [00:27, 4.61it/s] 126it [00:27, 4.62it/s] 127it [00:27, 4.49it/s] 128it [00:28, 4.54it/s] 129it [00:28, 4.58it/s] 130it [00:28, 4.58it/s] 131it [00:28, 4.60it/s] 132it [00:28, 4.56it/s] 133it [00:29, 4.61it/s] 134it [00:29, 4.57it/s] 135it [00:29, 4.59it/s] 136it [00:29, 4.61it/s] 137it [00:30, 4.61it/s] 138it [00:30, 4.61it/s] 139it [00:30, 4.62it/s] 140it [00:30, 4.61it/s] 141it [00:30, 4.53it/s] 142it [00:31, 4.57it/s] 143it [00:31, 4.59it/s] 144it [00:31, 4.60it/s] 145it [00:31, 4.62it/s] 146it [00:32, 4.62it/s] 147it [00:32, 4.61it/s] 148it [00:32, 4.61it/s] 149it [00:32, 4.62it/s] 150it [00:32, 4.64it/s]2025-05-25 22:40:38,868 - INFO - [Epoch 096 | Batch 0150] IWAE-loss 1193.1945 | mean log_px -0.0053 | KL -933.20 + 151it [00:33, 4.49it/s] 152it [00:33, 4.56it/s] 153it [00:33, 4.61it/s] 154it [00:33, 4.64it/s] 155it [00:33, 4.65it/s] 156it [00:34, 4.67it/s] 157it [00:34, 4.68it/s] 158it [00:34, 4.68it/s] 159it [00:34, 4.37it/s] 160it [00:35, 4.45it/s] 161it [00:35, 4.52it/s] 162it [00:35, 4.56it/s] 163it [00:35, 4.59it/s] 164it [00:35, 4.60it/s] 165it [00:36, 4.62it/s] 166it [00:36, 4.60it/s] 167it [00:36, 4.61it/s] 168it [00:36, 4.64it/s] 169it [00:37, 4.51it/s] 170it [00:37, 4.58it/s] 171it [00:37, 4.62it/s] 172it [00:37, 4.64it/s] 173it [00:37, 4.66it/s] 174it [00:38, 4.55it/s] 175it [00:38, 4.61it/s] 176it [00:38, 4.63it/s] 177it [00:38, 4.66it/s] 178it [00:38, 4.66it/s] 179it [00:39, 4.52it/s] 180it [00:39, 4.59it/s] 181it [00:39, 4.63it/s] 182it [00:39, 4.66it/s] 183it [00:40, 4.67it/s] 184it [00:40, 4.69it/s] 185it [00:40, 4.70it/s] 186it [00:40, 4.69it/s] 187it [00:40, 4.52it/s] 188it [00:41, 4.58it/s] 189it [00:41, 4.61it/s] 190it [00:41, 4.63it/s] 191it [00:41, 4.64it/s] 192it [00:42, 4.65it/s] 193it [00:42, 4.68it/s] 194it [00:42, 4.68it/s] 195it [00:42, 4.45it/s] 196it [00:42, 4.23it/s] 196it [00:43, 4.56it/s] +2025-05-25 22:40:48,842 - INFO - Epoch: 96, Objective: tensor([1514.7576], device='cuda:0', grad_fn=), Loss: 0.014402041211724281, KL/n: 19.02967071533203 + 0it [00:00, ?it/s]2025-05-25 22:40:49,237 - INFO - [Epoch 097 | Batch 0000] IWAE-loss 1021.1172 | mean log_px -0.0019 | KL -929.78 + 1it [00:00, 3.09it/s] 2it [00:00, 3.84it/s] 3it [00:00, 4.20it/s] 4it [00:00, 4.39it/s] 5it [00:01, 4.51it/s] 6it [00:01, 4.57it/s] 7it [00:01, 4.63it/s] 8it [00:01, 4.65it/s] 9it [00:02, 4.51it/s] 10it [00:02, 4.59it/s] 11it [00:02, 4.63it/s] 12it [00:02, 4.66it/s] 13it [00:02, 4.68it/s] 14it [00:03, 4.69it/s] 15it [00:03, 4.70it/s] 16it [00:03, 4.70it/s] 17it [00:03, 4.56it/s] 18it [00:03, 4.62it/s] 19it [00:04, 4.65it/s] 20it [00:04, 4.68it/s] 21it [00:04, 4.67it/s] 22it [00:04, 4.69it/s] 23it [00:05, 4.71it/s] 24it [00:05, 4.71it/s] 25it [00:05, 4.71it/s] 26it [00:05, 4.72it/s] 27it [00:05, 4.72it/s] 28it [00:06, 4.71it/s] 29it [00:06, 4.71it/s] 30it [00:06, 4.72it/s] 31it [00:06, 4.72it/s] 32it [00:06, 4.72it/s] 33it [00:07, 4.55it/s] 34it [00:07, 4.61it/s] 35it [00:07, 4.66it/s] 36it [00:07, 4.65it/s] 37it [00:08, 4.67it/s] 38it [00:08, 4.51it/s] 39it [00:08, 4.58it/s] 40it [00:08, 4.62it/s] 41it [00:08, 4.65it/s] 42it [00:09, 4.66it/s] 43it [00:09, 4.68it/s] 44it [00:09, 4.69it/s] 45it [00:09, 4.54it/s] 46it [00:09, 4.60it/s] 47it [00:10, 4.65it/s] 48it [00:10, 4.66it/s] 49it [00:10, 4.66it/s] 50it [00:10, 4.68it/s]2025-05-25 22:40:59,963 - INFO - [Epoch 097 | Batch 0050] IWAE-loss 1236.9264 | mean log_px -0.0168 | KL -931.44 + 51it [00:11, 4.69it/s] 52it [00:11, 4.69it/s] 53it [00:11, 4.70it/s] 54it [00:11, 4.71it/s] 55it [00:11, 4.72it/s] 56it [00:12, 4.71it/s] 57it [00:12, 4.54it/s] 58it [00:12, 4.59it/s] 59it [00:12, 4.63it/s] 60it [00:12, 4.62it/s] 61it [00:13, 4.55it/s] 62it [00:13, 4.61it/s] 63it [00:13, 4.65it/s] 64it [00:13, 4.67it/s] 65it [00:14, 4.68it/s] 66it [00:14, 4.69it/s] 67it [00:14, 4.70it/s] 68it [00:14, 4.71it/s] 69it [00:14, 4.71it/s] 70it [00:15, 4.71it/s] 71it [00:15, 4.71it/s] 72it [00:15, 4.70it/s] 73it [00:15, 4.55it/s] 74it [00:15, 4.61it/s] 75it [00:16, 4.62it/s] 76it [00:16, 4.48it/s] 77it [00:16, 4.56it/s] 78it [00:16, 4.60it/s] 79it [00:17, 4.64it/s] 80it [00:17, 4.66it/s] 81it [00:17, 4.68it/s] 82it [00:17, 4.53it/s] 83it [00:17, 4.60it/s] 84it [00:18, 4.63it/s] 85it [00:18, 4.66it/s] 86it [00:18, 4.68it/s] 87it [00:18, 4.70it/s] 88it [00:19, 4.59it/s] 89it [00:19, 4.65it/s] 90it [00:19, 4.66it/s] 91it [00:19, 4.68it/s] 92it [00:19, 4.69it/s] 93it [00:20, 4.71it/s] 94it [00:20, 4.71it/s] 95it [00:20, 4.71it/s] 96it [00:20, 4.72it/s] 97it [00:20, 4.72it/s] 98it [00:21, 4.72it/s] 99it [00:21, 4.72it/s] 100it [00:21, 4.72it/s]2025-05-25 22:41:10,696 - INFO - [Epoch 097 | Batch 0100] IWAE-loss 1532.8635 | mean log_px -0.0209 | KL -929.81 + 101it [00:21, 4.55it/s] 102it [00:22, 4.61it/s] 103it [00:22, 4.65it/s] 104it [00:22, 4.67it/s] 105it [00:22, 4.68it/s] 106it [00:22, 4.67it/s] 107it [00:23, 4.47it/s] 108it [00:23, 4.52it/s] 109it [00:23, 4.58it/s] 110it [00:23, 4.59it/s] 111it [00:23, 4.59it/s] 112it [00:24, 4.61it/s] 113it [00:24, 4.64it/s] 114it [00:24, 4.67it/s] 115it [00:24, 4.69it/s] 116it [00:25, 4.69it/s] 117it [00:25, 4.72it/s] 118it [00:25, 4.71it/s] 119it [00:25, 4.72it/s] 120it [00:25, 4.72it/s] 121it [00:26, 4.72it/s] 122it [00:26, 4.73it/s] 123it [00:26, 4.73it/s] 124it [00:26, 4.72it/s] 125it [00:26, 4.73it/s] 126it [00:27, 4.72it/s] 127it [00:27, 4.70it/s] 128it [00:27, 4.55it/s] 129it [00:27, 4.62it/s] 130it [00:28, 4.64it/s] 131it [00:28, 4.66it/s] 132it [00:28, 4.68it/s] 133it [00:28, 4.53it/s] 134it [00:28, 4.60it/s] 135it [00:29, 4.64it/s] 136it [00:29, 4.66it/s] 137it [00:29, 4.67it/s] 138it [00:29, 4.52it/s] 139it [00:29, 4.59it/s] 140it [00:30, 4.61it/s] 141it [00:30, 4.65it/s] 142it [00:30, 4.66it/s] 143it [00:30, 4.68it/s] 144it [00:31, 4.70it/s] 145it [00:31, 4.70it/s] 146it [00:31, 4.70it/s] 147it [00:31, 4.55it/s] 148it [00:31, 4.61it/s] 149it [00:32, 4.65it/s] 150it [00:32, 4.67it/s]2025-05-25 22:41:21,463 - INFO - [Epoch 097 | Batch 0150] IWAE-loss 995.0831 | mean log_px -0.0014 | KL -931.08 + 151it [00:32, 4.69it/s] 152it [00:32, 4.53it/s] 153it [00:32, 4.60it/s] 154it [00:33, 4.63it/s] 155it [00:33, 4.66it/s] 156it [00:33, 4.67it/s] 157it [00:33, 4.52it/s] 158it [00:34, 4.60it/s] 159it [00:34, 4.64it/s] 160it [00:34, 4.65it/s] 161it [00:34, 4.68it/s] 162it [00:34, 4.68it/s] 163it [00:35, 4.70it/s] 164it [00:35, 4.71it/s] 165it [00:35, 4.71it/s] 166it [00:35, 4.51it/s] 167it [00:36, 4.59it/s] 168it [00:36, 4.62it/s] 169it [00:36, 4.65it/s] 170it [00:36, 4.67it/s] 171it [00:36, 4.70it/s] 172it [00:37, 4.70it/s] 173it [00:37, 4.71it/s] 174it [00:37, 4.72it/s] 175it [00:37, 4.55it/s] 176it [00:37, 4.61it/s] 177it [00:38, 4.64it/s] 178it [00:38, 4.67it/s] 179it [00:38, 4.69it/s] 180it [00:38, 4.65it/s] 181it [00:39, 4.68it/s] 182it [00:39, 4.70it/s] 183it [00:39, 4.70it/s] 184it [00:39, 4.70it/s] 185it [00:39, 4.71it/s] 186it [00:40, 4.70it/s] 187it [00:40, 4.56it/s] 188it [00:40, 4.62it/s] 189it [00:40, 4.65it/s] 190it [00:40, 4.65it/s] 191it [00:41, 4.67it/s] 192it [00:41, 4.69it/s] 193it [00:41, 4.71it/s] 194it [00:41, 4.54it/s] 195it [00:42, 4.50it/s] 196it [00:42, 4.45it/s] 196it [00:42, 4.63it/s] +2025-05-25 22:41:31,305 - INFO - Epoch: 97, Objective: tensor([1209.1625], device='cuda:0', grad_fn=), Loss: 0.0060317241586744785, KL/n: 19.005821228027344 + 0it [00:00, ?it/s]2025-05-25 22:41:31,880 - INFO - [Epoch 098 | Batch 0000] IWAE-loss 1119.8661 | mean log_px -0.0051 | KL -930.75 + 1it [00:00, 3.08it/s] 2it [00:00, 3.73it/s] 3it [00:00, 4.11it/s] 4it [00:00, 4.32it/s] 5it [00:01, 4.13it/s] 6it [00:01, 4.19it/s] 7it [00:01, 4.22it/s] 8it [00:01, 4.33it/s] 9it [00:02, 4.33it/s] 10it [00:02, 4.35it/s] 11it [00:02, 4.32it/s] 12it [00:02, 4.32it/s] 13it [00:03, 4.17it/s] 14it [00:03, 4.26it/s] 15it [00:03, 4.29it/s] 16it [00:03, 4.37it/s] 17it [00:03, 4.48it/s] 18it [00:04, 4.50it/s] 19it [00:04, 4.56it/s] 20it [00:04, 4.46it/s] 21it [00:04, 4.41it/s] 22it [00:05, 4.25it/s] 23it [00:05, 4.31it/s] 24it [00:05, 4.27it/s] 25it [00:05, 4.32it/s] 26it [00:06, 4.40it/s] 27it [00:06, 4.49it/s] 28it [00:06, 4.30it/s] 29it [00:06, 4.42it/s] 30it [00:06, 4.38it/s] 31it [00:07, 4.47it/s] 32it [00:07, 4.41it/s] 33it [00:07, 4.49it/s] 34it [00:07, 4.54it/s] 35it [00:08, 4.59it/s] 36it [00:08, 4.52it/s] 37it [00:08, 4.59it/s] 38it [00:08, 4.46it/s] 39it [00:08, 4.44it/s] 40it [00:09, 4.27it/s] 41it [00:09, 4.40it/s] 42it [00:09, 4.39it/s] 43it [00:09, 4.39it/s] 44it [00:10, 4.46it/s] 45it [00:10, 4.53it/s] 46it [00:10, 4.42it/s] 47it [00:10, 4.40it/s] 48it [00:10, 4.44it/s] 49it [00:11, 4.40it/s] 50it [00:11, 4.34it/s]2025-05-25 22:41:43,252 - INFO - [Epoch 098 | Batch 0050] IWAE-loss 1496.3966 | mean log_px -0.0128 | KL -928.12 + 51it [00:11, 4.37it/s] 52it [00:11, 4.39it/s] 53it [00:12, 4.29it/s] 54it [00:12, 4.27it/s] 55it [00:12, 4.32it/s] 56it [00:12, 4.28it/s] 57it [00:13, 4.31it/s] 58it [00:13, 4.40it/s] 59it [00:13, 4.29it/s] 60it [00:13, 4.26it/s] 61it [00:14, 4.38it/s] 62it [00:14, 4.46it/s] 63it [00:14, 4.55it/s] 64it [00:14, 4.43it/s] 65it [00:14, 4.43it/s] 66it [00:15, 4.22it/s] 67it [00:15, 4.38it/s] 68it [00:15, 4.35it/s] 69it [00:15, 4.44it/s] 70it [00:16, 4.52it/s] 71it [00:16, 4.43it/s] 72it [00:16, 4.43it/s] 73it [00:16, 4.42it/s] 74it [00:16, 4.37it/s] 75it [00:17, 4.24it/s] 76it [00:17, 4.36it/s] 77it [00:17, 4.42it/s] 78it [00:17, 4.45it/s] 79it [00:18, 4.48it/s] 80it [00:18, 4.47it/s] 81it [00:18, 4.55it/s] 82it [00:18, 4.44it/s] 83it [00:18, 4.49it/s] 84it [00:19, 4.35it/s] 85it [00:19, 4.37it/s] 86it [00:19, 4.30it/s] 87it [00:19, 4.35it/s] 88it [00:20, 4.30it/s] 89it [00:20, 4.33it/s] 90it [00:20, 4.29it/s] 91it [00:20, 4.14it/s] 92it [00:21, 4.19it/s] 93it [00:21, 4.20it/s] 94it [00:21, 4.25it/s] 95it [00:21, 4.24it/s] 96it [00:22, 4.28it/s] 97it [00:22, 4.34it/s] 98it [00:22, 4.41it/s] 99it [00:22, 4.51it/s] 100it [00:22, 4.40it/s]2025-05-25 22:41:54,714 - INFO - [Epoch 098 | Batch 0100] IWAE-loss 1277.2687 | mean log_px -0.0050 | KL -925.47 + 101it [00:23, 4.25it/s] 102it [00:23, 4.33it/s] 103it [00:23, 4.43it/s] 104it [00:23, 4.49it/s] 105it [00:24, 4.55it/s] 106it [00:24, 4.49it/s] 107it [00:24, 4.55it/s] 108it [00:24, 4.50it/s] 109it [00:24, 4.49it/s] 110it [00:25, 4.26it/s] 111it [00:25, 4.36it/s] 112it [00:25, 4.46it/s] 113it [00:25, 4.40it/s] 114it [00:26, 4.37it/s] 115it [00:26, 4.46it/s] 116it [00:26, 4.42it/s] 117it [00:26, 4.49it/s] 118it [00:26, 4.51it/s] 119it [00:27, 4.31it/s] 120it [00:27, 4.41it/s] 121it [00:27, 4.45it/s] 122it [00:27, 4.50it/s] 123it [00:28, 4.51it/s] 124it [00:28, 4.45it/s] 125it [00:28, 4.46it/s] 126it [00:28, 4.53it/s] 127it [00:29, 4.45it/s] 128it [00:29, 4.24it/s] 129it [00:29, 4.30it/s] 130it [00:29, 4.33it/s] 131it [00:29, 4.34it/s] 132it [00:30, 4.31it/s] 133it [00:30, 4.27it/s] 134it [00:30, 4.37it/s] 135it [00:30, 4.47it/s] 136it [00:31, 4.34it/s] 137it [00:31, 4.32it/s] 138it [00:31, 4.29it/s] 139it [00:31, 4.33it/s] 140it [00:32, 4.29it/s] 141it [00:32, 4.34it/s] 142it [00:32, 4.25it/s] 143it [00:32, 4.37it/s] 144it [00:32, 4.40it/s] 145it [00:33, 4.37it/s] 146it [00:33, 4.31it/s] 147it [00:33, 4.35it/s] 148it [00:33, 4.42it/s] 149it [00:34, 4.36it/s] 150it [00:34, 4.44it/s]2025-05-25 22:42:06,080 - INFO - [Epoch 098 | Batch 0150] IWAE-loss 1349.3285 | mean log_px -0.0118 | KL -923.47 + 151it [00:34, 4.51it/s] 152it [00:34, 4.42it/s] 153it [00:34, 4.37it/s] 154it [00:35, 4.36it/s] 155it [00:35, 4.47it/s] 156it [00:35, 4.51it/s] 157it [00:35, 4.59it/s] 158it [00:36, 4.58it/s] 159it [00:36, 4.51it/s] 160it [00:36, 4.55it/s] 161it [00:36, 4.60it/s] 162it [00:36, 4.62it/s] 163it [00:37, 4.48it/s] 164it [00:37, 4.51it/s] 165it [00:37, 4.58it/s] 166it [00:37, 4.43it/s] 167it [00:38, 4.45it/s] 168it [00:38, 4.37it/s] 169it [00:38, 4.38it/s] 170it [00:38, 4.45it/s] 171it [00:38, 4.49it/s] 172it [00:39, 4.38it/s] 173it [00:39, 4.45it/s] 174it [00:39, 4.50it/s] 175it [00:39, 4.57it/s] 176it [00:40, 4.60it/s] 177it [00:40, 4.51it/s] 178it [00:40, 4.41it/s] 179it [00:40, 4.39it/s] 180it [00:41, 4.39it/s] 181it [00:41, 4.48it/s] 182it [00:41, 4.55it/s] 183it [00:41, 4.57it/s] 184it [00:41, 4.55it/s] 185it [00:42, 4.57it/s] 186it [00:42, 4.57it/s] 187it [00:42, 4.46it/s] 188it [00:42, 4.56it/s] 189it [00:42, 4.60it/s] 190it [00:43, 4.47it/s] 191it [00:43, 4.54it/s] 192it [00:43, 4.22it/s] 193it [00:43, 4.36it/s] 194it [00:44, 4.42it/s] 195it [00:44, 4.38it/s] 196it [00:44, 4.35it/s] 196it [00:44, 4.39it/s] +2025-05-25 22:42:16,277 - INFO - Epoch: 98, Objective: tensor([995.9705], device='cuda:0', grad_fn=), Loss: 0.005432826466858387, KL/n: 18.876163482666016 + 0it [00:00, ?it/s]2025-05-25 22:42:16,680 - INFO - [Epoch 099 | Batch 0000] IWAE-loss 1048.8071 | mean log_px -0.0020 | KL -923.30 + 1it [00:00, 2.99it/s] 2it [00:00, 3.84it/s] 3it [00:00, 3.84it/s] 4it [00:01, 4.13it/s] 5it [00:01, 4.33it/s] 6it [00:01, 4.36it/s] 7it [00:01, 4.48it/s] 8it [00:01, 4.42it/s] 9it [00:02, 4.37it/s] 10it [00:02, 4.24it/s] 11it [00:02, 4.36it/s] 12it [00:02, 4.31it/s] 13it [00:03, 4.33it/s] 14it [00:03, 4.32it/s] 15it [00:03, 4.29it/s] 16it [00:03, 4.29it/s] 17it [00:04, 4.28it/s] 18it [00:04, 4.28it/s] 19it [00:04, 4.32it/s] 20it [00:04, 4.27it/s] 21it [00:04, 4.30it/s] 22it [00:05, 4.33it/s] 23it [00:05, 4.44it/s] 24it [00:05, 4.45it/s] 25it [00:05, 4.50it/s] 26it [00:06, 4.43it/s] 27it [00:06, 4.39it/s] 28it [00:06, 4.40it/s] 29it [00:06, 4.46it/s] 30it [00:06, 4.41it/s] 31it [00:07, 4.27it/s] 32it [00:07, 4.34it/s] 33it [00:07, 4.33it/s] 34it [00:07, 4.42it/s] 35it [00:08, 4.47it/s] 36it [00:08, 4.21it/s] 37it [00:08, 4.30it/s] 38it [00:08, 4.34it/s] 39it [00:09, 4.31it/s] 40it [00:09, 4.33it/s] 41it [00:09, 4.35it/s] 42it [00:09, 4.37it/s] 43it [00:09, 4.23it/s] 44it [00:10, 4.29it/s] 45it [00:10, 4.29it/s] 46it [00:10, 4.33it/s] 47it [00:10, 4.31it/s] 48it [00:11, 4.20it/s] 49it [00:11, 4.27it/s] 50it [00:11, 4.30it/s]2025-05-25 22:42:28,194 - INFO - [Epoch 099 | Batch 0050] IWAE-loss 1050.6475 | mean log_px -0.0048 | KL -926.41 + 51it [00:11, 4.27it/s] 52it [00:12, 4.27it/s] 53it [00:12, 4.24it/s] 54it [00:12, 4.38it/s] 55it [00:12, 4.33it/s] 56it [00:12, 4.33it/s] 57it [00:13, 4.32it/s] 58it [00:13, 4.33it/s] 59it [00:13, 4.35it/s] 60it [00:13, 4.45it/s] 61it [00:14, 4.45it/s] 62it [00:14, 4.24it/s] 63it [00:14, 4.29it/s] 64it [00:15, 3.52it/s] 65it [00:15, 3.82it/s] 66it [00:15, 4.00it/s] 67it [00:15, 4.19it/s] 68it [00:15, 4.23it/s] 69it [00:16, 4.22it/s] 70it [00:16, 4.22it/s] 71it [00:16, 4.28it/s] 72it [00:16, 4.30it/s] 73it [00:17, 4.40it/s] 74it [00:17, 4.39it/s] 75it [00:17, 4.37it/s] 76it [00:17, 4.35it/s] 77it [00:17, 4.44it/s] 78it [00:18, 4.40it/s] 79it [00:18, 4.33it/s] 80it [00:18, 4.40it/s] 81it [00:18, 4.36it/s] 82it [00:19, 4.31it/s] 83it [00:19, 4.31it/s] 84it [00:19, 4.38it/s] 85it [00:19, 4.38it/s] 86it [00:20, 4.47it/s] 87it [00:20, 4.48it/s] 88it [00:20, 4.44it/s] 89it [00:20, 4.41it/s] 90it [00:20, 4.37it/s] 91it [00:21, 4.29it/s] 92it [00:21, 4.41it/s] 93it [00:21, 4.34it/s] 94it [00:21, 4.44it/s] 95it [00:22, 4.44it/s] 96it [00:22, 4.52it/s] 97it [00:22, 4.47it/s] 98it [00:22, 4.41it/s] 99it [00:22, 4.42it/s] 100it [00:23, 4.30it/s]2025-05-25 22:42:39,788 - INFO - [Epoch 099 | Batch 0100] IWAE-loss 1040.0406 | mean log_px -0.0042 | KL -928.02 + 101it [00:23, 4.26it/s] 102it [00:23, 4.32it/s] 103it [00:23, 4.32it/s] 104it [00:24, 4.36it/s] 105it [00:24, 4.34it/s] 106it [00:24, 4.19it/s] 107it [00:24, 4.33it/s] 108it [00:25, 4.35it/s] 109it [00:25, 4.47it/s] 110it [00:25, 4.53it/s] 111it [00:25, 4.37it/s] 112it [00:25, 4.32it/s] 113it [00:26, 4.36it/s] 114it [00:26, 4.30it/s] 115it [00:26, 4.36it/s] 116it [00:26, 4.31it/s] 117it [00:27, 4.31it/s] 118it [00:27, 4.27it/s] 119it [00:27, 4.30it/s] 120it [00:27, 4.28it/s] 121it [00:28, 4.26it/s] 122it [00:28, 4.26it/s] 123it [00:28, 4.31it/s] 124it [00:28, 4.30it/s] 125it [00:29, 4.17it/s] 126it [00:29, 4.24it/s] 127it [00:29, 4.35it/s] 128it [00:29, 4.44it/s] 129it [00:29, 4.52it/s] 130it [00:30, 4.42it/s] 131it [00:30, 4.36it/s] 132it [00:30, 4.23it/s] 133it [00:30, 4.36it/s] 134it [00:31, 4.31it/s] 135it [00:31, 4.43it/s] 136it [00:31, 4.45it/s] 137it [00:31, 4.51it/s] 138it [00:31, 4.49it/s] 139it [00:32, 4.36it/s] 140it [00:32, 4.35it/s] 141it [00:32, 4.47it/s] 142it [00:32, 4.53it/s] 143it [00:33, 4.44it/s] 144it [00:33, 4.45it/s] 145it [00:33, 4.52it/s] 146it [00:33, 4.41it/s] 147it [00:33, 4.42it/s] 148it [00:34, 4.41it/s] 149it [00:34, 4.39it/s] 150it [00:34, 4.42it/s]2025-05-25 22:42:51,228 - INFO - [Epoch 099 | Batch 0150] IWAE-loss 1044.7759 | mean log_px -0.0017 | KL -930.69 + 151it [00:34, 4.38it/s] 152it [00:35, 4.40it/s] 153it [00:35, 4.32it/s] 154it [00:35, 4.18it/s] 155it [00:35, 4.34it/s] 156it [00:36, 4.29it/s] 157it [00:36, 4.32it/s] 158it [00:36, 4.30it/s] 159it [00:36, 4.31it/s] 160it [00:36, 4.36it/s] 161it [00:37, 4.46it/s] 162it [00:37, 4.47it/s] 163it [00:37, 4.54it/s] 164it [00:37, 4.44it/s] 165it [00:38, 4.39it/s] 166it [00:38, 4.44it/s] 167it [00:38, 4.52it/s] 168it [00:38, 4.57it/s] 169it [00:38, 4.45it/s] 170it [00:39, 4.34it/s] 171it [00:39, 4.41it/s] 172it [00:39, 4.39it/s] 173it [00:39, 4.37it/s] 174it [00:40, 4.40it/s] 175it [00:40, 4.21it/s] 176it [00:40, 4.34it/s] 177it [00:40, 4.31it/s] 178it [00:41, 4.31it/s] 179it [00:41, 4.31it/s] 180it [00:41, 4.31it/s] 181it [00:41, 4.38it/s] 182it [00:41, 4.36it/s] 183it [00:42, 4.45it/s] 184it [00:42, 4.37it/s] 185it [00:42, 4.44it/s] 186it [00:42, 4.37it/s] 187it [00:43, 4.41it/s] 188it [00:43, 4.46it/s] 189it [00:43, 4.53it/s] 190it [00:43, 4.45it/s] 191it [00:43, 4.53it/s] 192it [00:44, 4.47it/s] 193it [00:44, 4.54it/s] 194it [00:44, 4.54it/s] 195it [00:44, 4.36it/s] 196it [00:45, 4.34it/s] 196it [00:45, 4.34it/s] +2025-05-25 22:43:01,607 - INFO - Epoch: 99, Objective: tensor([1112.6666], device='cuda:0', grad_fn=), Loss: 0.0035745336208492517, KL/n: 18.98943328857422 +2025-05-25 22:43:01,612 - INFO - Select objective: bbb + 0it [00:00, ?it/s] 1it [00:00, 9.58it/s] 4it [00:00, 21.15it/s] 7it [00:00, 24.77it/s] 10it [00:00, 26.10it/s] 13it [00:00, 27.14it/s] 17it [00:00, 27.94it/s] 21it [00:00, 28.66it/s] 24it [00:00, 28.18it/s] 28it [00:01, 28.58it/s] 31it [00:01, 28.29it/s] 34it [00:01, 28.62it/s] 37it [00:01, 28.53it/s] 40it [00:01, 28.93it/s] 43it [00:01, 28.79it/s] 46it [00:01, 29.08it/s] 50it [00:01, 29.49it/s] 53it [00:01, 28.75it/s] 57it [00:02, 29.17it/s] 60it [00:02, 28.83it/s] 64it [00:02, 29.27it/s] 67it [00:02, 28.99it/s] 71it [00:02, 29.28it/s] 74it [00:02, 29.02it/s] 77it [00:02, 29.03it/s] 80it [00:02, 28.99it/s] 83it [00:02, 27.92it/s] 86it [00:03, 28.46it/s] 89it [00:03, 27.94it/s] 92it [00:03, 28.34it/s] 95it [00:03, 28.13it/s] 98it [00:03, 28.20it/s] 102it [00:03, 28.60it/s] 105it [00:03, 28.32it/s] 109it [00:03, 28.40it/s] 113it [00:04, 28.46it/s] 117it [00:04, 28.93it/s] 120it [00:04, 28.53it/s] 123it [00:04, 28.47it/s] 126it [00:04, 28.50it/s] 129it [00:04, 28.52it/s] 133it [00:04, 28.93it/s] 136it [00:04, 28.08it/s] 140it [00:04, 28.43it/s] 144it [00:05, 29.03it/s] 147it [00:05, 28.06it/s] 150it [00:05, 28.01it/s] 153it [00:05, 27.89it/s] 156it [00:05, 28.22it/s] 159it [00:05, 28.59it/s] 162it [00:05, 28.34it/s] 165it [00:05, 28.72it/s] 169it [00:05, 29.18it/s] 172it [00:06, 28.60it/s] 175it [00:06, 28.67it/s] 178it [00:06, 28.57it/s] 181it [00:06, 28.81it/s] 184it [00:06, 28.68it/s] 187it [00:06, 28.90it/s] 191it [00:06, 29.24it/s] 194it [00:06, 28.45it/s] 198it [00:06, 28.86it/s] 201it [00:07, 28.52it/s] 204it [00:07, 28.88it/s] 208it [00:07, 29.32it/s] 211it [00:07, 28.32it/s] 215it [00:07, 29.21it/s] 218it [00:07, 29.05it/s] 221it [00:07, 28.32it/s] 225it [00:07, 29.17it/s] 228it [00:08, 28.38it/s] 232it [00:08, 29.27it/s] 235it [00:08, 28.27it/s] 239it [00:08, 28.23it/s] 243it [00:08, 28.75it/s] 246it [00:08, 28.05it/s] 249it [00:08, 28.32it/s] 252it [00:08, 28.34it/s] 255it [00:08, 28.51it/s] 258it [00:09, 27.81it/s] 261it [00:09, 28.24it/s] 264it [00:09, 27.93it/s] 267it [00:09, 28.27it/s] 270it [00:09, 27.89it/s] 273it [00:09, 28.04it/s] 276it [00:09, 27.43it/s] 279it [00:09, 25.60it/s] 280it [00:09, 28.14it/s] +2025-05-25 22:43:11,726 - INFO - Epoch: 0, Objective: 0.012997487559914589, Loss: 0.004764337092638016, KL/n: 0.008233150467276573 + 0%| | 0/84 [00:00), Loss: 0.11140021681785583, KL/n: 71.59821319580078 + 0it [00:00, ?it/s]2025-05-25 22:55:42,997 - INFO - [Epoch 001 | Batch 0000] IWAE-loss 11894.2480 | mean log_px -0.1369 | KL -3499.28 + 1it [00:00, 3.00it/s] 2it [00:00, 3.61it/s] 3it [00:00, 3.88it/s] 4it [00:01, 4.03it/s] 5it [00:01, 4.25it/s] 6it [00:01, 4.39it/s] 7it [00:01, 4.51it/s] 8it [00:01, 4.57it/s] 9it [00:02, 4.63it/s] 10it [00:02, 4.66it/s] 11it [00:02, 4.68it/s] 12it [00:02, 4.69it/s] 13it [00:02, 4.71it/s] 14it [00:03, 4.72it/s] 15it [00:03, 4.73it/s] 16it [00:03, 4.73it/s] 17it [00:03, 4.74it/s] 18it [00:04, 4.71it/s] 19it [00:04, 4.71it/s] 20it [00:04, 4.53it/s] 21it [00:04, 4.41it/s] 22it [00:04, 4.49it/s] 23it [00:05, 4.57it/s] 24it [00:05, 4.28it/s] 25it [00:05, 4.35it/s] 26it [00:05, 4.43it/s] 27it [00:06, 4.44it/s] 28it [00:06, 4.49it/s] 29it [00:06, 4.54it/s] 30it [00:06, 4.43it/s] 31it [00:06, 4.52it/s] 32it [00:07, 4.46it/s] 33it [00:07, 4.50it/s] 34it [00:07, 4.51it/s] 35it [00:07, 4.52it/s] 36it [00:08, 4.53it/s] 37it [00:08, 4.46it/s] 38it [00:08, 4.54it/s] 39it [00:08, 4.31it/s] 40it [00:08, 4.29it/s] 41it [00:09, 4.31it/s] 42it [00:09, 4.40it/s] 43it [00:09, 4.38it/s] 44it [00:09, 4.30it/s] 45it [00:10, 4.44it/s] 46it [00:10, 4.46it/s] 47it [00:10, 4.40it/s] 48it [00:10, 4.45it/s] 49it [00:11, 4.36it/s] 50it [00:11, 4.28it/s]2025-05-25 22:55:54,166 - INFO - [Epoch 001 | Batch 0050] IWAE-loss 11227.0039 | mean log_px -0.1305 | KL -3490.07 + 51it [00:11, 4.22it/s] 52it [00:11, 4.23it/s] 53it [00:11, 4.36it/s] 54it [00:12, 4.43it/s] 55it [00:12, 4.41it/s] 56it [00:12, 4.36it/s] 57it [00:12, 4.33it/s] 58it [00:13, 4.13it/s] 59it [00:13, 4.17it/s] 60it [00:13, 4.24it/s] 61it [00:13, 4.34it/s] 62it [00:14, 4.36it/s] 63it [00:14, 4.13it/s] 64it [00:14, 4.31it/s] 65it [00:14, 4.26it/s] 66it [00:14, 4.39it/s] 67it [00:15, 4.38it/s] 68it [00:15, 4.44it/s] 69it [00:15, 4.38it/s] 70it [00:15, 4.37it/s] 71it [00:16, 4.33it/s] 72it [00:16, 4.46it/s] 73it [00:16, 4.41it/s] 74it [00:16, 4.46it/s] 75it [00:16, 4.55it/s] 76it [00:17, 4.60it/s] 77it [00:17, 4.61it/s] 78it [00:17, 4.54it/s] 79it [00:17, 4.43it/s] 80it [00:18, 4.51it/s] 81it [00:18, 4.40it/s] 82it [00:18, 4.34it/s] 83it [00:18, 4.46it/s] 84it [00:19, 4.52it/s] 85it [00:19, 4.41it/s] 86it [00:19, 4.48it/s] 87it [00:19, 4.43it/s] 88it [00:19, 4.48it/s] 89it [00:20, 4.52it/s] 90it [00:20, 4.46it/s] 91it [00:20, 4.25it/s] 92it [00:20, 4.38it/s] 93it [00:21, 4.33it/s] 94it [00:21, 4.35it/s] 95it [00:21, 4.30it/s] 96it [00:21, 4.40it/s] 97it [00:21, 4.34it/s] 98it [00:22, 4.43it/s] 99it [00:22, 4.37it/s] 100it [00:22, 4.30it/s]2025-05-25 22:56:05,578 - INFO - [Epoch 001 | Batch 0100] IWAE-loss 8575.6543 | mean log_px -0.0730 | KL -3466.15 + 101it [00:22, 4.44it/s] 102it [00:23, 4.39it/s] 103it [00:23, 4.51it/s] 104it [00:23, 4.57it/s] 105it [00:23, 4.46it/s] 106it [00:24, 4.44it/s] 107it [00:24, 4.49it/s] 108it [00:24, 4.56it/s] 109it [00:24, 4.33it/s] 110it [00:24, 4.23it/s] 111it [00:25, 4.38it/s] 112it [00:25, 4.46it/s] 113it [00:25, 4.42it/s] 114it [00:25, 4.19it/s] 115it [00:26, 4.31it/s] 116it [00:26, 4.27it/s] 117it [00:26, 4.30it/s] 118it [00:26, 4.25it/s] 119it [00:26, 4.39it/s] 120it [00:27, 4.33it/s] 121it [00:27, 4.42it/s] 122it [00:27, 4.50it/s] 123it [00:27, 4.34it/s] 124it [00:28, 4.40it/s] 125it [00:28, 4.50it/s] 126it [00:28, 4.53it/s] 127it [00:28, 4.47it/s] 128it [00:29, 4.37it/s] 129it [00:29, 4.33it/s] 130it [00:29, 4.32it/s] 131it [00:29, 4.45it/s] 132it [00:29, 4.52it/s] 133it [00:30, 4.45it/s] 134it [00:30, 4.36it/s] 135it [00:30, 4.32it/s] 136it [00:30, 4.42it/s] 137it [00:31, 4.51it/s] 138it [00:31, 4.56it/s] 139it [00:31, 4.43it/s] 140it [00:31, 4.22it/s] 141it [00:31, 4.33it/s] 142it [00:32, 4.32it/s] 143it [00:32, 4.27it/s] 144it [00:32, 4.23it/s] 145it [00:32, 4.37it/s] 146it [00:33, 4.38it/s] 147it [00:33, 4.38it/s] 148it [00:33, 4.35it/s] 149it [00:33, 4.45it/s] 150it [00:34, 4.38it/s]2025-05-25 22:56:16,975 - INFO - [Epoch 001 | Batch 0150] IWAE-loss 10918.8730 | mean log_px -0.1088 | KL -3451.89 + 151it [00:34, 4.26it/s] 152it [00:34, 4.22it/s] 153it [00:34, 4.25it/s] 154it [00:35, 4.24it/s] 155it [00:35, 4.22it/s] 156it [00:35, 4.36it/s] 157it [00:35, 4.44it/s] 158it [00:35, 4.52it/s] 159it [00:36, 4.48it/s] 160it [00:36, 4.53it/s] 161it [00:36, 4.59it/s] 162it [00:36, 4.45it/s] 163it [00:37, 4.53it/s] 164it [00:37, 4.55it/s] 165it [00:37, 4.61it/s] 166it [00:37, 4.64it/s] 167it [00:37, 4.64it/s] 168it [00:38, 4.47it/s] 169it [00:38, 4.41it/s] 170it [00:38, 4.37it/s] 171it [00:38, 4.45it/s] 172it [00:38, 4.53it/s] 173it [00:39, 4.43it/s] 174it [00:39, 4.52it/s] 175it [00:39, 4.42it/s] 176it [00:39, 4.50it/s] 177it [00:40, 4.37it/s] 178it [00:40, 4.30it/s] 179it [00:40, 4.28it/s] 180it [00:40, 4.37it/s] 181it [00:41, 4.36it/s] 182it [00:41, 4.44it/s] 183it [00:41, 4.52it/s] 184it [00:41, 4.15it/s] 185it [00:42, 4.13it/s] 186it [00:42, 4.22it/s] 187it [00:42, 4.24it/s] 188it [00:42, 4.13it/s] 189it [00:42, 4.25it/s] 190it [00:43, 4.38it/s] 191it [00:43, 4.45it/s] 192it [00:43, 4.53it/s] 193it [00:43, 4.58it/s] 194it [00:44, 4.62it/s] 195it [00:44, 4.58it/s] 196it [00:44, 4.62it/s] 196it [00:44, 4.40it/s] +2025-05-25 22:56:27,263 - INFO - Epoch: 1, Objective: tensor([9172.7520], device='cuda:0', grad_fn=), Loss: 0.07874009013175964, KL/n: 70.15756225585938 + 0it [00:00, ?it/s]2025-05-25 22:56:27,802 - INFO - [Epoch 002 | Batch 0000] IWAE-loss 7225.7852 | mean log_px -0.0616 | KL -3439.12 + 1it [00:00, 3.12it/s] 2it [00:00, 3.89it/s] 3it [00:00, 4.25it/s] 4it [00:00, 4.42it/s] 5it [00:01, 4.52it/s] 6it [00:01, 4.40it/s] 7it [00:01, 4.51it/s] 8it [00:01, 4.57it/s] 9it [00:02, 4.63it/s] 10it [00:02, 4.66it/s] 11it [00:02, 4.55it/s] 12it [00:02, 4.49it/s] 13it [00:02, 4.58it/s] 14it [00:03, 4.61it/s] 15it [00:03, 4.65it/s] 16it [00:03, 4.66it/s] 17it [00:03, 4.52it/s] 18it [00:04, 4.57it/s] 19it [00:04, 4.63it/s] 20it [00:04, 4.65it/s] 21it [00:04, 4.68it/s] 22it [00:04, 4.63it/s] 23it [00:05, 4.66it/s] 24it [00:05, 4.69it/s] 25it [00:05, 4.70it/s] 26it [00:05, 4.68it/s] 27it [00:05, 4.72it/s] 28it [00:06, 4.71it/s] 29it [00:06, 4.60it/s] 30it [00:06, 4.65it/s] 31it [00:06, 4.67it/s] 32it [00:06, 4.68it/s] 33it [00:07, 4.70it/s] 34it [00:07, 4.71it/s] 35it [00:07, 4.72it/s] 36it [00:07, 4.55it/s] 37it [00:08, 4.62it/s] 38it [00:08, 4.64it/s] 39it [00:08, 4.67it/s] 40it [00:08, 4.68it/s] 41it [00:08, 4.56it/s] 42it [00:09, 4.62it/s] 43it [00:09, 4.65it/s] 44it [00:09, 4.65it/s] 45it [00:09, 4.67it/s] 46it [00:10, 4.68it/s] 47it [00:10, 4.70it/s] 48it [00:10, 4.70it/s] 49it [00:10, 4.54it/s] 50it [00:10, 4.59it/s]2025-05-25 22:56:38,602 - INFO - [Epoch 002 | Batch 0050] IWAE-loss 7740.6035 | mean log_px -0.0618 | KL -3413.71 + 51it [00:11, 4.61it/s] 52it [00:11, 4.63it/s] 53it [00:11, 4.66it/s] 54it [00:11, 4.63it/s] 55it [00:11, 4.65it/s] 56it [00:12, 4.67it/s] 57it [00:12, 4.69it/s] 58it [00:12, 4.53it/s] 59it [00:12, 4.60it/s] 60it [00:13, 4.64it/s] 61it [00:13, 4.67it/s] 62it [00:13, 4.68it/s] 63it [00:13, 4.53it/s] 64it [00:13, 4.59it/s] 65it [00:14, 4.63it/s] 66it [00:14, 4.63it/s] 67it [00:14, 4.63it/s] 68it [00:14, 4.62it/s] 69it [00:14, 4.59it/s] 70it [00:15, 4.60it/s] 71it [00:15, 4.60it/s] 72it [00:15, 4.59it/s] 73it [00:15, 4.47it/s] 74it [00:16, 4.55it/s] 75it [00:16, 4.55it/s] 76it [00:16, 4.59it/s] 77it [00:16, 4.63it/s] 78it [00:16, 4.65it/s] 79it [00:17, 4.55it/s] 80it [00:17, 4.61it/s] 81it [00:17, 4.65it/s] 82it [00:17, 4.67it/s] 83it [00:18, 4.69it/s] 84it [00:18, 4.69it/s] 85it [00:18, 4.71it/s] 86it [00:18, 4.54it/s] 87it [00:18, 4.58it/s] 88it [00:19, 4.59it/s] 89it [00:19, 4.64it/s] 90it [00:19, 4.66it/s] 91it [00:19, 4.52it/s] 92it [00:19, 4.59it/s] 93it [00:20, 4.63it/s] 94it [00:20, 4.66it/s] 95it [00:20, 4.68it/s] 96it [00:20, 4.69it/s] 97it [00:21, 4.71it/s] 98it [00:21, 4.71it/s] 99it [00:21, 4.72it/s] 100it [00:21, 4.71it/s]2025-05-25 22:56:49,398 - INFO - [Epoch 002 | Batch 0100] IWAE-loss 10890.5635 | mean log_px -0.1134 | KL -3399.14 + 101it [00:21, 4.55it/s] 102it [00:22, 4.57it/s] 103it [00:22, 4.61it/s] 104it [00:22, 4.64it/s] 105it [00:22, 4.67it/s] 106it [00:23, 4.51it/s] 107it [00:23, 4.59it/s] 108it [00:23, 4.63it/s] 109it [00:23, 4.66it/s] 110it [00:23, 4.67it/s] 111it [00:24, 4.69it/s] 112it [00:24, 4.53it/s] 113it [00:24, 4.59it/s] 114it [00:24, 4.63it/s] 115it [00:24, 4.65it/s] 116it [00:25, 4.66it/s] 117it [00:25, 4.51it/s] 118it [00:25, 4.57it/s] 119it [00:25, 4.60it/s] 120it [00:26, 4.63it/s] 121it [00:26, 4.66it/s] 122it [00:26, 4.68it/s] 123it [00:26, 4.69it/s] 124it [00:26, 4.70it/s] 125it [00:27, 4.71it/s] 126it [00:27, 4.71it/s] 127it [00:27, 4.53it/s] 128it [00:27, 4.59it/s] 129it [00:27, 4.63it/s] 130it [00:28, 4.66it/s] 131it [00:28, 4.57it/s] 132it [00:28, 4.55it/s] 133it [00:28, 4.57it/s] 134it [00:29, 4.59it/s] 135it [00:29, 4.41it/s] 136it [00:29, 4.46it/s] 137it [00:29, 4.53it/s] 138it [00:29, 4.57it/s] 139it [00:30, 4.61it/s] 140it [00:30, 4.63it/s] 141it [00:30, 4.65it/s] 142it [00:30, 4.66it/s] 143it [00:31, 4.68it/s] 144it [00:31, 4.69it/s] 145it [00:31, 4.70it/s] 146it [00:31, 4.70it/s] 147it [00:31, 4.54it/s] 148it [00:32, 4.59it/s] 149it [00:32, 4.62it/s] 150it [00:32, 4.64it/s]2025-05-25 22:57:00,247 - INFO - [Epoch 002 | Batch 0150] IWAE-loss 6388.3467 | mean log_px -0.0455 | KL -3380.82 + 151it [00:32, 4.64it/s] 152it [00:32, 4.65it/s] 153it [00:33, 4.50it/s] 154it [00:33, 4.56it/s] 155it [00:33, 4.59it/s] 156it [00:33, 4.61it/s] 157it [00:34, 4.62it/s] 158it [00:34, 4.64it/s] 159it [00:34, 4.65it/s] 160it [00:34, 4.67it/s] 161it [00:34, 4.68it/s] 162it [00:35, 4.65it/s] 163it [00:35, 4.66it/s] 164it [00:35, 4.64it/s] 165it [00:35, 4.47it/s] 166it [00:36, 4.44it/s] 167it [00:36, 4.48it/s] 168it [00:36, 4.51it/s] 169it [00:36, 4.49it/s] 170it [00:36, 4.55it/s] 171it [00:37, 4.57it/s] 172it [00:37, 4.61it/s] 173it [00:37, 4.64it/s] 174it [00:37, 4.66it/s] 175it [00:37, 4.68it/s] 176it [00:38, 4.68it/s] 177it [00:38, 4.53it/s] 178it [00:38, 4.59it/s] 179it [00:38, 4.63it/s] 180it [00:39, 4.60it/s] 181it [00:39, 4.63it/s] 182it [00:39, 4.65it/s] 183it [00:39, 4.67it/s] 184it [00:39, 4.52it/s] 185it [00:40, 4.58it/s] 186it [00:40, 4.60it/s] 187it [00:40, 4.63it/s] 188it [00:40, 4.65it/s] 189it [00:40, 4.65it/s] 190it [00:41, 4.67it/s] 191it [00:41, 4.69it/s] 192it [00:41, 4.69it/s] 193it [00:41, 4.53it/s] 194it [00:42, 4.59it/s] 195it [00:42, 4.41it/s] 196it [00:42, 4.35it/s] 196it [00:42, 4.60it/s] +2025-05-25 22:57:10,208 - INFO - Epoch: 2, Objective: tensor([7126.1548], device='cuda:0', grad_fn=), Loss: 0.05375305190682411, KL/n: 68.71427154541016 + 0it [00:00, ?it/s]2025-05-25 22:57:10,586 - INFO - [Epoch 003 | Batch 0000] IWAE-loss 6548.8511 | mean log_px -0.0590 | KL -3364.44 + 1it [00:00, 3.27it/s] 2it [00:00, 3.98it/s] 3it [00:00, 4.28it/s] 4it [00:00, 4.42it/s] 5it [00:01, 4.52it/s] 6it [00:01, 4.57it/s] 7it [00:01, 4.61it/s] 8it [00:01, 4.47it/s] 9it [00:02, 4.55it/s] 10it [00:02, 4.58it/s] 11it [00:02, 4.60it/s] 12it [00:02, 4.62it/s] 13it [00:02, 4.65it/s] 14it [00:03, 4.49it/s] 15it [00:03, 4.57it/s] 16it [00:03, 4.60it/s] 17it [00:03, 4.62it/s] 18it [00:03, 4.62it/s] 19it [00:04, 4.62it/s] 20it [00:04, 4.63it/s] 21it [00:04, 4.48it/s] 22it [00:04, 4.55it/s] 23it [00:05, 4.59it/s] 24it [00:05, 4.62it/s] 25it [00:05, 4.64it/s] 26it [00:05, 4.64it/s] 27it [00:05, 4.66it/s] 28it [00:06, 4.66it/s] 29it [00:06, 4.67it/s] 30it [00:06, 4.67it/s] 31it [00:06, 4.68it/s] 32it [00:07, 4.52it/s] 33it [00:07, 4.59it/s] 34it [00:07, 4.61it/s] 35it [00:07, 4.59it/s] 36it [00:07, 4.62it/s] 37it [00:08, 4.65it/s] 38it [00:08, 4.60it/s] 39it [00:08, 4.64it/s] 40it [00:08, 4.65it/s] 41it [00:08, 4.66it/s] 42it [00:09, 4.56it/s] 43it [00:09, 4.61it/s] 44it [00:09, 4.41it/s] 45it [00:09, 4.38it/s] 46it [00:10, 4.47it/s] 47it [00:10, 4.54it/s] 48it [00:10, 4.52it/s] 49it [00:10, 4.55it/s] 50it [00:10, 4.57it/s]2025-05-25 22:57:21,463 - INFO - [Epoch 003 | Batch 0050] IWAE-loss 6395.8638 | mean log_px -0.0435 | KL -3348.27 + 51it [00:11, 4.42it/s] 52it [00:11, 4.50it/s] 53it [00:11, 4.54it/s] 54it [00:11, 4.56it/s] 55it [00:12, 4.57it/s] 56it [00:12, 4.58it/s] 57it [00:12, 4.60it/s] 58it [00:12, 4.60it/s] 59it [00:12, 4.44it/s] 60it [00:13, 4.44it/s] 61it [00:13, 4.50it/s] 62it [00:13, 4.54it/s] 63it [00:13, 4.57it/s] 64it [00:14, 3.69it/s] 65it [00:14, 3.93it/s] 66it [00:14, 4.11it/s] 67it [00:14, 4.13it/s] 68it [00:15, 4.28it/s] 69it [00:15, 4.37it/s] 70it [00:15, 4.43it/s] 71it [00:15, 4.48it/s] 72it [00:15, 4.51it/s] 73it [00:16, 4.54it/s] 74it [00:16, 4.53it/s] 75it [00:16, 4.56it/s] 76it [00:16, 4.54it/s] 77it [00:17, 4.35it/s] 78it [00:17, 4.42it/s] 79it [00:17, 4.47it/s] 80it [00:17, 4.34it/s] 81it [00:18, 4.43it/s] 82it [00:18, 4.43it/s] 83it [00:18, 4.51it/s] 84it [00:18, 4.51it/s] 85it [00:18, 4.54it/s] 86it [00:19, 4.52it/s] 87it [00:19, 4.54it/s] 88it [00:19, 4.55it/s] 89it [00:19, 4.56it/s] 90it [00:19, 4.57it/s] 91it [00:20, 4.56it/s] 92it [00:20, 4.55it/s] 93it [00:20, 4.56it/s] 94it [00:20, 4.57it/s] 95it [00:21, 4.57it/s] 96it [00:21, 4.57it/s] 97it [00:21, 4.58it/s] 98it [00:21, 4.58it/s] 99it [00:21, 4.59it/s] 100it [00:22, 4.59it/s]2025-05-25 22:57:32,669 - INFO - [Epoch 003 | Batch 0100] IWAE-loss 6408.8643 | mean log_px -0.0460 | KL -3327.64 + 101it [00:22, 4.45it/s] 102it [00:22, 4.50it/s] 103it [00:22, 4.54it/s] 104it [00:23, 4.56it/s] 105it [00:23, 4.57it/s] 106it [00:23, 4.56it/s] 107it [00:23, 4.58it/s] 108it [00:23, 4.59it/s] 109it [00:24, 4.44it/s] 110it [00:24, 4.45it/s] 111it [00:24, 4.50it/s] 112it [00:24, 4.52it/s] 113it [00:25, 4.54it/s] 114it [00:25, 4.55it/s] 115it [00:25, 4.41it/s] 116it [00:25, 4.47it/s] 117it [00:25, 4.47it/s] 118it [00:26, 4.51it/s] 119it [00:26, 4.53it/s] 120it [00:26, 4.54it/s] 121it [00:26, 4.57it/s] 122it [00:27, 4.57it/s] 123it [00:27, 4.59it/s] 124it [00:27, 4.59it/s] 125it [00:27, 4.50it/s] 126it [00:27, 4.54it/s] 127it [00:28, 4.56it/s] 128it [00:28, 4.57it/s] 129it [00:28, 4.59it/s] 130it [00:28, 4.59it/s] 131it [00:29, 4.41it/s] 132it [00:29, 4.49it/s] 133it [00:29, 4.38it/s] 134it [00:29, 4.43it/s] 135it [00:29, 4.49it/s] 136it [00:30, 4.53it/s] 137it [00:30, 4.40it/s] 138it [00:30, 4.43it/s] 139it [00:30, 4.44it/s] 140it [00:31, 4.49it/s] 141it [00:31, 4.53it/s] 142it [00:31, 4.55it/s] 143it [00:31, 4.53it/s] 144it [00:31, 4.55it/s] 145it [00:32, 4.56it/s] 146it [00:32, 4.44it/s] 147it [00:32, 4.49it/s] 148it [00:32, 4.53it/s] 149it [00:33, 4.53it/s] 150it [00:33, 4.55it/s]2025-05-25 22:57:43,753 - INFO - [Epoch 003 | Batch 0150] IWAE-loss 6867.9688 | mean log_px -0.0538 | KL -3303.91 + 151it [00:33, 4.56it/s] 152it [00:33, 4.54it/s] 153it [00:33, 4.57it/s] 154it [00:34, 4.57it/s] 155it [00:34, 4.59it/s] 156it [00:34, 4.59it/s] 157it [00:34, 4.61it/s] 158it [00:34, 4.60it/s] 159it [00:35, 4.61it/s] 160it [00:35, 4.61it/s] 161it [00:35, 4.61it/s] 162it [00:35, 4.61it/s] 163it [00:36, 4.61it/s] 164it [00:36, 4.60it/s] 165it [00:36, 4.62it/s] 166it [00:36, 4.61it/s] 167it [00:36, 4.62it/s] 168it [00:37, 4.61it/s] 169it [00:37, 4.61it/s] 170it [00:37, 4.61it/s] 171it [00:37, 4.61it/s] 172it [00:38, 4.61it/s] 173it [00:38, 4.61it/s] 174it [00:38, 4.61it/s] 175it [00:38, 4.62it/s] 176it [00:38, 4.61it/s] 177it [00:39, 4.60it/s] 178it [00:39, 4.60it/s] 179it [00:39, 4.61it/s] 180it [00:39, 4.61it/s] 181it [00:39, 4.62it/s] 182it [00:40, 4.62it/s] 183it [00:40, 4.62it/s] 184it [00:40, 4.61it/s] 185it [00:40, 4.61it/s] 186it [00:41, 4.60it/s] 187it [00:41, 4.60it/s] 188it [00:41, 4.60it/s] 189it [00:41, 4.61it/s] 190it [00:41, 4.61it/s] 191it [00:42, 4.59it/s] 192it [00:42, 4.60it/s] 193it [00:42, 4.60it/s] 194it [00:42, 4.60it/s] 195it [00:43, 4.38it/s] 196it [00:43, 4.34it/s] 196it [00:43, 4.52it/s] +2025-05-25 22:57:53,713 - INFO - Epoch: 3, Objective: tensor([5746.6787], device='cuda:0', grad_fn=), Loss: 0.046654097735881805, KL/n: 67.17630004882812 + 0it [00:00, ?it/s]2025-05-25 22:57:54,098 - INFO - [Epoch 004 | Batch 0000] IWAE-loss 5883.0645 | mean log_px -0.0408 | KL -3290.14 + 1it [00:00, 2.91it/s] 2it [00:00, 3.70it/s] 3it [00:00, 4.08it/s] 4it [00:00, 4.29it/s] 5it [00:01, 4.41it/s] 6it [00:01, 4.47it/s] 7it [00:01, 4.53it/s] 8it [00:01, 4.55it/s] 9it [00:02, 4.42it/s] 10it [00:02, 4.39it/s] 11it [00:02, 4.45it/s] 12it [00:02, 4.39it/s] 13it [00:03, 4.40it/s] 14it [00:03, 4.43it/s] 15it [00:03, 4.40it/s] 16it [00:03, 4.27it/s] 17it [00:03, 4.29it/s] 18it [00:04, 4.37it/s] 19it [00:04, 4.30it/s] 20it [00:04, 4.19it/s] 21it [00:04, 4.23it/s] 22it [00:05, 4.28it/s] 23it [00:05, 4.35it/s] 24it [00:05, 4.28it/s] 25it [00:05, 4.18it/s] 26it [00:06, 4.27it/s] 27it [00:06, 4.36it/s] 28it [00:06, 4.43it/s] 29it [00:06, 4.49it/s] 30it [00:06, 4.36it/s] 31it [00:07, 4.35it/s] 32it [00:07, 4.14it/s] 33it [00:07, 4.16it/s] 34it [00:07, 4.14it/s] 35it [00:08, 4.21it/s] 36it [00:08, 4.32it/s] 37it [00:08, 4.25it/s] 38it [00:08, 4.34it/s] 39it [00:09, 4.15it/s] 40it [00:09, 4.12it/s] 41it [00:09, 4.17it/s] 42it [00:09, 4.29it/s] 43it [00:10, 4.20it/s] 44it [00:10, 4.31it/s] 45it [00:10, 4.37it/s] 46it [00:10, 4.44it/s] 47it [00:10, 4.30it/s] 48it [00:11, 4.41it/s] 49it [00:11, 4.47it/s] 50it [00:11, 4.51it/s]2025-05-25 22:58:05,604 - INFO - [Epoch 004 | Batch 0050] IWAE-loss 4895.3418 | mean log_px -0.0286 | KL -3262.91 + 51it [00:11, 4.55it/s] 52it [00:12, 4.39it/s] 53it [00:12, 4.44it/s] 54it [00:12, 4.47it/s] 55it [00:12, 4.52it/s] 56it [00:12, 4.48it/s] 57it [00:13, 4.49it/s] 58it [00:13, 4.53it/s] 59it [00:13, 4.57it/s] 60it [00:13, 4.38it/s] 61it [00:14, 4.46it/s] 62it [00:14, 4.50it/s] 63it [00:14, 4.51it/s] 64it [00:14, 4.34it/s] 65it [00:14, 4.39it/s] 66it [00:15, 4.27it/s] 67it [00:15, 4.36it/s] 68it [00:15, 4.43it/s] 69it [00:15, 4.48it/s] 70it [00:16, 4.40it/s] 71it [00:16, 4.47it/s] 72it [00:16, 4.23it/s] 73it [00:16, 4.34it/s] 74it [00:17, 4.25it/s] 75it [00:17, 4.34it/s] 76it [00:17, 4.40it/s] 77it [00:17, 4.40it/s] 78it [00:17, 4.27it/s] 79it [00:18, 4.21it/s] 80it [00:18, 4.25it/s] 81it [00:18, 4.35it/s] 82it [00:18, 4.41it/s] 83it [00:19, 4.40it/s] 84it [00:19, 4.29it/s] 85it [00:19, 4.25it/s] 86it [00:19, 4.19it/s] 87it [00:20, 4.31it/s] 88it [00:20, 4.17it/s] 89it [00:20, 4.25it/s] 90it [00:20, 4.32it/s] 91it [00:20, 4.41it/s] 92it [00:21, 4.13it/s] 93it [00:21, 4.13it/s] 94it [00:21, 4.24it/s] 95it [00:21, 4.35it/s] 96it [00:22, 4.37it/s] 97it [00:22, 4.26it/s] 98it [00:22, 4.32it/s] 99it [00:22, 4.39it/s] 100it [00:23, 4.43it/s]2025-05-25 22:58:17,084 - INFO - [Epoch 004 | Batch 0100] IWAE-loss 5435.9736 | mean log_px -0.0313 | KL -3245.03 + 101it [00:23, 4.49it/s] 102it [00:23, 4.50it/s] 103it [00:23, 4.44it/s] 104it [00:24, 4.30it/s] 105it [00:24, 4.29it/s] 106it [00:24, 4.22it/s] 107it [00:24, 4.32it/s] 108it [00:24, 4.35it/s] 109it [00:25, 4.42it/s] 110it [00:25, 4.40it/s] 111it [00:25, 4.30it/s] 112it [00:25, 4.31it/s] 113it [00:26, 4.26it/s] 114it [00:26, 4.20it/s] 115it [00:26, 4.17it/s] 116it [00:26, 4.14it/s] 117it [00:27, 4.23it/s] 118it [00:27, 4.15it/s] 119it [00:27, 4.28it/s] 120it [00:27, 4.20it/s] 121it [00:27, 4.32it/s] 122it [00:28, 4.40it/s] 123it [00:28, 4.45it/s] 124it [00:28, 4.48it/s] 125it [00:28, 4.51it/s] 126it [00:29, 4.38it/s] 127it [00:29, 4.43it/s] 128it [00:29, 4.47it/s] 129it [00:29, 4.48it/s] 130it [00:30, 4.33it/s] 131it [00:30, 4.28it/s] 132it [00:30, 4.35it/s] 133it [00:30, 4.41it/s] 134it [00:30, 4.45it/s] 135it [00:31, 4.48it/s] 136it [00:31, 4.49it/s] 137it [00:31, 4.51it/s] 138it [00:31, 4.52it/s] 139it [00:32, 4.35it/s] 140it [00:32, 4.40it/s] 141it [00:32, 4.45it/s] 142it [00:32, 4.48it/s] 143it [00:32, 4.50it/s] 144it [00:33, 4.51it/s] 145it [00:33, 4.39it/s] 146it [00:33, 4.43it/s] 147it [00:33, 4.47it/s] 148it [00:34, 4.50it/s] 149it [00:34, 4.52it/s] 150it [00:34, 4.54it/s]2025-05-25 22:58:28,494 - INFO - [Epoch 004 | Batch 0150] IWAE-loss 4805.7720 | mean log_px -0.0276 | KL -3228.11 + 151it [00:34, 4.47it/s] 152it [00:34, 4.49it/s] 153it [00:35, 4.51it/s] 154it [00:35, 4.51it/s] 155it [00:35, 4.48it/s] 156it [00:35, 4.41it/s] 157it [00:36, 4.40it/s] 158it [00:36, 4.26it/s] 159it [00:36, 4.26it/s] 160it [00:36, 4.25it/s] 161it [00:37, 4.18it/s] 162it [00:37, 4.11it/s] 163it [00:37, 4.21it/s] 164it [00:37, 4.14it/s] 165it [00:37, 4.25it/s] 166it [00:38, 4.32it/s] 167it [00:38, 4.39it/s] 168it [00:38, 4.45it/s] 169it [00:38, 4.49it/s] 170it [00:39, 4.52it/s] 171it [00:39, 4.48it/s] 172it [00:39, 4.46it/s] 173it [00:39, 4.51it/s] 174it [00:39, 4.54it/s] 175it [00:40, 4.55it/s] 176it [00:40, 4.55it/s] 177it [00:40, 4.52it/s] 178it [00:40, 4.52it/s] 179it [00:41, 4.54it/s] 180it [00:41, 4.36it/s] 181it [00:41, 4.35it/s] 182it [00:41, 4.40it/s] 183it [00:41, 4.45it/s] 184it [00:42, 4.47it/s] 185it [00:42, 4.50it/s] 186it [00:42, 4.52it/s] 187it [00:42, 4.54it/s] 188it [00:43, 4.37it/s] 189it [00:43, 4.39it/s] 190it [00:43, 4.21it/s] 191it [00:43, 4.32it/s] 192it [00:44, 4.39it/s] 193it [00:44, 4.42it/s] 194it [00:44, 4.28it/s] 195it [00:44, 4.25it/s] 196it [00:44, 4.36it/s] 196it [00:45, 4.35it/s] +2025-05-25 22:58:38,875 - INFO - Epoch: 4, Objective: tensor([5635.8784], device='cuda:0', grad_fn=), Loss: 0.03690037503838539, KL/n: 65.52703094482422 + 0it [00:00, ?it/s]2025-05-25 22:58:39,449 - INFO - [Epoch 005 | Batch 0000] IWAE-loss 6954.7480 | mean log_px -0.0605 | KL -3211.71 + 1it [00:00, 3.02it/s] 2it [00:00, 3.72it/s] 3it [00:00, 4.06it/s] 4it [00:01, 4.16it/s] 5it [00:01, 4.31it/s] 6it [00:01, 4.39it/s] 7it [00:01, 4.44it/s] 8it [00:01, 4.46it/s] 9it [00:02, 4.50it/s] 10it [00:02, 4.43it/s] 11it [00:02, 4.40it/s] 12it [00:02, 4.25it/s] 13it [00:03, 4.33it/s] 14it [00:03, 4.39it/s] 15it [00:03, 4.35it/s] 16it [00:03, 4.43it/s] 17it [00:03, 4.49it/s] 18it [00:04, 4.50it/s] 19it [00:04, 4.51it/s] 20it [00:04, 4.36it/s] 21it [00:04, 4.43it/s] 22it [00:05, 4.31it/s] 23it [00:05, 4.27it/s] 24it [00:05, 4.21it/s] 25it [00:05, 4.16it/s] 26it [00:06, 4.28it/s] 27it [00:06, 4.20it/s] 28it [00:06, 4.20it/s] 29it [00:06, 4.24it/s] 30it [00:06, 4.33it/s] 31it [00:07, 4.39it/s] 32it [00:07, 4.42it/s] 33it [00:07, 4.47it/s] 34it [00:07, 4.50it/s] 35it [00:08, 4.51it/s] 36it [00:08, 4.31it/s] 37it [00:08, 4.04it/s] 38it [00:08, 4.07it/s] 39it [00:09, 4.10it/s] 40it [00:09, 4.22it/s] 41it [00:09, 4.31it/s] 42it [00:09, 4.29it/s] 43it [00:09, 4.32it/s] 44it [00:10, 4.28it/s] 45it [00:10, 4.24it/s] 46it [00:10, 4.23it/s] 47it [00:10, 4.07it/s] 48it [00:11, 4.15it/s] 49it [00:11, 4.13it/s] 50it [00:11, 4.10it/s]2025-05-25 22:58:51,054 - INFO - [Epoch 005 | Batch 0050] IWAE-loss 6567.6064 | mean log_px -0.0585 | KL -3187.38 + 51it [00:11, 4.13it/s] 52it [00:12, 4.16it/s] 53it [00:12, 3.93it/s] 54it [00:12, 3.98it/s] 55it [00:12, 3.98it/s] 56it [00:13, 4.04it/s] 57it [00:13, 4.14it/s] 58it [00:13, 4.11it/s] 59it [00:13, 4.15it/s] 60it [00:14, 4.15it/s] 61it [00:14, 4.02it/s] 62it [00:14, 4.08it/s] 63it [00:14, 4.16it/s] 64it [00:15, 4.15it/s] 65it [00:15, 4.20it/s] 66it [00:15, 4.17it/s] 67it [00:15, 4.28it/s] 68it [00:16, 4.30it/s] 69it [00:16, 4.27it/s] 70it [00:16, 4.20it/s] 71it [00:16, 4.10it/s] 72it [00:17, 4.12it/s] 73it [00:17, 4.24it/s] 74it [00:17, 4.18it/s] 75it [00:17, 4.15it/s] 76it [00:17, 4.15it/s] 77it [00:18, 4.18it/s] 78it [00:18, 4.08it/s] 79it [00:18, 4.10it/s] 80it [00:18, 4.04it/s] 81it [00:19, 4.11it/s] 82it [00:19, 4.19it/s] 83it [00:19, 4.20it/s] 84it [00:19, 4.29it/s] 85it [00:20, 4.22it/s] 86it [00:20, 4.04it/s] 87it [00:20, 4.04it/s] 88it [00:20, 4.08it/s] 89it [00:21, 4.12it/s] 90it [00:21, 4.10it/s] 91it [00:21, 4.11it/s] 92it [00:21, 4.15it/s] 93it [00:22, 4.23it/s] 94it [00:22, 4.18it/s] 95it [00:22, 4.25it/s] 96it [00:22, 4.34it/s] 97it [00:23, 4.32it/s] 98it [00:23, 4.40it/s] 99it [00:23, 4.34it/s] 100it [00:23, 4.43it/s]2025-05-25 22:59:03,034 - INFO - [Epoch 005 | Batch 0100] IWAE-loss 5110.2051 | mean log_px -0.0323 | KL -3168.64 + 101it [00:23, 4.37it/s] 102it [00:24, 4.33it/s] 103it [00:24, 4.36it/s] 104it [00:24, 4.33it/s] 105it [00:24, 4.39it/s] 106it [00:25, 4.16it/s] 107it [00:25, 4.29it/s] 108it [00:25, 4.41it/s] 109it [00:25, 4.50it/s] 110it [00:25, 4.51it/s] 111it [00:26, 4.42it/s] 112it [00:26, 4.37it/s] 113it [00:26, 4.25it/s] 114it [00:26, 4.25it/s] 115it [00:27, 4.37it/s] 116it [00:27, 4.46it/s] 117it [00:27, 4.54it/s] 118it [00:27, 4.40it/s] 119it [00:28, 4.25it/s] 120it [00:28, 4.23it/s] 121it [00:28, 4.25it/s] 122it [00:28, 4.27it/s] 123it [00:28, 4.31it/s] 124it [00:29, 4.34it/s] 125it [00:29, 4.44it/s] 126it [00:29, 4.38it/s] 127it [00:29, 4.48it/s] 128it [00:30, 4.39it/s] 129it [00:30, 4.42it/s] 130it [00:30, 4.46it/s] 131it [00:30, 4.53it/s] 132it [00:30, 4.48it/s] 133it [00:31, 4.38it/s] 134it [00:31, 4.37it/s] 135it [00:31, 4.45it/s] 136it [00:31, 4.51it/s] 137it [00:32, 4.43it/s] 138it [00:32, 4.52it/s] 139it [00:32, 4.56it/s] 140it [00:32, 4.37it/s] 141it [00:33, 4.27it/s] 142it [00:33, 4.37it/s] 143it [00:33, 4.44it/s] 144it [00:33, 4.38it/s] 145it [00:33, 4.47it/s] 146it [00:34, 4.44it/s] 147it [00:34, 4.53it/s] 148it [00:34, 4.29it/s] 149it [00:34, 4.35it/s] 150it [00:35, 4.34it/s]2025-05-25 22:59:14,437 - INFO - [Epoch 005 | Batch 0150] IWAE-loss 3932.0217 | mean log_px -0.0119 | KL -3150.20 + 151it [00:35, 4.35it/s] 152it [00:35, 4.42it/s] 153it [00:35, 4.24it/s] 154it [00:36, 4.27it/s] 155it [00:36, 4.29it/s] 156it [00:36, 4.30it/s] 157it [00:36, 4.32it/s] 158it [00:36, 4.29it/s] 159it [00:37, 4.13it/s] 160it [00:37, 4.18it/s] 161it [00:37, 4.23it/s] 162it [00:37, 4.26it/s] 163it [00:38, 4.27it/s] 164it [00:38, 4.29it/s] 165it [00:38, 4.31it/s] 166it [00:38, 4.21it/s] 167it [00:39, 4.24it/s] 168it [00:39, 4.23it/s] 169it [00:39, 4.28it/s] 170it [00:39, 4.29it/s] 171it [00:40, 4.29it/s] 172it [00:40, 4.40it/s] 173it [00:40, 4.42it/s] 174it [00:40, 4.33it/s] 175it [00:40, 4.30it/s] 176it [00:41, 4.15it/s] 177it [00:41, 4.20it/s] 178it [00:41, 4.34it/s] 179it [00:41, 4.45it/s] 180it [00:42, 4.51it/s] 181it [00:42, 4.56it/s] 182it [00:42, 4.42it/s] 183it [00:42, 4.53it/s] 184it [00:42, 4.58it/s] 185it [00:43, 4.45it/s] 186it [00:43, 4.38it/s] 187it [00:43, 4.47it/s] 188it [00:43, 4.38it/s] 189it [00:44, 4.44it/s] 190it [00:44, 4.39it/s] 191it [00:44, 4.40it/s] 192it [00:44, 4.33it/s] 193it [00:45, 4.34it/s] 194it [00:45, 4.13it/s] 195it [00:45, 4.19it/s] 196it [00:45, 4.33it/s] 196it [00:45, 4.28it/s] +2025-05-25 22:59:24,975 - INFO - Epoch: 5, Objective: tensor([4262.7358], device='cuda:0', grad_fn=), Loss: 0.01855652406811714, KL/n: 64.05235290527344 + 0it [00:00, ?it/s]2025-05-25 22:59:25,384 - INFO - [Epoch 006 | Batch 0000] IWAE-loss 4869.3335 | mean log_px -0.0318 | KL -3135.65 + 1it [00:00, 2.99it/s] 2it [00:00, 3.75it/s] 3it [00:00, 4.10it/s] 4it [00:01, 4.13it/s] 5it [00:01, 4.34it/s] 6it [00:01, 4.44it/s] 7it [00:01, 4.54it/s] 8it [00:01, 4.59it/s] 9it [00:02, 4.63it/s] 10it [00:02, 4.66it/s] 11it [00:02, 4.68it/s] 12it [00:02, 4.58it/s] 13it [00:02, 4.61it/s] 14it [00:03, 4.51it/s] 15it [00:03, 4.59it/s] 16it [00:03, 4.63it/s] 17it [00:03, 4.66it/s] 18it [00:04, 4.68it/s] 19it [00:04, 4.70it/s] 20it [00:04, 4.70it/s] 21it [00:04, 4.72it/s] 22it [00:04, 4.72it/s] 23it [00:05, 4.72it/s] 24it [00:05, 4.56it/s] 25it [00:05, 4.63it/s] 26it [00:05, 3.72it/s] 27it [00:06, 3.97it/s] 28it [00:06, 4.17it/s] 29it [00:06, 4.33it/s] 30it [00:06, 4.44it/s] 31it [00:06, 4.52it/s] 32it [00:07, 4.42it/s] 33it [00:07, 4.53it/s] 34it [00:07, 4.56it/s] 35it [00:07, 4.49it/s] 36it [00:08, 4.57it/s] 37it [00:08, 4.62it/s] 38it [00:08, 4.65it/s] 39it [00:08, 4.67it/s] 40it [00:08, 4.68it/s] 41it [00:09, 4.70it/s] 42it [00:09, 4.54it/s] 43it [00:09, 4.58it/s] 44it [00:09, 4.62it/s] 45it [00:09, 4.65it/s] 46it [00:10, 4.66it/s] 47it [00:10, 4.67it/s] 48it [00:10, 4.68it/s] 49it [00:10, 4.54it/s] 50it [00:11, 4.61it/s]2025-05-25 22:59:36,348 - INFO - [Epoch 006 | Batch 0050] IWAE-loss 7057.3750 | mean log_px -0.0627 | KL -3113.32 + 51it [00:11, 4.64it/s] 52it [00:11, 4.65it/s] 53it [00:11, 4.69it/s] 54it [00:11, 4.56it/s] 55it [00:12, 4.63it/s] 56it [00:12, 4.65it/s] 57it [00:12, 4.67it/s] 58it [00:12, 4.68it/s] 59it [00:13, 4.71it/s] 60it [00:13, 4.54it/s] 61it [00:13, 4.61it/s] 62it [00:13, 4.65it/s] 63it [00:13, 4.67it/s] 64it [00:14, 4.68it/s] 65it [00:14, 4.71it/s] 66it [00:14, 4.71it/s] 67it [00:14, 4.72it/s] 68it [00:14, 4.72it/s] 69it [00:15, 4.73it/s] 70it [00:15, 4.72it/s] 71it [00:15, 4.73it/s] 72it [00:15, 4.73it/s] 73it [00:15, 4.69it/s] 74it [00:16, 4.70it/s] 75it [00:16, 4.52it/s] 76it [00:16, 4.32it/s] 77it [00:16, 4.32it/s] 78it [00:17, 4.41it/s] 79it [00:17, 4.46it/s] 80it [00:17, 4.56it/s] 81it [00:17, 4.47it/s] 82it [00:18, 4.52it/s] 83it [00:18, 4.59it/s] 84it [00:18, 4.43it/s] 85it [00:18, 4.44it/s] 86it [00:18, 4.37it/s] 87it [00:19, 4.32it/s] 88it [00:19, 4.40it/s] 89it [00:19, 4.45it/s] 90it [00:19, 4.53it/s] 91it [00:20, 4.59it/s] 92it [00:20, 4.42it/s] 93it [00:20, 4.43it/s] 94it [00:20, 4.26it/s] 95it [00:20, 4.42it/s] 96it [00:21, 4.36it/s] 97it [00:21, 4.44it/s] 98it [00:21, 4.47it/s] 99it [00:21, 4.54it/s] 100it [00:22, 4.42it/s]2025-05-25 22:59:47,357 - INFO - [Epoch 006 | Batch 0100] IWAE-loss 6381.2471 | mean log_px -0.0664 | KL -3103.59 + 101it [00:22, 4.51it/s] 102it [00:22, 4.55it/s] 103it [00:22, 4.54it/s] 104it [00:22, 4.43it/s] 105it [00:23, 4.25it/s] 106it [00:23, 4.40it/s] 107it [00:23, 4.41it/s] 108it [00:23, 4.37it/s] 109it [00:24, 4.29it/s] 110it [00:24, 4.28it/s] 111it [00:24, 4.29it/s] 112it [00:24, 4.39it/s] 113it [00:25, 4.36it/s] 114it [00:25, 4.27it/s] 115it [00:25, 4.35it/s] 116it [00:25, 4.44it/s] 117it [00:25, 4.36it/s] 118it [00:26, 4.34it/s] 119it [00:26, 4.31it/s] 120it [00:26, 4.18it/s] 121it [00:26, 4.25it/s] 122it [00:27, 4.24it/s] 123it [00:27, 4.35it/s] 124it [00:27, 4.36it/s] 125it [00:27, 4.33it/s] 126it [00:28, 4.31it/s] 127it [00:28, 4.43it/s] 128it [00:28, 4.37it/s] 129it [00:28, 4.45it/s] 130it [00:28, 4.40it/s] 131it [00:29, 4.23it/s] 132it [00:29, 4.21it/s] 133it [00:29, 4.22it/s] 134it [00:29, 4.28it/s] 135it [00:30, 4.39it/s] 136it [00:30, 4.36it/s] 137it [00:30, 4.44it/s] 138it [00:30, 4.36it/s] 139it [00:31, 4.29it/s] 140it [00:31, 4.24it/s] 141it [00:31, 4.36it/s] 142it [00:31, 4.30it/s] 143it [00:32, 4.16it/s] 144it [00:32, 4.32it/s] 145it [00:32, 4.43it/s] 146it [00:32, 4.50it/s] 147it [00:32, 4.57it/s] 148it [00:33, 4.42it/s] 149it [00:33, 4.51it/s] 150it [00:33, 4.57it/s]2025-05-25 22:59:58,818 - INFO - [Epoch 006 | Batch 0150] IWAE-loss 4548.9775 | mean log_px -0.0281 | KL -3080.35 + 151it [00:33, 4.60it/s] 152it [00:33, 4.64it/s] 153it [00:34, 4.67it/s] 154it [00:34, 4.68it/s] 155it [00:34, 4.53it/s] 156it [00:34, 4.60it/s] 157it [00:35, 4.64it/s] 158it [00:35, 4.66it/s] 159it [00:35, 4.68it/s] 160it [00:35, 4.68it/s] 161it [00:35, 4.67it/s] 162it [00:36, 4.69it/s] 163it [00:36, 4.65it/s] 164it [00:36, 4.46it/s] 165it [00:36, 4.52it/s] 166it [00:37, 4.55it/s] 167it [00:37, 4.54it/s] 168it [00:37, 4.37it/s] 169it [00:37, 4.47it/s] 170it [00:37, 4.36it/s] 171it [00:38, 4.43it/s] 172it [00:38, 4.51it/s] 173it [00:38, 4.55it/s] 174it [00:38, 4.60it/s] 175it [00:39, 4.30it/s] 176it [00:39, 4.38it/s] 177it [00:39, 4.37it/s] 178it [00:39, 4.48it/s] 179it [00:39, 4.53it/s] 180it [00:40, 4.57it/s] 181it [00:40, 4.59it/s] 182it [00:40, 4.53it/s] 183it [00:40, 4.53it/s] 184it [00:41, 4.59it/s] 185it [00:41, 4.46it/s] 186it [00:41, 4.50it/s] 187it [00:41, 4.44it/s] 188it [00:41, 4.49it/s] 189it [00:42, 4.41it/s] 190it [00:42, 4.39it/s] 191it [00:42, 4.46it/s] 192it [00:42, 4.54it/s] 193it [00:43, 4.60it/s] 194it [00:43, 4.63it/s] 195it [00:43, 4.57it/s] 196it [00:43, 4.62it/s] 196it [00:43, 4.48it/s] +2025-05-25 23:00:08,876 - INFO - Epoch: 6, Objective: tensor([7316.6924], device='cuda:0', grad_fn=), Loss: 0.06832034140825272, KL/n: 62.47688674926758 + 0it [00:00, ?it/s]2025-05-25 23:00:09,256 - INFO - [Epoch 007 | Batch 0000] IWAE-loss 5764.2217 | mean log_px -0.0439 | KL -3059.68 + 1it [00:00, 3.02it/s] 2it [00:00, 3.75it/s] 3it [00:00, 4.15it/s] 4it [00:00, 4.29it/s] 5it [00:01, 4.43it/s] 6it [00:01, 4.51it/s] 7it [00:01, 4.58it/s] 8it [00:01, 4.63it/s] 9it [00:02, 4.67it/s] 10it [00:02, 4.67it/s] 11it [00:02, 4.69it/s] 12it [00:02, 4.70it/s] 13it [00:02, 4.70it/s] 14it [00:03, 4.53it/s] 15it [00:03, 4.61it/s] 16it [00:03, 4.63it/s] 17it [00:03, 4.65it/s] 18it [00:03, 4.66it/s] 19it [00:04, 4.68it/s] 20it [00:04, 4.69it/s] 21it [00:04, 4.71it/s] 22it [00:04, 4.71it/s] 23it [00:05, 4.72it/s] 24it [00:05, 4.55it/s] 25it [00:05, 4.60it/s] 26it [00:05, 4.63it/s] 27it [00:05, 4.66it/s] 28it [00:06, 4.67it/s] 29it [00:06, 4.69it/s] 30it [00:06, 4.69it/s] 31it [00:06, 4.54it/s] 32it [00:06, 4.60it/s] 33it [00:07, 4.64it/s] 34it [00:07, 4.66it/s] 35it [00:07, 4.68it/s] 36it [00:07, 4.68it/s] 37it [00:08, 4.69it/s] 38it [00:08, 4.70it/s] 39it [00:08, 4.70it/s] 40it [00:08, 4.70it/s] 41it [00:08, 4.71it/s] 42it [00:09, 4.71it/s] 43it [00:09, 4.72it/s] 44it [00:09, 4.52it/s] 45it [00:09, 4.60it/s] 46it [00:09, 4.63it/s] 47it [00:10, 4.66it/s] 48it [00:10, 4.67it/s] 49it [00:10, 4.53it/s] 50it [00:10, 4.60it/s]2025-05-25 23:00:20,030 - INFO - [Epoch 007 | Batch 0050] IWAE-loss 4438.1538 | mean log_px -0.0305 | KL -3042.06 + 51it [00:11, 4.60it/s] 52it [00:11, 4.61it/s] 53it [00:11, 4.66it/s] 54it [00:11, 4.67it/s] 55it [00:11, 4.66it/s] 56it [00:12, 4.67it/s] 57it [00:12, 4.69it/s] 58it [00:12, 4.69it/s] 59it [00:12, 4.70it/s] 60it [00:12, 4.71it/s] 61it [00:13, 4.71it/s] 62it [00:13, 4.71it/s] 63it [00:13, 4.72it/s] 64it [00:13, 4.72it/s] 65it [00:14, 4.55it/s] 66it [00:14, 4.61it/s] 67it [00:14, 4.64it/s] 68it [00:14, 4.65it/s] 69it [00:14, 4.67it/s] 70it [00:15, 4.66it/s] 71it [00:15, 4.52it/s] 72it [00:15, 4.59it/s] 73it [00:15, 4.62it/s] 74it [00:16, 4.64it/s] 75it [00:16, 4.50it/s] 76it [00:16, 4.57it/s] 77it [00:16, 4.61it/s] 78it [00:16, 4.64it/s] 79it [00:17, 4.67it/s] 80it [00:17, 4.51it/s] 81it [00:17, 4.58it/s] 82it [00:17, 4.61it/s] 83it [00:17, 4.64it/s] 84it [00:18, 4.65it/s] 85it [00:18, 4.50it/s] 86it [00:18, 4.56it/s] 87it [00:18, 4.61it/s] 88it [00:19, 4.63it/s] 89it [00:19, 4.49it/s] 90it [00:19, 4.56it/s] 91it [00:19, 4.61it/s] 92it [00:19, 4.64it/s] 93it [00:20, 4.66it/s] 94it [00:20, 4.67it/s] 95it [00:20, 4.52it/s] 96it [00:20, 4.59it/s] 97it [00:21, 4.62it/s] 98it [00:21, 4.62it/s] 99it [00:21, 4.66it/s] 100it [00:21, 4.67it/s]2025-05-25 23:00:30,834 - INFO - [Epoch 007 | Batch 0100] IWAE-loss 3706.3210 | mean log_px -0.0132 | KL -3016.29 + 101it [00:21, 4.68it/s] 102it [00:22, 4.52it/s] 103it [00:22, 4.59it/s] 104it [00:22, 4.62it/s] 105it [00:22, 4.65it/s] 106it [00:22, 4.64it/s] 107it [00:23, 4.65it/s] 108it [00:23, 4.62it/s] 109it [00:23, 4.66it/s] 110it [00:23, 4.68it/s] 111it [00:24, 4.69it/s] 112it [00:24, 4.69it/s] 113it [00:24, 4.70it/s] 114it [00:24, 4.70it/s] 115it [00:24, 4.71it/s] 116it [00:25, 4.71it/s] 117it [00:25, 4.71it/s] 118it [00:25, 4.69it/s] 119it [00:25, 4.53it/s] 120it [00:25, 4.59it/s] 121it [00:26, 4.62it/s] 122it [00:26, 4.64it/s] 123it [00:26, 4.57it/s] 124it [00:26, 4.59it/s] 125it [00:27, 4.62it/s] 126it [00:27, 4.61it/s] 127it [00:27, 4.46it/s] 128it [00:27, 4.47it/s] 129it [00:27, 4.51it/s] 130it [00:28, 4.55it/s] 131it [00:28, 4.58it/s] 132it [00:28, 4.60it/s] 133it [00:28, 4.48it/s] 134it [00:29, 4.54it/s] 135it [00:29, 4.58it/s] 136it [00:29, 4.60it/s] 137it [00:29, 4.61it/s] 138it [00:29, 4.62it/s] 139it [00:30, 4.63it/s] 140it [00:30, 4.49it/s] 141it [00:30, 4.55it/s] 142it [00:30, 4.58it/s] 143it [00:31, 4.59it/s] 144it [00:31, 4.60it/s] 145it [00:31, 4.61it/s] 146it [00:31, 4.62it/s] 147it [00:31, 4.64it/s] 148it [00:32, 4.63it/s] 149it [00:32, 4.63it/s] 150it [00:32, 4.63it/s]2025-05-25 23:00:41,685 - INFO - [Epoch 007 | Batch 0150] IWAE-loss 6590.7559 | mean log_px -0.0561 | KL -2995.29 + 151it [00:32, 4.65it/s] 152it [00:32, 4.62it/s] 153it [00:33, 4.48it/s] 154it [00:33, 4.54it/s] 155it [00:33, 4.57it/s] 156it [00:33, 4.59it/s] 157it [00:34, 4.61it/s] 158it [00:34, 4.62it/s] 159it [00:34, 4.62it/s] 160it [00:34, 4.61it/s] 161it [00:34, 4.62it/s] 162it [00:35, 4.64it/s] 163it [00:35, 4.65it/s] 164it [00:35, 4.62it/s] 165it [00:35, 4.49it/s] 166it [00:36, 4.55it/s] 167it [00:36, 4.59it/s] 168it [00:36, 4.60it/s] 169it [00:36, 4.61it/s] 170it [00:36, 4.61it/s] 171it [00:37, 4.63it/s] 172it [00:37, 4.61it/s] 173it [00:37, 4.63it/s] 174it [00:37, 4.64it/s] 175it [00:37, 4.64it/s] 176it [00:38, 4.64it/s] 177it [00:38, 4.65it/s] 178it [00:38, 4.65it/s] 179it [00:38, 4.61it/s] 180it [00:39, 4.60it/s] 181it [00:39, 4.62it/s] 182it [00:39, 4.62it/s] 183it [00:39, 4.64it/s] 184it [00:39, 4.64it/s] 185it [00:40, 4.63it/s] 186it [00:40, 4.62it/s] 187it [00:40, 4.63it/s] 188it [00:40, 4.64it/s] 189it [00:40, 4.65it/s] 190it [00:41, 4.65it/s] 191it [00:41, 4.50it/s] 192it [00:41, 4.55it/s] 193it [00:41, 4.58it/s] 194it [00:42, 4.60it/s] 195it [00:42, 4.32it/s] 196it [00:42, 4.42it/s] 196it [00:42, 4.60it/s] +2025-05-25 23:00:51,625 - INFO - Epoch: 7, Objective: tensor([5831.9897], device='cuda:0', grad_fn=), Loss: 0.03322037681937218, KL/n: 60.5771369934082 + 0it [00:00, ?it/s]2025-05-25 23:00:52,206 - INFO - [Epoch 008 | Batch 0000] IWAE-loss 3881.9414 | mean log_px -0.0130 | KL -2970.20 + 1it [00:00, 3.01it/s] 2it [00:00, 3.76it/s] 3it [00:00, 4.10it/s] 4it [00:00, 4.29it/s] 5it [00:01, 4.26it/s] 6it [00:01, 4.39it/s] 7it [00:01, 4.47it/s] 8it [00:01, 4.52it/s] 9it [00:02, 4.57it/s] 10it [00:02, 4.58it/s] 11it [00:02, 4.60it/s] 12it [00:02, 4.61it/s] 13it [00:02, 4.64it/s] 14it [00:03, 4.53it/s] 15it [00:03, 4.57it/s] 16it [00:03, 4.59it/s] 17it [00:03, 4.60it/s] 18it [00:04, 4.61it/s] 19it [00:04, 4.62it/s] 20it [00:04, 4.62it/s] 21it [00:04, 4.63it/s] 22it [00:04, 4.62it/s] 23it [00:05, 4.37it/s] 24it [00:05, 4.39it/s] 25it [00:05, 4.45it/s] 26it [00:05, 4.50it/s] 27it [00:06, 4.55it/s] 28it [00:06, 4.57it/s] 29it [00:06, 4.45it/s] 30it [00:06, 4.51it/s] 31it [00:06, 4.54it/s] 32it [00:07, 4.57it/s] 33it [00:07, 4.58it/s] 34it [00:07, 4.60it/s] 35it [00:07, 4.58it/s] 36it [00:08, 4.61it/s] 37it [00:08, 4.47it/s] 38it [00:08, 4.53it/s] 39it [00:08, 4.50it/s] 40it [00:08, 4.54it/s] 41it [00:09, 4.58it/s] 42it [00:09, 4.60it/s] 43it [00:09, 4.61it/s] 44it [00:09, 4.47it/s] 45it [00:09, 4.52it/s] 46it [00:10, 4.50it/s] 47it [00:10, 4.51it/s] 48it [00:10, 4.55it/s] 49it [00:10, 4.58it/s] 50it [00:11, 4.59it/s]2025-05-25 23:01:03,181 - INFO - [Epoch 008 | Batch 0050] IWAE-loss 4140.3315 | mean log_px -0.0194 | KL -2946.16 + 51it [00:11, 4.47it/s] 52it [00:11, 4.53it/s] 53it [00:11, 4.56it/s] 54it [00:11, 4.59it/s] 55it [00:12, 4.61it/s] 56it [00:12, 4.61it/s] 57it [00:12, 4.62it/s] 58it [00:12, 4.47it/s] 59it [00:13, 4.53it/s] 60it [00:13, 4.56it/s] 61it [00:13, 4.59it/s] 62it [00:13, 4.60it/s] 63it [00:13, 4.61it/s] 64it [00:14, 4.61it/s] 65it [00:14, 4.47it/s] 66it [00:14, 4.49it/s] 67it [00:14, 4.49it/s] 68it [00:15, 4.47it/s] 69it [00:15, 4.45it/s] 70it [00:15, 4.51it/s] 71it [00:15, 4.41it/s] 72it [00:15, 4.49it/s] 73it [00:16, 4.54it/s] 74it [00:16, 4.57it/s] 75it [00:16, 4.59it/s] 76it [00:16, 4.61it/s] 77it [00:17, 4.47it/s] 78it [00:17, 4.53it/s] 79it [00:17, 4.56it/s] 80it [00:17, 4.58it/s] 81it [00:17, 4.61it/s] 82it [00:18, 4.63it/s] 83it [00:18, 4.62it/s] 84it [00:18, 4.48it/s] 85it [00:18, 4.52it/s] 86it [00:19, 4.56it/s] 87it [00:19, 4.58it/s] 88it [00:19, 4.60it/s] 89it [00:19, 4.61it/s] 90it [00:19, 4.61it/s] 91it [00:20, 4.48it/s] 92it [00:20, 4.53it/s] 93it [00:20, 4.57it/s] 94it [00:20, 4.59it/s] 95it [00:20, 4.60it/s] 96it [00:21, 4.47it/s] 97it [00:21, 4.54it/s] 98it [00:21, 4.56it/s] 99it [00:21, 4.59it/s] 100it [00:22, 4.61it/s]2025-05-25 23:01:14,168 - INFO - [Epoch 008 | Batch 0100] IWAE-loss 3203.0884 | mean log_px -0.0045 | KL -2923.38 + 101it [00:22, 4.61it/s] 102it [00:22, 4.62it/s] 103it [00:22, 4.65it/s] 104it [00:22, 4.43it/s] 105it [00:23, 4.50it/s] 106it [00:23, 4.54it/s] 107it [00:23, 4.58it/s] 108it [00:23, 4.60it/s] 109it [00:24, 4.61it/s] 110it [00:24, 4.62it/s] 111it [00:24, 4.63it/s] 112it [00:24, 4.63it/s] 113it [00:24, 4.63it/s] 114it [00:25, 4.63it/s] 115it [00:25, 4.50it/s] 116it [00:25, 4.55it/s] 117it [00:25, 4.55it/s] 118it [00:26, 4.58it/s] 119it [00:26, 4.60it/s] 120it [00:26, 4.60it/s] 121it [00:26, 4.48it/s] 122it [00:26, 4.53it/s] 123it [00:27, 4.55it/s] 124it [00:27, 4.56it/s] 125it [00:27, 4.58it/s] 126it [00:27, 4.58it/s] 127it [00:27, 4.59it/s] 128it [00:28, 4.59it/s] 129it [00:28, 4.61it/s] 130it [00:28, 4.60it/s] 131it [00:28, 4.60it/s] 132it [00:29, 4.61it/s] 133it [00:29, 4.62it/s] 134it [00:29, 4.61it/s] 135it [00:29, 4.62it/s] 136it [00:29, 4.47it/s] 137it [00:30, 4.54it/s] 138it [00:30, 4.53it/s] 139it [00:30, 4.55it/s] 140it [00:30, 4.56it/s] 141it [00:31, 4.58it/s] 142it [00:31, 4.54it/s] 143it [00:31, 4.43it/s] 144it [00:31, 4.50it/s] 145it [00:31, 4.53it/s] 146it [00:32, 4.54it/s] 147it [00:32, 4.57it/s] 148it [00:32, 4.57it/s] 149it [00:32, 4.56it/s] 150it [00:33, 4.59it/s]2025-05-25 23:01:25,120 - INFO - [Epoch 008 | Batch 0150] IWAE-loss 3672.0759 | mean log_px -0.0163 | KL -2904.56 + 151it [00:33, 4.58it/s] 152it [00:33, 4.58it/s] 153it [00:33, 4.58it/s] 154it [00:33, 4.59it/s] 155it [00:34, 4.55it/s] 156it [00:34, 4.57it/s] 157it [00:34, 4.56it/s] 158it [00:34, 4.57it/s] 159it [00:34, 4.56it/s] 160it [00:35, 4.58it/s] 161it [00:35, 4.59it/s] 162it [00:35, 4.51it/s] 163it [00:35, 4.55it/s] 164it [00:36, 4.57it/s] 165it [00:36, 4.58it/s] 166it [00:36, 4.60it/s] 167it [00:36, 4.59it/s] 168it [00:36, 4.60it/s] 169it [00:37, 4.61it/s] 170it [00:37, 4.57it/s] 171it [00:37, 4.56it/s] 172it [00:37, 4.56it/s] 173it [00:38, 4.45it/s] 174it [00:38, 4.50it/s] 175it [00:38, 4.54it/s] 176it [00:38, 4.57it/s] 177it [00:38, 4.57it/s] 178it [00:39, 4.58it/s] 179it [00:39, 4.60it/s] 180it [00:39, 4.60it/s] 181it [00:39, 4.62it/s] 182it [00:40, 4.61it/s] 183it [00:40, 4.55it/s] 184it [00:40, 4.56it/s] 185it [00:40, 4.58it/s] 186it [00:40, 4.59it/s] 187it [00:41, 4.61it/s] 188it [00:41, 4.59it/s] 189it [00:41, 4.60it/s] 190it [00:41, 4.60it/s] 191it [00:41, 4.61it/s] 192it [00:42, 4.61it/s] 193it [00:42, 4.60it/s] 194it [00:42, 4.59it/s] 195it [00:42, 4.20it/s] 196it [00:43, 4.24it/s] 196it [00:43, 4.53it/s] +2025-05-25 23:01:35,169 - INFO - Epoch: 8, Objective: tensor([4215.5410], device='cuda:0', grad_fn=), Loss: 0.014363881200551987, KL/n: 58.71515655517578 + 0it [00:00, ?it/s]2025-05-25 23:01:35,548 - INFO - [Epoch 009 | Batch 0000] IWAE-loss 3831.5950 | mean log_px -0.0261 | KL -2873.97 + 1it [00:00, 3.26it/s] 2it [00:00, 3.94it/s] 3it [00:00, 4.23it/s] 4it [00:00, 4.37it/s] 5it [00:01, 4.47it/s] 6it [00:01, 4.53it/s] 7it [00:01, 4.59it/s] 8it [00:01, 4.59it/s] 9it [00:02, 4.60it/s] 10it [00:02, 4.60it/s] 11it [00:02, 4.63it/s] 12it [00:02, 3.67it/s] 13it [00:03, 3.80it/s] 14it [00:03, 3.96it/s] 15it [00:03, 4.15it/s] 16it [00:03, 4.29it/s] 17it [00:03, 4.39it/s] 18it [00:04, 4.44it/s] 19it [00:04, 4.49it/s] 20it [00:04, 4.45it/s] 21it [00:04, 4.51it/s] 22it [00:05, 4.55it/s] 23it [00:05, 4.57it/s] 24it [00:05, 4.53it/s] 25it [00:05, 4.55it/s] 26it [00:05, 4.42it/s] 27it [00:06, 4.47it/s] 28it [00:06, 4.51it/s] 29it [00:06, 4.55it/s] 30it [00:06, 4.55it/s] 31it [00:07, 4.54it/s] 32it [00:07, 4.56it/s] 33it [00:07, 4.58it/s] 34it [00:07, 4.58it/s] 35it [00:07, 4.59it/s] 36it [00:08, 4.60it/s] 37it [00:08, 4.61it/s] 38it [00:08, 4.61it/s] 39it [00:08, 4.63it/s] 40it [00:09, 4.62it/s] 41it [00:09, 4.64it/s] 42it [00:09, 4.63it/s] 43it [00:09, 4.63it/s] 44it [00:09, 4.63it/s] 45it [00:10, 4.64it/s] 46it [00:10, 4.62it/s] 47it [00:10, 4.63it/s] 48it [00:10, 4.45it/s] 49it [00:10, 4.52it/s] 50it [00:11, 4.53it/s]2025-05-25 23:01:46,660 - INFO - [Epoch 009 | Batch 0050] IWAE-loss 3554.7034 | mean log_px -0.0139 | KL -2847.36 + 51it [00:11, 4.55it/s] 52it [00:11, 4.56it/s] 53it [00:11, 4.58it/s] 54it [00:12, 4.60it/s] 55it [00:12, 4.47it/s] 56it [00:12, 4.54it/s] 57it [00:12, 4.56it/s] 58it [00:12, 4.58it/s] 59it [00:13, 4.61it/s] 60it [00:13, 4.61it/s] 61it [00:13, 4.62it/s] 62it [00:13, 4.63it/s] 63it [00:14, 4.64it/s] 64it [00:14, 4.63it/s] 65it [00:14, 4.62it/s] 66it [00:14, 4.48it/s] 67it [00:14, 4.53it/s] 68it [00:15, 4.56it/s] 69it [00:15, 4.59it/s] 70it [00:15, 4.59it/s] 71it [00:15, 4.61it/s] 72it [00:15, 4.61it/s] 73it [00:16, 4.61it/s] 74it [00:16, 4.61it/s] 75it [00:16, 4.48it/s] 76it [00:16, 4.50it/s] 77it [00:17, 4.54it/s] 78it [00:17, 4.57it/s] 79it [00:17, 4.58it/s] 80it [00:17, 4.59it/s] 81it [00:17, 4.62it/s] 82it [00:18, 4.60it/s] 83it [00:18, 4.64it/s] 84it [00:18, 4.63it/s] 85it [00:18, 4.63it/s] 86it [00:19, 4.63it/s] 87it [00:19, 4.65it/s] 88it [00:19, 4.49it/s] 89it [00:19, 4.55it/s] 90it [00:19, 4.57it/s] 91it [00:20, 4.60it/s] 92it [00:20, 4.61it/s] 93it [00:20, 4.63it/s] 94it [00:20, 4.63it/s] 95it [00:21, 4.65it/s] 96it [00:21, 4.64it/s] 97it [00:21, 4.48it/s] 98it [00:21, 4.53it/s] 99it [00:21, 4.57it/s] 100it [00:22, 4.52it/s]2025-05-25 23:01:57,585 - INFO - [Epoch 009 | Batch 0100] IWAE-loss 3406.7056 | mean log_px -0.0110 | KL -2821.77 + 101it [00:22, 4.48it/s] 102it [00:22, 4.50it/s] 103it [00:22, 4.54it/s] 104it [00:22, 4.56it/s] 105it [00:23, 4.59it/s] 106it [00:23, 4.60it/s] 107it [00:23, 4.61it/s] 108it [00:23, 4.62it/s] 109it [00:24, 4.62it/s] 110it [00:24, 4.62it/s] 111it [00:24, 4.63it/s] 112it [00:24, 4.63it/s] 113it [00:24, 4.64it/s] 114it [00:25, 4.63it/s] 115it [00:25, 4.63it/s] 116it [00:25, 4.63it/s] 117it [00:25, 4.64it/s] 118it [00:26, 4.63it/s] 119it [00:26, 4.64it/s] 120it [00:26, 4.63it/s] 121it [00:26, 4.62it/s] 122it [00:26, 4.46it/s] 123it [00:27, 4.53it/s] 124it [00:27, 4.54it/s] 125it [00:27, 4.57it/s] 126it [00:27, 4.58it/s] 127it [00:27, 4.59it/s] 128it [00:28, 4.44it/s] 129it [00:28, 4.35it/s] 130it [00:28, 4.41it/s] 131it [00:28, 4.49it/s] 132it [00:29, 4.52it/s] 133it [00:29, 4.56it/s] 134it [00:29, 4.57it/s] 135it [00:29, 4.59it/s] 136it [00:30, 4.44it/s] 137it [00:30, 4.51it/s] 138it [00:30, 4.53it/s] 139it [00:30, 4.56it/s] 140it [00:30, 4.56it/s] 141it [00:31, 4.59it/s] 142it [00:31, 4.59it/s] 143it [00:31, 4.60it/s] 144it [00:31, 4.49it/s] 145it [00:31, 4.50it/s] 146it [00:32, 4.53it/s] 147it [00:32, 4.57it/s] 148it [00:32, 4.57it/s] 149it [00:32, 4.51it/s] 150it [00:33, 4.54it/s]2025-05-25 23:02:08,537 - INFO - [Epoch 009 | Batch 0150] IWAE-loss 5147.5215 | mean log_px -0.0361 | KL -2803.57 + 151it [00:33, 4.57it/s] 152it [00:33, 4.57it/s] 153it [00:33, 4.43it/s] 154it [00:33, 4.50it/s] 155it [00:34, 4.54it/s] 156it [00:34, 4.55it/s] 157it [00:34, 4.50it/s] 158it [00:34, 4.52it/s] 159it [00:35, 4.53it/s] 160it [00:35, 4.54it/s] 161it [00:35, 4.55it/s] 162it [00:35, 4.56it/s] 163it [00:35, 4.59it/s] 164it [00:36, 4.60it/s] 165it [00:36, 4.61it/s] 166it [00:36, 4.60it/s] 167it [00:36, 4.61it/s] 168it [00:37, 4.60it/s] 169it [00:37, 4.61it/s] 170it [00:37, 4.49it/s] 171it [00:37, 4.54it/s] 172it [00:37, 4.56it/s] 173it [00:38, 4.57it/s] 174it [00:38, 4.58it/s] 175it [00:38, 4.59it/s] 176it [00:38, 4.60it/s] 177it [00:38, 4.60it/s] 178it [00:39, 4.60it/s] 179it [00:39, 4.58it/s] 180it [00:39, 4.57it/s] 181it [00:39, 4.59it/s] 182it [00:40, 4.60it/s] 183it [00:40, 4.61it/s] 184it [00:40, 4.45it/s] 185it [00:40, 4.52it/s] 186it [00:40, 4.54it/s] 187it [00:41, 4.57it/s] 188it [00:41, 4.58it/s] 189it [00:41, 4.58it/s] 190it [00:41, 4.57it/s] 191it [00:42, 4.59it/s] 192it [00:42, 4.60it/s] 193it [00:42, 4.60it/s] 194it [00:42, 4.61it/s] 195it [00:42, 4.21it/s] 196it [00:43, 4.33it/s] 196it [00:43, 4.53it/s] +2025-05-25 23:02:18,584 - INFO - Epoch: 9, Objective: tensor([4143.1064], device='cuda:0', grad_fn=), Loss: 0.02341052144765854, KL/n: 56.89252471923828 + 0it [00:00, ?it/s]2025-05-25 23:02:18,989 - INFO - [Epoch 010 | Batch 0000] IWAE-loss 3292.7747 | mean log_px -0.0090 | KL -2785.48 + 1it [00:00, 3.00it/s] 2it [00:00, 3.76it/s] 3it [00:00, 4.13it/s] 4it [00:00, 4.26it/s] 5it [00:01, 4.36it/s] 6it [00:01, 4.36it/s] 7it [00:01, 4.46it/s] 8it [00:01, 4.50it/s] 9it [00:02, 4.53it/s] 10it [00:02, 4.55it/s] 11it [00:02, 4.58it/s] 12it [00:02, 4.57it/s] 13it [00:02, 4.59it/s] 14it [00:03, 4.60it/s] 15it [00:03, 4.60it/s] 16it [00:03, 4.60it/s] 17it [00:03, 4.60it/s] 18it [00:04, 4.60it/s] 19it [00:04, 4.61it/s] 20it [00:04, 4.59it/s] 21it [00:04, 4.61it/s] 22it [00:04, 4.61it/s] 23it [00:05, 4.61it/s] 24it [00:05, 4.59it/s] 25it [00:05, 4.57it/s] 26it [00:05, 4.55it/s] 27it [00:06, 4.57it/s] 28it [00:06, 4.57it/s] 29it [00:06, 4.60it/s] 30it [00:06, 4.60it/s] 31it [00:06, 4.60it/s] 32it [00:07, 4.47it/s] 33it [00:07, 4.52it/s] 34it [00:07, 4.52it/s] 35it [00:07, 4.56it/s] 36it [00:07, 4.57it/s] 37it [00:08, 4.60it/s] 38it [00:08, 4.59it/s] 39it [00:08, 4.40it/s] 40it [00:08, 4.46it/s] 41it [00:09, 4.51it/s] 42it [00:09, 4.53it/s] 43it [00:09, 4.56it/s] 44it [00:09, 4.57it/s] 45it [00:09, 4.58it/s] 46it [00:10, 4.58it/s] 47it [00:10, 4.59it/s] 48it [00:10, 4.60it/s] 49it [00:10, 4.61it/s] 50it [00:11, 4.61it/s]2025-05-25 23:02:29,927 - INFO - [Epoch 010 | Batch 0050] IWAE-loss 3255.0281 | mean log_px -0.0100 | KL -2764.80 + 51it [00:11, 4.59it/s] 52it [00:11, 4.60it/s] 53it [00:11, 4.60it/s] 54it [00:11, 4.59it/s] 55it [00:12, 4.60it/s] 56it [00:12, 4.51it/s] 57it [00:12, 4.54it/s] 58it [00:12, 4.56it/s] 59it [00:13, 4.58it/s] 60it [00:13, 4.60it/s] 61it [00:13, 4.60it/s] 62it [00:13, 4.60it/s] 63it [00:13, 4.61it/s] 64it [00:14, 4.61it/s] 65it [00:14, 4.62it/s] 66it [00:14, 4.59it/s] 67it [00:14, 4.60it/s] 68it [00:14, 4.61it/s] 69it [00:15, 4.61it/s] 70it [00:15, 4.56it/s] 71it [00:15, 4.58it/s] 72it [00:15, 4.58it/s] 73it [00:16, 4.45it/s] 74it [00:16, 4.50it/s] 75it [00:16, 4.55it/s] 76it [00:16, 4.55it/s] 77it [00:16, 4.57it/s] 78it [00:17, 4.58it/s] 79it [00:17, 4.60it/s] 80it [00:17, 4.60it/s] 81it [00:17, 4.59it/s] 82it [00:18, 4.62it/s] 83it [00:18, 4.65it/s] 84it [00:18, 4.65it/s] 85it [00:18, 4.67it/s] 86it [00:18, 4.51it/s] 87it [00:19, 4.57it/s] 88it [00:19, 4.60it/s] 89it [00:19, 4.64it/s] 90it [00:19, 4.66it/s] 91it [00:19, 4.67it/s] 92it [00:20, 4.68it/s] 93it [00:20, 4.69it/s] 94it [00:20, 4.70it/s] 95it [00:20, 4.66it/s] 96it [00:21, 4.68it/s] 97it [00:21, 4.70it/s] 98it [00:21, 4.69it/s] 99it [00:21, 4.66it/s] 100it [00:21, 4.50it/s]2025-05-25 23:02:40,797 - INFO - [Epoch 010 | Batch 0100] IWAE-loss 3816.2234 | mean log_px -0.0176 | KL -2740.36 + 101it [00:22, 4.57it/s] 102it [00:22, 4.58it/s] 103it [00:22, 4.54it/s] 104it [00:22, 4.54it/s] 105it [00:23, 4.59it/s] 106it [00:23, 4.59it/s] 107it [00:23, 4.61it/s] 108it [00:23, 4.47it/s] 109it [00:23, 4.52it/s] 110it [00:24, 4.55it/s] 111it [00:24, 4.58it/s] 112it [00:24, 4.59it/s] 113it [00:24, 4.61it/s] 114it [00:24, 4.61it/s] 115it [00:25, 4.61it/s] 116it [00:25, 4.61it/s] 117it [00:25, 4.62it/s] 118it [00:25, 4.63it/s] 119it [00:26, 4.50it/s] 120it [00:26, 4.55it/s] 121it [00:26, 4.58it/s] 122it [00:26, 4.59it/s] 123it [00:26, 4.61it/s] 124it [00:27, 4.63it/s] 125it [00:27, 4.64it/s] 126it [00:27, 4.63it/s] 127it [00:27, 4.64it/s] 128it [00:28, 4.63it/s] 129it [00:28, 4.63it/s] 130it [00:28, 4.63it/s] 131it [00:28, 4.63it/s] 132it [00:28, 4.63it/s] 133it [00:29, 4.50it/s] 134it [00:29, 4.54it/s] 135it [00:29, 4.56it/s] 136it [00:29, 4.58it/s] 137it [00:29, 4.59it/s] 138it [00:30, 4.59it/s] 139it [00:30, 4.59it/s] 140it [00:30, 4.59it/s] 141it [00:30, 4.60it/s] 142it [00:31, 4.61it/s] 143it [00:31, 4.62it/s] 144it [00:31, 4.49it/s] 145it [00:31, 4.55it/s] 146it [00:31, 4.58it/s] 147it [00:32, 4.60it/s] 148it [00:32, 4.60it/s] 149it [00:32, 4.61it/s] 150it [00:32, 4.62it/s]2025-05-25 23:02:51,687 - INFO - [Epoch 010 | Batch 0150] IWAE-loss 4118.2427 | mean log_px -0.0299 | KL -2717.40 + 151it [00:33, 4.62it/s] 152it [00:33, 4.63it/s] 153it [00:33, 4.63it/s] 154it [00:33, 4.62it/s] 155it [00:33, 4.63it/s] 156it [00:34, 4.62it/s] 157it [00:34, 4.63it/s] 158it [00:34, 4.63it/s] 159it [00:34, 4.64it/s] 160it [00:34, 4.63it/s] 161it [00:35, 4.64it/s] 162it [00:35, 4.63it/s] 163it [00:35, 4.65it/s] 164it [00:35, 4.64it/s] 165it [00:36, 4.50it/s] 166it [00:36, 4.55it/s] 167it [00:36, 4.58it/s] 168it [00:36, 4.58it/s] 169it [00:36, 4.60it/s] 170it [00:37, 4.61it/s] 171it [00:37, 4.61it/s] 172it [00:37, 4.62it/s] 173it [00:37, 4.62it/s] 174it [00:38, 4.63it/s] 175it [00:38, 4.64it/s] 176it [00:38, 4.62it/s] 177it [00:38, 4.62it/s] 178it [00:38, 4.61it/s] 179it [00:39, 4.62it/s] 180it [00:39, 4.62it/s] 181it [00:39, 4.63it/s] 182it [00:39, 4.63it/s] 183it [00:39, 4.64it/s] 184it [00:40, 4.64it/s] 185it [00:40, 4.65it/s] 186it [00:40, 4.64it/s] 187it [00:40, 4.64it/s] 188it [00:41, 4.64it/s] 189it [00:41, 4.64it/s] 190it [00:41, 4.65it/s] 191it [00:41, 4.63it/s] 192it [00:41, 4.61it/s] 193it [00:42, 4.62it/s] 194it [00:42, 4.61it/s] 195it [00:42, 4.28it/s] 196it [00:42, 4.39it/s] 196it [00:42, 4.57it/s] +2025-05-25 23:03:01,608 - INFO - Epoch: 10, Objective: tensor([2976.3257], device='cuda:0', grad_fn=), Loss: 0.00489531084895134, KL/n: 55.191680908203125 + 0it [00:00, ?it/s]2025-05-25 23:03:02,196 - INFO - [Epoch 011 | Batch 0000] IWAE-loss 3065.4336 | mean log_px -0.0064 | KL -2701.94 + 1it [00:00, 2.77it/s] 2it [00:00, 3.65it/s] 3it [00:00, 3.86it/s] 4it [00:01, 4.15it/s] 5it [00:01, 4.33it/s] 6it [00:01, 4.43it/s] 7it [00:01, 4.22it/s] 8it [00:01, 4.24it/s] 9it [00:02, 4.37it/s] 10it [00:02, 4.45it/s] 11it [00:02, 4.43it/s] 12it [00:02, 4.46it/s] 13it [00:03, 4.53it/s] 14it [00:03, 4.44it/s] 15it [00:03, 4.33it/s] 16it [00:03, 4.44it/s] 17it [00:03, 4.44it/s] 18it [00:04, 4.51it/s] 19it [00:04, 4.52it/s] 20it [00:04, 4.54it/s] 21it [00:04, 4.54it/s] 22it [00:05, 4.36it/s] 23it [00:05, 4.46it/s] 24it [00:05, 4.52it/s] 25it [00:05, 4.52it/s] 26it [00:05, 4.51it/s] 27it [00:06, 4.54it/s] 28it [00:06, 4.36it/s] 29it [00:06, 4.46it/s] 30it [00:06, 4.49it/s] 31it [00:07, 4.53it/s] 32it [00:07, 4.49it/s] 33it [00:07, 4.50it/s] 34it [00:07, 4.52it/s] 35it [00:07, 4.55it/s] 36it [00:08, 4.53it/s] 37it [00:08, 4.52it/s] 38it [00:08, 4.59it/s] 39it [00:08, 4.60it/s] 40it [00:09, 4.57it/s] 41it [00:09, 4.63it/s] 42it [00:09, 4.64it/s] 43it [00:09, 4.65it/s] 44it [00:09, 4.63it/s] 45it [00:10, 4.54it/s] 46it [00:10, 4.56it/s] 47it [00:10, 4.54it/s] 48it [00:10, 4.45it/s] 49it [00:11, 4.30it/s] 50it [00:11, 4.41it/s]2025-05-25 23:03:13,350 - INFO - [Epoch 011 | Batch 0050] IWAE-loss 3133.4580 | mean log_px -0.0073 | KL -2682.37 + 51it [00:11, 4.47it/s] 52it [00:11, 4.51it/s] 53it [00:11, 4.49it/s] 54it [00:12, 4.47it/s] 55it [00:12, 4.52it/s] 56it [00:12, 4.58it/s] 57it [00:12, 4.55it/s] 58it [00:13, 4.59it/s] 59it [00:13, 4.50it/s] 60it [00:13, 4.56it/s] 61it [00:13, 4.57it/s] 62it [00:13, 4.57it/s] 63it [00:14, 4.57it/s] 64it [00:14, 4.55it/s] 65it [00:14, 4.54it/s] 66it [00:14, 4.56it/s] 67it [00:14, 4.59it/s] 68it [00:15, 4.57it/s] 69it [00:15, 4.53it/s] 70it [00:15, 4.55it/s] 71it [00:15, 4.57it/s] 72it [00:16, 4.60it/s] 73it [00:16, 4.61it/s] 74it [00:16, 4.61it/s] 75it [00:16, 4.46it/s] 76it [00:16, 4.54it/s] 77it [00:17, 4.58it/s] 78it [00:17, 4.59it/s] 79it [00:17, 4.62it/s] 80it [00:17, 4.62it/s] 81it [00:18, 4.60it/s] 82it [00:18, 4.45it/s] 83it [00:18, 4.50it/s] 84it [00:18, 4.52it/s] 85it [00:18, 4.52it/s] 86it [00:19, 4.52it/s] 87it [00:19, 4.53it/s] 88it [00:19, 4.41it/s] 89it [00:19, 4.44it/s] 90it [00:20, 4.47it/s] 91it [00:20, 4.48it/s] 92it [00:20, 4.52it/s] 93it [00:20, 4.54it/s] 94it [00:20, 4.55it/s] 95it [00:21, 4.37it/s] 96it [00:21, 4.42it/s] 97it [00:21, 4.42it/s] 98it [00:21, 4.50it/s] 99it [00:22, 4.53it/s] 100it [00:22, 4.53it/s]2025-05-25 23:03:24,376 - INFO - [Epoch 011 | Batch 0100] IWAE-loss 4312.6279 | mean log_px -0.0334 | KL -2658.71 + 101it [00:22, 4.58it/s] 102it [00:22, 4.57it/s] 103it [00:22, 4.58it/s] 104it [00:23, 4.60it/s] 105it [00:23, 4.63it/s] 106it [00:23, 4.65it/s] 107it [00:23, 4.67it/s] 108it [00:24, 4.62it/s] 109it [00:24, 4.42it/s] 110it [00:24, 4.49it/s] 111it [00:24, 4.56it/s] 112it [00:24, 4.52it/s] 113it [00:25, 4.51it/s] 114it [00:25, 4.42it/s] 115it [00:25, 4.44it/s] 116it [00:25, 4.49it/s] 117it [00:26, 4.56it/s] 118it [00:26, 4.44it/s] 119it [00:26, 4.39it/s] 120it [00:26, 4.44it/s] 121it [00:26, 4.52it/s] 122it [00:27, 4.53it/s] 123it [00:27, 4.48it/s] 124it [00:27, 4.51it/s] 125it [00:27, 4.30it/s] 126it [00:28, 4.38it/s] 127it [00:28, 4.46it/s] 128it [00:28, 4.54it/s] 129it [00:28, 4.59it/s] 130it [00:28, 4.62it/s] 131it [00:29, 4.63it/s] 132it [00:29, 4.62it/s] 133it [00:29, 4.50it/s] 134it [00:29, 4.49it/s] 135it [00:30, 4.48it/s] 136it [00:30, 4.46it/s] 137it [00:30, 4.49it/s] 138it [00:30, 4.55it/s] 139it [00:30, 4.60it/s] 140it [00:31, 4.61it/s] 141it [00:31, 4.61it/s] 142it [00:31, 4.59it/s] 143it [00:31, 4.59it/s] 144it [00:32, 4.61it/s] 145it [00:32, 4.64it/s] 146it [00:32, 4.65it/s] 147it [00:32, 4.45it/s] 148it [00:32, 4.54it/s] 149it [00:33, 4.56it/s] 150it [00:33, 4.58it/s]2025-05-25 23:03:35,402 - INFO - [Epoch 011 | Batch 0150] IWAE-loss 3104.3960 | mean log_px -0.0096 | KL -2631.08 + 151it [00:33, 4.58it/s] 152it [00:33, 4.56it/s] 153it [00:33, 4.46it/s] 154it [00:34, 4.54it/s] 155it [00:34, 4.55it/s] 156it [00:34, 4.56it/s] 157it [00:34, 4.57it/s] 158it [00:35, 4.58it/s] 159it [00:35, 4.44it/s] 160it [00:35, 4.51it/s] 161it [00:35, 4.54it/s] 162it [00:35, 4.54it/s] 163it [00:36, 4.51it/s] 164it [00:36, 4.42it/s] 165it [00:36, 4.46it/s] 166it [00:36, 4.50it/s] 167it [00:37, 4.50it/s] 168it [00:37, 4.40it/s] 169it [00:37, 4.45it/s] 170it [00:37, 4.53it/s] 171it [00:37, 4.54it/s] 172it [00:38, 4.55it/s] 173it [00:38, 4.58it/s] 174it [00:38, 4.62it/s] 175it [00:38, 4.63it/s] 176it [00:39, 4.62it/s] 177it [00:39, 4.62it/s] 178it [00:39, 4.42it/s] 179it [00:39, 4.44it/s] 180it [00:39, 4.46it/s] 181it [00:40, 4.51it/s] 182it [00:40, 4.44it/s] 183it [00:40, 4.50it/s] 184it [00:40, 4.29it/s] 185it [00:41, 4.35it/s] 186it [00:41, 4.45it/s] 187it [00:41, 4.50it/s] 188it [00:41, 4.55it/s] 189it [00:41, 4.56it/s] 190it [00:42, 4.32it/s] 191it [00:42, 4.40it/s] 192it [00:42, 4.47it/s] 193it [00:42, 4.48it/s] 194it [00:43, 4.50it/s] 195it [00:43, 4.40it/s] 196it [00:43, 4.44it/s] 196it [00:43, 4.49it/s] +2025-05-25 23:03:45,570 - INFO - Epoch: 11, Objective: tensor([4247.3716], device='cuda:0', grad_fn=), Loss: 0.031174693256616592, KL/n: 53.34761047363281 + 0it [00:00, ?it/s]2025-05-25 23:03:45,982 - INFO - [Epoch 012 | Batch 0000] IWAE-loss 3012.1206 | mean log_px -0.0057 | KL -2611.20 + 1it [00:00, 2.73it/s] 2it [00:00, 3.63it/s] 3it [00:00, 4.01it/s] 4it [00:01, 4.23it/s] 5it [00:01, 4.38it/s] 6it [00:01, 4.46it/s] 7it [00:01, 4.37it/s] 8it [00:01, 4.46it/s] 9it [00:02, 4.50it/s] 10it [00:02, 4.54it/s] 11it [00:02, 3.55it/s] 12it [00:02, 3.82it/s] 13it [00:03, 4.04it/s] 14it [00:03, 4.22it/s] 15it [00:03, 4.33it/s] 16it [00:03, 4.41it/s] 17it [00:04, 4.35it/s] 18it [00:04, 4.43it/s] 19it [00:04, 4.49it/s] 20it [00:04, 4.54it/s] 21it [00:04, 4.53it/s] 22it [00:05, 4.57it/s] 23it [00:05, 4.46it/s] 24it [00:05, 4.53it/s] 25it [00:05, 4.57it/s] 26it [00:06, 4.60it/s] 27it [00:06, 4.62it/s] 28it [00:06, 4.63it/s] 29it [00:06, 4.50it/s] 30it [00:06, 4.56it/s] 31it [00:07, 4.59it/s] 32it [00:07, 4.61it/s] 33it [00:07, 4.63it/s] 34it [00:07, 4.63it/s] 35it [00:07, 4.51it/s] 36it [00:08, 4.56it/s] 37it [00:08, 4.59it/s] 38it [00:08, 4.60it/s] 39it [00:08, 4.62it/s] 40it [00:09, 4.60it/s] 41it [00:09, 4.48it/s] 42it [00:09, 4.54it/s] 43it [00:09, 4.57it/s] 44it [00:09, 4.60it/s] 45it [00:10, 4.63it/s] 46it [00:10, 4.64it/s] 47it [00:10, 4.50it/s] 48it [00:10, 4.56it/s] 49it [00:11, 4.59it/s] 50it [00:11, 4.61it/s]2025-05-25 23:03:57,122 - INFO - [Epoch 012 | Batch 0050] IWAE-loss 3992.2141 | mean log_px -0.0251 | KL -2592.65 + 51it [00:11, 4.62it/s] 52it [00:11, 4.63it/s] 53it [00:11, 4.46it/s] 54it [00:12, 4.53it/s] 55it [00:12, 4.54it/s] 56it [00:12, 4.55it/s] 57it [00:12, 4.59it/s] 58it [00:13, 4.62it/s] 59it [00:13, 4.64it/s] 60it [00:13, 4.50it/s] 61it [00:13, 4.57it/s] 62it [00:13, 4.59it/s] 63it [00:14, 4.58it/s] 64it [00:14, 4.61it/s] 65it [00:14, 4.63it/s] 66it [00:14, 4.64it/s] 67it [00:14, 4.65it/s] 68it [00:15, 4.66it/s] 69it [00:15, 4.52it/s] 70it [00:15, 4.57it/s] 71it [00:15, 4.60it/s] 72it [00:16, 4.62it/s] 73it [00:16, 4.64it/s] 74it [00:16, 4.64it/s] 75it [00:16, 4.55it/s] 76it [00:16, 4.60it/s] 77it [00:17, 4.63it/s] 78it [00:17, 4.64it/s] 79it [00:17, 4.51it/s] 80it [00:17, 4.57it/s] 81it [00:18, 4.60it/s] 82it [00:18, 4.62it/s] 83it [00:18, 4.63it/s] 84it [00:18, 4.49it/s] 85it [00:18, 4.56it/s] 86it [00:19, 4.59it/s] 87it [00:19, 4.62it/s] 88it [00:19, 4.62it/s] 89it [00:19, 4.64it/s] 90it [00:19, 4.64it/s] 91it [00:20, 4.66it/s] 92it [00:20, 4.51it/s] 93it [00:20, 4.57it/s] 94it [00:20, 4.60it/s] 95it [00:21, 4.62it/s] 96it [00:21, 4.64it/s] 97it [00:21, 4.65it/s] 98it [00:21, 4.65it/s] 99it [00:21, 4.66it/s] 100it [00:22, 4.66it/s]2025-05-25 23:04:07,990 - INFO - [Epoch 012 | Batch 0100] IWAE-loss 7227.1890 | mean log_px -0.0753 | KL -2570.68 + 101it [00:22, 4.67it/s] 102it [00:22, 4.53it/s] 103it [00:22, 4.57it/s] 104it [00:23, 4.61it/s] 105it [00:23, 4.59it/s] 106it [00:23, 4.61it/s] 107it [00:23, 4.63it/s] 108it [00:23, 4.50it/s] 109it [00:24, 4.56it/s] 110it [00:24, 4.59it/s] 111it [00:24, 4.46it/s] 112it [00:24, 4.52it/s] 113it [00:24, 4.56it/s] 114it [00:25, 4.57it/s] 115it [00:25, 4.61it/s] 116it [00:25, 4.60it/s] 117it [00:25, 4.46it/s] 118it [00:26, 4.51it/s] 119it [00:26, 4.54it/s] 120it [00:26, 4.43it/s] 121it [00:26, 4.50it/s] 122it [00:26, 4.52it/s] 123it [00:27, 4.57it/s] 124it [00:27, 4.59it/s] 125it [00:27, 4.61it/s] 126it [00:27, 4.47it/s] 127it [00:28, 4.53it/s] 128it [00:28, 4.56it/s] 129it [00:28, 4.54it/s] 130it [00:28, 4.57it/s] 131it [00:28, 4.60it/s] 132it [00:29, 4.61it/s] 133it [00:29, 4.63it/s] 134it [00:29, 4.64it/s] 135it [00:29, 4.55it/s] 136it [00:30, 4.50it/s] 137it [00:30, 4.55it/s] 138it [00:30, 4.44it/s] 139it [00:30, 4.51it/s] 140it [00:30, 4.54it/s] 141it [00:31, 4.58it/s] 142it [00:31, 4.59it/s] 143it [00:31, 4.61it/s] 144it [00:31, 4.46it/s] 145it [00:32, 4.52it/s] 146it [00:32, 4.56it/s] 147it [00:32, 4.58it/s] 148it [00:32, 4.60it/s] 149it [00:32, 4.61it/s] 150it [00:33, 4.63it/s]2025-05-25 23:04:18,966 - INFO - [Epoch 012 | Batch 0150] IWAE-loss 3201.9055 | mean log_px -0.0163 | KL -2551.84 + 151it [00:33, 4.64it/s] 152it [00:33, 4.64it/s] 153it [00:33, 4.66it/s] 154it [00:33, 4.46it/s] 155it [00:34, 4.53it/s] 156it [00:34, 4.56it/s] 157it [00:34, 4.56it/s] 158it [00:34, 4.58it/s] 159it [00:35, 4.61it/s] 160it [00:35, 4.62it/s] 161it [00:35, 4.63it/s] 162it [00:35, 4.64it/s] 163it [00:35, 4.55it/s] 164it [00:36, 4.60it/s] 165it [00:36, 4.61it/s] 166it [00:36, 4.62it/s] 167it [00:36, 4.63it/s] 168it [00:37, 4.64it/s] 169it [00:37, 4.64it/s] 170it [00:37, 4.64it/s] 171it [00:37, 4.64it/s] 172it [00:37, 4.50it/s] 173it [00:38, 4.55it/s] 174it [00:38, 4.57it/s] 175it [00:38, 4.60it/s] 176it [00:38, 4.61it/s] 177it [00:38, 4.63it/s] 178it [00:39, 4.62it/s] 179it [00:39, 4.63it/s] 180it [00:39, 4.64it/s] 181it [00:39, 4.63it/s] 182it [00:40, 4.50it/s] 183it [00:40, 4.55it/s] 184it [00:40, 4.57it/s] 185it [00:40, 4.61it/s] 186it [00:40, 4.62it/s] 187it [00:41, 4.63it/s] 188it [00:41, 4.49it/s] 189it [00:41, 4.54it/s] 190it [00:41, 4.56it/s] 191it [00:42, 4.55it/s] 192it [00:42, 4.58it/s] 193it [00:42, 4.61it/s] 194it [00:42, 4.62it/s] 195it [00:42, 4.51it/s] 196it [00:43, 4.55it/s] 196it [00:43, 4.54it/s] +2025-05-25 23:04:28,914 - INFO - Epoch: 12, Objective: tensor([2863.8979], device='cuda:0', grad_fn=), Loss: 0.006043643224984407, KL/n: 51.6978874206543 + 0it [00:00, ?it/s]2025-05-25 23:04:29,296 - INFO - [Epoch 013 | Batch 0000] IWAE-loss 2755.2402 | mean log_px -0.0041 | KL -2532.30 + 1it [00:00, 2.97it/s] 2it [00:00, 3.78it/s] 3it [00:00, 4.15it/s] 4it [00:00, 4.33it/s] 5it [00:01, 4.39it/s] 6it [00:01, 4.48it/s] 7it [00:01, 4.55it/s] 8it [00:01, 4.58it/s] 9it [00:02, 4.61it/s] 10it [00:02, 4.60it/s] 11it [00:02, 4.48it/s] 12it [00:02, 4.45it/s] 13it [00:02, 4.51it/s] 14it [00:03, 4.57it/s] 15it [00:03, 4.59it/s] 16it [00:03, 4.61it/s] 17it [00:03, 4.63it/s] 18it [00:04, 4.65it/s] 19it [00:04, 4.51it/s] 20it [00:04, 4.56it/s] 21it [00:04, 4.60it/s] 22it [00:04, 4.62it/s] 23it [00:05, 4.57it/s] 24it [00:05, 4.40it/s] 25it [00:05, 4.49it/s] 26it [00:05, 4.54it/s] 27it [00:06, 4.43it/s] 28it [00:06, 4.48it/s] 29it [00:06, 4.54it/s] 30it [00:06, 4.59it/s] 31it [00:06, 4.62it/s] 32it [00:07, 4.64it/s] 33it [00:07, 4.65it/s] 34it [00:07, 4.66it/s] 35it [00:07, 4.67it/s] 36it [00:07, 4.62it/s] 37it [00:08, 4.64it/s] 38it [00:08, 4.64it/s] 39it [00:08, 4.43it/s] 40it [00:08, 4.50it/s] 41it [00:09, 4.55it/s] 42it [00:09, 4.60it/s] 43it [00:09, 4.63it/s] 44it [00:09, 4.65it/s] 45it [00:09, 4.67it/s] 46it [00:10, 4.52it/s] 47it [00:10, 4.58it/s] 48it [00:10, 4.62it/s] 49it [00:10, 4.65it/s] 50it [00:11, 4.66it/s]2025-05-25 23:04:40,215 - INFO - [Epoch 013 | Batch 0050] IWAE-loss 2921.4778 | mean log_px -0.0094 | KL -2503.91 + 51it [00:11, 4.68it/s] 52it [00:11, 4.52it/s] 53it [00:11, 4.57it/s] 54it [00:11, 4.60it/s] 55it [00:12, 4.64it/s] 56it [00:12, 4.65it/s] 57it [00:12, 4.67it/s] 58it [00:12, 4.63it/s] 59it [00:12, 4.49it/s] 60it [00:13, 4.55it/s] 61it [00:13, 4.58it/s] 62it [00:13, 4.61it/s] 63it [00:13, 4.64it/s] 64it [00:14, 4.64it/s] 65it [00:14, 4.63it/s] 66it [00:14, 4.65it/s] 67it [00:14, 4.51it/s] 68it [00:14, 4.56it/s] 69it [00:15, 4.60it/s] 70it [00:15, 4.62it/s] 71it [00:15, 4.44it/s] 72it [00:15, 4.52it/s] 73it [00:16, 4.57it/s] 74it [00:16, 4.59it/s] 75it [00:16, 4.62it/s] 76it [00:16, 4.63it/s] 77it [00:16, 4.65it/s] 78it [00:17, 4.66it/s] 79it [00:17, 4.63it/s] 80it [00:17, 4.65it/s] 81it [00:17, 4.65it/s] 82it [00:17, 4.45it/s] 83it [00:18, 4.51it/s] 84it [00:18, 4.54it/s] 85it [00:18, 4.58it/s] 86it [00:18, 4.40it/s] 87it [00:19, 4.48it/s] 88it [00:19, 4.50it/s] 89it [00:19, 4.56it/s] 90it [00:19, 4.58it/s] 91it [00:19, 4.61it/s] 92it [00:20, 4.63it/s] 93it [00:20, 4.65it/s] 94it [00:20, 4.65it/s] 95it [00:20, 4.52it/s] 96it [00:21, 4.58it/s] 97it [00:21, 4.61it/s] 98it [00:21, 4.63it/s] 99it [00:21, 4.57it/s] 100it [00:21, 4.54it/s]2025-05-25 23:04:51,136 - INFO - [Epoch 013 | Batch 0100] IWAE-loss 3051.0591 | mean log_px -0.0105 | KL -2480.72 + 101it [00:22, 4.58it/s] 102it [00:22, 4.60it/s] 103it [00:22, 4.45it/s] 104it [00:22, 4.50it/s] 105it [00:23, 4.54it/s] 106it [00:23, 4.57it/s] 107it [00:23, 4.60it/s] 108it [00:23, 4.61it/s] 109it [00:23, 4.49it/s] 110it [00:24, 4.54it/s] 111it [00:24, 4.58it/s] 112it [00:24, 4.59it/s] 113it [00:24, 4.61it/s] 114it [00:24, 4.62it/s] 115it [00:25, 4.63it/s] 116it [00:25, 4.64it/s] 117it [00:25, 4.63it/s] 118it [00:25, 4.64it/s] 119it [00:26, 4.49it/s] 120it [00:26, 4.55it/s] 121it [00:26, 4.58it/s] 122it [00:26, 4.60it/s] 123it [00:26, 4.62it/s] 124it [00:27, 4.64it/s] 125it [00:27, 4.65it/s] 126it [00:27, 4.65it/s] 127it [00:27, 4.51it/s] 128it [00:28, 4.55it/s] 129it [00:28, 4.59it/s] 130it [00:28, 4.59it/s] 131it [00:28, 4.61it/s] 132it [00:28, 4.61it/s] 133it [00:29, 4.62it/s] 134it [00:29, 4.53it/s] 135it [00:29, 4.58it/s] 136it [00:29, 4.59it/s] 137it [00:30, 4.58it/s] 138it [00:30, 4.60it/s] 139it [00:30, 4.62it/s] 140it [00:30, 4.63it/s] 141it [00:30, 4.64it/s] 142it [00:31, 4.64it/s] 143it [00:31, 4.50it/s] 144it [00:31, 4.54it/s] 145it [00:31, 4.59it/s] 146it [00:31, 4.60it/s] 147it [00:32, 4.63it/s] 148it [00:32, 4.60it/s] 149it [00:32, 4.58it/s] 150it [00:32, 4.59it/s]2025-05-25 23:05:02,033 - INFO - [Epoch 013 | Batch 0150] IWAE-loss 2694.3430 | mean log_px -0.0060 | KL -2454.87 + 151it [00:33, 4.61it/s] 152it [00:33, 4.59it/s] 153it [00:33, 4.58it/s] 154it [00:33, 4.59it/s] 155it [00:33, 4.62it/s] 156it [00:34, 4.63it/s] 157it [00:34, 4.64it/s] 158it [00:34, 4.64it/s] 159it [00:34, 4.65it/s] 160it [00:34, 4.64it/s] 161it [00:35, 4.66it/s] 162it [00:35, 4.65it/s] 163it [00:35, 4.66it/s] 164it [00:35, 4.67it/s] 165it [00:36, 4.66it/s] 166it [00:36, 4.66it/s] 167it [00:36, 4.64it/s] 168it [00:36, 4.52it/s] 169it [00:36, 4.51it/s] 170it [00:37, 4.54it/s] 171it [00:37, 4.59it/s] 172it [00:37, 4.61it/s] 173it [00:37, 4.64it/s] 174it [00:38, 4.63it/s] 175it [00:38, 4.63it/s] 176it [00:38, 4.64it/s] 177it [00:38, 4.65it/s] 178it [00:38, 4.65it/s] 179it [00:39, 4.66it/s] 180it [00:39, 4.66it/s] 181it [00:39, 4.67it/s] 182it [00:39, 4.66it/s] 183it [00:39, 4.68it/s] 184it [00:40, 4.67it/s] 185it [00:40, 4.67it/s] 186it [00:40, 4.64it/s] 187it [00:40, 4.66it/s] 188it [00:41, 4.67it/s] 189it [00:41, 4.67it/s] 190it [00:41, 4.67it/s] 191it [00:41, 4.67it/s] 192it [00:41, 4.66it/s] 193it [00:42, 4.67it/s] 194it [00:42, 4.67it/s] 195it [00:42, 4.53it/s] 196it [00:42, 4.56it/s] 196it [00:42, 4.58it/s] +2025-05-25 23:05:11,860 - INFO - Epoch: 13, Objective: tensor([4922.8945], device='cuda:0', grad_fn=), Loss: 0.041003212332725525, KL/n: 49.89161682128906 + 0it [00:00, ?it/s]2025-05-25 23:05:12,426 - INFO - [Epoch 014 | Batch 0000] IWAE-loss 2859.6846 | mean log_px -0.0121 | KL -2441.73 + 1it [00:00, 2.92it/s] 2it [00:00, 3.57it/s] 3it [00:00, 4.01it/s] 4it [00:01, 4.21it/s] 5it [00:01, 4.35it/s] 6it [00:01, 4.26it/s] 7it [00:01, 4.30it/s] 8it [00:01, 4.26it/s] 9it [00:02, 4.28it/s] 10it [00:02, 4.37it/s] 11it [00:02, 4.46it/s] 12it [00:02, 4.50it/s] 13it [00:03, 4.46it/s] 14it [00:03, 4.45it/s] 15it [00:03, 4.52it/s] 16it [00:03, 4.34it/s] 17it [00:03, 4.35it/s] 18it [00:04, 4.43it/s] 19it [00:04, 4.41it/s] 20it [00:04, 4.50it/s] 21it [00:04, 4.34it/s] 22it [00:05, 4.30it/s] 23it [00:05, 4.32it/s] 24it [00:05, 4.28it/s] 25it [00:05, 4.39it/s] 26it [00:06, 4.32it/s] 27it [00:06, 4.26it/s] 28it [00:06, 4.28it/s] 29it [00:06, 4.27it/s] 30it [00:06, 4.35it/s] 31it [00:07, 4.39it/s] 32it [00:07, 4.30it/s] 33it [00:07, 4.32it/s] 34it [00:07, 4.26it/s] 35it [00:08, 4.29it/s] 36it [00:08, 4.34it/s] 37it [00:08, 4.44it/s] 38it [00:08, 4.33it/s] 39it [00:09, 4.33it/s] 40it [00:09, 4.25it/s] 41it [00:09, 4.37it/s] 42it [00:09, 4.44it/s] 43it [00:09, 4.42it/s] 44it [00:10, 4.48it/s] 45it [00:10, 4.50it/s] 46it [00:10, 4.43it/s] 47it [00:10, 4.50it/s] 48it [00:11, 4.52it/s] 49it [00:11, 4.55it/s] 50it [00:11, 4.44it/s]2025-05-25 23:05:23,847 - INFO - [Epoch 014 | Batch 0050] IWAE-loss 3013.0603 | mean log_px -0.0122 | KL -2423.46 + 51it [00:11, 4.37it/s] 52it [00:11, 4.40it/s] 53it [00:12, 4.32it/s] 54it [00:12, 4.39it/s] 55it [00:12, 4.33it/s] 56it [00:12, 4.40it/s] 57it [00:13, 4.35it/s] 58it [00:13, 4.44it/s] 59it [00:13, 4.33it/s] 60it [00:13, 4.44it/s] 61it [00:14, 4.50it/s] 62it [00:14, 4.33it/s] 63it [00:14, 4.34it/s] 64it [00:14, 4.28it/s] 65it [00:14, 4.26it/s] 66it [00:15, 4.37it/s] 67it [00:15, 4.31it/s] 68it [00:15, 4.41it/s] 69it [00:15, 4.41it/s] 70it [00:16, 4.32it/s] 71it [00:16, 4.30it/s] 72it [00:16, 4.27it/s] 73it [00:16, 4.39it/s] 74it [00:17, 4.35it/s] 75it [00:17, 4.32it/s] 76it [00:17, 4.40it/s] 77it [00:17, 4.47it/s] 78it [00:17, 4.34it/s] 79it [00:18, 4.33it/s] 80it [00:18, 4.42it/s] 81it [00:18, 4.38it/s] 82it [00:18, 4.47it/s] 83it [00:19, 4.39it/s] 84it [00:19, 4.20it/s] 85it [00:19, 4.22it/s] 86it [00:19, 4.22it/s] 87it [00:20, 4.23it/s] 88it [00:20, 4.17it/s] 89it [00:20, 4.11it/s] 90it [00:20, 4.22it/s] 91it [00:20, 4.35it/s] 92it [00:21, 4.27it/s] 93it [00:21, 4.38it/s] 94it [00:21, 4.28it/s] 95it [00:21, 4.29it/s] 96it [00:22, 4.11it/s] 97it [00:22, 4.12it/s] 98it [00:22, 4.22it/s] 99it [00:22, 4.27it/s] 100it [00:23, 4.37it/s]2025-05-25 23:05:35,427 - INFO - [Epoch 014 | Batch 0100] IWAE-loss 3804.5000 | mean log_px -0.0205 | KL -2399.92 + 101it [00:23, 4.30it/s] 102it [00:23, 4.38it/s] 103it [00:23, 4.40it/s] 104it [00:23, 4.45it/s] 105it [00:24, 4.53it/s] 106it [00:24, 4.38it/s] 107it [00:24, 4.36it/s] 108it [00:24, 4.28it/s] 109it [00:25, 4.40it/s] 110it [00:25, 4.31it/s] 111it [00:25, 4.33it/s] 112it [00:25, 4.26it/s] 113it [00:26, 4.29it/s] 114it [00:26, 4.35it/s] 115it [00:26, 4.37it/s] 116it [00:26, 4.37it/s] 117it [00:26, 4.28it/s] 118it [00:27, 4.25it/s] 119it [00:27, 4.35it/s] 120it [00:27, 4.28it/s] 121it [00:27, 4.25it/s] 122it [00:28, 4.22it/s] 123it [00:28, 4.31it/s] 124it [00:28, 4.41it/s] 125it [00:28, 4.49it/s] 126it [00:29, 4.41it/s] 127it [00:29, 4.34it/s] 128it [00:29, 4.32it/s] 129it [00:29, 4.30it/s] 130it [00:30, 4.28it/s] 131it [00:30, 4.40it/s] 132it [00:30, 4.34it/s] 133it [00:30, 4.30it/s] 134it [00:30, 4.27it/s] 135it [00:31, 4.35it/s] 136it [00:31, 4.43it/s] 137it [00:31, 4.50it/s] 138it [00:31, 4.54it/s] 139it [00:32, 4.44it/s] 140it [00:32, 4.37it/s] 141it [00:32, 4.32it/s] 142it [00:32, 4.31it/s] 143it [00:32, 4.36it/s] 144it [00:33, 4.30it/s] 145it [00:33, 4.15it/s] 146it [00:33, 4.19it/s] 147it [00:33, 4.31it/s] 148it [00:34, 4.37it/s] 149it [00:34, 4.41it/s] 150it [00:34, 4.39it/s]2025-05-25 23:05:46,915 - INFO - [Epoch 014 | Batch 0150] IWAE-loss 3109.0154 | mean log_px -0.0184 | KL -2386.44 + 151it [00:34, 4.28it/s] 152it [00:35, 4.27it/s] 153it [00:35, 4.25it/s] 154it [00:35, 4.27it/s] 155it [00:35, 4.26it/s] 156it [00:36, 4.25it/s] 157it [00:36, 4.13it/s] 158it [00:36, 4.16it/s] 159it [00:36, 4.22it/s] 160it [00:36, 4.33it/s] 161it [00:37, 4.31it/s] 162it [00:37, 4.32it/s] 163it [00:37, 4.14it/s] 164it [00:37, 4.15it/s] 165it [00:38, 4.17it/s] 166it [00:38, 4.28it/s] 167it [00:38, 4.11it/s] 168it [00:38, 4.15it/s] 169it [00:39, 4.25it/s] 170it [00:39, 4.28it/s] 171it [00:39, 4.27it/s] 172it [00:39, 4.26it/s] 173it [00:40, 4.23it/s] 174it [00:40, 4.20it/s] 175it [00:40, 4.22it/s] 176it [00:40, 4.19it/s] 177it [00:40, 4.22it/s] 178it [00:41, 4.34it/s] 179it [00:41, 4.27it/s] 180it [00:41, 4.37it/s] 181it [00:41, 4.43it/s] 182it [00:42, 4.48it/s] 183it [00:42, 4.33it/s] 184it [00:42, 4.43it/s] 185it [00:42, 4.46it/s] 186it [00:43, 4.43it/s] 187it [00:43, 4.35it/s] 188it [00:43, 4.37it/s] 189it [00:43, 4.38it/s] 190it [00:43, 4.43it/s] 191it [00:44, 4.50it/s] 192it [00:44, 4.33it/s] 193it [00:44, 4.33it/s] 194it [00:44, 4.42it/s] 195it [00:45, 4.35it/s] 196it [00:45, 4.28it/s] 196it [00:45, 4.32it/s] +2025-05-25 23:05:57,563 - INFO - Epoch: 14, Objective: tensor([2733.1536], device='cuda:0', grad_fn=), Loss: 0.013086755760014057, KL/n: 48.29157638549805 + 0it [00:00, ?it/s]2025-05-25 23:05:57,931 - INFO - [Epoch 015 | Batch 0000] IWAE-loss 3566.3582 | mean log_px -0.0216 | KL -2368.83 + 1it [00:00, 3.37it/s] 2it [00:00, 4.02it/s] 3it [00:00, 4.29it/s] 4it [00:00, 4.41it/s] 5it [00:01, 4.52it/s] 6it [00:01, 4.55it/s] 7it [00:01, 4.59it/s] 8it [00:01, 4.44it/s] 9it [00:02, 3.57it/s] 10it [00:02, 3.84it/s] 11it [00:02, 4.06it/s] 12it [00:02, 4.21it/s] 13it [00:03, 4.34it/s] 14it [00:03, 4.43it/s] 15it [00:03, 4.49it/s] 16it [00:03, 4.40it/s] 17it [00:03, 4.47it/s] 18it [00:04, 4.53it/s] 19it [00:04, 4.56it/s] 20it [00:04, 4.59it/s] 21it [00:04, 4.60it/s] 22it [00:05, 4.60it/s] 23it [00:05, 4.57it/s] 24it [00:05, 4.60it/s] 25it [00:05, 4.62it/s] 26it [00:05, 4.48it/s] 27it [00:06, 4.53it/s] 28it [00:06, 4.57it/s] 29it [00:06, 4.60it/s] 30it [00:06, 4.62it/s] 31it [00:07, 4.65it/s] 32it [00:07, 4.65it/s] 33it [00:07, 4.66it/s] 34it [00:07, 4.66it/s] 35it [00:07, 4.67it/s] 36it [00:08, 4.52it/s] 37it [00:08, 4.56it/s] 38it [00:08, 4.59it/s] 39it [00:08, 4.62it/s] 40it [00:08, 4.63it/s] 41it [00:09, 4.65it/s] 42it [00:09, 4.65it/s] 43it [00:09, 4.55it/s] 44it [00:09, 4.59it/s] 45it [00:10, 4.62it/s] 46it [00:10, 4.63it/s] 47it [00:10, 4.65it/s] 48it [00:10, 4.51it/s] 49it [00:10, 4.58it/s] 50it [00:11, 4.61it/s]2025-05-25 23:06:08,987 - INFO - [Epoch 015 | Batch 0050] IWAE-loss 2586.0901 | mean log_px -0.0101 | KL -2342.14 + 51it [00:11, 4.62it/s] 52it [00:11, 4.63it/s] 53it [00:11, 4.62it/s] 54it [00:12, 4.49it/s] 55it [00:12, 4.56it/s] 56it [00:12, 4.59it/s] 57it [00:12, 4.62it/s] 58it [00:12, 4.62it/s] 59it [00:13, 4.60it/s] 60it [00:13, 4.62it/s] 61it [00:13, 4.60it/s] 62it [00:13, 4.60it/s] 63it [00:13, 4.48it/s] 64it [00:14, 4.54it/s] 65it [00:14, 4.58it/s] 66it [00:14, 4.60it/s] 67it [00:14, 4.61it/s] 68it [00:15, 4.61it/s] 69it [00:15, 4.63it/s] 70it [00:15, 4.63it/s] 71it [00:15, 4.50it/s] 72it [00:15, 4.55it/s] 73it [00:16, 4.58it/s] 74it [00:16, 4.59it/s] 75it [00:16, 4.61it/s] 76it [00:16, 4.59it/s] 77it [00:17, 4.62it/s] 78it [00:17, 4.48it/s] 79it [00:17, 4.55it/s] 80it [00:17, 4.58it/s] 81it [00:17, 4.61it/s] 82it [00:18, 4.63it/s] 83it [00:18, 4.65it/s] 84it [00:18, 4.58it/s] 85it [00:18, 4.61it/s] 86it [00:18, 4.62it/s] 87it [00:19, 4.64it/s] 88it [00:19, 4.64it/s] 89it [00:19, 4.66it/s] 90it [00:19, 4.65it/s] 91it [00:20, 4.66it/s] 92it [00:20, 4.67it/s] 93it [00:20, 4.67it/s] 94it [00:20, 4.67it/s] 95it [00:20, 4.67it/s] 96it [00:21, 4.67it/s] 97it [00:21, 4.68it/s] 98it [00:21, 4.68it/s] 99it [00:21, 4.68it/s] 100it [00:21, 4.67it/s]2025-05-25 23:06:19,825 - INFO - [Epoch 015 | Batch 0100] IWAE-loss 2982.4482 | mean log_px -0.0107 | KL -2318.40 + 101it [00:22, 4.67it/s] 102it [00:22, 4.67it/s] 103it [00:22, 4.67it/s] 104it [00:22, 4.65it/s] 105it [00:23, 4.66it/s] 106it [00:23, 4.65it/s] 107it [00:23, 4.41it/s] 108it [00:23, 4.43it/s] 109it [00:23, 4.46it/s] 110it [00:24, 4.48it/s] 111it [00:24, 4.49it/s] 112it [00:24, 4.48it/s] 113it [00:24, 4.53it/s] 114it [00:25, 4.56it/s] 115it [00:25, 4.44it/s] 116it [00:25, 4.49it/s] 117it [00:25, 4.54it/s] 118it [00:25, 4.57it/s] 119it [00:26, 4.59it/s] 120it [00:26, 4.60it/s] 121it [00:26, 4.61it/s] 122it [00:26, 4.61it/s] 123it [00:27, 4.47it/s] 124it [00:27, 4.52it/s] 125it [00:27, 4.56it/s] 126it [00:27, 4.57it/s] 127it [00:27, 4.59it/s] 128it [00:28, 4.56it/s] 129it [00:28, 4.59it/s] 130it [00:28, 4.60it/s] 131it [00:28, 4.60it/s] 132it [00:28, 4.61it/s] 133it [00:29, 4.61it/s] 134it [00:29, 4.62it/s] 135it [00:29, 4.63it/s] 136it [00:29, 4.60it/s] 137it [00:30, 4.61it/s] 138it [00:30, 4.62it/s] 139it [00:30, 4.49it/s] 140it [00:30, 4.54it/s] 141it [00:30, 4.57it/s] 142it [00:31, 4.58it/s] 143it [00:31, 4.61it/s] 144it [00:31, 4.47it/s] 145it [00:31, 4.52it/s] 146it [00:32, 4.56it/s] 147it [00:32, 4.59it/s] 148it [00:32, 4.60it/s] 149it [00:32, 4.61it/s] 150it [00:32, 4.62it/s]2025-05-25 23:06:30,782 - INFO - [Epoch 015 | Batch 0150] IWAE-loss 3421.2581 | mean log_px -0.0186 | KL -2299.48 + 151it [00:33, 4.62it/s] 152it [00:33, 4.63it/s] 153it [00:33, 4.48it/s] 154it [00:33, 4.54it/s] 155it [00:34, 4.57it/s] 156it [00:34, 4.59it/s] 157it [00:34, 4.60it/s] 158it [00:34, 4.61it/s] 159it [00:34, 4.62it/s] 160it [00:35, 4.63it/s] 161it [00:35, 4.64it/s] 162it [00:35, 4.63it/s] 163it [00:35, 4.48it/s] 164it [00:35, 4.52it/s] 165it [00:36, 4.56it/s] 166it [00:36, 4.58it/s] 167it [00:36, 4.59it/s] 168it [00:36, 4.60it/s] 169it [00:37, 4.61it/s] 170it [00:37, 4.62it/s] 171it [00:37, 4.62it/s] 172it [00:37, 4.48it/s] 173it [00:37, 4.47it/s] 174it [00:38, 4.52it/s] 175it [00:38, 4.54it/s] 176it [00:38, 4.54it/s] 177it [00:38, 4.55it/s] 178it [00:39, 4.54it/s] 179it [00:39, 4.58it/s] 180it [00:39, 4.41it/s] 181it [00:39, 4.45it/s] 182it [00:39, 4.50it/s] 183it [00:40, 4.50it/s] 184it [00:40, 4.53it/s] 185it [00:40, 4.57it/s] 186it [00:40, 4.58it/s] 187it [00:41, 4.60it/s] 188it [00:41, 4.61it/s] 189it [00:41, 4.48it/s] 190it [00:41, 4.53it/s] 191it [00:41, 4.57it/s] 192it [00:42, 4.58it/s] 193it [00:42, 4.59it/s] 194it [00:42, 4.61it/s] 195it [00:42, 4.50it/s] 196it [00:43, 4.56it/s] 196it [00:43, 4.55it/s] +2025-05-25 23:06:40,792 - INFO - Epoch: 15, Objective: tensor([2673.8301], device='cuda:0', grad_fn=), Loss: 0.006941231433302164, KL/n: 46.54920196533203 + 0it [00:00, ?it/s]2025-05-25 23:06:41,163 - INFO - [Epoch 016 | Batch 0000] IWAE-loss 2568.5730 | mean log_px -0.0058 | KL -2277.45 + 1it [00:00, 3.10it/s] 2it [00:00, 3.80it/s] 3it [00:00, 4.16it/s] 4it [00:00, 4.32it/s] 5it [00:01, 4.42it/s] 6it [00:01, 4.49it/s] 7it [00:01, 4.54it/s] 8it [00:01, 4.41it/s] 9it [00:02, 4.50it/s] 10it [00:02, 4.54it/s] 11it [00:02, 4.57it/s] 12it [00:02, 4.60it/s] 13it [00:02, 4.62it/s] 14it [00:03, 4.48it/s] 15it [00:03, 4.55it/s] 16it [00:03, 4.58it/s] 17it [00:03, 4.62it/s] 18it [00:04, 4.63it/s] 19it [00:04, 4.65it/s] 20it [00:04, 4.50it/s] 21it [00:04, 4.56it/s] 22it [00:04, 4.59it/s] 23it [00:05, 4.62it/s] 24it [00:05, 4.63it/s] 25it [00:05, 4.63it/s] 26it [00:05, 4.49it/s] 27it [00:06, 4.56it/s] 28it [00:06, 4.57it/s] 29it [00:06, 4.60it/s] 30it [00:06, 4.61it/s] 31it [00:06, 4.62it/s] 32it [00:07, 4.49it/s] 33it [00:07, 4.55it/s] 34it [00:07, 4.57it/s] 35it [00:07, 4.57it/s] 36it [00:07, 4.59it/s] 37it [00:08, 4.62it/s] 38it [00:08, 4.48it/s] 39it [00:08, 4.54it/s] 40it [00:08, 4.52it/s] 41it [00:09, 4.57it/s] 42it [00:09, 4.60it/s] 43it [00:09, 4.62it/s] 44it [00:09, 4.62it/s] 45it [00:09, 4.65it/s] 46it [00:10, 4.65it/s] 47it [00:10, 4.66it/s] 48it [00:10, 4.66it/s] 49it [00:10, 4.52it/s] 50it [00:11, 4.58it/s]2025-05-25 23:06:52,097 - INFO - [Epoch 016 | Batch 0050] IWAE-loss 2469.5354 | mean log_px -0.0050 | KL -2246.70 + 51it [00:11, 4.60it/s] 52it [00:11, 4.52it/s] 53it [00:11, 4.47it/s] 54it [00:11, 4.51it/s] 55it [00:12, 4.54it/s] 56it [00:12, 4.56it/s] 57it [00:12, 4.58it/s] 58it [00:12, 4.45it/s] 59it [00:13, 4.48it/s] 60it [00:13, 4.54it/s] 61it [00:13, 4.59it/s] 62it [00:13, 4.60it/s] 63it [00:13, 4.63it/s] 64it [00:14, 4.49it/s] 65it [00:14, 4.54it/s] 66it [00:14, 4.57it/s] 67it [00:14, 4.60it/s] 68it [00:14, 4.61it/s] 69it [00:15, 4.63it/s] 70it [00:15, 4.64it/s] 71it [00:15, 4.50it/s] 72it [00:15, 4.55it/s] 73it [00:16, 4.58it/s] 74it [00:16, 4.51it/s] 75it [00:16, 4.57it/s] 76it [00:16, 4.59it/s] 77it [00:16, 4.62it/s] 78it [00:17, 4.63it/s] 79it [00:17, 4.50it/s] 80it [00:17, 4.55it/s] 81it [00:17, 4.59it/s] 82it [00:18, 4.61it/s] 83it [00:18, 4.62it/s] 84it [00:18, 4.63it/s] 85it [00:18, 4.49it/s] 86it [00:18, 4.55it/s] 87it [00:19, 4.55it/s] 88it [00:19, 4.59it/s] 89it [00:19, 4.62it/s] 90it [00:19, 4.63it/s] 91it [00:20, 4.48it/s] 92it [00:20, 4.54it/s] 93it [00:20, 4.58it/s] 94it [00:20, 4.59it/s] 95it [00:20, 4.61it/s] 96it [00:21, 4.61it/s] 97it [00:21, 4.47it/s] 98it [00:21, 4.53it/s] 99it [00:21, 4.57it/s] 100it [00:21, 4.59it/s]2025-05-25 23:07:03,052 - INFO - [Epoch 016 | Batch 0100] IWAE-loss 2823.7253 | mean log_px -0.0109 | KL -2227.54 + 101it [00:22, 4.60it/s] 102it [00:22, 4.62it/s] 103it [00:22, 4.49it/s] 104it [00:22, 4.54it/s] 105it [00:23, 4.58it/s] 106it [00:23, 4.60it/s] 107it [00:23, 4.62it/s] 108it [00:23, 4.63it/s] 109it [00:23, 4.50it/s] 110it [00:24, 4.55it/s] 111it [00:24, 4.59it/s] 112it [00:24, 4.60it/s] 113it [00:24, 4.63it/s] 114it [00:25, 4.64it/s] 115it [00:25, 4.49it/s] 116it [00:25, 4.54it/s] 117it [00:25, 4.58it/s] 118it [00:25, 4.60it/s] 119it [00:26, 4.47it/s] 120it [00:26, 4.53it/s] 121it [00:26, 4.56it/s] 122it [00:26, 4.59it/s] 123it [00:27, 4.61it/s] 124it [00:27, 4.62it/s] 125it [00:27, 4.48it/s] 126it [00:27, 4.55it/s] 127it [00:27, 4.58it/s] 128it [00:28, 4.60it/s] 129it [00:28, 4.62it/s] 130it [00:28, 4.63it/s] 131it [00:28, 4.49it/s] 132it [00:28, 4.54it/s] 133it [00:29, 4.58it/s] 134it [00:29, 4.60it/s] 135it [00:29, 4.62it/s] 136it [00:29, 4.63it/s] 137it [00:30, 4.48it/s] 138it [00:30, 4.53it/s] 139it [00:30, 4.57it/s] 140it [00:30, 4.55it/s] 141it [00:30, 4.58it/s] 142it [00:31, 4.59it/s] 143it [00:31, 4.44it/s] 144it [00:31, 4.51it/s] 145it [00:31, 4.55it/s] 146it [00:32, 4.57it/s] 147it [00:32, 4.60it/s] 148it [00:32, 4.61it/s] 149it [00:32, 4.48it/s] 150it [00:32, 4.54it/s]2025-05-25 23:07:14,011 - INFO - [Epoch 016 | Batch 0150] IWAE-loss 2373.7930 | mean log_px -0.0035 | KL -2207.88 + 151it [00:33, 4.58it/s] 152it [00:33, 4.60it/s] 153it [00:33, 4.62it/s] 154it [00:33, 4.63it/s] 155it [00:34, 4.46it/s] 156it [00:34, 4.53it/s] 157it [00:34, 4.57it/s] 158it [00:34, 4.59it/s] 159it [00:34, 4.62it/s] 160it [00:35, 4.63it/s] 161it [00:35, 4.48it/s] 162it [00:35, 4.54it/s] 163it [00:35, 4.58it/s] 164it [00:35, 4.60it/s] 165it [00:36, 4.62it/s] 166it [00:36, 4.63it/s] 167it [00:36, 4.48it/s] 168it [00:36, 4.54it/s] 169it [00:37, 4.59it/s] 170it [00:37, 4.60it/s] 171it [00:37, 4.62it/s] 172it [00:37, 4.64it/s] 173it [00:37, 4.50it/s] 174it [00:38, 4.56it/s] 175it [00:38, 4.59it/s] 176it [00:38, 4.60it/s] 177it [00:38, 4.62it/s] 178it [00:39, 4.64it/s] 179it [00:39, 4.49it/s] 180it [00:39, 4.55it/s] 181it [00:39, 4.58it/s] 182it [00:39, 4.60it/s] 183it [00:40, 4.62it/s] 184it [00:40, 4.48it/s] 185it [00:40, 4.54it/s] 186it [00:40, 4.57it/s] 187it [00:41, 4.61it/s] 188it [00:41, 4.62it/s] 189it [00:41, 4.63it/s] 190it [00:41, 4.48it/s] 191it [00:41, 4.54it/s] 192it [00:42, 4.55it/s] 193it [00:42, 4.59it/s] 194it [00:42, 4.60it/s] 195it [00:42, 4.39it/s] 196it [00:43, 4.26it/s] 196it [00:43, 4.55it/s] +2025-05-25 23:07:24,037 - INFO - Epoch: 16, Objective: tensor([2848.4922], device='cuda:0', grad_fn=), Loss: 0.02026955410838127, KL/n: 44.883338928222656 + 0it [00:00, ?it/s]2025-05-25 23:07:24,588 - INFO - [Epoch 017 | Batch 0000] IWAE-loss 2439.9866 | mean log_px -0.0047 | KL -2197.12 + 1it [00:00, 3.31it/s] 2it [00:00, 3.98it/s] 3it [00:00, 4.27it/s] 4it [00:00, 4.41it/s] 5it [00:01, 4.47it/s] 6it [00:01, 4.52it/s] 7it [00:01, 4.57it/s] 8it [00:01, 4.55it/s] 9it [00:02, 4.59it/s] 10it [00:02, 4.60it/s] 11it [00:02, 4.61it/s] 12it [00:02, 4.59it/s] 13it [00:02, 4.60it/s] 14it [00:03, 4.60it/s] 15it [00:03, 4.62it/s] 16it [00:03, 4.62it/s] 17it [00:03, 4.63it/s] 18it [00:03, 4.65it/s] 19it [00:04, 4.66it/s] 20it [00:04, 4.66it/s] 21it [00:04, 4.68it/s] 22it [00:04, 4.67it/s] 23it [00:05, 4.67it/s] 24it [00:05, 4.51it/s] 25it [00:05, 4.57it/s] 26it [00:05, 4.59it/s] 27it [00:05, 4.62it/s] 28it [00:06, 4.63it/s] 29it [00:06, 4.64it/s] 30it [00:06, 4.48it/s] 31it [00:06, 4.54it/s] 32it [00:07, 4.58it/s] 33it [00:07, 4.59it/s] 34it [00:07, 4.58it/s] 35it [00:07, 4.61it/s] 36it [00:07, 4.62it/s] 37it [00:08, 4.64it/s] 38it [00:08, 4.65it/s] 39it [00:08, 4.66it/s] 40it [00:08, 4.66it/s] 41it [00:08, 4.67it/s] 42it [00:09, 4.51it/s] 43it [00:09, 4.54it/s] 44it [00:09, 4.55it/s] 45it [00:09, 4.58it/s] 46it [00:10, 4.59it/s] 47it [00:10, 4.59it/s] 48it [00:10, 4.46it/s] 49it [00:10, 4.54it/s] 50it [00:10, 4.57it/s]2025-05-25 23:07:35,449 - INFO - [Epoch 017 | Batch 0050] IWAE-loss 3817.5354 | mean log_px -0.0287 | KL -2182.09 + 51it [00:11, 4.59it/s] 52it [00:11, 4.60it/s] 53it [00:11, 4.63it/s] 54it [00:11, 4.65it/s] 55it [00:12, 4.50it/s] 56it [00:12, 4.55it/s] 57it [00:12, 4.59it/s] 58it [00:12, 4.61it/s] 59it [00:12, 4.63it/s] 60it [00:13, 4.48it/s] 61it [00:13, 4.54it/s] 62it [00:13, 4.43it/s] 63it [00:13, 4.52it/s] 64it [00:14, 4.57it/s] 65it [00:14, 4.60it/s] 66it [00:14, 4.62it/s] 67it [00:14, 4.64it/s] 68it [00:14, 4.65it/s] 69it [00:15, 4.51it/s] 70it [00:15, 4.52it/s] 71it [00:15, 4.56it/s] 72it [00:15, 4.60it/s] 73it [00:15, 4.62it/s] 74it [00:16, 4.64it/s] 75it [00:16, 4.66it/s] 76it [00:16, 4.51it/s] 77it [00:16, 4.56it/s] 78it [00:17, 4.58it/s] 79it [00:17, 4.60it/s] 80it [00:17, 4.63it/s] 81it [00:17, 4.65it/s] 82it [00:17, 4.65it/s] 83it [00:18, 4.66it/s] 84it [00:18, 4.66it/s] 85it [00:18, 4.51it/s] 86it [00:18, 4.56it/s] 87it [00:19, 4.60it/s] 88it [00:19, 4.62it/s] 89it [00:19, 4.64it/s] 90it [00:19, 4.63it/s] 91it [00:19, 4.38it/s] 92it [00:20, 4.48it/s] 93it [00:20, 4.55it/s] 94it [00:20, 4.58it/s] 95it [00:20, 4.62it/s] 96it [00:20, 4.63it/s] 97it [00:21, 4.47it/s] 98it [00:21, 4.54it/s] 99it [00:21, 4.53it/s] 100it [00:21, 4.57it/s]2025-05-25 23:07:46,371 - INFO - [Epoch 017 | Batch 0100] IWAE-loss 2449.2668 | mean log_px -0.0059 | KL -2174.15 + 101it [00:22, 4.61it/s] 102it [00:22, 4.62it/s] 103it [00:22, 4.64it/s] 104it [00:22, 4.48it/s] 105it [00:22, 4.54it/s] 106it [00:23, 4.57it/s] 107it [00:23, 4.61it/s] 108it [00:23, 4.62it/s] 109it [00:23, 4.63it/s] 110it [00:24, 4.65it/s] 111it [00:24, 4.67it/s] 112it [00:24, 4.66it/s] 113it [00:24, 4.63it/s] 114it [00:24, 4.63it/s] 115it [00:25, 4.46it/s] 116it [00:25, 4.51it/s] 117it [00:25, 4.55it/s] 118it [00:25, 4.57it/s] 119it [00:26, 4.57it/s] 120it [00:26, 4.60it/s] 121it [00:26, 4.61it/s] 122it [00:26, 4.62it/s] 123it [00:26, 4.63it/s] 124it [00:27, 4.48it/s] 125it [00:27, 4.55it/s] 126it [00:27, 4.58it/s] 127it [00:27, 4.60it/s] 128it [00:27, 4.61it/s] 129it [00:28, 4.62it/s] 130it [00:28, 4.62it/s] 131it [00:28, 4.64it/s] 132it [00:28, 4.64it/s] 133it [00:29, 4.48it/s] 134it [00:29, 4.54it/s] 135it [00:29, 4.59it/s] 136it [00:29, 4.61it/s] 137it [00:29, 4.62it/s] 138it [00:30, 4.62it/s] 139it [00:30, 4.48it/s] 140it [00:30, 4.53it/s] 141it [00:30, 4.52it/s] 142it [00:31, 4.49it/s] 143it [00:31, 4.56it/s] 144it [00:31, 4.59it/s] 145it [00:31, 4.62it/s] 146it [00:31, 4.63it/s] 147it [00:32, 4.49it/s] 148it [00:32, 4.56it/s] 149it [00:32, 4.58it/s] 150it [00:32, 4.60it/s]2025-05-25 23:07:57,286 - INFO - [Epoch 017 | Batch 0150] IWAE-loss 2379.8494 | mean log_px -0.0040 | KL -2152.76 + 151it [00:33, 4.57it/s] 152it [00:33, 4.54it/s] 153it [00:33, 4.57it/s] 154it [00:33, 4.58it/s] 155it [00:33, 4.61it/s] 156it [00:34, 4.61it/s] 157it [00:34, 4.62it/s] 158it [00:34, 4.63it/s] 159it [00:34, 4.63it/s] 160it [00:34, 4.63it/s] 161it [00:35, 4.63it/s] 162it [00:35, 4.63it/s] 163it [00:35, 4.62it/s] 164it [00:35, 4.62it/s] 165it [00:36, 4.48it/s] 166it [00:36, 4.53it/s] 167it [00:36, 4.56it/s] 168it [00:36, 4.57it/s] 169it [00:36, 4.60it/s] 170it [00:37, 4.60it/s] 171it [00:37, 4.60it/s] 172it [00:37, 4.61it/s] 173it [00:37, 4.63it/s] 174it [00:37, 4.61it/s] 175it [00:38, 4.62it/s] 176it [00:38, 4.60it/s] 177it [00:38, 4.61it/s] 178it [00:38, 4.61it/s] 179it [00:39, 4.63it/s] 180it [00:39, 4.63it/s] 181it [00:39, 4.65it/s] 182it [00:39, 4.64it/s] 183it [00:39, 4.50it/s] 184it [00:40, 4.55it/s] 185it [00:40, 4.53it/s] 186it [00:40, 4.56it/s] 187it [00:40, 4.58it/s] 188it [00:41, 4.60it/s] 189it [00:41, 4.61it/s] 190it [00:41, 4.61it/s] 191it [00:41, 4.62it/s] 192it [00:41, 4.49it/s] 193it [00:42, 4.56it/s] 194it [00:42, 4.57it/s] 195it [00:42, 4.33it/s] 196it [00:42, 4.42it/s] 196it [00:42, 4.57it/s] +2025-05-25 23:08:07,260 - INFO - Epoch: 17, Objective: tensor([2270.9153], device='cuda:0', grad_fn=), Loss: 0.004182320553809404, KL/n: 43.6452751159668 + 0it [00:00, ?it/s]2025-05-25 23:08:07,637 - INFO - [Epoch 018 | Batch 0000] IWAE-loss 2706.3704 | mean log_px -0.0173 | KL -2135.82 + 1it [00:00, 3.01it/s] 2it [00:00, 3.75it/s] 3it [00:00, 4.11it/s] 4it [00:00, 4.23it/s] 5it [00:01, 4.29it/s] 6it [00:01, 4.29it/s] 7it [00:01, 3.46it/s] 8it [00:02, 3.71it/s] 9it [00:02, 3.94it/s] 10it [00:02, 4.09it/s] 11it [00:02, 4.20it/s] 12it [00:02, 4.16it/s] 13it [00:03, 4.29it/s] 14it [00:03, 4.36it/s] 15it [00:03, 4.45it/s] 16it [00:03, 4.33it/s] 17it [00:04, 4.37it/s] 18it [00:04, 4.45it/s] 19it [00:04, 4.48it/s] 20it [00:04, 4.51it/s] 21it [00:04, 4.49it/s] 22it [00:05, 4.37it/s] 23it [00:05, 4.45it/s] 24it [00:05, 4.40it/s] 25it [00:05, 4.42it/s] 26it [00:06, 4.48it/s] 27it [00:06, 4.51it/s] 28it [00:06, 4.52it/s] 29it [00:06, 4.49it/s] 30it [00:07, 4.32it/s] 31it [00:07, 4.29it/s] 32it [00:07, 4.35it/s] 33it [00:07, 4.43it/s] 34it [00:07, 4.47it/s] 35it [00:08, 4.45it/s] 36it [00:08, 4.49it/s] 37it [00:08, 4.52it/s] 38it [00:08, 4.54it/s] 39it [00:09, 4.56it/s] 40it [00:09, 4.41it/s] 41it [00:09, 4.47it/s] 42it [00:09, 4.48it/s] 43it [00:09, 4.51it/s] 44it [00:10, 4.55it/s] 45it [00:10, 4.55it/s] 46it [00:10, 4.58it/s] 47it [00:10, 4.59it/s] 48it [00:11, 4.59it/s] 49it [00:11, 4.61it/s] 50it [00:11, 4.60it/s]2025-05-25 23:08:19,027 - INFO - [Epoch 018 | Batch 0050] IWAE-loss 2571.1865 | mean log_px -0.0093 | KL -2121.10 + 51it [00:11, 4.45it/s] 52it [00:11, 4.34it/s] 53it [00:12, 4.43it/s] 54it [00:12, 4.48it/s] 55it [00:12, 4.53it/s] 56it [00:12, 4.39it/s] 57it [00:13, 4.46it/s] 58it [00:13, 4.35it/s] 59it [00:13, 4.42it/s] 60it [00:13, 4.32it/s] 61it [00:13, 4.42it/s] 62it [00:14, 4.43it/s] 63it [00:14, 4.52it/s] 64it [00:14, 4.55it/s] 65it [00:14, 4.42it/s] 66it [00:15, 4.31it/s] 67it [00:15, 4.41it/s] 68it [00:15, 4.33it/s] 69it [00:15, 4.27it/s] 70it [00:16, 4.36it/s] 71it [00:16, 4.44it/s] 72it [00:16, 4.49it/s] 73it [00:16, 4.52it/s] 74it [00:16, 4.55it/s] 75it [00:17, 4.42it/s] 76it [00:17, 4.48it/s] 77it [00:17, 4.51it/s] 78it [00:17, 4.52it/s] 79it [00:18, 4.48it/s] 80it [00:18, 4.51it/s] 81it [00:18, 4.31it/s] 82it [00:18, 4.39it/s] 83it [00:18, 4.45it/s] 84it [00:19, 4.30it/s] 85it [00:19, 4.17it/s] 86it [00:19, 4.15it/s] 87it [00:19, 4.03it/s] 88it [00:20, 4.06it/s] 89it [00:20, 4.18it/s] 90it [00:20, 4.12it/s] 91it [00:20, 4.04it/s] 92it [00:21, 4.05it/s] 93it [00:21, 4.13it/s] 94it [00:21, 4.13it/s] 95it [00:21, 4.13it/s] 96it [00:22, 4.21it/s] 97it [00:22, 4.19it/s] 98it [00:22, 4.16it/s] 99it [00:22, 4.15it/s] 100it [00:23, 4.30it/s]2025-05-25 23:08:30,586 - INFO - [Epoch 018 | Batch 0100] IWAE-loss 2327.6116 | mean log_px -0.0041 | KL -2106.47 + 101it [00:23, 4.39it/s] 102it [00:23, 4.47it/s] 103it [00:23, 4.52it/s] 104it [00:23, 4.40it/s] 105it [00:24, 4.12it/s] 106it [00:24, 4.26it/s] 107it [00:24, 4.25it/s] 108it [00:24, 4.21it/s] 109it [00:25, 4.23it/s] 110it [00:25, 4.20it/s] 111it [00:25, 4.32it/s] 112it [00:25, 4.25it/s] 113it [00:26, 4.25it/s] 114it [00:26, 4.20it/s] 115it [00:26, 4.27it/s] 116it [00:26, 4.32it/s] 117it [00:27, 4.18it/s] 118it [00:27, 4.19it/s] 119it [00:27, 4.30it/s] 120it [00:27, 4.21it/s] 121it [00:27, 4.22it/s] 122it [00:28, 4.19it/s] 123it [00:28, 4.30it/s] 124it [00:28, 4.38it/s] 125it [00:28, 4.29it/s] 126it [00:29, 4.36it/s] 127it [00:29, 4.42it/s] 128it [00:29, 4.47it/s] 129it [00:29, 4.41it/s] 130it [00:29, 4.46it/s] 131it [00:30, 4.50it/s] 132it [00:30, 4.53it/s] 133it [00:30, 4.37it/s] 134it [00:30, 4.42it/s] 135it [00:31, 4.48it/s] 136it [00:31, 4.38it/s] 137it [00:31, 4.29it/s] 138it [00:31, 4.37it/s] 139it [00:32, 4.29it/s] 140it [00:32, 4.24it/s] 141it [00:32, 4.33it/s] 142it [00:32, 4.37it/s] 143it [00:32, 4.36it/s] 144it [00:33, 4.15it/s] 145it [00:33, 4.18it/s] 146it [00:33, 4.15it/s] 147it [00:33, 4.18it/s] 148it [00:34, 4.29it/s] 149it [00:34, 4.13it/s] 150it [00:34, 4.26it/s]2025-05-25 23:08:42,211 - INFO - [Epoch 018 | Batch 0150] IWAE-loss 3520.7913 | mean log_px -0.0254 | KL -2092.53 + 151it [00:34, 4.35it/s] 152it [00:35, 4.26it/s] 153it [00:35, 4.26it/s] 154it [00:35, 4.18it/s] 155it [00:35, 4.31it/s] 156it [00:36, 4.40it/s] 157it [00:36, 4.47it/s] 158it [00:36, 4.51it/s] 159it [00:36, 4.55it/s] 160it [00:36, 4.57it/s] 161it [00:37, 4.49it/s] 162it [00:37, 4.34it/s] 163it [00:37, 4.31it/s] 164it [00:37, 4.12it/s] 165it [00:38, 4.27it/s] 166it [00:38, 4.36it/s] 167it [00:38, 4.28it/s] 168it [00:38, 4.37it/s] 169it [00:38, 4.45it/s] 170it [00:39, 4.50it/s] 171it [00:39, 4.55it/s] 172it [00:39, 4.46it/s] 173it [00:39, 4.52it/s] 174it [00:40, 4.55it/s] 175it [00:40, 4.47it/s] 176it [00:40, 4.54it/s] 177it [00:40, 4.39it/s] 178it [00:41, 4.45it/s] 179it [00:41, 4.35it/s] 180it [00:41, 4.42it/s] 181it [00:41, 4.32it/s] 182it [00:41, 4.40it/s] 183it [00:42, 4.47it/s] 184it [00:42, 4.32it/s] 185it [00:42, 4.21it/s] 186it [00:42, 4.19it/s] 187it [00:43, 4.18it/s] 188it [00:43, 4.16it/s] 189it [00:43, 4.23it/s] 190it [00:43, 4.17it/s] 191it [00:44, 4.18it/s] 192it [00:44, 4.30it/s] 193it [00:44, 4.39it/s] 194it [00:44, 4.31it/s] 195it [00:44, 4.29it/s] 196it [00:45, 4.38it/s] 196it [00:45, 4.33it/s] +2025-05-25 23:08:52,653 - INFO - Epoch: 18, Objective: tensor([2600.6919], device='cuda:0', grad_fn=), Loss: 0.01254788413643837, KL/n: 42.441864013671875 + 0it [00:00, ?it/s]2025-05-25 23:08:53,041 - INFO - [Epoch 019 | Batch 0000] IWAE-loss 2569.3970 | mean log_px -0.0069 | KL -2083.59 + 1it [00:00, 3.13it/s] 2it [00:00, 3.85it/s] 3it [00:00, 4.20it/s] 4it [00:00, 4.36it/s] 5it [00:01, 4.44it/s] 6it [00:01, 4.35it/s] 7it [00:01, 4.41it/s] 8it [00:01, 4.49it/s] 9it [00:02, 4.51it/s] 10it [00:02, 4.55it/s] 11it [00:02, 4.58it/s] 12it [00:02, 4.58it/s] 13it [00:02, 4.64it/s] 14it [00:03, 4.66it/s] 15it [00:03, 4.69it/s] 16it [00:03, 4.69it/s] 17it [00:03, 4.54it/s] 18it [00:04, 4.60it/s] 19it [00:04, 4.64it/s] 20it [00:04, 4.50it/s] 21it [00:04, 4.58it/s] 22it [00:04, 4.62it/s] 23it [00:05, 4.66it/s] 24it [00:05, 4.65it/s] 25it [00:05, 4.45it/s] 26it [00:05, 4.53it/s] 27it [00:05, 4.58it/s] 28it [00:06, 4.61it/s] 29it [00:06, 4.64it/s] 30it [00:06, 4.65it/s] 31it [00:06, 4.67it/s] 32it [00:07, 4.68it/s] 33it [00:07, 4.70it/s] 34it [00:07, 4.70it/s] 35it [00:07, 4.55it/s] 36it [00:07, 4.60it/s] 37it [00:08, 4.64it/s] 38it [00:08, 4.66it/s] 39it [00:08, 4.68it/s] 40it [00:08, 4.69it/s] 41it [00:09, 4.54it/s] 42it [00:09, 4.61it/s] 43it [00:09, 4.65it/s] 44it [00:09, 4.66it/s] 45it [00:09, 4.68it/s] 46it [00:10, 4.68it/s] 47it [00:10, 4.70it/s] 48it [00:10, 4.70it/s] 49it [00:10, 4.71it/s] 50it [00:10, 4.54it/s]2025-05-25 23:09:03,874 - INFO - [Epoch 019 | Batch 0050] IWAE-loss 2562.2981 | mean log_px -0.0159 | KL -2057.50 + 51it [00:11, 4.61it/s] 52it [00:11, 4.64it/s] 53it [00:11, 4.67it/s] 54it [00:11, 4.68it/s] 55it [00:12, 4.53it/s] 56it [00:12, 4.60it/s] 57it [00:12, 4.64it/s] 58it [00:12, 4.63it/s] 59it [00:12, 4.64it/s] 60it [00:13, 4.62it/s] 61it [00:13, 4.66it/s] 62it [00:13, 4.68it/s] 63it [00:13, 4.70it/s] 64it [00:13, 4.70it/s] 65it [00:14, 4.71it/s] 66it [00:14, 4.71it/s] 67it [00:14, 4.72it/s] 68it [00:14, 4.72it/s] 69it [00:14, 4.73it/s] 70it [00:15, 4.72it/s] 71it [00:15, 4.73it/s] 72it [00:15, 4.72it/s] 73it [00:15, 4.73it/s] 74it [00:16, 4.72it/s] 75it [00:16, 4.73it/s] 76it [00:16, 4.72it/s] 77it [00:16, 4.73it/s] 78it [00:16, 4.73it/s] 79it [00:17, 4.73it/s] 80it [00:17, 4.73it/s] 81it [00:17, 4.73it/s] 82it [00:17, 4.73it/s] 83it [00:17, 4.73it/s] 84it [00:18, 4.73it/s] 85it [00:18, 4.73it/s] 86it [00:18, 4.73it/s] 87it [00:18, 4.73it/s] 88it [00:19, 4.73it/s] 89it [00:19, 4.72it/s] 90it [00:19, 4.72it/s] 91it [00:19, 4.72it/s] 92it [00:19, 4.72it/s] 93it [00:20, 4.72it/s] 94it [00:20, 4.72it/s] 95it [00:20, 4.72it/s] 96it [00:20, 4.72it/s] 97it [00:20, 4.73it/s] 98it [00:21, 4.64it/s] 99it [00:21, 4.67it/s] 100it [00:21, 4.68it/s]2025-05-25 23:09:14,501 - INFO - [Epoch 019 | Batch 0100] IWAE-loss 2413.2510 | mean log_px -0.0084 | KL -2045.86 + 101it [00:21, 4.70it/s] 102it [00:21, 4.70it/s] 103it [00:22, 4.71it/s] 104it [00:22, 4.71it/s] 105it [00:22, 4.72it/s] 106it [00:22, 4.72it/s] 107it [00:23, 4.72it/s] 108it [00:23, 4.72it/s] 109it [00:23, 4.73it/s] 110it [00:23, 4.72it/s] 111it [00:23, 4.73it/s] 112it [00:24, 4.72it/s] 113it [00:24, 4.71it/s] 114it [00:24, 4.54it/s] 115it [00:24, 4.61it/s] 116it [00:24, 4.64it/s] 117it [00:25, 4.67it/s] 118it [00:25, 4.68it/s] 119it [00:25, 4.70it/s] 120it [00:25, 4.71it/s] 121it [00:26, 4.71it/s] 122it [00:26, 4.72it/s] 123it [00:26, 4.73it/s] 124it [00:26, 4.73it/s] 125it [00:26, 4.53it/s] 126it [00:27, 4.60it/s] 127it [00:27, 4.64it/s] 128it [00:27, 4.67it/s] 129it [00:27, 4.69it/s] 130it [00:27, 4.69it/s] 131it [00:28, 4.71it/s] 132it [00:28, 4.55it/s] 133it [00:28, 4.61it/s] 134it [00:28, 4.64it/s] 135it [00:29, 4.67it/s] 136it [00:29, 4.67it/s] 137it [00:29, 4.52it/s] 138it [00:29, 4.59it/s] 139it [00:29, 4.62it/s] 140it [00:30, 4.65it/s] 141it [00:30, 4.67it/s] 142it [00:30, 4.69it/s] 143it [00:30, 4.54it/s] 144it [00:31, 4.61it/s] 145it [00:31, 4.64it/s] 146it [00:31, 4.67it/s] 147it [00:31, 4.68it/s] 148it [00:31, 4.69it/s] 149it [00:32, 4.71it/s] 150it [00:32, 4.71it/s]2025-05-25 23:09:25,214 - INFO - [Epoch 019 | Batch 0150] IWAE-loss 2499.8535 | mean log_px -0.0090 | KL -2029.06 + 151it [00:32, 4.71it/s] 152it [00:32, 4.44it/s] 153it [00:32, 4.47it/s] 154it [00:33, 4.50it/s] 155it [00:33, 4.51it/s] 156it [00:33, 4.53it/s] 157it [00:33, 4.55it/s] 158it [00:34, 4.55it/s] 159it [00:34, 4.57it/s] 160it [00:34, 4.57it/s] 161it [00:34, 4.44it/s] 162it [00:34, 4.48it/s] 163it [00:35, 4.51it/s] 164it [00:35, 4.53it/s] 165it [00:35, 4.52it/s] 166it [00:35, 4.54it/s] 167it [00:36, 4.57it/s] 168it [00:36, 4.57it/s] 169it [00:36, 4.59it/s] 170it [00:36, 4.47it/s] 171it [00:36, 4.48it/s] 172it [00:37, 4.52it/s] 173it [00:37, 4.53it/s] 174it [00:37, 4.53it/s] 175it [00:37, 4.55it/s] 176it [00:38, 4.54it/s] 177it [00:38, 4.57it/s] 178it [00:38, 4.55it/s] 179it [00:38, 4.54it/s] 180it [00:38, 4.57it/s] 181it [00:39, 4.59it/s] 182it [00:39, 4.57it/s] 183it [00:39, 4.61it/s] 184it [00:39, 4.60it/s] 185it [00:39, 4.60it/s] 186it [00:40, 4.59it/s] 187it [00:40, 4.59it/s] 188it [00:40, 4.47it/s] 189it [00:40, 4.53it/s] 190it [00:41, 4.56it/s] 191it [00:41, 4.58it/s] 192it [00:41, 4.58it/s] 193it [00:41, 4.61it/s] 194it [00:41, 4.48it/s] 195it [00:42, 4.39it/s] 196it [00:42, 4.36it/s] 196it [00:42, 4.61it/s] +2025-05-25 23:09:35,304 - INFO - Epoch: 19, Objective: tensor([2346.0564], device='cuda:0', grad_fn=), Loss: 0.010250546969473362, KL/n: 41.190834045410156 + 0it [00:00, ?it/s]2025-05-25 23:09:35,877 - INFO - [Epoch 020 | Batch 0000] IWAE-loss 2297.0408 | mean log_px -0.0067 | KL -2018.12 + 1it [00:00, 3.03it/s] 2it [00:00, 3.83it/s] 3it [00:00, 4.19it/s] 4it [00:00, 4.35it/s] 5it [00:01, 4.44it/s] 6it [00:01, 4.43it/s] 7it [00:01, 4.51it/s] 8it [00:01, 4.54it/s] 9it [00:02, 4.57it/s] 10it [00:02, 4.52it/s] 11it [00:02, 4.42it/s] 12it [00:02, 4.49it/s] 13it [00:02, 4.55it/s] 14it [00:03, 4.57it/s] 15it [00:03, 4.60it/s] 16it [00:03, 4.59it/s] 17it [00:03, 4.48it/s] 18it [00:04, 4.53it/s] 19it [00:04, 4.53it/s] 20it [00:04, 4.54it/s] 21it [00:04, 4.57it/s] 22it [00:04, 4.58it/s] 23it [00:05, 4.60it/s] 24it [00:05, 4.61it/s] 25it [00:05, 4.46it/s] 26it [00:05, 4.51it/s] 27it [00:06, 4.55it/s] 28it [00:06, 4.56it/s] 29it [00:06, 4.58it/s] 30it [00:06, 4.59it/s] 31it [00:06, 4.60it/s] 32it [00:07, 4.45it/s] 33it [00:07, 4.52it/s] 34it [00:07, 4.55it/s] 35it [00:07, 4.57it/s] 36it [00:08, 4.58it/s] 37it [00:08, 4.60it/s] 38it [00:08, 4.61it/s] 39it [00:08, 4.47it/s] 40it [00:08, 4.51it/s] 41it [00:09, 4.51it/s] 42it [00:09, 4.54it/s] 43it [00:09, 4.56it/s] 44it [00:09, 4.58it/s] 45it [00:09, 4.60it/s] 46it [00:10, 4.46it/s] 47it [00:10, 4.52it/s] 48it [00:10, 4.54it/s] 49it [00:10, 4.57it/s] 50it [00:11, 4.59it/s]2025-05-25 23:09:46,851 - INFO - [Epoch 020 | Batch 0050] IWAE-loss 2567.9041 | mean log_px -0.0136 | KL -1997.04 + 51it [00:11, 4.61it/s] 52it [00:11, 4.60it/s] 53it [00:11, 4.62it/s] 54it [00:11, 4.61it/s] 55it [00:12, 4.47it/s] 56it [00:12, 4.52it/s] 57it [00:12, 4.55it/s] 58it [00:12, 4.56it/s] 59it [00:13, 4.59it/s] 60it [00:13, 4.58it/s] 61it [00:13, 4.56it/s] 62it [00:13, 4.57it/s] 63it [00:13, 4.58it/s] 64it [00:14, 4.45it/s] 65it [00:14, 4.51it/s] 66it [00:14, 4.54it/s] 67it [00:14, 4.56it/s] 68it [00:15, 4.57it/s] 69it [00:15, 4.56it/s] 70it [00:15, 4.53it/s] 71it [00:15, 4.57it/s] 72it [00:15, 4.59it/s] 73it [00:16, 4.61it/s] 74it [00:16, 4.45it/s] 75it [00:16, 4.52it/s] 76it [00:16, 4.53it/s] 77it [00:17, 4.55it/s] 78it [00:17, 4.57it/s] 79it [00:17, 4.44it/s] 80it [00:17, 4.49it/s] 81it [00:17, 4.54it/s] 82it [00:18, 4.57it/s] 83it [00:18, 4.58it/s] 84it [00:18, 4.59it/s] 85it [00:18, 4.60it/s] 86it [00:19, 4.46it/s] 87it [00:19, 4.54it/s] 88it [00:19, 4.56it/s] 89it [00:19, 4.60it/s] 90it [00:19, 4.59it/s] 91it [00:20, 4.60it/s] 92it [00:20, 4.60it/s] 93it [00:20, 4.44it/s] 94it [00:20, 4.51it/s] 95it [00:20, 4.55it/s] 96it [00:21, 4.58it/s] 97it [00:21, 4.59it/s] 98it [00:21, 4.44it/s] 99it [00:21, 4.48it/s] 100it [00:22, 4.53it/s]2025-05-25 23:09:57,851 - INFO - [Epoch 020 | Batch 0100] IWAE-loss 3235.3687 | mean log_px -0.0223 | KL -1973.44 + 101it [00:22, 4.44it/s] 102it [00:22, 4.51it/s] 103it [00:22, 4.55it/s] 104it [00:22, 4.57it/s] 105it [00:23, 4.59it/s] 106it [00:23, 4.59it/s] 107it [00:23, 4.59it/s] 108it [00:23, 4.44it/s] 109it [00:24, 4.50it/s] 110it [00:24, 4.55it/s] 111it [00:24, 4.57it/s] 112it [00:24, 4.59it/s] 113it [00:24, 4.58it/s] 114it [00:25, 4.59it/s] 115it [00:25, 4.49it/s] 116it [00:25, 4.35it/s] 117it [00:25, 4.35it/s] 118it [00:26, 4.37it/s] 119it [00:26, 4.43it/s] 120it [00:26, 4.44it/s] 121it [00:26, 4.39it/s] 122it [00:26, 4.42it/s] 123it [00:27, 4.49it/s] 124it [00:27, 4.52it/s] 125it [00:27, 4.56it/s] 126it [00:27, 4.43it/s] 127it [00:28, 4.50it/s] 128it [00:28, 4.54it/s] 129it [00:28, 4.57it/s] 130it [00:28, 4.56it/s] 131it [00:28, 4.56it/s] 132it [00:29, 4.60it/s] 133it [00:29, 4.62it/s] 134it [00:29, 4.47it/s] 135it [00:29, 4.53it/s] 136it [00:30, 4.55it/s] 137it [00:30, 4.59it/s] 138it [00:30, 4.60it/s] 139it [00:30, 4.57it/s] 140it [00:30, 4.60it/s] 141it [00:31, 4.60it/s] 142it [00:31, 4.47it/s] 143it [00:31, 4.52it/s] 144it [00:31, 4.40it/s] 145it [00:32, 4.47it/s] 146it [00:32, 4.52it/s] 147it [00:32, 4.56it/s] 148it [00:32, 4.57it/s] 149it [00:32, 4.58it/s] 150it [00:33, 4.44it/s]2025-05-25 23:10:08,930 - INFO - [Epoch 020 | Batch 0150] IWAE-loss 2351.8418 | mean log_px -0.0055 | KL -1967.71 + 151it [00:33, 4.51it/s] 152it [00:33, 4.54it/s] 153it [00:33, 4.57it/s] 154it [00:34, 4.56it/s] 155it [00:34, 4.44it/s] 156it [00:34, 4.51it/s] 157it [00:34, 4.56it/s] 158it [00:34, 4.43it/s] 159it [00:35, 4.49it/s] 160it [00:35, 4.54it/s] 161it [00:35, 4.56it/s] 162it [00:35, 4.56it/s] 163it [00:36, 4.59it/s] 164it [00:36, 4.60it/s] 165it [00:36, 4.46it/s] 166it [00:36, 4.49it/s] 167it [00:36, 4.54it/s] 168it [00:37, 4.54it/s] 169it [00:37, 4.57it/s] 170it [00:37, 4.58it/s] 171it [00:37, 4.59it/s] 172it [00:38, 4.45it/s] 173it [00:38, 4.51it/s] 174it [00:38, 4.48it/s] 175it [00:38, 4.52it/s] 176it [00:38, 4.55it/s] 177it [00:39, 4.57it/s] 178it [00:39, 4.57it/s] 179it [00:39, 4.59it/s] 180it [00:39, 4.45it/s] 181it [00:39, 4.51it/s] 182it [00:40, 4.53it/s] 183it [00:40, 4.55it/s] 184it [00:40, 4.57it/s] 185it [00:40, 4.58it/s] 186it [00:41, 4.44it/s] 187it [00:41, 4.51it/s] 188it [00:41, 4.54it/s] 189it [00:41, 4.57it/s] 190it [00:41, 4.57it/s] 191it [00:42, 4.58it/s] 192it [00:42, 4.60it/s] 193it [00:42, 4.47it/s] 194it [00:42, 4.52it/s] 195it [00:43, 4.33it/s] 196it [00:43, 4.41it/s] 196it [00:43, 4.52it/s] +2025-05-25 23:10:19,022 - INFO - Epoch: 20, Objective: tensor([2321.2383], device='cuda:0', grad_fn=), Loss: 0.013511824421584606, KL/n: 39.98223876953125 + 0it [00:00, ?it/s]2025-05-25 23:10:19,394 - INFO - [Epoch 021 | Batch 0000] IWAE-loss 2518.2864 | mean log_px -0.0100 | KL -1959.45 + 1it [00:00, 3.29it/s] 2it [00:00, 3.73it/s] 3it [00:00, 4.10it/s] 4it [00:01, 4.12it/s] 5it [00:01, 4.29it/s] 6it [00:01, 4.34it/s] 7it [00:01, 4.43it/s] 8it [00:01, 4.48it/s] 9it [00:02, 4.54it/s] 10it [00:02, 4.57it/s] 11it [00:02, 4.43it/s] 12it [00:02, 4.43it/s] 13it [00:03, 4.36it/s] 14it [00:03, 4.42it/s] 15it [00:03, 4.47it/s] 16it [00:03, 4.35it/s] 17it [00:03, 4.28it/s] 18it [00:04, 4.36it/s] 19it [00:04, 4.45it/s] 20it [00:04, 4.46it/s] 21it [00:04, 4.53it/s] 22it [00:05, 4.56it/s] 23it [00:05, 4.55it/s] 24it [00:05, 4.52it/s] 25it [00:05, 4.55it/s] 26it [00:05, 4.59it/s] 27it [00:06, 4.60it/s] 28it [00:06, 4.62it/s] 29it [00:06, 4.61it/s] 30it [00:06, 4.63it/s] 31it [00:06, 4.63it/s] 32it [00:07, 4.47it/s] 33it [00:07, 4.36it/s] 34it [00:07, 4.28it/s] 35it [00:07, 4.23it/s] 36it [00:08, 4.19it/s] 37it [00:08, 4.27it/s] 38it [00:08, 4.38it/s] 39it [00:08, 4.47it/s] 40it [00:09, 4.53it/s] 41it [00:09, 4.57it/s] 42it [00:09, 4.45it/s] 43it [00:09, 4.51it/s] 44it [00:09, 4.55it/s] 45it [00:10, 4.56it/s] 46it [00:10, 4.59it/s] 47it [00:10, 4.61it/s] 48it [00:10, 4.62it/s] 49it [00:11, 4.65it/s] 50it [00:11, 4.48it/s]2025-05-25 23:10:30,563 - INFO - [Epoch 021 | Batch 0050] IWAE-loss 2608.6096 | mean log_px -0.0148 | KL -1939.67 + 51it [00:11, 4.54it/s] 52it [00:11, 4.58it/s] 53it [00:11, 4.57it/s] 54it [00:12, 4.40it/s] 55it [00:12, 4.35it/s] 56it [00:12, 4.43it/s] 57it [00:12, 4.51it/s] 58it [00:13, 4.54it/s] 59it [00:13, 4.19it/s] 60it [00:13, 4.31it/s] 61it [00:13, 4.25it/s] 62it [00:13, 4.35it/s] 63it [00:14, 4.27it/s] 64it [00:14, 4.23it/s] 65it [00:14, 4.31it/s] 66it [00:15, 3.45it/s] 67it [00:15, 3.75it/s] 68it [00:15, 3.95it/s] 69it [00:15, 4.15it/s] 70it [00:15, 4.29it/s] 71it [00:16, 4.40it/s] 72it [00:16, 4.48it/s] 73it [00:16, 4.38it/s] 74it [00:16, 4.47it/s] 75it [00:17, 4.53it/s] 76it [00:17, 4.41it/s] 77it [00:17, 4.31it/s] 78it [00:17, 4.40it/s] 79it [00:18, 4.29it/s] 80it [00:18, 4.22it/s] 81it [00:18, 4.15it/s] 82it [00:18, 4.14it/s] 83it [00:18, 4.17it/s] 84it [00:19, 4.16it/s] 85it [00:19, 4.29it/s] 86it [00:19, 4.25it/s] 87it [00:19, 4.36it/s] 88it [00:20, 4.45it/s] 89it [00:20, 4.42it/s] 90it [00:20, 4.49it/s] 91it [00:20, 4.54it/s] 92it [00:21, 4.47it/s] 93it [00:21, 4.54it/s] 94it [00:21, 4.57it/s] 95it [00:21, 4.59it/s] 96it [00:21, 4.62it/s] 97it [00:22, 4.48it/s] 98it [00:22, 4.35it/s] 99it [00:22, 4.43it/s] 100it [00:22, 4.47it/s]2025-05-25 23:10:42,102 - INFO - [Epoch 021 | Batch 0100] IWAE-loss 2265.2100 | mean log_px -0.0051 | KL -1927.49 + 101it [00:23, 4.53it/s] 102it [00:23, 4.36it/s] 103it [00:23, 4.17it/s] 104it [00:23, 4.29it/s] 105it [00:23, 4.40it/s] 106it [00:24, 4.32it/s] 107it [00:24, 4.25it/s] 108it [00:24, 4.20it/s] 109it [00:24, 4.22it/s] 110it [00:25, 4.32it/s] 111it [00:25, 4.24it/s] 112it [00:25, 4.18it/s] 113it [00:25, 4.25it/s] 114it [00:26, 4.36it/s] 115it [00:26, 4.27it/s] 116it [00:26, 4.23it/s] 117it [00:26, 4.20it/s] 118it [00:27, 4.31it/s] 119it [00:27, 4.41it/s] 120it [00:27, 4.31it/s] 121it [00:27, 4.13it/s] 122it [00:27, 4.14it/s] 123it [00:28, 4.28it/s] 124it [00:28, 4.23it/s] 125it [00:28, 4.35it/s] 126it [00:28, 4.44it/s] 127it [00:29, 4.19it/s] 128it [00:29, 4.28it/s] 129it [00:29, 4.38it/s] 130it [00:29, 4.45it/s] 131it [00:30, 4.47it/s] 132it [00:30, 4.38it/s] 133it [00:30, 4.26it/s] 134it [00:30, 4.38it/s] 135it [00:30, 4.28it/s] 136it [00:31, 4.24it/s] 137it [00:31, 4.35it/s] 138it [00:31, 4.27it/s] 139it [00:31, 4.33it/s] 140it [00:32, 4.23it/s] 141it [00:32, 4.24it/s] 142it [00:32, 4.22it/s] 143it [00:32, 4.35it/s] 144it [00:33, 4.44it/s] 145it [00:33, 4.33it/s] 146it [00:33, 4.14it/s] 147it [00:33, 4.13it/s] 148it [00:34, 4.13it/s] 149it [00:34, 4.28it/s] 150it [00:34, 4.40it/s]2025-05-25 23:10:53,782 - INFO - [Epoch 021 | Batch 0150] IWAE-loss 2249.6196 | mean log_px -0.0076 | KL -1918.02 + 151it [00:34, 4.25it/s] 152it [00:34, 4.38it/s] 153it [00:35, 4.45it/s] 154it [00:35, 4.52it/s] 155it [00:35, 4.57it/s] 156it [00:35, 4.44it/s] 157it [00:36, 4.35it/s] 158it [00:36, 4.29it/s] 159it [00:36, 4.32it/s] 160it [00:36, 4.27it/s] 161it [00:36, 4.24it/s] 162it [00:37, 4.06it/s] 163it [00:37, 4.09it/s] 164it [00:37, 4.10it/s] 165it [00:37, 4.23it/s] 166it [00:38, 4.33it/s] 167it [00:38, 4.27it/s] 168it [00:38, 4.33it/s] 169it [00:38, 4.41it/s] 170it [00:39, 4.46it/s] 171it [00:39, 4.38it/s] 172it [00:39, 4.44it/s] 173it [00:39, 4.34it/s] 174it [00:40, 4.41it/s] 175it [00:40, 4.35it/s] 176it [00:40, 4.23it/s] 177it [00:40, 4.33it/s] 178it [00:40, 4.42it/s] 179it [00:41, 4.48it/s] 180it [00:41, 4.52it/s] 181it [00:41, 4.56it/s] 182it [00:41, 4.55it/s] 183it [00:42, 4.58it/s] 184it [00:42, 4.58it/s] 185it [00:42, 4.61it/s] 186it [00:42, 4.47it/s] 187it [00:42, 4.53it/s] 188it [00:43, 4.56it/s] 189it [00:43, 4.58it/s] 190it [00:43, 4.59it/s] 191it [00:43, 4.60it/s] 192it [00:43, 4.61it/s] 193it [00:44, 4.62it/s] 194it [00:44, 4.44it/s] 195it [00:44, 4.34it/s] 196it [00:44, 4.45it/s] 196it [00:44, 4.36it/s] +2025-05-25 23:11:04,114 - INFO - Epoch: 21, Objective: tensor([2395.0178], device='cuda:0', grad_fn=), Loss: 0.009308933280408382, KL/n: 39.00183868408203 + 0it [00:00, ?it/s]2025-05-25 23:11:04,483 - INFO - [Epoch 022 | Batch 0000] IWAE-loss 2293.9033 | mean log_px -0.0119 | KL -1907.14 + 1it [00:00, 3.33it/s] 2it [00:00, 3.74it/s] 3it [00:00, 4.11it/s] 4it [00:00, 4.27it/s] 5it [00:01, 4.40it/s] 6it [00:01, 4.14it/s] 7it [00:01, 4.28it/s] 8it [00:01, 4.38it/s] 9it [00:02, 4.46it/s] 10it [00:02, 4.50it/s] 11it [00:02, 4.54it/s] 12it [00:02, 4.55it/s] 13it [00:02, 4.58it/s] 14it [00:03, 4.27it/s] 15it [00:03, 4.36it/s] 16it [00:03, 4.44it/s] 17it [00:03, 4.41it/s] 18it [00:04, 4.39it/s] 19it [00:04, 4.33it/s] 20it [00:04, 4.26it/s] 21it [00:04, 4.35it/s] 22it [00:05, 4.43it/s] 23it [00:05, 4.45it/s] 24it [00:05, 4.51it/s] 25it [00:05, 4.37it/s] 26it [00:05, 4.44it/s] 27it [00:06, 4.35it/s] 28it [00:06, 4.29it/s] 29it [00:06, 4.36it/s] 30it [00:06, 4.42it/s] 31it [00:07, 4.36it/s] 32it [00:07, 4.27it/s] 33it [00:07, 4.27it/s] 34it [00:07, 4.22it/s] 35it [00:08, 4.16it/s] 36it [00:08, 4.26it/s] 37it [00:08, 4.34it/s] 38it [00:08, 4.42it/s] 39it [00:08, 4.48it/s] 40it [00:09, 4.54it/s] 41it [00:09, 4.58it/s] 42it [00:09, 4.62it/s] 43it [00:09, 4.47it/s] 44it [00:10, 4.39it/s] 45it [00:10, 4.49it/s] 46it [00:10, 4.55it/s] 47it [00:10, 4.43it/s] 48it [00:10, 4.49it/s] 49it [00:11, 4.54it/s] 50it [00:11, 4.57it/s]2025-05-25 23:11:15,799 - INFO - [Epoch 022 | Batch 0050] IWAE-loss 2142.6248 | mean log_px -0.0071 | KL -1895.51 + 51it [00:11, 4.39it/s] 52it [00:11, 4.50it/s] 53it [00:12, 4.38it/s] 54it [00:12, 4.31it/s] 55it [00:12, 4.24it/s] 56it [00:12, 4.20it/s] 57it [00:13, 4.32it/s] 58it [00:13, 4.21it/s] 59it [00:13, 4.11it/s] 60it [00:13, 4.13it/s] 61it [00:14, 4.28it/s] 62it [00:14, 4.24it/s] 63it [00:14, 4.21it/s] 64it [00:14, 4.21it/s] 65it [00:14, 4.33it/s] 66it [00:15, 4.25it/s] 67it [00:15, 4.26it/s] 68it [00:15, 4.19it/s] 69it [00:15, 4.23it/s] 70it [00:16, 4.26it/s] 71it [00:16, 4.39it/s] 72it [00:16, 4.47it/s] 73it [00:16, 4.45it/s] 74it [00:17, 4.36it/s] 75it [00:17, 4.16it/s] 76it [00:17, 4.17it/s] 77it [00:17, 4.27it/s] 78it [00:17, 4.27it/s] 79it [00:18, 4.23it/s] 80it [00:18, 4.17it/s] 81it [00:18, 4.16it/s] 82it [00:18, 4.15it/s] 83it [00:19, 4.19it/s] 84it [00:19, 4.18it/s] 85it [00:19, 4.17it/s] 86it [00:19, 4.30it/s] 87it [00:20, 4.41it/s] 88it [00:20, 4.46it/s] 89it [00:20, 4.53it/s] 90it [00:20, 4.57it/s] 91it [00:20, 4.48it/s] 92it [00:21, 4.38it/s] 93it [00:21, 4.46it/s] 94it [00:21, 4.37it/s] 95it [00:21, 4.29it/s] 96it [00:22, 4.10it/s] 97it [00:22, 4.16it/s] 98it [00:22, 4.14it/s] 99it [00:22, 4.27it/s] 100it [00:23, 4.38it/s]2025-05-25 23:11:27,516 - INFO - [Epoch 022 | Batch 0100] IWAE-loss 2433.9939 | mean log_px -0.0126 | KL -1877.79 + 101it [00:23, 4.29it/s] 102it [00:23, 4.38it/s] 103it [00:23, 4.47it/s] 104it [00:23, 4.54it/s] 105it [00:24, 4.41it/s] 106it [00:24, 4.48it/s] 107it [00:24, 4.37it/s] 108it [00:24, 4.31it/s] 109it [00:25, 4.26it/s] 110it [00:25, 4.21it/s] 111it [00:25, 4.17it/s] 112it [00:25, 4.19it/s] 113it [00:26, 4.32it/s] 114it [00:26, 4.26it/s] 115it [00:26, 4.38it/s] 116it [00:26, 4.47it/s] 117it [00:26, 4.51it/s] 118it [00:27, 4.55it/s] 119it [00:27, 4.44it/s] 120it [00:27, 4.50it/s] 121it [00:27, 4.55it/s] 122it [00:28, 4.59it/s] 123it [00:28, 4.62it/s] 124it [00:28, 4.60it/s] 125it [00:28, 4.39it/s] 126it [00:28, 4.33it/s] 127it [00:29, 4.41it/s] 128it [00:29, 4.32it/s] 129it [00:29, 4.42it/s] 130it [00:29, 4.31it/s] 131it [00:30, 4.40it/s] 132it [00:30, 4.47it/s] 133it [00:30, 4.33it/s] 134it [00:30, 4.08it/s] 135it [00:31, 4.23it/s] 136it [00:31, 4.36it/s] 137it [00:31, 4.46it/s] 138it [00:31, 4.53it/s] 139it [00:31, 4.56it/s] 140it [00:32, 4.41it/s] 141it [00:32, 4.37it/s] 142it [00:32, 4.30it/s] 143it [00:32, 4.34it/s] 144it [00:33, 4.44it/s] 145it [00:33, 4.34it/s] 146it [00:33, 4.30it/s] 147it [00:33, 4.43it/s] 148it [00:34, 4.51it/s] 149it [00:34, 4.57it/s] 150it [00:34, 4.41it/s]2025-05-25 23:11:38,879 - INFO - [Epoch 022 | Batch 0150] IWAE-loss 2279.8452 | mean log_px -0.0095 | KL -1866.57 + 151it [00:34, 4.38it/s] 152it [00:34, 4.32it/s] 153it [00:35, 4.42it/s] 154it [00:35, 4.19it/s] 155it [00:35, 4.19it/s] 156it [00:35, 4.31it/s] 157it [00:36, 4.41it/s] 158it [00:36, 4.49it/s] 159it [00:36, 4.38it/s] 160it [00:36, 4.31it/s] 161it [00:37, 4.34it/s] 162it [00:37, 4.29it/s] 163it [00:37, 4.24it/s] 164it [00:37, 4.20it/s] 165it [00:37, 4.10it/s] 166it [00:38, 4.14it/s] 167it [00:38, 4.12it/s] 168it [00:38, 4.10it/s] 169it [00:38, 4.16it/s] 170it [00:39, 4.15it/s] 171it [00:39, 4.30it/s] 172it [00:39, 4.38it/s] 173it [00:39, 4.48it/s] 174it [00:40, 4.54it/s] 175it [00:40, 4.59it/s] 176it [00:40, 4.61it/s] 177it [00:40, 4.45it/s] 178it [00:40, 4.54it/s] 179it [00:41, 4.59it/s] 180it [00:41, 4.58it/s] 181it [00:41, 4.42it/s] 182it [00:41, 4.34it/s] 183it [00:42, 4.28it/s] 184it [00:42, 4.40it/s] 185it [00:42, 4.50it/s] 186it [00:42, 4.55it/s] 187it [00:42, 4.40it/s] 188it [00:43, 4.32it/s] 189it [00:43, 4.27it/s] 190it [00:43, 4.38it/s] 191it [00:43, 4.47it/s] 192it [00:44, 4.36it/s] 193it [00:44, 4.35it/s] 194it [00:44, 4.31it/s] 195it [00:44, 4.30it/s] 196it [00:45, 4.18it/s] 196it [00:45, 4.34it/s] +2025-05-25 23:11:49,385 - INFO - Epoch: 22, Objective: tensor([2321.2053], device='cuda:0', grad_fn=), Loss: 0.0126264663413167, KL/n: 37.90328598022461 + 0it [00:00, ?it/s]2025-05-25 23:11:49,971 - INFO - [Epoch 023 | Batch 0000] IWAE-loss 2031.7919 | mean log_px -0.0048 | KL -1857.27 + 1it [00:00, 3.02it/s] 2it [00:00, 3.78it/s] 3it [00:00, 4.15it/s] 4it [00:00, 4.17it/s] 5it [00:01, 4.37it/s] 6it [00:01, 4.48it/s] 7it [00:01, 4.55it/s] 8it [00:01, 4.52it/s] 9it [00:02, 4.47it/s] 10it [00:02, 4.55it/s] 11it [00:02, 4.59it/s] 12it [00:02, 4.62it/s] 13it [00:02, 4.65it/s] 14it [00:03, 4.65it/s] 15it [00:03, 4.66it/s] 16it [00:03, 4.66it/s] 17it [00:03, 4.68it/s] 18it [00:04, 4.52it/s] 19it [00:04, 4.59it/s] 20it [00:04, 4.61it/s] 21it [00:04, 4.64it/s] 22it [00:04, 4.65it/s] 23it [00:05, 4.51it/s] 24it [00:05, 4.57it/s] 25it [00:05, 4.61it/s] 26it [00:05, 4.48it/s] 27it [00:05, 4.56it/s] 28it [00:06, 4.59it/s] 29it [00:06, 4.62it/s] 30it [00:06, 4.63it/s] 31it [00:06, 4.50it/s] 32it [00:07, 4.57it/s] 33it [00:07, 4.54it/s] 34it [00:07, 4.59it/s] 35it [00:07, 4.46it/s] 36it [00:07, 4.54it/s] 37it [00:08, 4.59it/s] 38it [00:08, 4.62it/s] 39it [00:08, 4.50it/s] 40it [00:08, 4.56it/s] 41it [00:09, 4.60it/s] 42it [00:09, 4.61it/s] 43it [00:09, 4.63it/s] 44it [00:09, 4.65it/s] 45it [00:09, 4.51it/s] 46it [00:10, 4.57it/s] 47it [00:10, 4.60it/s] 48it [00:10, 4.61it/s] 49it [00:10, 4.64it/s] 50it [00:11, 4.64it/s]2025-05-25 23:12:00,857 - INFO - [Epoch 023 | Batch 0050] IWAE-loss 2093.6794 | mean log_px -0.0058 | KL -1840.02 + 51it [00:11, 4.51it/s] 52it [00:11, 4.57it/s] 53it [00:11, 4.51it/s] 54it [00:11, 4.54it/s] 55it [00:12, 4.61it/s] 56it [00:12, 4.63it/s] 57it [00:12, 4.65it/s] 58it [00:12, 4.65it/s] 59it [00:12, 4.67it/s] 60it [00:13, 4.51it/s] 61it [00:13, 4.58it/s] 62it [00:13, 4.60it/s] 63it [00:13, 4.64it/s] 64it [00:14, 4.63it/s] 65it [00:14, 4.65it/s] 66it [00:14, 4.66it/s] 67it [00:14, 4.67it/s] 68it [00:14, 4.67it/s] 69it [00:15, 4.53it/s] 70it [00:15, 4.59it/s] 71it [00:15, 4.61it/s] 72it [00:15, 4.63it/s] 73it [00:15, 4.64it/s] 74it [00:16, 4.65it/s] 75it [00:16, 4.66it/s] 76it [00:16, 4.44it/s] 77it [00:16, 4.47it/s] 78it [00:17, 4.53it/s] 79it [00:17, 4.53it/s] 80it [00:17, 4.59it/s] 81it [00:17, 4.62it/s] 82it [00:17, 4.47it/s] 83it [00:18, 4.55it/s] 84it [00:18, 4.59it/s] 85it [00:18, 4.58it/s] 86it [00:18, 4.62it/s] 87it [00:19, 4.64it/s] 88it [00:19, 4.50it/s] 89it [00:19, 4.57it/s] 90it [00:19, 4.60it/s] 91it [00:19, 4.62it/s] 92it [00:20, 4.64it/s] 93it [00:20, 4.65it/s] 94it [00:20, 4.65it/s] 95it [00:20, 4.66it/s] 96it [00:21, 4.66it/s] 97it [00:21, 4.53it/s] 98it [00:21, 4.43it/s] 99it [00:21, 4.34it/s] 100it [00:21, 4.42it/s]2025-05-25 23:12:11,817 - INFO - [Epoch 023 | Batch 0100] IWAE-loss 2605.1060 | mean log_px -0.0202 | KL -1829.09 + 101it [00:22, 4.35it/s] 102it [00:22, 4.30it/s] 103it [00:22, 4.26it/s] 104it [00:22, 4.23it/s] 105it [00:23, 4.33it/s] 106it [00:23, 4.43it/s] 107it [00:23, 4.49it/s] 108it [00:23, 4.36it/s] 109it [00:24, 4.44it/s] 110it [00:24, 4.50it/s] 111it [00:24, 4.40it/s] 112it [00:24, 4.48it/s] 113it [00:24, 4.48it/s] 114it [00:25, 4.53it/s] 115it [00:25, 4.58it/s] 116it [00:25, 4.60it/s] 117it [00:25, 4.60it/s] 118it [00:25, 4.48it/s] 119it [00:26, 4.55it/s] 120it [00:26, 4.58it/s] 121it [00:26, 4.61it/s] 122it [00:26, 4.62it/s] 123it [00:27, 4.49it/s] 124it [00:27, 4.56it/s] 125it [00:27, 4.58it/s] 126it [00:27, 4.46it/s] 127it [00:27, 4.54it/s] 128it [00:28, 4.57it/s] 129it [00:28, 4.60it/s] 130it [00:28, 4.62it/s] 131it [00:28, 4.64it/s] 132it [00:29, 4.50it/s] 133it [00:29, 4.56it/s] 134it [00:29, 4.59it/s] 135it [00:29, 4.62it/s] 136it [00:29, 4.63it/s] 137it [00:30, 4.62it/s] 138it [00:30, 4.55it/s] 139it [00:30, 4.61it/s] 140it [00:30, 4.63it/s] 141it [00:30, 4.64it/s] 142it [00:31, 4.50it/s] 143it [00:31, 4.56it/s] 144it [00:31, 4.59it/s] 145it [00:31, 4.63it/s] 146it [00:32, 4.64it/s] 147it [00:32, 4.64it/s] 148it [00:32, 4.66it/s] 149it [00:32, 4.57it/s] 150it [00:32, 4.61it/s]2025-05-25 23:12:22,811 - INFO - [Epoch 023 | Batch 0150] IWAE-loss 2053.4185 | mean log_px -0.0083 | KL -1817.16 + 151it [00:33, 4.63it/s] 152it [00:33, 4.64it/s] 153it [00:33, 4.66it/s] 154it [00:33, 4.64it/s] 155it [00:34, 4.68it/s] 156it [00:34, 4.68it/s] 157it [00:34, 4.69it/s] 158it [00:34, 4.53it/s] 159it [00:34, 4.59it/s] 160it [00:35, 4.62it/s] 161it [00:35, 4.64it/s] 162it [00:35, 4.65it/s] 163it [00:35, 4.51it/s] 164it [00:35, 4.56it/s] 165it [00:36, 4.60it/s] 166it [00:36, 4.63it/s] 167it [00:36, 4.65it/s] 168it [00:36, 4.65it/s] 169it [00:37, 4.55it/s] 170it [00:37, 4.59it/s] 171it [00:37, 4.49it/s] 172it [00:37, 4.54it/s] 173it [00:37, 4.60it/s] 174it [00:38, 4.62it/s] 175it [00:38, 4.65it/s] 176it [00:38, 4.66it/s] 177it [00:38, 4.66it/s] 178it [00:39, 4.67it/s] 179it [00:39, 4.51it/s] 180it [00:39, 4.57it/s] 181it [00:39, 4.61it/s] 182it [00:39, 4.62it/s] 183it [00:40, 4.64it/s] 184it [00:40, 4.66it/s] 185it [00:40, 4.64it/s] 186it [00:40, 4.67it/s] 187it [00:40, 4.68it/s] 188it [00:41, 4.52it/s] 189it [00:41, 4.54it/s] 190it [00:41, 4.59it/s] 191it [00:41, 4.62it/s] 192it [00:42, 4.63it/s] 193it [00:42, 4.65it/s] 194it [00:42, 4.65it/s] 195it [00:42, 4.27it/s] 196it [00:42, 4.42it/s] 196it [00:43, 4.55it/s] +2025-05-25 23:12:32,731 - INFO - Epoch: 23, Objective: tensor([2333.9048], device='cuda:0', grad_fn=), Loss: 0.009835069067776203, KL/n: 36.8824462890625 + 0it [00:00, ?it/s]2025-05-25 23:12:33,141 - INFO - [Epoch 024 | Batch 0000] IWAE-loss 2042.8802 | mean log_px -0.0088 | KL -1806.51 + 1it [00:00, 2.95it/s] 2it [00:00, 3.74it/s] 3it [00:00, 3.95it/s] 4it [00:01, 3.85it/s] 5it [00:01, 4.00it/s] 6it [00:01, 4.03it/s] 7it [00:01, 4.08it/s] 8it [00:02, 4.14it/s] 9it [00:02, 4.31it/s] 10it [00:02, 4.41it/s] 11it [00:02, 4.48it/s] 12it [00:02, 4.39it/s] 13it [00:03, 4.38it/s] 14it [00:03, 4.46it/s] 15it [00:03, 4.38it/s] 16it [00:03, 4.32it/s] 17it [00:04, 4.33it/s] 18it [00:04, 4.42it/s] 19it [00:04, 4.48it/s] 20it [00:04, 4.54it/s] 21it [00:04, 4.27it/s] 22it [00:05, 4.19it/s] 23it [00:05, 4.30it/s] 24it [00:05, 4.39it/s] 25it [00:05, 4.32it/s] 26it [00:06, 4.38it/s] 27it [00:06, 4.45it/s] 28it [00:06, 4.52it/s] 29it [00:06, 4.36it/s] 30it [00:06, 4.46it/s] 31it [00:07, 4.53it/s] 32it [00:07, 4.43it/s] 33it [00:07, 4.50it/s] 34it [00:07, 4.55it/s] 35it [00:08, 4.41it/s] 36it [00:08, 4.49it/s] 37it [00:08, 4.55it/s] 38it [00:08, 4.59it/s] 39it [00:08, 4.62it/s] 40it [00:09, 4.62it/s] 41it [00:09, 4.48it/s] 42it [00:09, 4.52it/s] 43it [00:09, 4.25it/s] 44it [00:10, 4.26it/s] 45it [00:10, 4.36it/s] 46it [00:10, 4.32it/s] 47it [00:10, 4.28it/s] 48it [00:11, 4.26it/s] 49it [00:11, 4.30it/s] 50it [00:11, 4.26it/s]2025-05-25 23:12:44,575 - INFO - [Epoch 024 | Batch 0050] IWAE-loss 1896.7238 | mean log_px -0.0014 | KL -1796.85 + 51it [00:11, 4.24it/s] 52it [00:12, 4.23it/s] 53it [00:12, 3.42it/s] 54it [00:12, 3.71it/s] 55it [00:12, 3.84it/s] 56it [00:13, 3.95it/s] 57it [00:13, 4.12it/s] 58it [00:13, 4.14it/s] 59it [00:13, 4.28it/s] 60it [00:14, 4.41it/s] 61it [00:14, 4.49it/s] 62it [00:14, 4.54it/s] 63it [00:14, 4.43it/s] 64it [00:14, 4.48it/s] 65it [00:15, 4.46it/s] 66it [00:15, 4.52it/s] 67it [00:15, 4.57it/s] 68it [00:15, 4.61it/s] 69it [00:15, 4.48it/s] 70it [00:16, 4.41it/s] 71it [00:16, 4.48it/s] 72it [00:16, 4.54it/s] 73it [00:16, 4.59it/s] 74it [00:17, 4.45it/s] 75it [00:17, 4.43it/s] 76it [00:17, 4.22it/s] 77it [00:17, 4.30it/s] 78it [00:18, 4.25it/s] 79it [00:18, 4.29it/s] 80it [00:18, 4.39it/s] 81it [00:18, 4.48it/s] 82it [00:18, 4.54it/s] 83it [00:19, 4.44it/s] 84it [00:19, 4.52it/s] 85it [00:19, 4.58it/s] 86it [00:19, 4.60it/s] 87it [00:20, 4.47it/s] 88it [00:20, 4.51it/s] 89it [00:20, 4.41it/s] 90it [00:20, 4.33it/s] 91it [00:21, 4.18it/s] 92it [00:21, 4.15it/s] 93it [00:21, 4.15it/s] 94it [00:21, 4.17it/s] 95it [00:21, 4.18it/s] 96it [00:22, 4.32it/s] 97it [00:22, 4.27it/s] 98it [00:22, 4.38it/s] 99it [00:22, 4.30it/s] 100it [00:23, 4.42it/s]2025-05-25 23:12:56,110 - INFO - [Epoch 024 | Batch 0100] IWAE-loss 2474.6335 | mean log_px -0.0208 | KL -1782.80 + 101it [00:23, 4.50it/s] 102it [00:23, 4.50it/s] 103it [00:23, 4.39it/s] 104it [00:24, 4.33it/s] 105it [00:24, 4.28it/s] 106it [00:24, 4.25it/s] 107it [00:24, 4.16it/s] 108it [00:24, 4.30it/s] 109it [00:25, 4.40it/s] 110it [00:25, 4.34it/s] 111it [00:25, 4.42it/s] 112it [00:25, 4.50it/s] 113it [00:26, 4.40it/s] 114it [00:26, 4.49it/s] 115it [00:26, 4.54it/s] 116it [00:26, 4.59it/s] 117it [00:26, 4.57it/s] 118it [00:27, 4.60it/s] 119it [00:27, 4.62it/s] 120it [00:27, 4.51it/s] 121it [00:27, 4.59it/s] 122it [00:28, 4.61it/s] 123it [00:28, 4.44it/s] 124it [00:28, 4.51it/s] 125it [00:28, 4.54it/s] 126it [00:28, 4.58it/s] 127it [00:29, 4.43it/s] 128it [00:29, 4.49it/s] 129it [00:29, 4.36it/s] 130it [00:29, 4.45it/s] 131it [00:30, 4.52it/s] 132it [00:30, 4.36it/s] 133it [00:30, 4.33it/s] 134it [00:30, 4.27it/s] 135it [00:31, 4.10it/s] 136it [00:31, 4.16it/s] 137it [00:31, 4.30it/s] 138it [00:31, 4.23it/s] 139it [00:31, 4.20it/s] 140it [00:32, 4.20it/s] 141it [00:32, 4.18it/s] 142it [00:32, 4.31it/s] 143it [00:32, 4.16it/s] 144it [00:33, 4.31it/s] 145it [00:33, 4.41it/s] 146it [00:33, 4.48it/s] 147it [00:33, 4.54it/s] 148it [00:34, 4.37it/s] 149it [00:34, 4.34it/s] 150it [00:34, 4.42it/s]2025-05-25 23:13:07,516 - INFO - [Epoch 024 | Batch 0150] IWAE-loss 2033.4376 | mean log_px -0.0059 | KL -1774.52 + 151it [00:34, 4.19it/s] 152it [00:34, 4.18it/s] 153it [00:35, 4.31it/s] 154it [00:35, 4.42it/s] 155it [00:35, 4.34it/s] 156it [00:35, 4.27it/s] 157it [00:36, 4.11it/s] 158it [00:36, 4.23it/s] 159it [00:36, 4.30it/s] 160it [00:36, 4.41it/s] 161it [00:37, 4.36it/s] 162it [00:37, 4.45it/s] 163it [00:37, 4.29it/s] 164it [00:37, 4.41it/s] 165it [00:37, 4.41it/s] 166it [00:38, 4.49it/s] 167it [00:38, 4.34it/s] 168it [00:38, 4.31it/s] 169it [00:38, 4.42it/s] 170it [00:39, 4.32it/s] 171it [00:39, 4.42it/s] 172it [00:39, 4.32it/s] 173it [00:39, 4.27it/s] 174it [00:40, 4.21it/s] 175it [00:40, 4.22it/s] 176it [00:40, 4.19it/s] 177it [00:40, 4.32it/s] 178it [00:40, 4.24it/s] 179it [00:41, 4.36it/s] 180it [00:41, 4.44it/s] 181it [00:41, 4.43it/s] 182it [00:41, 4.32it/s] 183it [00:42, 4.43it/s] 184it [00:42, 4.47it/s] 185it [00:42, 4.40it/s] 186it [00:42, 4.46it/s] 187it [00:43, 4.37it/s] 188it [00:43, 4.29it/s] 189it [00:43, 4.10it/s] 190it [00:43, 4.26it/s] 191it [00:43, 4.36it/s] 192it [00:44, 4.27it/s] 193it [00:44, 4.23it/s] 194it [00:44, 4.20it/s] 195it [00:44, 4.07it/s] 196it [00:45, 4.12it/s] 196it [00:45, 4.33it/s] +2025-05-25 23:13:18,127 - INFO - Epoch: 24, Objective: tensor([2720.5593], device='cuda:0', grad_fn=), Loss: 0.01608070731163025, KL/n: 36.15454864501953 + 0it [00:00, ?it/s]2025-05-25 23:13:18,526 - INFO - [Epoch 025 | Batch 0000] IWAE-loss 2173.3323 | mean log_px -0.0057 | KL -1770.69 + 1it [00:00, 3.03it/s] 2it [00:00, 3.75it/s] 3it [00:00, 4.08it/s] 4it [00:01, 4.10it/s] 5it [00:01, 4.29it/s] 6it [00:01, 4.18it/s] 7it [00:01, 4.20it/s] 8it [00:01, 4.32it/s] 9it [00:02, 4.41it/s] 10it [00:02, 4.46it/s] 11it [00:02, 4.55it/s] 12it [00:02, 4.46it/s] 13it [00:03, 4.43it/s] 14it [00:03, 4.49it/s] 15it [00:03, 4.53it/s] 16it [00:03, 4.57it/s] 17it [00:03, 4.61it/s] 18it [00:04, 4.46it/s] 19it [00:04, 4.44it/s] 20it [00:04, 4.35it/s] 21it [00:04, 4.46it/s] 22it [00:05, 4.50it/s] 23it [00:05, 4.56it/s] 24it [00:05, 4.59it/s] 25it [00:05, 4.62it/s] 26it [00:05, 4.60it/s] 27it [00:06, 4.34it/s] 28it [00:06, 4.26it/s] 29it [00:06, 4.29it/s] 30it [00:06, 4.38it/s] 31it [00:07, 4.46it/s] 32it [00:07, 4.50it/s] 33it [00:07, 4.38it/s] 34it [00:07, 4.17it/s] 35it [00:08, 4.30it/s] 36it [00:08, 4.36it/s] 37it [00:08, 4.37it/s] 38it [00:08, 4.43it/s] 39it [00:08, 4.47it/s] 40it [00:09, 4.51it/s] 41it [00:09, 4.54it/s] 42it [00:09, 4.55it/s] 43it [00:09, 4.42it/s] 44it [00:10, 4.47it/s] 45it [00:10, 4.43it/s] 46it [00:10, 4.46it/s] 47it [00:10, 4.45it/s] 48it [00:10, 4.48it/s] 49it [00:11, 4.34it/s] 50it [00:11, 4.39it/s]2025-05-25 23:13:29,795 - INFO - [Epoch 025 | Batch 0050] IWAE-loss 1950.6661 | mean log_px -0.0028 | KL -1755.02 + 51it [00:11, 4.40it/s] 52it [00:11, 4.33it/s] 53it [00:12, 4.26it/s] 54it [00:12, 4.36it/s] 55it [00:12, 4.27it/s] 56it [00:12, 4.34it/s] 57it [00:13, 4.27it/s] 58it [00:13, 4.37it/s] 59it [00:13, 4.42it/s] 60it [00:13, 4.46it/s] 61it [00:13, 4.49it/s] 62it [00:14, 4.38it/s] 63it [00:14, 4.47it/s] 64it [00:14, 4.33it/s] 65it [00:14, 4.27it/s] 66it [00:15, 4.36it/s] 67it [00:15, 4.44it/s] 68it [00:15, 4.47it/s] 69it [00:15, 4.53it/s] 70it [00:15, 4.56it/s] 71it [00:16, 4.44it/s] 72it [00:16, 4.50it/s] 73it [00:16, 4.55it/s] 74it [00:16, 4.38it/s] 75it [00:17, 4.44it/s] 76it [00:17, 4.32it/s] 77it [00:17, 4.38it/s] 78it [00:17, 4.28it/s] 79it [00:17, 4.31it/s] 80it [00:18, 4.39it/s] 81it [00:18, 4.30it/s] 82it [00:18, 4.11it/s] 83it [00:18, 4.11it/s] 84it [00:19, 4.11it/s] 85it [00:19, 4.01it/s] 86it [00:19, 4.17it/s] 87it [00:19, 4.29it/s] 88it [00:20, 4.38it/s] 89it [00:20, 4.45it/s] 90it [00:20, 4.32it/s] 91it [00:20, 4.42it/s] 92it [00:21, 4.47it/s] 93it [00:21, 4.52it/s] 94it [00:21, 4.52it/s] 95it [00:21, 4.48it/s] 96it [00:21, 4.53it/s] 97it [00:22, 4.55it/s] 98it [00:22, 4.39it/s] 99it [00:22, 4.40it/s] 100it [00:22, 4.44it/s]2025-05-25 23:13:41,254 - INFO - [Epoch 025 | Batch 0100] IWAE-loss 1830.5348 | mean log_px -0.0022 | KL -1743.90 + 101it [00:23, 4.29it/s] 102it [00:23, 4.34it/s] 103it [00:23, 4.37it/s] 104it [00:23, 4.43it/s] 105it [00:23, 4.33it/s] 106it [00:24, 4.27it/s] 107it [00:24, 4.38it/s] 108it [00:24, 4.45it/s] 109it [00:24, 4.52it/s] 110it [00:25, 4.35it/s] 111it [00:25, 4.34it/s] 112it [00:25, 4.40it/s] 113it [00:25, 4.46it/s] 114it [00:25, 4.51it/s] 115it [00:26, 4.39it/s] 116it [00:26, 4.15it/s] 117it [00:26, 4.18it/s] 118it [00:26, 4.29it/s] 119it [00:27, 4.39it/s] 120it [00:27, 4.27it/s] 121it [00:27, 4.26it/s] 122it [00:27, 4.22it/s] 123it [00:28, 4.09it/s] 124it [00:28, 4.24it/s] 125it [00:28, 4.35it/s] 126it [00:28, 4.43it/s] 127it [00:29, 4.47it/s] 128it [00:29, 4.38it/s] 129it [00:29, 4.47it/s] 130it [00:29, 4.35it/s] 131it [00:29, 4.43it/s] 132it [00:30, 4.47it/s] 133it [00:30, 4.37it/s] 134it [00:30, 4.43it/s] 135it [00:30, 4.48it/s] 136it [00:31, 4.33it/s] 137it [00:31, 4.42it/s] 138it [00:31, 4.48it/s] 139it [00:31, 4.53it/s] 140it [00:31, 4.52it/s] 141it [00:32, 4.42it/s] 142it [00:32, 4.17it/s] 143it [00:32, 4.14it/s] 144it [00:32, 4.10it/s] 145it [00:33, 4.24it/s] 146it [00:33, 4.19it/s] 147it [00:33, 4.17it/s] 148it [00:33, 4.27it/s] 149it [00:34, 4.35it/s] 150it [00:34, 4.19it/s]2025-05-25 23:13:52,778 - INFO - [Epoch 025 | Batch 0150] IWAE-loss 2106.1345 | mean log_px -0.0053 | KL -1734.84 + 151it [00:34, 4.31it/s] 152it [00:34, 4.37it/s] 153it [00:35, 4.46it/s] 154it [00:35, 4.51it/s] 155it [00:35, 4.56it/s] 156it [00:35, 4.58it/s] 157it [00:35, 4.45it/s] 158it [00:36, 4.31it/s] 159it [00:36, 4.26it/s] 160it [00:36, 4.37it/s] 161it [00:36, 4.31it/s] 162it [00:37, 4.23it/s] 163it [00:37, 4.29it/s] 164it [00:37, 4.22it/s] 165it [00:37, 4.20it/s] 166it [00:38, 4.34it/s] 167it [00:38, 4.42it/s] 168it [00:38, 4.48it/s] 169it [00:38, 4.45it/s] 170it [00:38, 4.45it/s] 171it [00:39, 4.49it/s] 172it [00:39, 4.53it/s] 173it [00:39, 4.54it/s] 174it [00:39, 4.57it/s] 175it [00:39, 4.59it/s] 176it [00:40, 4.61it/s] 177it [00:40, 4.62it/s] 178it [00:40, 4.62it/s] 179it [00:40, 4.45it/s] 180it [00:41, 4.36it/s] 181it [00:41, 4.29it/s] 182it [00:41, 4.21it/s] 183it [00:41, 4.23it/s] 184it [00:42, 4.33it/s] 185it [00:42, 4.42it/s] 186it [00:42, 4.29it/s] 187it [00:42, 4.39it/s] 188it [00:42, 4.46it/s] 189it [00:43, 4.40it/s] 190it [00:43, 4.33it/s] 191it [00:43, 4.40it/s] 192it [00:43, 4.47it/s] 193it [00:44, 4.39it/s] 194it [00:44, 4.43it/s] 195it [00:44, 4.21it/s] 196it [00:44, 4.21it/s] 196it [00:44, 4.37it/s] +2025-05-25 23:14:03,146 - INFO - Epoch: 25, Objective: tensor([2120.1199], device='cuda:0', grad_fn=), Loss: 0.009839070029556751, KL/n: 35.31795120239258 + 0it [00:00, ?it/s]2025-05-25 23:14:03,719 - INFO - [Epoch 026 | Batch 0000] IWAE-loss 2901.0183 | mean log_px -0.0300 | KL -1724.86 + 1it [00:00, 3.12it/s] 2it [00:00, 3.84it/s] 3it [00:00, 4.17it/s] 4it [00:00, 4.30it/s] 5it [00:01, 4.36it/s] 6it [00:01, 4.29it/s] 7it [00:01, 4.33it/s] 8it [00:01, 4.29it/s] 9it [00:02, 4.24it/s] 10it [00:02, 4.21it/s] 11it [00:02, 4.32it/s] 12it [00:02, 4.28it/s] 13it [00:03, 4.23it/s] 14it [00:03, 4.21it/s] 15it [00:03, 4.21it/s] 16it [00:03, 4.21it/s] 17it [00:04, 4.23it/s] 18it [00:04, 4.19it/s] 19it [00:04, 4.23it/s] 20it [00:04, 4.33it/s] 21it [00:04, 4.42it/s] 22it [00:05, 4.24it/s] 23it [00:05, 4.26it/s] 24it [00:05, 4.34it/s] 25it [00:05, 4.36it/s] 26it [00:06, 4.44it/s] 27it [00:06, 4.36it/s] 28it [00:06, 4.46it/s] 29it [00:06, 4.49it/s] 30it [00:06, 4.46it/s] 31it [00:07, 4.40it/s] 32it [00:07, 4.37it/s] 33it [00:07, 4.22it/s] 34it [00:07, 4.26it/s] 35it [00:08, 4.37it/s] 36it [00:08, 4.46it/s] 37it [00:08, 4.31it/s] 38it [00:08, 4.37it/s] 39it [00:09, 4.44it/s] 40it [00:09, 4.49it/s] 41it [00:09, 4.51it/s] 42it [00:09, 4.43it/s] 43it [00:09, 4.50it/s] 44it [00:10, 4.23it/s] 45it [00:10, 4.34it/s] 46it [00:10, 4.27it/s] 47it [00:10, 4.24it/s] 48it [00:11, 4.37it/s] 49it [00:11, 4.35it/s] 50it [00:11, 4.40it/s]2025-05-25 23:14:15,199 - INFO - [Epoch 026 | Batch 0050] IWAE-loss 2016.3051 | mean log_px -0.0103 | KL -1714.56 + 51it [00:11, 4.38it/s] 52it [00:12, 4.48it/s] 53it [00:12, 4.54it/s] 54it [00:12, 4.55it/s] 55it [00:12, 4.49it/s] 56it [00:12, 4.38it/s] 57it [00:13, 4.47it/s] 58it [00:13, 4.49it/s] 59it [00:13, 4.43it/s] 60it [00:13, 4.49it/s] 61it [00:14, 4.40it/s] 62it [00:14, 4.36it/s] 63it [00:14, 4.36it/s] 64it [00:14, 4.45it/s] 65it [00:14, 4.38it/s] 66it [00:15, 4.45it/s] 67it [00:15, 4.39it/s] 68it [00:15, 4.47it/s] 69it [00:15, 4.36it/s] 70it [00:16, 4.25it/s] 71it [00:16, 4.24it/s] 72it [00:16, 4.37it/s] 73it [00:16, 4.35it/s] 74it [00:17, 4.29it/s] 75it [00:17, 4.29it/s] 76it [00:17, 4.40it/s] 77it [00:17, 4.35it/s] 78it [00:17, 4.30it/s] 79it [00:18, 4.27it/s] 80it [00:18, 4.28it/s] 81it [00:18, 4.27it/s] 82it [00:18, 4.27it/s] 83it [00:19, 4.28it/s] 84it [00:19, 4.27it/s] 85it [00:19, 4.39it/s] 86it [00:19, 4.33it/s] 87it [00:20, 4.32it/s] 88it [00:20, 4.25it/s] 89it [00:20, 4.34it/s] 90it [00:20, 4.22it/s] 91it [00:20, 4.35it/s] 92it [00:21, 4.44it/s] 93it [00:21, 4.47it/s] 94it [00:21, 4.36it/s] 95it [00:21, 4.34it/s] 96it [00:22, 4.26it/s] 97it [00:22, 4.38it/s] 98it [00:22, 4.29it/s] 99it [00:22, 4.29it/s] 100it [00:23, 4.37it/s]2025-05-25 23:14:26,684 - INFO - [Epoch 026 | Batch 0100] IWAE-loss 2671.4316 | mean log_px -0.0232 | KL -1705.30 + 101it [00:23, 4.32it/s] 102it [00:23, 4.30it/s] 103it [00:23, 4.30it/s] 104it [00:23, 4.35it/s] 105it [00:24, 4.32it/s] 106it [00:24, 4.13it/s] 107it [00:24, 4.15it/s] 108it [00:24, 4.17it/s] 109it [00:25, 4.19it/s] 110it [00:25, 4.17it/s] 111it [00:25, 4.19it/s] 112it [00:25, 4.21it/s] 113it [00:26, 4.26it/s] 114it [00:26, 4.35it/s] 115it [00:26, 4.32it/s] 116it [00:26, 4.28it/s] 117it [00:27, 4.22it/s] 118it [00:27, 4.10it/s] 119it [00:27, 4.27it/s] 120it [00:27, 4.37it/s] 121it [00:27, 4.44it/s] 122it [00:28, 4.50it/s] 123it [00:28, 4.42it/s] 124it [00:28, 4.46it/s] 125it [00:28, 4.42it/s] 126it [00:29, 4.36it/s] 127it [00:29, 4.32it/s] 128it [00:29, 4.40it/s] 129it [00:29, 4.47it/s] 130it [00:30, 4.51it/s] 131it [00:30, 4.52it/s] 132it [00:30, 4.41it/s] 133it [00:30, 4.36it/s] 134it [00:30, 4.31it/s] 135it [00:31, 4.27it/s] 136it [00:31, 4.25it/s] 137it [00:31, 4.24it/s] 138it [00:31, 4.20it/s] 139it [00:32, 4.23it/s] 140it [00:32, 4.32it/s] 141it [00:32, 4.41it/s] 142it [00:32, 4.34it/s] 143it [00:33, 4.35it/s] 144it [00:33, 4.42it/s] 145it [00:33, 4.46it/s] 146it [00:33, 4.49it/s] 147it [00:33, 4.53it/s] 148it [00:34, 4.39it/s] 149it [00:34, 4.37it/s] 150it [00:34, 4.30it/s]2025-05-25 23:14:38,240 - INFO - [Epoch 026 | Batch 0150] IWAE-loss 3300.8362 | mean log_px -0.0360 | KL -1700.18 + 151it [00:34, 4.34it/s] 152it [00:35, 4.43it/s] 153it [00:35, 4.49it/s] 154it [00:35, 4.53it/s] 155it [00:35, 4.56it/s] 156it [00:35, 4.41it/s] 157it [00:36, 4.39it/s] 158it [00:36, 4.33it/s] 159it [00:36, 4.30it/s] 160it [00:36, 4.25it/s] 161it [00:37, 4.37it/s] 162it [00:37, 4.28it/s] 163it [00:37, 4.29it/s] 164it [00:37, 4.37it/s] 165it [00:38, 4.45it/s] 166it [00:38, 4.35it/s] 167it [00:38, 4.35it/s] 168it [00:38, 4.30it/s] 169it [00:38, 4.29it/s] 170it [00:39, 4.36it/s] 171it [00:39, 4.33it/s] 172it [00:39, 4.39it/s] 173it [00:39, 4.46it/s] 174it [00:40, 4.30it/s] 175it [00:40, 4.33it/s] 176it [00:40, 4.28it/s] 177it [00:40, 4.31it/s] 178it [00:41, 4.23it/s] 179it [00:41, 4.24it/s] 180it [00:41, 4.19it/s] 181it [00:41, 4.21it/s] 182it [00:41, 4.30it/s] 183it [00:42, 4.30it/s] 184it [00:42, 4.29it/s] 185it [00:42, 4.39it/s] 186it [00:42, 4.32it/s] 187it [00:43, 4.31it/s] 188it [00:43, 4.38it/s] 189it [00:43, 4.33it/s] 190it [00:43, 4.40it/s] 191it [00:44, 4.36it/s] 192it [00:44, 4.46it/s] 193it [00:44, 4.39it/s] 194it [00:44, 4.41it/s] 195it [00:44, 4.38it/s] 196it [00:45, 4.47it/s] 196it [00:45, 4.33it/s] +2025-05-25 23:14:48,704 - INFO - Epoch: 26, Objective: tensor([2170.3135], device='cuda:0', grad_fn=), Loss: 0.008433881215751171, KL/n: 34.64965057373047 + 0it [00:00, ?it/s]2025-05-25 23:14:49,108 - INFO - [Epoch 027 | Batch 0000] IWAE-loss 1838.5685 | mean log_px -0.0048 | KL -1699.11 + 1it [00:00, 3.00it/s] 2it [00:00, 3.74it/s] 3it [00:00, 3.94it/s] 4it [00:01, 4.00it/s] 5it [00:01, 4.24it/s] 6it [00:01, 4.21it/s] 7it [00:01, 4.21it/s] 8it [00:01, 4.32it/s] 9it [00:02, 4.35it/s] 10it [00:02, 4.42it/s] 11it [00:02, 4.49it/s] 12it [00:02, 4.54it/s] 13it [00:03, 4.56it/s] 14it [00:03, 4.59it/s] 15it [00:03, 4.62it/s] 16it [00:03, 4.63it/s] 17it [00:03, 4.64it/s] 18it [00:04, 4.39it/s] 19it [00:04, 4.45it/s] 20it [00:04, 4.35it/s] 21it [00:04, 4.42it/s] 22it [00:05, 4.48it/s] 23it [00:05, 4.46it/s] 24it [00:05, 4.50it/s] 25it [00:05, 4.55it/s] 26it [00:05, 4.54it/s] 27it [00:06, 4.32it/s] 28it [00:06, 4.28it/s] 29it [00:06, 4.24it/s] 30it [00:06, 4.33it/s] 31it [00:07, 4.43it/s] 32it [00:07, 4.34it/s] 33it [00:07, 4.30it/s] 34it [00:07, 4.24it/s] 35it [00:08, 4.21it/s] 36it [00:08, 4.20it/s] 37it [00:08, 4.20it/s] 38it [00:08, 4.17it/s] 39it [00:09, 4.19it/s] 40it [00:09, 4.18it/s] 41it [00:09, 4.19it/s] 42it [00:09, 4.15it/s] 43it [00:09, 4.07it/s] 44it [00:10, 4.21it/s] 45it [00:10, 4.33it/s] 46it [00:10, 4.42it/s] 47it [00:10, 4.45it/s] 48it [00:11, 4.34it/s] 49it [00:11, 4.16it/s] 50it [00:11, 4.17it/s]2025-05-25 23:15:00,604 - INFO - [Epoch 027 | Batch 0050] IWAE-loss 2172.3386 | mean log_px -0.0069 | KL -1685.88 + 51it [00:11, 4.29it/s] 52it [00:12, 4.38it/s] 53it [00:12, 4.46it/s] 54it [00:12, 4.26it/s] 55it [00:12, 4.34it/s] 56it [00:12, 4.39it/s] 57it [00:13, 4.30it/s] 58it [00:13, 4.08it/s] 59it [00:13, 4.22it/s] 60it [00:13, 4.26it/s] 61it [00:14, 4.24it/s] 62it [00:14, 4.31it/s] 63it [00:14, 4.39it/s] 64it [00:15, 3.37it/s] 65it [00:15, 3.65it/s] 66it [00:15, 3.79it/s] 67it [00:15, 4.00it/s] 68it [00:15, 4.15it/s] 69it [00:16, 4.28it/s] 70it [00:16, 4.23it/s] 71it [00:16, 4.34it/s] 72it [00:16, 4.23it/s] 73it [00:17, 4.24it/s] 74it [00:17, 4.21it/s] 75it [00:17, 4.32it/s] 76it [00:17, 4.39it/s] 77it [00:18, 4.30it/s] 78it [00:18, 4.25it/s] 79it [00:18, 4.36it/s] 80it [00:18, 4.40it/s] 81it [00:18, 4.47it/s] 82it [00:19, 4.51it/s] 83it [00:19, 4.27it/s] 84it [00:19, 4.23it/s] 85it [00:19, 4.27it/s] 86it [00:20, 4.35it/s] 87it [00:20, 4.35it/s] 88it [00:20, 4.27it/s] 89it [00:20, 4.23it/s] 90it [00:21, 4.17it/s] 91it [00:21, 4.24it/s] 92it [00:21, 4.36it/s] 93it [00:21, 4.35it/s] 94it [00:21, 4.42it/s] 95it [00:22, 4.32it/s] 96it [00:22, 4.33it/s] 97it [00:22, 4.15it/s] 98it [00:22, 4.15it/s] 99it [00:23, 4.28it/s] 100it [00:23, 4.27it/s]2025-05-25 23:15:12,389 - INFO - [Epoch 027 | Batch 0100] IWAE-loss 2017.5281 | mean log_px -0.0098 | KL -1670.65 + 101it [00:23, 4.36it/s] 102it [00:23, 4.43it/s] 103it [00:24, 4.30it/s] 104it [00:24, 4.10it/s] 105it [00:24, 4.14it/s] 106it [00:24, 4.13it/s] 107it [00:25, 4.26it/s] 108it [00:25, 4.20it/s] 109it [00:25, 4.19it/s] 110it [00:25, 4.16it/s] 111it [00:26, 4.10it/s] 112it [00:26, 4.09it/s] 113it [00:26, 4.11it/s] 114it [00:26, 4.10it/s] 115it [00:26, 4.24it/s] 116it [00:27, 4.16it/s] 117it [00:27, 4.15it/s] 118it [00:27, 4.22it/s] 119it [00:27, 4.35it/s] 120it [00:28, 4.34it/s] 121it [00:28, 4.41it/s] 122it [00:28, 4.31it/s] 123it [00:28, 4.40it/s] 124it [00:29, 4.28it/s] 125it [00:29, 4.29it/s] 126it [00:29, 4.36it/s] 127it [00:29, 4.43it/s] 128it [00:29, 4.30it/s] 129it [00:30, 4.19it/s] 130it [00:30, 4.15it/s] 131it [00:30, 4.15it/s] 132it [00:30, 4.20it/s] 133it [00:31, 4.32it/s] 134it [00:31, 4.40it/s] 135it [00:31, 4.31it/s] 136it [00:31, 4.23it/s] 137it [00:32, 4.34it/s] 138it [00:32, 4.41it/s] 139it [00:32, 4.46it/s] 140it [00:32, 4.35it/s] 141it [00:33, 4.20it/s] 142it [00:33, 4.29it/s] 143it [00:33, 4.15it/s] 144it [00:33, 4.23it/s] 145it [00:33, 4.32it/s] 146it [00:34, 4.38it/s] 147it [00:34, 4.39it/s] 148it [00:34, 4.44it/s] 149it [00:34, 4.27it/s] 150it [00:35, 4.33it/s]2025-05-25 23:15:24,127 - INFO - [Epoch 027 | Batch 0150] IWAE-loss 2334.5696 | mean log_px -0.0127 | KL -1661.62 + 151it [00:35, 4.26it/s] 152it [00:35, 4.32it/s] 153it [00:35, 4.32it/s] 154it [00:36, 4.21it/s] 155it [00:36, 4.20it/s] 156it [00:36, 4.15it/s] 157it [00:36, 4.09it/s] 158it [00:37, 4.09it/s] 159it [00:37, 4.09it/s] 160it [00:37, 4.13it/s] 161it [00:37, 4.14it/s] 162it [00:37, 4.23it/s] 163it [00:38, 4.22it/s] 164it [00:38, 4.32it/s] 165it [00:38, 4.40it/s] 166it [00:38, 4.44it/s] 167it [00:39, 4.43it/s] 168it [00:39, 4.49it/s] 169it [00:39, 4.40it/s] 170it [00:39, 4.31it/s] 171it [00:40, 4.26it/s] 172it [00:40, 4.22it/s] 173it [00:40, 4.32it/s] 174it [00:40, 4.33it/s] 175it [00:40, 4.28it/s] 176it [00:41, 4.37it/s] 177it [00:41, 4.44it/s] 178it [00:41, 4.31it/s] 179it [00:41, 4.29it/s] 180it [00:42, 4.23it/s] 181it [00:42, 4.18it/s] 182it [00:42, 4.29it/s] 183it [00:42, 4.30it/s] 184it [00:43, 4.37it/s] 185it [00:43, 4.30it/s] 186it [00:43, 4.35it/s] 187it [00:43, 4.29it/s] 188it [00:44, 4.21it/s] 189it [00:44, 4.22it/s] 190it [00:44, 4.30it/s] 191it [00:44, 4.35it/s] 192it [00:44, 4.41it/s] 193it [00:45, 4.31it/s] 194it [00:45, 4.11it/s] 195it [00:45, 3.98it/s] 196it [00:45, 4.06it/s] 196it [00:46, 4.26it/s] +2025-05-25 23:15:34,845 - INFO - Epoch: 27, Objective: tensor([2400.2996], device='cuda:0', grad_fn=), Loss: 0.009168989956378937, KL/n: 33.872135162353516 + 0it [00:00, ?it/s]2025-05-25 23:15:35,228 - INFO - [Epoch 028 | Batch 0000] IWAE-loss 1821.6100 | mean log_px -0.0041 | KL -1660.52 + 1it [00:00, 3.20it/s] 2it [00:00, 3.65it/s] 3it [00:00, 3.98it/s] 4it [00:01, 4.19it/s] 5it [00:01, 4.18it/s] 6it [00:01, 4.27it/s] 7it [00:01, 4.22it/s] 8it [00:01, 4.00it/s] 9it [00:02, 4.18it/s] 10it [00:02, 4.29it/s] 11it [00:02, 4.31it/s] 12it [00:02, 4.37it/s] 13it [00:03, 4.31it/s] 14it [00:03, 4.25it/s] 15it [00:03, 4.33it/s] 16it [00:03, 4.41it/s] 17it [00:04, 4.47it/s] 18it [00:04, 4.36it/s] 19it [00:04, 4.43it/s] 20it [00:04, 4.25it/s] 21it [00:04, 4.21it/s] 22it [00:05, 4.33it/s] 23it [00:05, 4.28it/s] 24it [00:05, 4.23it/s] 25it [00:05, 4.23it/s] 26it [00:06, 4.34it/s] 27it [00:06, 4.39it/s] 28it [00:06, 4.44it/s] 29it [00:06, 4.50it/s] 30it [00:06, 4.52it/s] 31it [00:07, 4.49it/s] 32it [00:07, 4.50it/s] 33it [00:07, 4.25it/s] 34it [00:07, 4.32it/s] 35it [00:08, 4.24it/s] 36it [00:08, 4.19it/s] 37it [00:08, 4.32it/s] 38it [00:08, 4.25it/s] 39it [00:09, 4.37it/s] 40it [00:09, 4.22it/s] 41it [00:09, 4.16it/s] 42it [00:09, 4.16it/s] 43it [00:10, 4.22it/s] 44it [00:10, 4.16it/s] 45it [00:10, 4.14it/s] 46it [00:10, 4.13it/s] 47it [00:11, 4.15it/s] 48it [00:11, 3.98it/s] 49it [00:11, 4.15it/s] 50it [00:11, 4.12it/s]2025-05-25 23:15:46,919 - INFO - [Epoch 028 | Batch 0050] IWAE-loss 1886.0216 | mean log_px -0.0034 | KL -1643.58 + 51it [00:12, 4.25it/s] 52it [00:12, 4.30it/s] 53it [00:12, 4.24it/s] 54it [00:12, 4.19it/s] 55it [00:12, 4.30it/s] 56it [00:13, 4.37it/s] 57it [00:13, 4.35it/s] 58it [00:13, 4.29it/s] 59it [00:13, 4.39it/s] 60it [00:14, 4.41it/s] 61it [00:14, 4.48it/s] 62it [00:14, 4.36it/s] 63it [00:14, 4.44it/s] 64it [00:14, 4.48it/s] 65it [00:15, 4.45it/s] 66it [00:15, 4.51it/s] 67it [00:15, 4.40it/s] 68it [00:15, 4.33it/s] 69it [00:16, 4.29it/s] 70it [00:16, 4.34it/s] 71it [00:16, 4.43it/s] 72it [00:16, 4.37it/s] 73it [00:17, 4.45it/s] 74it [00:17, 4.36it/s] 75it [00:17, 4.31it/s] 76it [00:17, 4.37it/s] 77it [00:17, 4.30it/s] 78it [00:18, 4.25it/s] 79it [00:18, 4.36it/s] 80it [00:18, 4.27it/s] 81it [00:18, 4.38it/s] 82it [00:19, 4.30it/s] 83it [00:19, 4.35it/s] 84it [00:19, 4.38it/s] 85it [00:19, 4.46it/s] 86it [00:20, 4.45it/s] 87it [00:20, 4.37it/s] 88it [00:20, 4.19it/s] 89it [00:20, 4.33it/s] 90it [00:20, 4.26it/s] 91it [00:21, 4.35it/s] 92it [00:21, 4.28it/s] 93it [00:21, 4.24it/s] 94it [00:21, 4.19it/s] 95it [00:22, 4.30it/s] 96it [00:22, 4.24it/s] 97it [00:22, 4.32it/s] 98it [00:22, 4.25it/s] 99it [00:23, 4.35it/s] 100it [00:23, 4.28it/s]2025-05-25 23:15:58,425 - INFO - [Epoch 028 | Batch 0100] IWAE-loss 1992.9895 | mean log_px -0.0080 | KL -1643.61 + 101it [00:23, 4.37it/s] 102it [00:23, 4.40it/s] 103it [00:23, 4.49it/s] 104it [00:24, 4.53it/s] 105it [00:24, 4.56it/s] 106it [00:24, 4.42it/s] 107it [00:24, 4.51it/s] 108it [00:25, 4.55it/s] 109it [00:25, 4.58it/s] 110it [00:25, 4.54it/s] 111it [00:25, 4.58it/s] 112it [00:25, 4.43it/s] 113it [00:26, 4.51it/s] 114it [00:26, 4.40it/s] 115it [00:26, 4.31it/s] 116it [00:26, 4.24it/s] 117it [00:27, 4.35it/s] 118it [00:27, 4.42it/s] 119it [00:27, 4.50it/s] 120it [00:27, 4.55it/s] 121it [00:27, 4.59it/s] 122it [00:28, 4.45it/s] 123it [00:28, 4.29it/s] 124it [00:28, 4.39it/s] 125it [00:28, 4.47it/s] 126it [00:29, 4.37it/s] 127it [00:29, 4.45it/s] 128it [00:29, 4.52it/s] 129it [00:29, 4.49it/s] 130it [00:29, 4.53it/s] 131it [00:30, 4.59it/s] 132it [00:30, 4.45it/s] 133it [00:30, 4.38it/s] 134it [00:30, 4.44it/s] 135it [00:31, 4.52it/s] 136it [00:31, 4.57it/s] 137it [00:31, 4.61it/s] 138it [00:31, 4.63it/s] 139it [00:31, 4.66it/s] 140it [00:32, 4.64it/s] 141it [00:32, 4.52it/s] 142it [00:32, 4.55it/s] 143it [00:32, 4.59it/s] 144it [00:33, 4.59it/s] 145it [00:33, 4.49it/s] 146it [00:33, 4.37it/s] 147it [00:33, 4.32it/s] 148it [00:33, 4.40it/s] 149it [00:34, 4.29it/s] 150it [00:34, 4.37it/s]2025-05-25 23:16:09,611 - INFO - [Epoch 028 | Batch 0150] IWAE-loss 1948.8407 | mean log_px -0.0090 | KL -1636.46 + 151it [00:34, 4.32it/s] 152it [00:34, 4.27it/s] 153it [00:35, 4.26it/s] 154it [00:35, 4.35it/s] 155it [00:35, 4.43it/s] 156it [00:35, 4.51it/s] 157it [00:36, 4.57it/s] 158it [00:36, 4.61it/s] 159it [00:36, 4.48it/s] 160it [00:36, 4.51it/s] 161it [00:36, 4.56it/s] 162it [00:37, 4.47it/s] 163it [00:37, 4.54it/s] 164it [00:37, 4.58it/s] 165it [00:37, 4.46it/s] 166it [00:38, 4.35it/s] 167it [00:38, 4.33it/s] 168it [00:38, 4.40it/s] 169it [00:38, 4.49it/s] 170it [00:38, 4.55it/s] 171it [00:39, 4.60it/s] 172it [00:39, 4.62it/s] 173it [00:39, 4.65it/s] 174it [00:39, 4.65it/s] 175it [00:39, 4.67it/s] 176it [00:40, 4.68it/s] 177it [00:40, 4.53it/s] 178it [00:40, 4.54it/s] 179it [00:40, 4.59it/s] 180it [00:41, 4.62it/s] 181it [00:41, 4.49it/s] 182it [00:41, 4.52it/s] 183it [00:41, 4.57it/s] 184it [00:42, 4.42it/s] 185it [00:42, 4.38it/s] 186it [00:42, 4.30it/s] 187it [00:42, 4.19it/s] 188it [00:42, 4.18it/s] 189it [00:43, 4.32it/s] 190it [00:43, 4.41it/s] 191it [00:43, 4.36it/s] 192it [00:43, 4.41it/s] 193it [00:44, 4.50it/s] 194it [00:44, 4.56it/s] 195it [00:44, 4.30it/s] 196it [00:44, 4.40it/s] 196it [00:44, 4.37it/s] +2025-05-25 23:16:19,806 - INFO - Epoch: 28, Objective: tensor([2206.5891], device='cuda:0', grad_fn=), Loss: 0.015577034093439579, KL/n: 33.273502349853516 + 0it [00:00, ?it/s]2025-05-25 23:16:20,382 - INFO - [Epoch 029 | Batch 0000] IWAE-loss 1807.6621 | mean log_px -0.0057 | KL -1630.16 + 1it [00:00, 3.03it/s] 2it [00:00, 3.81it/s] 3it [00:00, 4.19it/s] 4it [00:00, 4.38it/s] 5it [00:01, 4.50it/s] 6it [00:01, 4.57it/s] 7it [00:01, 4.60it/s] 8it [00:01, 4.63it/s] 9it [00:02, 4.64it/s] 10it [00:02, 4.67it/s] 11it [00:02, 4.54it/s] 12it [00:02, 4.60it/s] 13it [00:02, 4.64it/s] 14it [00:03, 4.65it/s] 15it [00:03, 4.66it/s] 16it [00:03, 4.52it/s] 17it [00:03, 4.55it/s] 18it [00:03, 4.58it/s] 19it [00:04, 4.60it/s] 20it [00:04, 4.48it/s] 21it [00:04, 4.56it/s] 22it [00:04, 4.60it/s] 23it [00:05, 4.48it/s] 24it [00:05, 4.56it/s] 25it [00:05, 4.61it/s] 26it [00:05, 4.60it/s] 27it [00:05, 4.63it/s] 28it [00:06, 4.61it/s] 29it [00:06, 4.48it/s] 30it [00:06, 4.57it/s] 31it [00:06, 4.61it/s] 32it [00:07, 4.63it/s] 33it [00:07, 4.65it/s] 34it [00:07, 4.49it/s] 35it [00:07, 4.58it/s] 36it [00:07, 4.62it/s] 37it [00:08, 4.65it/s] 38it [00:08, 4.67it/s] 39it [00:08, 4.52it/s] 40it [00:08, 4.59it/s] 41it [00:09, 4.63it/s] 42it [00:09, 4.65it/s] 43it [00:09, 4.68it/s] 44it [00:09, 4.52it/s] 45it [00:09, 4.59it/s] 46it [00:10, 4.61it/s] 47it [00:10, 4.64it/s] 48it [00:10, 4.62it/s] 49it [00:10, 4.57it/s] 50it [00:10, 4.60it/s]2025-05-25 23:16:31,237 - INFO - [Epoch 029 | Batch 0050] IWAE-loss 1674.5372 | mean log_px -0.0011 | KL -1614.30 + 51it [00:11, 4.64it/s] 52it [00:11, 4.65it/s] 53it [00:11, 4.68it/s] 54it [00:11, 4.69it/s] 55it [00:12, 4.70it/s] 56it [00:12, 4.69it/s] 57it [00:12, 4.70it/s] 58it [00:12, 4.66it/s] 59it [00:12, 4.68it/s] 60it [00:13, 4.69it/s] 61it [00:13, 4.70it/s] 62it [00:13, 4.69it/s] 63it [00:13, 4.70it/s] 64it [00:13, 4.70it/s] 65it [00:14, 4.70it/s] 66it [00:14, 4.54it/s] 67it [00:14, 4.59it/s] 68it [00:14, 4.61it/s] 69it [00:15, 4.54it/s] 70it [00:15, 4.59it/s] 71it [00:15, 4.41it/s] 72it [00:15, 4.51it/s] 73it [00:15, 4.56it/s] 74it [00:16, 4.58it/s] 75it [00:16, 4.60it/s] 76it [00:16, 4.62it/s] 77it [00:16, 4.65it/s] 78it [00:17, 4.53it/s] 79it [00:17, 4.60it/s] 80it [00:17, 4.63it/s] 81it [00:17, 4.65it/s] 82it [00:17, 4.67it/s] 83it [00:18, 4.69it/s] 84it [00:18, 4.53it/s] 85it [00:18, 4.60it/s] 86it [00:18, 4.63it/s] 87it [00:18, 4.64it/s] 88it [00:19, 4.66it/s] 89it [00:19, 4.66it/s] 90it [00:19, 4.51it/s] 91it [00:19, 4.59it/s] 92it [00:20, 4.62it/s] 93it [00:20, 4.64it/s] 94it [00:20, 4.63it/s] 95it [00:20, 4.67it/s] 96it [00:20, 4.68it/s] 97it [00:21, 4.53it/s] 98it [00:21, 4.55it/s] 99it [00:21, 4.58it/s] 100it [00:21, 4.61it/s]2025-05-25 23:16:42,056 - INFO - [Epoch 029 | Batch 0100] IWAE-loss 1752.5222 | mean log_px -0.0047 | KL -1603.06 + 101it [00:21, 4.63it/s] 102it [00:22, 4.48it/s] 103it [00:22, 4.46it/s] 104it [00:22, 4.52it/s] 105it [00:22, 4.57it/s] 106it [00:23, 4.61it/s] 107it [00:23, 4.64it/s] 108it [00:23, 4.65it/s] 109it [00:23, 4.66it/s] 110it [00:23, 4.68it/s] 111it [00:24, 4.70it/s] 112it [00:24, 4.52it/s] 113it [00:24, 4.60it/s] 114it [00:24, 4.63it/s] 115it [00:25, 4.66it/s] 116it [00:25, 4.66it/s] 117it [00:25, 4.68it/s] 118it [00:25, 4.52it/s] 119it [00:25, 4.60it/s] 120it [00:26, 4.63it/s] 121it [00:26, 4.65it/s] 122it [00:26, 4.65it/s] 123it [00:26, 4.51it/s] 124it [00:27, 4.58it/s] 125it [00:27, 4.62it/s] 126it [00:27, 4.63it/s] 127it [00:27, 4.67it/s] 128it [00:27, 4.68it/s] 129it [00:28, 4.53it/s] 130it [00:28, 4.58it/s] 131it [00:28, 4.62it/s] 132it [00:28, 4.64it/s] 133it [00:28, 4.57it/s] 134it [00:29, 4.57it/s] 135it [00:29, 4.44it/s] 136it [00:29, 4.52it/s] 137it [00:29, 4.57it/s] 138it [00:30, 4.57it/s] 139it [00:30, 4.61it/s] 140it [00:30, 4.39it/s] 141it [00:30, 4.42it/s] 142it [00:30, 4.50it/s] 143it [00:31, 4.57it/s] 144it [00:31, 4.60it/s] 145it [00:31, 4.63it/s] 146it [00:31, 4.48it/s] 147it [00:32, 4.56it/s] 148it [00:32, 4.60it/s] 149it [00:32, 4.63it/s] 150it [00:32, 4.65it/s]2025-05-25 23:16:52,956 - INFO - [Epoch 029 | Batch 0150] IWAE-loss 1698.8661 | mean log_px -0.0024 | KL -1595.82 + 151it [00:32, 4.66it/s] 152it [00:33, 4.67it/s] 153it [00:33, 4.69it/s] 154it [00:33, 4.58it/s] 155it [00:33, 4.62it/s] 156it [00:33, 4.62it/s] 157it [00:34, 4.67it/s] 158it [00:34, 4.68it/s] 159it [00:34, 4.69it/s] 160it [00:34, 4.70it/s] 161it [00:35, 4.71it/s] 162it [00:35, 4.70it/s] 163it [00:35, 4.71it/s] 164it [00:35, 4.70it/s] 165it [00:35, 4.71it/s] 166it [00:36, 4.70it/s] 167it [00:36, 4.66it/s] 168it [00:36, 4.65it/s] 169it [00:36, 4.61it/s] 170it [00:36, 4.62it/s] 171it [00:37, 4.59it/s] 172it [00:37, 4.59it/s] 173it [00:37, 4.60it/s] 174it [00:37, 4.58it/s] 175it [00:38, 4.58it/s] 176it [00:38, 4.59it/s] 177it [00:38, 4.59it/s] 178it [00:38, 4.59it/s] 179it [00:38, 4.61it/s] 180it [00:39, 4.62it/s] 181it [00:39, 4.62it/s] 182it [00:39, 4.60it/s] 183it [00:39, 4.62it/s] 184it [00:40, 4.63it/s] 185it [00:40, 4.63it/s] 186it [00:40, 4.62it/s] 187it [00:40, 4.63it/s] 188it [00:40, 4.62it/s] 189it [00:41, 4.62it/s] 190it [00:41, 4.61it/s] 191it [00:41, 4.60it/s] 192it [00:41, 4.59it/s] 193it [00:41, 4.58it/s] 194it [00:42, 4.27it/s] 195it [00:42, 4.26it/s] 196it [00:42, 4.38it/s] 196it [00:42, 4.58it/s] +2025-05-25 23:17:02,887 - INFO - Epoch: 29, Objective: tensor([2066.5352], device='cuda:0', grad_fn=), Loss: 0.007869544439017773, KL/n: 32.472476959228516 + 0it [00:00, ?it/s]2025-05-25 23:17:03,312 - INFO - [Epoch 030 | Batch 0000] IWAE-loss 1742.8804 | mean log_px -0.0048 | KL -1591.28 + 1it [00:00, 2.79it/s] 2it [00:00, 3.64it/s] 3it [00:00, 4.00it/s] 4it [00:01, 4.16it/s] 5it [00:01, 4.33it/s] 6it [00:01, 4.43it/s] 7it [00:01, 4.49it/s] 8it [00:01, 4.36it/s] 9it [00:02, 4.42it/s] 10it [00:02, 4.47it/s] 11it [00:02, 4.52it/s] 12it [00:02, 4.54it/s] 13it [00:02, 4.57it/s] 14it [00:03, 4.59it/s] 15it [00:03, 3.67it/s] 16it [00:03, 3.91it/s] 17it [00:04, 3.99it/s] 18it [00:04, 4.17it/s] 19it [00:04, 4.30it/s] 20it [00:04, 4.39it/s] 21it [00:04, 4.46it/s] 22it [00:05, 4.52it/s] 23it [00:05, 4.41it/s] 24it [00:05, 4.49it/s] 25it [00:05, 4.54it/s] 26it [00:06, 4.56it/s] 27it [00:06, 4.57it/s] 28it [00:06, 4.58it/s] 29it [00:06, 4.58it/s] 30it [00:06, 4.59it/s] 31it [00:07, 4.61it/s] 32it [00:07, 4.62it/s] 33it [00:07, 4.62it/s] 34it [00:07, 4.62it/s] 35it [00:08, 4.48it/s] 36it [00:08, 4.53it/s] 37it [00:08, 4.56it/s] 38it [00:08, 4.58it/s] 39it [00:08, 4.59it/s] 40it [00:09, 4.60it/s] 41it [00:09, 4.60it/s] 42it [00:09, 4.59it/s] 43it [00:09, 4.59it/s] 44it [00:09, 4.46it/s] 45it [00:10, 4.52it/s] 46it [00:10, 4.54it/s] 47it [00:10, 4.57it/s] 48it [00:10, 4.58it/s] 49it [00:11, 4.59it/s] 50it [00:11, 4.60it/s]2025-05-25 23:17:14,451 - INFO - [Epoch 030 | Batch 0050] IWAE-loss 1974.8240 | mean log_px -0.0085 | KL -1577.82 + 51it [00:11, 4.60it/s] 52it [00:11, 4.43it/s] 53it [00:11, 4.50it/s] 54it [00:12, 4.53it/s] 55it [00:12, 4.55it/s] 56it [00:12, 4.57it/s] 57it [00:12, 4.44it/s] 58it [00:13, 4.50it/s] 59it [00:13, 4.50it/s] 60it [00:13, 4.53it/s] 61it [00:13, 4.56it/s] 62it [00:13, 4.58it/s] 63it [00:14, 4.60it/s] 64it [00:14, 4.48it/s] 65it [00:14, 4.54it/s] 66it [00:14, 4.55it/s] 67it [00:15, 4.57it/s] 68it [00:15, 4.56it/s] 69it [00:15, 4.57it/s] 70it [00:15, 4.59it/s] 71it [00:15, 4.60it/s] 72it [00:16, 4.59it/s] 73it [00:16, 4.61it/s] 74it [00:16, 4.60it/s] 75it [00:16, 4.47it/s] 76it [00:17, 4.51it/s] 77it [00:17, 4.54it/s] 78it [00:17, 4.45it/s] 79it [00:17, 4.52it/s] 80it [00:17, 4.55it/s] 81it [00:18, 4.58it/s] 82it [00:18, 4.59it/s] 83it [00:18, 4.43it/s] 84it [00:18, 4.49it/s] 85it [00:18, 4.53it/s] 86it [00:19, 4.55it/s] 87it [00:19, 4.57it/s] 88it [00:19, 4.58it/s] 89it [00:19, 4.59it/s] 90it [00:20, 4.59it/s] 91it [00:20, 4.61it/s] 92it [00:20, 4.61it/s] 93it [00:20, 4.61it/s] 94it [00:20, 4.60it/s] 95it [00:21, 4.60it/s] 96it [00:21, 4.47it/s] 97it [00:21, 4.53it/s] 98it [00:21, 4.55it/s] 99it [00:22, 4.57it/s] 100it [00:22, 4.59it/s]2025-05-25 23:17:25,447 - INFO - [Epoch 030 | Batch 0100] IWAE-loss 1863.1838 | mean log_px -0.0062 | KL -1573.59 + 101it [00:22, 4.59it/s] 102it [00:22, 4.44it/s] 103it [00:22, 4.44it/s] 104it [00:23, 4.48it/s] 105it [00:23, 4.55it/s] 106it [00:23, 4.59it/s] 107it [00:23, 4.63it/s] 108it [00:24, 4.53it/s] 109it [00:24, 4.60it/s] 110it [00:24, 4.62it/s] 111it [00:24, 4.62it/s] 112it [00:24, 4.66it/s] 113it [00:25, 4.68it/s] 114it [00:25, 4.52it/s] 115it [00:25, 4.59it/s] 116it [00:25, 4.63it/s] 117it [00:25, 4.66it/s] 118it [00:26, 4.67it/s] 119it [00:26, 4.69it/s] 120it [00:26, 4.69it/s] 121it [00:26, 4.54it/s] 122it [00:27, 4.60it/s] 123it [00:27, 4.64it/s] 124it [00:27, 4.65it/s] 125it [00:27, 4.67it/s] 126it [00:27, 4.68it/s] 127it [00:28, 4.70it/s] 128it [00:28, 4.70it/s] 129it [00:28, 4.71it/s] 130it [00:28, 4.54it/s] 131it [00:28, 4.61it/s] 132it [00:29, 4.63it/s] 133it [00:29, 4.54it/s] 134it [00:29, 4.60it/s] 135it [00:29, 4.64it/s] 136it [00:30, 4.65it/s] 137it [00:30, 4.67it/s] 138it [00:30, 4.68it/s] 139it [00:30, 4.69it/s] 140it [00:30, 4.57it/s] 141it [00:31, 4.63it/s] 142it [00:31, 4.65it/s] 143it [00:31, 4.66it/s] 144it [00:31, 4.67it/s] 145it [00:32, 4.69it/s] 146it [00:32, 4.69it/s] 147it [00:32, 4.71it/s] 148it [00:32, 4.71it/s] 149it [00:32, 4.54it/s] 150it [00:33, 4.61it/s]2025-05-25 23:17:36,261 - INFO - [Epoch 030 | Batch 0150] IWAE-loss 2044.0123 | mean log_px -0.0121 | KL -1569.41 + 151it [00:33, 4.63it/s] 152it [00:33, 4.65it/s] 153it [00:33, 4.67it/s] 154it [00:33, 4.68it/s] 155it [00:34, 4.52it/s] 156it [00:34, 4.59it/s] 157it [00:34, 4.62it/s] 158it [00:34, 4.64it/s] 159it [00:35, 4.67it/s] 160it [00:35, 4.67it/s] 161it [00:35, 4.68it/s] 162it [00:35, 4.68it/s] 163it [00:35, 4.70it/s] 164it [00:36, 4.69it/s] 165it [00:36, 4.68it/s] 166it [00:36, 4.67it/s] 167it [00:36, 4.52it/s] 168it [00:36, 4.59it/s] 169it [00:37, 4.62it/s] 170it [00:37, 4.65it/s] 171it [00:37, 4.67it/s] 172it [00:37, 4.67it/s] 173it [00:38, 4.69it/s] 174it [00:38, 4.69it/s] 175it [00:38, 4.70it/s] 176it [00:38, 4.69it/s] 177it [00:38, 4.70it/s] 178it [00:39, 4.69it/s] 179it [00:39, 4.70it/s] 180it [00:39, 4.70it/s] 181it [00:39, 4.70it/s] 182it [00:39, 4.70it/s] 183it [00:40, 4.71it/s] 184it [00:40, 4.71it/s] 185it [00:40, 4.71it/s] 186it [00:40, 4.71it/s] 187it [00:41, 4.71it/s] 188it [00:41, 4.71it/s] 189it [00:41, 4.72it/s] 190it [00:41, 4.71it/s] 191it [00:41, 4.71it/s] 192it [00:42, 4.71it/s] 193it [00:42, 4.71it/s] 194it [00:42, 4.71it/s] 195it [00:42, 4.60it/s] 196it [00:42, 4.64it/s] 196it [00:43, 4.56it/s] +2025-05-25 23:17:46,023 - INFO - Epoch: 30, Objective: tensor([1660.5792], device='cuda:0', grad_fn=), Loss: 0.002282704459503293, KL/n: 31.856414794921875 + 0it [00:00, ?it/s]2025-05-25 23:17:46,439 - INFO - [Epoch 031 | Batch 0000] IWAE-loss 1722.8004 | mean log_px -0.0030 | KL -1562.43 + 1it [00:00, 2.72it/s] 2it [00:00, 3.65it/s] 3it [00:00, 4.08it/s] 4it [00:00, 4.31it/s] 5it [00:01, 4.46it/s] 6it [00:01, 4.53it/s] 7it [00:01, 4.61it/s] 8it [00:01, 4.64it/s] 9it [00:02, 4.67it/s] 10it [00:02, 4.68it/s] 11it [00:02, 4.53it/s] 12it [00:02, 4.61it/s] 13it [00:02, 4.63it/s] 14it [00:03, 4.66it/s] 15it [00:03, 4.68it/s] 16it [00:03, 4.70it/s] 17it [00:03, 4.72it/s] 18it [00:03, 4.72it/s] 19it [00:04, 4.73it/s] 20it [00:04, 4.73it/s] 21it [00:04, 4.66it/s] 22it [00:04, 4.69it/s] 23it [00:05, 4.71it/s] 24it [00:05, 4.54it/s] 25it [00:05, 4.61it/s] 26it [00:05, 4.54it/s] 27it [00:05, 4.61it/s] 28it [00:06, 4.63it/s] 29it [00:06, 4.62it/s] 30it [00:06, 4.64it/s] 31it [00:06, 4.66it/s] 32it [00:07, 4.50it/s] 33it [00:07, 4.55it/s] 34it [00:07, 4.59it/s] 35it [00:07, 4.62it/s] 36it [00:07, 4.64it/s] 37it [00:08, 4.66it/s] 38it [00:08, 4.67it/s] 39it [00:08, 4.64it/s] 40it [00:08, 4.64it/s] 41it [00:08, 4.64it/s] 42it [00:09, 4.63it/s] 43it [00:09, 4.64it/s] 44it [00:09, 4.63it/s] 45it [00:09, 4.64it/s] 46it [00:10, 4.63it/s] 47it [00:10, 4.64it/s] 48it [00:10, 4.62it/s] 49it [00:10, 4.63it/s] 50it [00:10, 4.61it/s]2025-05-25 23:17:57,222 - INFO - [Epoch 031 | Batch 0050] IWAE-loss 1696.5232 | mean log_px -0.0034 | KL -1540.58 + 51it [00:11, 4.45it/s] 52it [00:11, 4.49it/s] 53it [00:11, 4.53it/s] 54it [00:11, 4.56it/s] 55it [00:12, 4.58it/s] 56it [00:12, 4.58it/s] 57it [00:12, 4.59it/s] 58it [00:12, 4.60it/s] 59it [00:12, 4.60it/s] 60it [00:13, 4.47it/s] 61it [00:13, 4.52it/s] 62it [00:13, 4.54it/s] 63it [00:13, 4.57it/s] 64it [00:13, 4.58it/s] 65it [00:14, 4.61it/s] 66it [00:14, 4.40it/s] 67it [00:14, 4.48it/s] 68it [00:14, 4.52it/s] 69it [00:15, 4.56it/s] 70it [00:15, 4.58it/s] 71it [00:15, 4.60it/s] 72it [00:15, 4.60it/s] 73it [00:15, 4.59it/s] 74it [00:16, 4.62it/s] 75it [00:16, 4.65it/s] 76it [00:16, 4.65it/s] 77it [00:16, 4.68it/s] 78it [00:17, 4.68it/s] 79it [00:17, 4.69it/s] 80it [00:17, 4.68it/s] 81it [00:17, 4.69it/s] 82it [00:17, 4.68it/s] 83it [00:18, 4.68it/s] 84it [00:18, 4.52it/s] 85it [00:18, 4.56it/s] 86it [00:18, 4.60it/s] 87it [00:18, 4.62it/s] 88it [00:19, 4.64it/s] 89it [00:19, 4.66it/s] 90it [00:19, 4.51it/s] 91it [00:19, 4.59it/s] 92it [00:20, 4.61it/s] 93it [00:20, 4.62it/s] 94it [00:20, 4.65it/s] 95it [00:20, 4.66it/s] 96it [00:20, 4.50it/s] 97it [00:21, 4.57it/s] 98it [00:21, 4.61it/s] 99it [00:21, 4.63it/s] 100it [00:21, 4.66it/s]2025-05-25 23:18:08,119 - INFO - [Epoch 031 | Batch 0100] IWAE-loss 1671.5338 | mean log_px -0.0022 | KL -1533.55 + 101it [00:22, 4.56it/s] 102it [00:22, 4.51it/s] 103it [00:22, 4.48it/s] 104it [00:22, 4.53it/s] 105it [00:22, 4.43it/s] 106it [00:23, 4.50it/s] 107it [00:23, 4.56it/s] 108it [00:23, 4.60it/s] 109it [00:23, 4.63it/s] 110it [00:23, 4.64it/s] 111it [00:24, 4.50it/s] 112it [00:24, 4.58it/s] 113it [00:24, 4.60it/s] 114it [00:24, 4.62it/s] 115it [00:25, 4.64it/s] 116it [00:25, 4.65it/s] 117it [00:25, 4.60it/s] 118it [00:25, 4.46it/s] 119it [00:25, 4.54it/s] 120it [00:26, 4.57it/s] 121it [00:26, 4.59it/s] 122it [00:26, 4.61it/s] 123it [00:26, 4.64it/s] 124it [00:27, 4.65it/s] 125it [00:27, 4.66it/s] 126it [00:27, 4.47it/s] 127it [00:27, 4.51it/s] 128it [00:27, 4.56it/s] 129it [00:28, 4.60it/s] 130it [00:28, 4.60it/s] 131it [00:28, 4.64it/s] 132it [00:28, 4.66it/s] 133it [00:29, 4.50it/s] 134it [00:29, 4.58it/s] 135it [00:29, 4.61it/s] 136it [00:29, 4.48it/s] 137it [00:29, 4.56it/s] 138it [00:30, 4.59it/s] 139it [00:30, 4.62it/s] 140it [00:30, 4.63it/s] 141it [00:30, 4.65it/s] 142it [00:30, 4.50it/s] 143it [00:31, 4.55it/s] 144it [00:31, 4.57it/s] 145it [00:31, 4.60it/s] 146it [00:31, 4.62it/s] 147it [00:32, 4.63it/s] 148it [00:32, 4.64it/s] 149it [00:32, 4.64it/s] 150it [00:32, 4.65it/s]2025-05-25 23:18:19,029 - INFO - [Epoch 031 | Batch 0150] IWAE-loss 1709.1289 | mean log_px -0.0036 | KL -1533.10 + 151it [00:32, 4.49it/s] 152it [00:33, 4.54it/s] 153it [00:33, 4.58it/s] 154it [00:33, 4.61it/s] 155it [00:33, 4.61it/s] 156it [00:34, 4.56it/s] 157it [00:34, 4.44it/s] 158it [00:34, 4.52it/s] 159it [00:34, 4.57it/s] 160it [00:34, 4.61it/s] 161it [00:35, 4.63it/s] 162it [00:35, 4.65it/s] 163it [00:35, 4.67it/s] 164it [00:35, 4.50it/s] 165it [00:36, 4.58it/s] 166it [00:36, 4.61it/s] 167it [00:36, 4.63it/s] 168it [00:36, 4.64it/s] 169it [00:36, 4.59it/s] 170it [00:37, 4.40it/s] 171it [00:37, 4.49it/s] 172it [00:37, 4.55it/s] 173it [00:37, 4.59it/s] 174it [00:37, 4.62it/s] 175it [00:38, 4.46it/s] 176it [00:38, 4.50it/s] 177it [00:38, 4.56it/s] 178it [00:38, 4.55it/s] 179it [00:39, 4.59it/s] 180it [00:39, 4.62it/s] 181it [00:39, 4.48it/s] 182it [00:39, 4.54it/s] 183it [00:39, 4.58it/s] 184it [00:40, 4.60it/s] 185it [00:40, 4.63it/s] 186it [00:40, 4.63it/s] 187it [00:40, 4.65it/s] 188it [00:41, 4.62it/s] 189it [00:41, 4.48it/s] 190it [00:41, 4.54it/s] 191it [00:41, 4.57it/s] 192it [00:41, 4.60it/s] 193it [00:42, 4.63it/s] 194it [00:42, 4.63it/s] 195it [00:42, 4.50it/s] 196it [00:42, 4.54it/s] 196it [00:42, 4.57it/s] +2025-05-25 23:18:29,026 - INFO - Epoch: 31, Objective: tensor([1998.8662], device='cuda:0', grad_fn=), Loss: 0.011031880974769592, KL/n: 31.218055725097656 + 0it [00:00, ?it/s]2025-05-25 23:18:29,614 - INFO - [Epoch 032 | Batch 0000] IWAE-loss 1605.7083 | mean log_px -0.0011 | KL -1530.47 + 1it [00:00, 2.91it/s] 2it [00:00, 3.53it/s] 3it [00:00, 3.98it/s] 4it [00:01, 4.22it/s] 5it [00:01, 4.37it/s] 6it [00:01, 4.45it/s] 7it [00:01, 4.47it/s] 8it [00:01, 4.52it/s] 9it [00:02, 4.41it/s] 10it [00:02, 4.49it/s] 11it [00:02, 4.53it/s] 12it [00:02, 4.57it/s] 13it [00:02, 4.60it/s] 14it [00:03, 4.61it/s] 15it [00:03, 4.63it/s] 16it [00:03, 4.61it/s] 17it [00:03, 4.64it/s] 18it [00:04, 4.65it/s] 19it [00:04, 4.64it/s] 20it [00:04, 4.63it/s] 21it [00:04, 4.63it/s] 22it [00:04, 4.64it/s] 23it [00:05, 4.65it/s] 24it [00:05, 4.65it/s] 25it [00:05, 4.64it/s] 26it [00:05, 4.49it/s] 27it [00:06, 4.55it/s] 28it [00:06, 4.58it/s] 29it [00:06, 4.60it/s] 30it [00:06, 4.61it/s] 31it [00:06, 4.63it/s] 32it [00:07, 4.60it/s] 33it [00:07, 4.63it/s] 34it [00:07, 4.63it/s] 35it [00:07, 4.63it/s] 36it [00:07, 4.47it/s] 37it [00:08, 4.53it/s] 38it [00:08, 4.56it/s] 39it [00:08, 4.59it/s] 40it [00:08, 4.61it/s] 41it [00:09, 4.63it/s] 42it [00:09, 4.63it/s] 43it [00:09, 4.64it/s] 44it [00:09, 4.48it/s] 45it [00:09, 4.55it/s] 46it [00:10, 4.58it/s] 47it [00:10, 4.60it/s] 48it [00:10, 4.62it/s] 49it [00:10, 4.63it/s] 50it [00:11, 4.49it/s]2025-05-25 23:18:40,533 - INFO - [Epoch 032 | Batch 0050] IWAE-loss 1871.9933 | mean log_px -0.0139 | KL -1516.54 + 51it [00:11, 4.53it/s] 52it [00:11, 4.55it/s] 53it [00:11, 4.57it/s] 54it [00:11, 4.59it/s] 55it [00:12, 4.61it/s] 56it [00:12, 4.61it/s] 57it [00:12, 4.47it/s] 58it [00:12, 4.54it/s] 59it [00:13, 4.57it/s] 60it [00:13, 4.59it/s] 61it [00:13, 4.61it/s] 62it [00:13, 4.62it/s] 63it [00:13, 4.63it/s] 64it [00:14, 4.63it/s] 65it [00:14, 4.64it/s] 66it [00:14, 4.63it/s] 67it [00:14, 4.64it/s] 68it [00:14, 4.65it/s] 69it [00:15, 4.65it/s] 70it [00:15, 4.63it/s] 71it [00:15, 4.63it/s] 72it [00:15, 4.48it/s] 73it [00:16, 4.55it/s] 74it [00:16, 4.57it/s] 75it [00:16, 4.59it/s] 76it [00:16, 4.60it/s] 77it [00:16, 4.63it/s] 78it [00:17, 4.61it/s] 79it [00:17, 4.48it/s] 80it [00:17, 4.53it/s] 81it [00:17, 4.57it/s] 82it [00:18, 4.58it/s] 83it [00:18, 4.60it/s] 84it [00:18, 4.57it/s] 85it [00:18, 4.59it/s] 86it [00:18, 4.61it/s] 87it [00:19, 4.63it/s] 88it [00:19, 4.62it/s] 89it [00:19, 4.64it/s] 90it [00:19, 4.49it/s] 91it [00:19, 4.56it/s] 92it [00:20, 4.58it/s] 93it [00:20, 4.60it/s] 94it [00:20, 4.61it/s] 95it [00:20, 4.62it/s] 96it [00:21, 4.63it/s] 97it [00:21, 4.64it/s] 98it [00:21, 4.64it/s] 99it [00:21, 4.49it/s] 100it [00:21, 4.54it/s]2025-05-25 23:18:51,424 - INFO - [Epoch 032 | Batch 0100] IWAE-loss 2199.9558 | mean log_px -0.0137 | KL -1505.77 + 101it [00:22, 4.57it/s] 102it [00:22, 4.60it/s] 103it [00:22, 4.61it/s] 104it [00:22, 4.61it/s] 105it [00:23, 4.63it/s] 106it [00:23, 4.63it/s] 107it [00:23, 4.65it/s] 108it [00:23, 4.64it/s] 109it [00:23, 4.53it/s] 110it [00:24, 4.56it/s] 111it [00:24, 4.60it/s] 112it [00:24, 4.61it/s] 113it [00:24, 4.63it/s] 114it [00:24, 4.62it/s] 115it [00:25, 4.60it/s] 116it [00:25, 4.46it/s] 117it [00:25, 4.53it/s] 118it [00:25, 4.57it/s] 119it [00:26, 4.61it/s] 120it [00:26, 4.62it/s] 121it [00:26, 4.64it/s] 122it [00:26, 4.60it/s] 123it [00:26, 4.56it/s] 124it [00:27, 4.60it/s] 125it [00:27, 4.63it/s] 126it [00:27, 4.63it/s] 127it [00:27, 4.49it/s] 128it [00:28, 4.54it/s] 129it [00:28, 4.56it/s] 130it [00:28, 4.59it/s] 131it [00:28, 4.61it/s] 132it [00:28, 4.62it/s] 133it [00:29, 4.63it/s] 134it [00:29, 4.63it/s] 135it [00:29, 4.49it/s] 136it [00:29, 4.56it/s] 137it [00:29, 4.59it/s] 138it [00:30, 4.61it/s] 139it [00:30, 4.62it/s] 140it [00:30, 4.63it/s] 141it [00:30, 4.64it/s] 142it [00:31, 4.50it/s] 143it [00:31, 4.55it/s] 144it [00:31, 4.57it/s] 145it [00:31, 4.59it/s] 146it [00:31, 4.60it/s] 147it [00:32, 4.61it/s] 148it [00:32, 4.62it/s] 149it [00:32, 4.63it/s] 150it [00:32, 4.63it/s]2025-05-25 23:19:02,301 - INFO - [Epoch 032 | Batch 0150] IWAE-loss 1934.8878 | mean log_px -0.0096 | KL -1507.10 + 151it [00:33, 4.50it/s] 152it [00:33, 4.50it/s] 153it [00:33, 4.34it/s] 154it [00:33, 4.43it/s] 155it [00:33, 4.50it/s] 156it [00:34, 4.54it/s] 157it [00:34, 4.57it/s] 158it [00:34, 4.58it/s] 159it [00:34, 4.61it/s] 160it [00:35, 4.52it/s] 161it [00:35, 4.58it/s] 162it [00:35, 4.59it/s] 163it [00:35, 4.62it/s] 164it [00:35, 4.63it/s] 165it [00:36, 4.64it/s] 166it [00:36, 4.50it/s] 167it [00:36, 4.55it/s] 168it [00:36, 4.57it/s] 169it [00:36, 4.60it/s] 170it [00:37, 4.53it/s] 171it [00:37, 4.58it/s] 172it [00:37, 4.59it/s] 173it [00:37, 4.61it/s] 174it [00:38, 4.61it/s] 175it [00:38, 4.62it/s] 176it [00:38, 4.49it/s] 177it [00:38, 4.55it/s] 178it [00:38, 4.58it/s] 179it [00:39, 4.61it/s] 180it [00:39, 4.62it/s] 181it [00:39, 4.63it/s] 182it [00:39, 4.54it/s] 183it [00:40, 4.59it/s] 184it [00:40, 4.61it/s] 185it [00:40, 4.63it/s] 186it [00:40, 4.63it/s] 187it [00:40, 4.64it/s] 188it [00:41, 4.61it/s] 189it [00:41, 4.59it/s] 190it [00:41, 4.44it/s] 191it [00:41, 4.49it/s] 192it [00:42, 4.54it/s] 193it [00:42, 4.57it/s] 194it [00:42, 4.59it/s] 195it [00:42, 4.47it/s] 196it [00:42, 4.40it/s] 196it [00:43, 4.56it/s] +2025-05-25 23:19:12,343 - INFO - Epoch: 32, Objective: tensor([1967.3446], device='cuda:0', grad_fn=), Loss: 0.012947743758559227, KL/n: 30.607524871826172 + 0it [00:00, ?it/s]2025-05-25 23:19:12,764 - INFO - [Epoch 033 | Batch 0000] IWAE-loss 1662.4415 | mean log_px -0.0023 | KL -1498.38 + 1it [00:00, 2.93it/s] 2it [00:00, 3.73it/s] 3it [00:00, 4.11it/s] 4it [00:00, 4.30it/s] 5it [00:01, 4.42it/s] 6it [00:01, 4.49it/s] 7it [00:01, 4.55it/s] 8it [00:01, 4.58it/s] 9it [00:02, 4.61it/s] 10it [00:02, 4.62it/s] 11it [00:02, 4.61it/s] 12it [00:02, 3.57it/s] 13it [00:03, 3.77it/s] 14it [00:03, 3.99it/s] 15it [00:03, 4.18it/s] 16it [00:03, 4.31it/s] 17it [00:04, 4.41it/s] 18it [00:04, 4.34it/s] 19it [00:04, 4.44it/s] 20it [00:04, 4.31it/s] 21it [00:04, 4.42it/s] 22it [00:05, 4.49it/s] 23it [00:05, 4.53it/s] 24it [00:05, 4.44it/s] 25it [00:05, 4.39it/s] 26it [00:06, 4.44it/s] 27it [00:06, 4.49it/s] 28it [00:06, 4.52it/s] 29it [00:06, 4.39it/s] 30it [00:06, 4.46it/s] 31it [00:07, 4.49it/s] 32it [00:07, 4.49it/s] 33it [00:07, 4.54it/s] 34it [00:07, 4.58it/s] 35it [00:08, 4.61it/s] 36it [00:08, 4.62it/s] 37it [00:08, 4.58it/s] 38it [00:08, 4.46it/s] 39it [00:08, 4.53it/s] 40it [00:09, 4.55it/s] 41it [00:09, 4.54it/s] 42it [00:09, 4.55it/s] 43it [00:09, 4.54it/s] 44it [00:10, 4.55it/s] 45it [00:10, 4.59it/s] 46it [00:10, 4.60it/s] 47it [00:10, 4.61it/s] 48it [00:10, 4.62it/s] 49it [00:11, 4.63it/s] 50it [00:11, 4.62it/s]2025-05-25 23:19:23,943 - INFO - [Epoch 033 | Batch 0050] IWAE-loss 1766.8324 | mean log_px -0.0126 | KL -1488.90 + 51it [00:11, 4.62it/s] 52it [00:11, 4.62it/s] 53it [00:11, 4.47it/s] 54it [00:12, 4.53it/s] 55it [00:12, 4.57it/s] 56it [00:12, 4.45it/s] 57it [00:12, 4.51it/s] 58it [00:13, 4.55it/s] 59it [00:13, 4.53it/s] 60it [00:13, 4.47it/s] 61it [00:13, 4.49it/s] 62it [00:13, 4.35it/s] 63it [00:14, 4.42it/s] 64it [00:14, 4.47it/s] 65it [00:14, 4.47it/s] 66it [00:14, 4.51it/s] 67it [00:15, 4.53it/s] 68it [00:15, 4.42it/s] 69it [00:15, 4.48it/s] 70it [00:15, 4.49it/s] 71it [00:15, 4.49it/s] 72it [00:16, 4.51it/s] 73it [00:16, 4.55it/s] 74it [00:16, 4.53it/s] 75it [00:16, 4.58it/s] 76it [00:17, 4.56it/s] 77it [00:17, 4.46it/s] 78it [00:17, 4.51it/s] 79it [00:17, 4.55it/s] 80it [00:17, 4.56it/s] 81it [00:18, 4.58it/s] 82it [00:18, 4.59it/s] 83it [00:18, 4.60it/s] 84it [00:18, 4.60it/s] 85it [00:19, 4.62it/s] 86it [00:19, 4.52it/s] 87it [00:19, 4.55it/s] 88it [00:19, 4.50it/s] 89it [00:19, 4.48it/s] 90it [00:20, 4.53it/s] 91it [00:20, 4.46it/s] 92it [00:20, 4.51it/s] 93it [00:20, 4.36it/s] 94it [00:21, 4.44it/s] 95it [00:21, 4.39it/s] 96it [00:21, 4.48it/s] 97it [00:21, 4.52it/s] 98it [00:21, 4.42it/s] 99it [00:22, 4.50it/s] 100it [00:22, 4.53it/s]2025-05-25 23:19:35,043 - INFO - [Epoch 033 | Batch 0100] IWAE-loss 1801.3687 | mean log_px -0.0054 | KL -1479.41 + 101it [00:22, 4.56it/s] 102it [00:22, 4.51it/s] 103it [00:23, 4.55it/s] 104it [00:23, 4.41it/s] 105it [00:23, 4.49it/s] 106it [00:23, 4.54it/s] 107it [00:23, 4.57it/s] 108it [00:24, 4.59it/s] 109it [00:24, 4.61it/s] 110it [00:24, 4.61it/s] 111it [00:24, 4.63it/s] 112it [00:25, 4.62it/s] 113it [00:25, 4.47it/s] 114it [00:25, 4.54it/s] 115it [00:25, 4.49it/s] 116it [00:25, 4.52it/s] 117it [00:26, 4.57it/s] 118it [00:26, 4.57it/s] 119it [00:26, 4.60it/s] 120it [00:26, 4.48it/s] 121it [00:27, 4.54it/s] 122it [00:27, 4.60it/s] 123it [00:27, 4.46it/s] 124it [00:27, 4.52it/s] 125it [00:27, 4.58it/s] 126it [00:28, 4.58it/s] 127it [00:28, 4.60it/s] 128it [00:28, 4.54it/s] 129it [00:28, 4.57it/s] 130it [00:28, 4.60it/s] 131it [00:29, 4.63it/s] 132it [00:29, 4.60it/s] 133it [00:29, 4.63it/s] 134it [00:29, 4.64it/s] 135it [00:30, 4.65it/s] 136it [00:30, 4.52it/s] 137it [00:30, 4.58it/s] 138it [00:30, 4.60it/s] 139it [00:30, 4.63it/s] 140it [00:31, 4.64it/s] 141it [00:31, 4.66it/s] 142it [00:31, 4.67it/s] 143it [00:31, 4.67it/s] 144it [00:32, 4.67it/s] 145it [00:32, 4.55it/s] 146it [00:32, 4.56it/s] 147it [00:32, 4.60it/s] 148it [00:32, 4.49it/s] 149it [00:33, 4.56it/s] 150it [00:33, 4.45it/s]2025-05-25 23:19:45,995 - INFO - [Epoch 033 | Batch 0150] IWAE-loss 1976.7753 | mean log_px -0.0103 | KL -1475.10 + 151it [00:33, 4.51it/s] 152it [00:33, 4.55it/s] 153it [00:33, 4.60it/s] 154it [00:34, 4.61it/s] 155it [00:34, 4.64it/s] 156it [00:34, 4.64it/s] 157it [00:34, 4.52it/s] 158it [00:35, 4.51it/s] 159it [00:35, 4.50it/s] 160it [00:35, 4.50it/s] 161it [00:35, 4.54it/s] 162it [00:35, 4.58it/s] 163it [00:36, 4.60it/s] 164it [00:36, 4.59it/s] 165it [00:36, 4.61it/s] 166it [00:36, 4.41it/s] 167it [00:37, 4.51it/s] 168it [00:37, 4.56it/s] 169it [00:37, 4.60it/s] 170it [00:37, 4.59it/s] 171it [00:37, 4.62it/s] 172it [00:38, 4.63it/s] 173it [00:38, 4.66it/s] 174it [00:38, 4.66it/s] 175it [00:38, 4.67it/s] 176it [00:39, 4.62it/s] 177it [00:39, 4.65it/s] 178it [00:39, 4.50it/s] 179it [00:39, 4.56it/s] 180it [00:39, 4.59it/s] 181it [00:40, 4.63it/s] 182it [00:40, 4.64it/s] 183it [00:40, 4.66it/s] 184it [00:40, 4.52it/s] 185it [00:40, 4.59it/s] 186it [00:41, 4.43it/s] 187it [00:41, 4.52it/s] 188it [00:41, 4.56it/s] 189it [00:41, 4.60it/s] 190it [00:42, 4.63it/s] 191it [00:42, 4.65it/s] 192it [00:42, 4.66it/s] 193it [00:42, 4.67it/s] 194it [00:42, 4.40it/s] 195it [00:43, 4.37it/s] 196it [00:43, 4.47it/s] 196it [00:43, 4.51it/s] +2025-05-25 23:19:55,977 - INFO - Epoch: 33, Objective: tensor([2188.4385], device='cuda:0', grad_fn=), Loss: 0.011592795141041279, KL/n: 29.990604400634766 + 0it [00:00, ?it/s]2025-05-25 23:19:56,405 - INFO - [Epoch 034 | Batch 0000] IWAE-loss 1666.0902 | mean log_px -0.0050 | KL -1469.55 + 1it [00:00, 2.80it/s] 2it [00:00, 3.62it/s] 3it [00:00, 4.03it/s] 4it [00:01, 4.26it/s] 5it [00:01, 4.18it/s] 6it [00:01, 4.23it/s] 7it [00:01, 4.36it/s] 8it [00:01, 4.45it/s] 9it [00:02, 4.53it/s] 10it [00:02, 4.54it/s] 11it [00:02, 4.60it/s] 12it [00:02, 4.62it/s] 13it [00:02, 4.65it/s] 14it [00:03, 4.65it/s] 15it [00:03, 4.51it/s] 16it [00:03, 4.56it/s] 17it [00:03, 4.60it/s] 18it [00:04, 4.62it/s] 19it [00:04, 4.62it/s] 20it [00:04, 4.63it/s] 21it [00:04, 4.65it/s] 22it [00:04, 4.51it/s] 23it [00:05, 4.57it/s] 24it [00:05, 4.58it/s] 25it [00:05, 4.56it/s] 26it [00:05, 4.56it/s] 27it [00:06, 4.59it/s] 28it [00:06, 4.39it/s] 29it [00:06, 4.43it/s] 30it [00:06, 4.52it/s] 31it [00:06, 4.57it/s] 32it [00:07, 4.60it/s] 33it [00:07, 4.60it/s] 34it [00:07, 4.59it/s] 35it [00:07, 4.46it/s] 36it [00:08, 4.50it/s] 37it [00:08, 4.54it/s] 38it [00:08, 4.55it/s] 39it [00:08, 4.53it/s] 40it [00:08, 4.54it/s] 41it [00:09, 4.42it/s] 42it [00:09, 4.49it/s] 43it [00:09, 4.53it/s] 44it [00:09, 4.56it/s] 45it [00:10, 4.58it/s] 46it [00:10, 4.60it/s] 47it [00:10, 4.61it/s] 48it [00:10, 4.47it/s] 49it [00:10, 4.53it/s] 50it [00:11, 4.55it/s]2025-05-25 23:20:07,393 - INFO - [Epoch 034 | Batch 0050] IWAE-loss 1685.5781 | mean log_px -0.0031 | KL -1466.24 + 51it [00:11, 4.44it/s] 52it [00:11, 4.47it/s] 53it [00:11, 4.51it/s] 54it [00:12, 4.40it/s] 55it [00:12, 4.48it/s] 56it [00:12, 4.52it/s] 57it [00:12, 4.56it/s] 58it [00:12, 4.57it/s] 59it [00:13, 4.58it/s] 60it [00:13, 4.50it/s] 61it [00:13, 4.50it/s] 62it [00:13, 4.53it/s] 63it [00:14, 4.55it/s] 64it [00:14, 4.56it/s] 65it [00:14, 4.43it/s] 66it [00:14, 4.49it/s] 67it [00:14, 4.53it/s] 68it [00:15, 4.55it/s] 69it [00:15, 4.57it/s] 70it [00:15, 4.58it/s] 71it [00:15, 4.61it/s] 72it [00:16, 4.47it/s] 73it [00:16, 4.51it/s] 74it [00:16, 4.54it/s] 75it [00:16, 4.56it/s] 76it [00:16, 4.59it/s] 77it [00:17, 4.59it/s] 78it [00:17, 4.61it/s] 79it [00:17, 4.62it/s] 80it [00:17, 4.61it/s] 81it [00:17, 4.48it/s] 82it [00:18, 4.52it/s] 83it [00:18, 4.57it/s] 84it [00:18, 4.59it/s] 85it [00:18, 4.60it/s] 86it [00:19, 4.60it/s] 87it [00:19, 4.61it/s] 88it [00:19, 4.63it/s] 89it [00:19, 4.49it/s] 90it [00:19, 4.54it/s] 91it [00:20, 4.56it/s] 92it [00:20, 4.57it/s] 93it [00:20, 4.59it/s] 94it [00:20, 4.60it/s] 95it [00:21, 4.46it/s] 96it [00:21, 4.52it/s] 97it [00:21, 4.55it/s] 98it [00:21, 4.57it/s] 99it [00:21, 4.59it/s] 100it [00:22, 4.61it/s]2025-05-25 23:20:18,389 - INFO - [Epoch 034 | Batch 0100] IWAE-loss 4595.9902 | mean log_px -0.0572 | KL -1454.45 + 101it [00:22, 4.60it/s] 102it [00:22, 4.61it/s] 103it [00:22, 4.62it/s] 104it [00:23, 4.43it/s] 105it [00:23, 4.50it/s] 106it [00:23, 4.53it/s] 107it [00:23, 4.57it/s] 108it [00:23, 4.58it/s] 109it [00:24, 4.60it/s] 110it [00:24, 4.60it/s] 111it [00:24, 4.61it/s] 112it [00:24, 4.61it/s] 113it [00:24, 4.48it/s] 114it [00:25, 4.52it/s] 115it [00:25, 4.56it/s] 116it [00:25, 4.57it/s] 117it [00:25, 4.59it/s] 118it [00:26, 4.60it/s] 119it [00:26, 4.46it/s] 120it [00:26, 4.51it/s] 121it [00:26, 4.56it/s] 122it [00:26, 4.57it/s] 123it [00:27, 4.59it/s] 124it [00:27, 4.60it/s] 125it [00:27, 4.61it/s] 126it [00:27, 4.59it/s] 127it [00:28, 4.47it/s] 128it [00:28, 4.52it/s] 129it [00:28, 4.55it/s] 130it [00:28, 4.57it/s] 131it [00:28, 4.59it/s] 132it [00:29, 4.46it/s] 133it [00:29, 4.52it/s] 134it [00:29, 4.54it/s] 135it [00:29, 4.58it/s] 136it [00:30, 4.59it/s] 137it [00:30, 4.60it/s] 138it [00:30, 4.61it/s] 139it [00:30, 4.62it/s] 140it [00:30, 4.60it/s] 141it [00:31, 4.47it/s] 142it [00:31, 4.51it/s] 143it [00:31, 4.55it/s] 144it [00:31, 4.55it/s] 145it [00:31, 4.57it/s] 146it [00:32, 4.56it/s] 147it [00:32, 4.57it/s] 148it [00:32, 4.52it/s] 149it [00:32, 4.36it/s] 150it [00:33, 4.45it/s]2025-05-25 23:20:29,392 - INFO - [Epoch 034 | Batch 0150] IWAE-loss 1796.6715 | mean log_px -0.0049 | KL -1448.83 + 151it [00:33, 4.50it/s] 152it [00:33, 4.54it/s] 153it [00:33, 4.55it/s] 154it [00:33, 4.59it/s] 155it [00:34, 4.46it/s] 156it [00:34, 4.48it/s] 157it [00:34, 4.53it/s] 158it [00:34, 4.57it/s] 159it [00:35, 4.60it/s] 160it [00:35, 4.59it/s] 161it [00:35, 4.51it/s] 162it [00:35, 4.56it/s] 163it [00:35, 4.58it/s] 164it [00:36, 4.59it/s] 165it [00:36, 4.58it/s] 166it [00:36, 4.59it/s] 167it [00:36, 4.62it/s] 168it [00:37, 4.62it/s] 169it [00:37, 4.48it/s] 170it [00:37, 4.52it/s] 171it [00:37, 4.56it/s] 172it [00:37, 4.56it/s] 173it [00:38, 4.58it/s] 174it [00:38, 4.59it/s] 175it [00:38, 4.42it/s] 176it [00:38, 4.48it/s] 177it [00:39, 4.52it/s] 178it [00:39, 4.55it/s] 179it [00:39, 4.57it/s] 180it [00:39, 4.57it/s] 181it [00:39, 4.59it/s] 182it [00:40, 4.60it/s] 183it [00:40, 4.47it/s] 184it [00:40, 4.51it/s] 185it [00:40, 4.56it/s] 186it [00:41, 4.57it/s] 187it [00:41, 4.58it/s] 188it [00:41, 4.57it/s] 189it [00:41, 4.49it/s] 190it [00:41, 4.54it/s] 191it [00:42, 4.56it/s] 192it [00:42, 4.57it/s] 193it [00:42, 4.58it/s] 194it [00:42, 4.59it/s] 195it [00:43, 4.48it/s] 196it [00:43, 4.55it/s] 196it [00:43, 4.53it/s] +2025-05-25 23:20:39,408 - INFO - Epoch: 34, Objective: tensor([1598.8741], device='cuda:0', grad_fn=), Loss: 0.003922741860151291, KL/n: 29.56195640563965 + 0it [00:00, ?it/s]2025-05-25 23:20:39,963 - INFO - [Epoch 035 | Batch 0000] IWAE-loss 1601.3729 | mean log_px -0.0040 | KL -1447.12 + 1it [00:00, 3.31it/s] 2it [00:00, 3.80it/s] 3it [00:00, 4.17it/s] 4it [00:01, 4.04it/s] 5it [00:01, 4.25it/s] 6it [00:01, 4.38it/s] 7it [00:01, 4.47it/s] 8it [00:01, 4.52it/s] 9it [00:02, 4.54it/s] 10it [00:02, 4.58it/s] 11it [00:02, 4.45it/s] 12it [00:02, 4.51it/s] 13it [00:02, 4.55it/s] 14it [00:03, 4.58it/s] 15it [00:03, 4.60it/s] 16it [00:03, 4.63it/s] 17it [00:03, 4.63it/s] 18it [00:04, 4.62it/s] 19it [00:04, 4.64it/s] 20it [00:04, 4.65it/s] 21it [00:04, 4.65it/s] 22it [00:04, 4.63it/s] 23it [00:05, 4.64it/s] 24it [00:05, 4.66it/s] 25it [00:05, 4.65it/s] 26it [00:05, 4.65it/s] 27it [00:06, 4.51it/s] 28it [00:06, 4.56it/s] 29it [00:06, 4.59it/s] 30it [00:06, 4.62it/s] 31it [00:06, 4.64it/s] 32it [00:07, 4.65it/s] 33it [00:07, 4.66it/s] 34it [00:07, 4.66it/s] 35it [00:07, 4.67it/s] 36it [00:07, 4.66it/s] 37it [00:08, 4.66it/s] 38it [00:08, 4.62it/s] 39it [00:08, 4.65it/s] 40it [00:08, 4.64it/s] 41it [00:09, 4.51it/s] 42it [00:09, 4.54it/s] 43it [00:09, 4.58it/s] 44it [00:09, 4.60it/s] 45it [00:09, 4.62it/s] 46it [00:10, 4.63it/s] 47it [00:10, 4.65it/s] 48it [00:10, 4.64it/s] 49it [00:10, 4.66it/s] 50it [00:10, 4.65it/s]2025-05-25 23:20:50,843 - INFO - [Epoch 035 | Batch 0050] IWAE-loss 1802.3173 | mean log_px -0.0079 | KL -1440.26 + 51it [00:11, 4.64it/s] 52it [00:11, 4.64it/s] 53it [00:11, 4.65it/s] 54it [00:11, 4.66it/s] 55it [00:12, 4.65it/s] 56it [00:12, 4.65it/s] 57it [00:12, 4.65it/s] 58it [00:12, 4.65it/s] 59it [00:12, 4.65it/s] 60it [00:13, 4.66it/s] 61it [00:13, 4.66it/s] 62it [00:13, 4.63it/s] 63it [00:13, 4.66it/s] 64it [00:13, 4.65it/s] 65it [00:14, 4.65it/s] 66it [00:14, 4.66it/s] 67it [00:14, 4.65it/s] 68it [00:14, 4.65it/s] 69it [00:15, 4.51it/s] 70it [00:15, 4.57it/s] 71it [00:15, 4.61it/s] 72it [00:15, 4.50it/s] 73it [00:15, 4.54it/s] 74it [00:16, 4.57it/s] 75it [00:16, 4.50it/s] 76it [00:16, 4.54it/s] 77it [00:16, 4.44it/s] 78it [00:17, 4.50it/s] 79it [00:17, 4.53it/s] 80it [00:17, 4.55it/s] 81it [00:17, 4.56it/s] 82it [00:17, 4.44it/s] 83it [00:18, 4.51it/s] 84it [00:18, 4.54it/s] 85it [00:18, 4.57it/s] 86it [00:18, 4.59it/s] 87it [00:19, 4.62it/s] 88it [00:19, 4.64it/s] 89it [00:19, 4.65it/s] 90it [00:19, 4.65it/s] 91it [00:19, 4.48it/s] 92it [00:20, 4.54it/s] 93it [00:20, 4.56it/s] 94it [00:20, 4.44it/s] 95it [00:20, 4.40it/s] 96it [00:21, 4.47it/s] 97it [00:21, 4.51it/s] 98it [00:21, 4.55it/s] 99it [00:21, 4.58it/s] 100it [00:21, 4.60it/s]2025-05-25 23:21:01,768 - INFO - [Epoch 035 | Batch 0100] IWAE-loss 1988.3760 | mean log_px -0.0165 | KL -1428.70 + 101it [00:22, 4.62it/s] 102it [00:22, 4.63it/s] 103it [00:22, 4.64it/s] 104it [00:22, 4.49it/s] 105it [00:22, 4.55it/s] 106it [00:23, 4.58it/s] 107it [00:23, 4.59it/s] 108it [00:23, 4.60it/s] 109it [00:23, 4.62it/s] 110it [00:24, 4.49it/s] 111it [00:24, 4.53it/s] 112it [00:24, 4.58it/s] 113it [00:24, 4.61it/s] 114it [00:24, 4.60it/s] 115it [00:25, 4.62it/s] 116it [00:25, 4.63it/s] 117it [00:25, 4.51it/s] 118it [00:25, 4.56it/s] 119it [00:26, 4.59it/s] 120it [00:26, 4.62it/s] 121it [00:26, 4.63it/s] 122it [00:26, 4.64it/s] 123it [00:26, 4.51it/s] 124it [00:27, 4.55it/s] 125it [00:27, 4.58it/s] 126it [00:27, 4.59it/s] 127it [00:27, 4.62it/s] 128it [00:27, 4.64it/s] 129it [00:28, 4.51it/s] 130it [00:28, 4.57it/s] 131it [00:28, 4.60it/s] 132it [00:28, 4.61it/s] 133it [00:29, 4.62it/s] 134it [00:29, 4.62it/s] 135it [00:29, 4.63it/s] 136it [00:29, 4.63it/s] 137it [00:29, 4.51it/s] 138it [00:30, 4.56it/s] 139it [00:30, 4.59it/s] 140it [00:30, 4.60it/s] 141it [00:30, 4.63it/s] 142it [00:31, 4.62it/s] 143it [00:31, 4.64it/s] 144it [00:31, 4.55it/s] 145it [00:31, 4.60it/s] 146it [00:31, 4.61it/s] 147it [00:32, 4.58it/s] 148it [00:32, 4.59it/s] 149it [00:32, 4.47it/s] 150it [00:32, 4.53it/s]2025-05-25 23:21:12,678 - INFO - [Epoch 035 | Batch 0150] IWAE-loss 1613.8336 | mean log_px -0.0041 | KL -1433.86 + 151it [00:33, 4.57it/s] 152it [00:33, 4.52it/s] 153it [00:33, 4.55it/s] 154it [00:33, 4.59it/s] 155it [00:33, 4.62it/s] 156it [00:34, 4.48it/s] 157it [00:34, 4.54it/s] 158it [00:34, 4.57it/s] 159it [00:34, 4.60it/s] 160it [00:34, 4.60it/s] 161it [00:35, 4.60it/s] 162it [00:35, 4.63it/s] 163it [00:35, 4.63it/s] 164it [00:35, 4.64it/s] 165it [00:36, 4.51it/s] 166it [00:36, 4.53it/s] 167it [00:36, 4.57it/s] 168it [00:36, 4.57it/s] 169it [00:36, 4.61it/s] 170it [00:37, 4.63it/s] 171it [00:37, 4.64it/s] 172it [00:37, 4.64it/s] 173it [00:37, 4.64it/s] 174it [00:38, 4.64it/s] 175it [00:38, 4.66it/s] 176it [00:38, 4.66it/s] 177it [00:38, 4.67it/s] 178it [00:38, 4.53it/s] 179it [00:39, 4.58it/s] 180it [00:39, 4.59it/s] 181it [00:39, 4.61it/s] 182it [00:39, 4.62it/s] 183it [00:39, 4.65it/s] 184it [00:40, 4.66it/s] 185it [00:40, 4.52it/s] 186it [00:40, 4.58it/s] 187it [00:40, 4.62it/s] 188it [00:41, 4.63it/s] 189it [00:41, 4.66it/s] 190it [00:41, 4.65it/s] 191it [00:41, 4.66it/s] 192it [00:41, 4.66it/s] 193it [00:42, 4.67it/s] 194it [00:42, 4.68it/s] 195it [00:42, 4.55it/s] 196it [00:42, 4.59it/s] 196it [00:42, 4.57it/s] +2025-05-25 23:21:22,584 - INFO - Epoch: 35, Objective: tensor([2143.9568], device='cuda:0', grad_fn=), Loss: 0.021683480590581894, KL/n: 29.22657012939453 + 0it [00:00, ?it/s]2025-05-25 23:21:22,961 - INFO - [Epoch 036 | Batch 0000] IWAE-loss 1631.0413 | mean log_px -0.0034 | KL -1429.53 + 1it [00:00, 3.33it/s] 2it [00:00, 3.88it/s] 3it [00:00, 4.22it/s] 4it [00:00, 4.09it/s] 5it [00:01, 4.26it/s] 6it [00:01, 4.38it/s] 7it [00:01, 4.42it/s] 8it [00:02, 3.41it/s] 9it [00:02, 3.73it/s] 10it [00:02, 3.94it/s] 11it [00:02, 4.14it/s] 12it [00:02, 4.27it/s] 13it [00:03, 4.40it/s] 14it [00:03, 4.48it/s] 15it [00:03, 4.55it/s] 16it [00:03, 4.58it/s] 17it [00:04, 4.61it/s] 18it [00:04, 4.60it/s] 19it [00:04, 4.60it/s] 20it [00:04, 4.56it/s] 21it [00:04, 4.60it/s] 22it [00:05, 4.62it/s] 23it [00:05, 4.64it/s] 24it [00:05, 4.50it/s] 25it [00:05, 4.56it/s] 26it [00:05, 4.58it/s] 27it [00:06, 4.62it/s] 28it [00:06, 4.64it/s] 29it [00:06, 4.65it/s] 30it [00:06, 4.65it/s] 31it [00:07, 4.67it/s] 32it [00:07, 4.66it/s] 33it [00:07, 4.68it/s] 34it [00:07, 4.65it/s] 35it [00:07, 4.68it/s] 36it [00:08, 4.53it/s] 37it [00:08, 4.59it/s] 38it [00:08, 4.61it/s] 39it [00:08, 4.50it/s] 40it [00:09, 4.51it/s] 41it [00:09, 4.56it/s] 42it [00:09, 4.59it/s] 43it [00:09, 4.47it/s] 44it [00:09, 4.52it/s] 45it [00:10, 4.58it/s] 46it [00:10, 4.54it/s] 47it [00:10, 4.59it/s] 48it [00:10, 4.61it/s] 49it [00:10, 4.64it/s] 50it [00:11, 4.64it/s]2025-05-25 23:21:34,076 - INFO - [Epoch 036 | Batch 0050] IWAE-loss 1841.2819 | mean log_px -0.0059 | KL -1423.28 + 51it [00:11, 4.66it/s] 52it [00:11, 4.66it/s] 53it [00:11, 4.67it/s] 54it [00:12, 4.67it/s] 55it [00:12, 4.68it/s] 56it [00:12, 4.67it/s] 57it [00:12, 4.68it/s] 58it [00:12, 4.68it/s] 59it [00:13, 4.53it/s] 60it [00:13, 4.58it/s] 61it [00:13, 4.61it/s] 62it [00:13, 4.62it/s] 63it [00:14, 4.64it/s] 64it [00:14, 4.64it/s] 65it [00:14, 4.65it/s] 66it [00:14, 4.65it/s] 67it [00:14, 4.67it/s] 68it [00:15, 4.52it/s] 69it [00:15, 4.58it/s] 70it [00:15, 4.61it/s] 71it [00:15, 4.63it/s] 72it [00:15, 4.58it/s] 73it [00:16, 4.61it/s] 74it [00:16, 4.63it/s] 75it [00:16, 4.64it/s] 76it [00:16, 4.50it/s] 77it [00:17, 4.57it/s] 78it [00:17, 4.60it/s] 79it [00:17, 4.63it/s] 80it [00:17, 4.64it/s] 81it [00:17, 4.50it/s] 82it [00:18, 4.56it/s] 83it [00:18, 4.60it/s] 84it [00:18, 4.62it/s] 85it [00:18, 4.64it/s] 86it [00:18, 4.64it/s] 87it [00:19, 4.51it/s] 88it [00:19, 4.57it/s] 89it [00:19, 4.59it/s] 90it [00:19, 4.60it/s] 91it [00:20, 4.56it/s] 92it [00:20, 4.59it/s] 93it [00:20, 4.62it/s] 94it [00:20, 4.64it/s] 95it [00:20, 4.50it/s] 96it [00:21, 4.55it/s] 97it [00:21, 4.59it/s] 98it [00:21, 4.61it/s] 99it [00:21, 4.63it/s] 100it [00:22, 4.63it/s]2025-05-25 23:21:44,928 - INFO - [Epoch 036 | Batch 0100] IWAE-loss 1601.9835 | mean log_px -0.0026 | KL -1416.70 + 101it [00:22, 4.65it/s] 102it [00:22, 4.62it/s] 103it [00:22, 4.46it/s] 104it [00:22, 4.50it/s] 105it [00:23, 4.51it/s] 106it [00:23, 4.53it/s] 107it [00:23, 4.55it/s] 108it [00:23, 4.55it/s] 109it [00:24, 4.58it/s] 110it [00:24, 4.59it/s] 111it [00:24, 4.58it/s] 112it [00:24, 4.59it/s] 113it [00:24, 4.60it/s] 114it [00:25, 4.62it/s] 115it [00:25, 4.62it/s] 116it [00:25, 4.62it/s] 117it [00:25, 4.62it/s] 118it [00:25, 4.63it/s] 119it [00:26, 4.63it/s] 120it [00:26, 4.62it/s] 121it [00:26, 4.64it/s] 122it [00:26, 4.48it/s] 123it [00:27, 4.52it/s] 124it [00:27, 4.51it/s] 125it [00:27, 4.54it/s] 126it [00:27, 4.55it/s] 127it [00:27, 4.56it/s] 128it [00:28, 4.58it/s] 129it [00:28, 4.45it/s] 130it [00:28, 4.49it/s] 131it [00:28, 4.48it/s] 132it [00:29, 4.51it/s] 133it [00:29, 4.51it/s] 134it [00:29, 4.52it/s] 135it [00:29, 4.54it/s] 136it [00:29, 4.38it/s] 137it [00:30, 4.46it/s] 138it [00:30, 4.49it/s] 139it [00:30, 4.55it/s] 140it [00:30, 4.59it/s] 141it [00:31, 4.62it/s] 142it [00:31, 4.49it/s] 143it [00:31, 4.56it/s] 144it [00:31, 4.59it/s] 145it [00:31, 4.63it/s] 146it [00:32, 4.65it/s] 147it [00:32, 4.51it/s] 148it [00:32, 4.57it/s] 149it [00:32, 4.61it/s] 150it [00:33, 4.63it/s]2025-05-25 23:21:55,899 - INFO - [Epoch 036 | Batch 0150] IWAE-loss 1938.5652 | mean log_px -0.0120 | KL -1410.55 + 151it [00:33, 4.65it/s] 152it [00:33, 4.51it/s] 153it [00:33, 4.58it/s] 154it [00:33, 4.61it/s] 155it [00:34, 4.65it/s] 156it [00:34, 4.64it/s] 157it [00:34, 4.51it/s] 158it [00:34, 4.57it/s] 159it [00:34, 4.61it/s] 160it [00:35, 4.49it/s] 161it [00:35, 4.57it/s] 162it [00:35, 4.60it/s] 163it [00:35, 4.63it/s] 164it [00:36, 4.64it/s] 165it [00:36, 4.51it/s] 166it [00:36, 4.57it/s] 167it [00:36, 4.61it/s] 168it [00:36, 4.62it/s] 169it [00:37, 4.64it/s] 170it [00:37, 4.65it/s] 171it [00:37, 4.52it/s] 172it [00:37, 4.58it/s] 173it [00:38, 4.62it/s] 174it [00:38, 4.64it/s] 175it [00:38, 4.65it/s] 176it [00:38, 4.65it/s] 177it [00:38, 4.47it/s] 178it [00:39, 4.54it/s] 179it [00:39, 4.59it/s] 180it [00:39, 4.61it/s] 181it [00:39, 4.61it/s] 182it [00:39, 4.60it/s] 183it [00:40, 4.55it/s] 184it [00:40, 4.58it/s] 185it [00:40, 4.61it/s] 186it [00:40, 4.63it/s] 187it [00:41, 4.49it/s] 188it [00:41, 4.54it/s] 189it [00:41, 4.57it/s] 190it [00:41, 4.58it/s] 191it [00:41, 4.60it/s] 192it [00:42, 4.46it/s] 193it [00:42, 4.53it/s] 194it [00:42, 4.55it/s] 195it [00:42, 4.45it/s] 196it [00:43, 4.51it/s] 196it [00:43, 4.54it/s] +2025-05-25 23:22:05,884 - INFO - Epoch: 36, Objective: tensor([1572.9171], device='cuda:0', grad_fn=), Loss: 0.004463386721909046, KL/n: 28.696121215820312 + 0it [00:00, ?it/s]2025-05-25 23:22:06,295 - INFO - [Epoch 037 | Batch 0000] IWAE-loss 1712.1151 | mean log_px -0.0071 | KL -1405.82 + 1it [00:00, 2.92it/s] 2it [00:00, 3.72it/s] 3it [00:00, 4.09it/s] 4it [00:00, 4.25it/s] 5it [00:01, 4.39it/s] 6it [00:01, 4.43it/s] 7it [00:01, 4.49it/s] 8it [00:01, 4.54it/s] 9it [00:02, 4.42it/s] 10it [00:02, 4.45it/s] 11it [00:02, 4.49it/s] 12it [00:02, 4.53it/s] 13it [00:02, 4.56it/s] 14it [00:03, 4.50it/s] 15it [00:03, 4.53it/s] 16it [00:03, 4.54it/s] 17it [00:03, 4.40it/s] 18it [00:04, 4.47it/s] 19it [00:04, 4.53it/s] 20it [00:04, 4.54it/s] 21it [00:04, 4.56it/s] 22it [00:04, 4.54it/s] 23it [00:05, 4.55it/s] 24it [00:05, 4.36it/s] 25it [00:05, 4.40it/s] 26it [00:05, 4.44it/s] 27it [00:06, 4.29it/s] 28it [00:06, 4.32it/s] 29it [00:06, 4.30it/s] 30it [00:06, 4.28it/s] 31it [00:07, 4.34it/s] 32it [00:07, 4.35it/s] 33it [00:07, 4.40it/s] 34it [00:07, 4.44it/s] 35it [00:07, 4.44it/s] 36it [00:08, 4.34it/s] 37it [00:08, 4.44it/s] 38it [00:08, 4.42it/s] 39it [00:08, 4.49it/s] 40it [00:09, 4.53it/s] 41it [00:09, 4.57it/s] 42it [00:09, 4.48it/s] 43it [00:09, 4.53it/s] 44it [00:09, 4.40it/s] 45it [00:10, 4.48it/s] 46it [00:10, 4.53it/s] 47it [00:10, 4.51it/s] 48it [00:10, 4.48it/s] 49it [00:11, 4.45it/s] 50it [00:11, 4.50it/s]2025-05-25 23:22:17,475 - INFO - [Epoch 037 | Batch 0050] IWAE-loss 1829.0848 | mean log_px -0.0077 | KL -1399.44 + 51it [00:11, 4.52it/s] 52it [00:11, 4.40it/s] 53it [00:11, 4.46it/s] 54it [00:12, 4.50it/s] 55it [00:12, 4.49it/s] 56it [00:12, 4.54it/s] 57it [00:12, 4.56it/s] 58it [00:13, 4.57it/s] 59it [00:13, 4.53it/s] 60it [00:13, 4.56it/s] 61it [00:13, 4.58it/s] 62it [00:13, 4.59it/s] 63it [00:14, 4.61it/s] 64it [00:14, 4.55it/s] 65it [00:14, 4.39it/s] 66it [00:14, 4.46it/s] 67it [00:15, 4.43it/s] 68it [00:15, 4.48it/s] 69it [00:15, 4.45it/s] 70it [00:15, 4.47it/s] 71it [00:15, 4.52it/s] 72it [00:16, 4.53it/s] 73it [00:16, 4.31it/s] 74it [00:16, 4.40it/s] 75it [00:16, 4.46it/s] 76it [00:17, 4.51it/s] 77it [00:17, 4.54it/s] 78it [00:17, 4.55it/s] 79it [00:17, 4.58it/s] 80it [00:17, 4.57it/s] 81it [00:18, 4.42it/s] 82it [00:18, 4.48it/s] 83it [00:18, 4.50it/s] 84it [00:18, 4.54it/s] 85it [00:19, 4.57it/s] 86it [00:19, 4.56it/s] 87it [00:19, 4.53it/s] 88it [00:19, 4.39it/s] 89it [00:19, 4.47it/s] 90it [00:20, 4.48it/s] 91it [00:20, 4.52it/s] 92it [00:20, 4.54it/s] 93it [00:20, 4.54it/s] 94it [00:21, 4.56it/s] 95it [00:21, 4.55it/s] 96it [00:21, 4.42it/s] 97it [00:21, 4.44it/s] 98it [00:21, 4.50it/s] 99it [00:22, 4.54it/s] 100it [00:22, 4.54it/s]2025-05-25 23:22:28,572 - INFO - [Epoch 037 | Batch 0100] IWAE-loss 1828.0680 | mean log_px -0.0090 | KL -1395.64 + 101it [00:22, 4.54it/s] 102it [00:22, 4.40it/s] 103it [00:23, 4.48it/s] 104it [00:23, 4.49it/s] 105it [00:23, 4.52it/s] 106it [00:23, 4.37it/s] 107it [00:23, 4.38it/s] 108it [00:24, 4.37it/s] 109it [00:24, 4.46it/s] 110it [00:24, 4.47it/s] 111it [00:24, 4.46it/s] 112it [00:25, 4.50it/s] 113it [00:25, 4.46it/s] 114it [00:25, 4.50it/s] 115it [00:25, 4.56it/s] 116it [00:25, 4.58it/s] 117it [00:26, 4.48it/s] 118it [00:26, 4.38it/s] 119it [00:26, 4.45it/s] 120it [00:26, 4.50it/s] 121it [00:27, 4.54it/s] 122it [00:27, 4.55it/s] 123it [00:27, 4.57it/s] 124it [00:27, 4.56it/s] 125it [00:27, 4.57it/s] 126it [00:28, 4.54it/s] 127it [00:28, 4.44it/s] 128it [00:28, 4.46it/s] 129it [00:28, 4.52it/s] 130it [00:29, 4.55it/s] 131it [00:29, 4.43it/s] 132it [00:29, 4.39it/s] 133it [00:29, 4.44it/s] 134it [00:30, 4.37it/s] 135it [00:30, 4.47it/s] 136it [00:30, 4.51it/s] 137it [00:30, 4.28it/s] 138it [00:30, 4.36it/s] 139it [00:31, 4.37it/s] 140it [00:31, 4.41it/s] 141it [00:31, 4.48it/s] 142it [00:31, 4.51it/s] 143it [00:32, 4.54it/s] 144it [00:32, 4.42it/s] 145it [00:32, 4.36it/s] 146it [00:32, 4.45it/s] 147it [00:32, 4.47it/s] 148it [00:33, 4.47it/s] 149it [00:33, 4.52it/s] 150it [00:33, 4.50it/s]2025-05-25 23:22:39,768 - INFO - [Epoch 037 | Batch 0150] IWAE-loss 2035.0342 | mean log_px -0.0140 | KL -1391.93 + 151it [00:33, 4.48it/s] 152it [00:34, 4.35it/s] 153it [00:34, 4.41it/s] 154it [00:34, 4.45it/s] 155it [00:34, 4.50it/s] 156it [00:34, 4.40it/s] 157it [00:35, 4.48it/s] 158it [00:35, 4.48it/s] 159it [00:35, 4.51it/s] 160it [00:35, 4.52it/s] 161it [00:36, 4.54it/s] 162it [00:36, 4.54it/s] 163it [00:36, 4.56it/s] 164it [00:36, 4.38it/s] 165it [00:36, 4.46it/s] 166it [00:37, 4.48it/s] 167it [00:37, 4.49it/s] 168it [00:37, 4.46it/s] 169it [00:37, 4.52it/s] 170it [00:38, 4.53it/s] 171it [00:38, 4.40it/s] 172it [00:38, 4.46it/s] 173it [00:38, 4.50it/s] 174it [00:38, 4.43it/s] 175it [00:39, 4.45it/s] 176it [00:39, 4.50it/s] 177it [00:39, 4.50it/s] 178it [00:39, 4.53it/s] 179it [00:40, 4.56it/s] 180it [00:40, 4.54it/s] 181it [00:40, 4.55it/s] 182it [00:40, 4.57it/s] 183it [00:40, 4.56it/s] 184it [00:41, 4.56it/s] 185it [00:41, 4.57it/s] 186it [00:41, 4.56it/s] 187it [00:41, 4.42it/s] 188it [00:42, 4.47it/s] 189it [00:42, 4.50it/s] 190it [00:42, 4.40it/s] 191it [00:42, 4.44it/s] 192it [00:42, 4.37it/s] 193it [00:43, 4.42it/s] 194it [00:43, 4.40it/s] 195it [00:43, 4.32it/s] 196it [00:43, 4.21it/s] 196it [00:43, 4.46it/s] +2025-05-25 23:22:50,008 - INFO - Epoch: 37, Objective: tensor([1723.5656], device='cuda:0', grad_fn=), Loss: 0.004755986854434013, KL/n: 28.372997283935547 + 0it [00:00, ?it/s]2025-05-25 23:22:50,605 - INFO - [Epoch 038 | Batch 0000] IWAE-loss 1650.8577 | mean log_px -0.0084 | KL -1389.24 + 1it [00:00, 2.92it/s] 2it [00:00, 3.65it/s] 3it [00:00, 4.04it/s] 4it [00:01, 4.22it/s] 5it [00:01, 4.39it/s] 6it [00:01, 4.45it/s] 7it [00:01, 4.35it/s] 8it [00:01, 4.44it/s] 9it [00:02, 4.48it/s] 10it [00:02, 4.51it/s] 11it [00:02, 4.54it/s] 12it [00:02, 4.55it/s] 13it [00:02, 4.59it/s] 14it [00:03, 4.60it/s] 15it [00:03, 4.60it/s] 16it [00:03, 4.45it/s] 17it [00:03, 4.50it/s] 18it [00:04, 4.52it/s] 19it [00:04, 4.55it/s] 20it [00:04, 4.55it/s] 21it [00:04, 4.57it/s] 22it [00:04, 4.56it/s] 23it [00:05, 4.57it/s] 24it [00:05, 4.58it/s] 25it [00:05, 4.47it/s] 26it [00:05, 4.51it/s] 27it [00:06, 4.51it/s] 28it [00:06, 4.54it/s] 29it [00:06, 4.56it/s] 30it [00:06, 4.41it/s] 31it [00:06, 4.48it/s] 32it [00:07, 4.47it/s] 33it [00:07, 4.50it/s] 34it [00:07, 4.48it/s] 35it [00:07, 4.52it/s] 36it [00:08, 4.53it/s] 37it [00:08, 4.57it/s] 38it [00:08, 4.57it/s] 39it [00:08, 4.43it/s] 40it [00:08, 4.50it/s] 41it [00:09, 4.54it/s] 42it [00:09, 4.54it/s] 43it [00:09, 4.51it/s] 44it [00:09, 4.54it/s] 45it [00:10, 4.56it/s] 46it [00:10, 4.56it/s] 47it [00:10, 4.58it/s] 48it [00:10, 4.58it/s] 49it [00:10, 4.59it/s] 50it [00:11, 4.43it/s]2025-05-25 23:23:01,653 - INFO - [Epoch 038 | Batch 0050] IWAE-loss 1416.7461 | mean log_px -0.0029 | KL -1381.36 + 51it [00:11, 4.49it/s] 52it [00:11, 4.51it/s] 53it [00:11, 4.53it/s] 54it [00:12, 4.55it/s] 55it [00:12, 4.55it/s] 56it [00:12, 4.56it/s] 57it [00:12, 4.56it/s] 58it [00:12, 4.56it/s] 59it [00:13, 4.59it/s] 60it [00:13, 4.59it/s] 61it [00:13, 4.60it/s] 62it [00:13, 4.61it/s] 63it [00:14, 4.45it/s] 64it [00:14, 4.48it/s] 65it [00:14, 4.53it/s] 66it [00:14, 4.56it/s] 67it [00:14, 4.58it/s] 68it [00:15, 4.58it/s] 69it [00:15, 4.56it/s] 70it [00:15, 4.33it/s] 71it [00:15, 4.43it/s] 72it [00:16, 4.49it/s] 73it [00:16, 4.54it/s] 74it [00:16, 4.56it/s] 75it [00:16, 4.61it/s] 76it [00:16, 4.62it/s] 77it [00:17, 4.63it/s] 78it [00:17, 4.63it/s] 79it [00:17, 4.48it/s] 80it [00:17, 4.53it/s] 81it [00:17, 4.57it/s] 82it [00:18, 4.61it/s] 83it [00:18, 4.61it/s] 84it [00:18, 4.62it/s] 85it [00:18, 4.63it/s] 86it [00:19, 4.63it/s] 87it [00:19, 4.62it/s] 88it [00:19, 4.62it/s] 89it [00:19, 4.63it/s] 90it [00:19, 4.49it/s] 91it [00:20, 4.54it/s] 92it [00:20, 4.55it/s] 93it [00:20, 4.59it/s] 94it [00:20, 4.61it/s] 95it [00:21, 4.60it/s] 96it [00:21, 4.60it/s] 97it [00:21, 4.62it/s] 98it [00:21, 4.60it/s] 99it [00:21, 4.60it/s] 100it [00:22, 4.59it/s]2025-05-25 23:23:12,588 - INFO - [Epoch 038 | Batch 0100] IWAE-loss 1494.8090 | mean log_px -0.0030 | KL -1374.98 + 101it [00:22, 4.61it/s] 102it [00:22, 4.61it/s] 103it [00:22, 4.62it/s] 104it [00:22, 4.62it/s] 105it [00:23, 4.62it/s] 106it [00:23, 4.62it/s] 107it [00:23, 4.62it/s] 108it [00:23, 4.62it/s] 109it [00:24, 4.49it/s] 110it [00:24, 4.53it/s] 111it [00:24, 4.54it/s] 112it [00:24, 4.59it/s] 113it [00:24, 4.60it/s] 114it [00:25, 4.60it/s] 115it [00:25, 4.62it/s] 116it [00:25, 4.62it/s] 117it [00:25, 4.61it/s] 118it [00:26, 4.49it/s] 119it [00:26, 4.55it/s] 120it [00:26, 4.57it/s] 121it [00:26, 4.59it/s] 122it [00:26, 4.59it/s] 123it [00:27, 4.61it/s] 124it [00:27, 4.62it/s] 125it [00:27, 4.61it/s] 126it [00:27, 4.61it/s] 127it [00:27, 4.63it/s] 128it [00:28, 4.63it/s] 129it [00:28, 4.54it/s] 130it [00:28, 4.58it/s] 131it [00:28, 4.59it/s] 132it [00:29, 4.60it/s] 133it [00:29, 4.62it/s] 134it [00:29, 4.63it/s] 135it [00:29, 4.47it/s] 136it [00:29, 4.52it/s] 137it [00:30, 4.55it/s] 138it [00:30, 4.57it/s] 139it [00:30, 4.59it/s] 140it [00:30, 4.60it/s] 141it [00:31, 4.62it/s] 142it [00:31, 4.61it/s] 143it [00:31, 4.47it/s] 144it [00:31, 4.52it/s] 145it [00:31, 4.56it/s] 146it [00:32, 4.58it/s] 147it [00:32, 4.55it/s] 148it [00:32, 4.58it/s] 149it [00:32, 4.60it/s] 150it [00:33, 4.60it/s]2025-05-25 23:23:23,499 - INFO - [Epoch 038 | Batch 0150] IWAE-loss 2008.2279 | mean log_px -0.0121 | KL -1368.49 + 151it [00:33, 4.62it/s] 152it [00:33, 4.50it/s] 153it [00:33, 4.56it/s] 154it [00:33, 4.57it/s] 155it [00:34, 4.59it/s] 156it [00:34, 4.60it/s] 157it [00:34, 4.62it/s] 158it [00:34, 4.62it/s] 159it [00:34, 4.63it/s] 160it [00:35, 4.63it/s] 161it [00:35, 4.63it/s] 162it [00:35, 4.63it/s] 163it [00:35, 4.63it/s] 164it [00:36, 4.48it/s] 165it [00:36, 4.53it/s] 166it [00:36, 4.56it/s] 167it [00:36, 4.58it/s] 168it [00:36, 4.57it/s] 169it [00:37, 4.44it/s] 170it [00:37, 4.50it/s] 171it [00:37, 4.55it/s] 172it [00:37, 4.56it/s] 173it [00:38, 4.58it/s] 174it [00:38, 4.57it/s] 175it [00:38, 4.59it/s] 176it [00:38, 4.45it/s] 177it [00:38, 4.51it/s] 178it [00:39, 4.52it/s] 179it [00:39, 4.53it/s] 180it [00:39, 4.54it/s] 181it [00:39, 4.57it/s] 182it [00:40, 4.59it/s] 183it [00:40, 4.46it/s] 184it [00:40, 4.51it/s] 185it [00:40, 4.55it/s] 186it [00:40, 4.56it/s] 187it [00:41, 4.59it/s] 188it [00:41, 4.60it/s] 189it [00:41, 4.60it/s] 190it [00:41, 4.61it/s] 191it [00:42, 4.47it/s] 192it [00:42, 4.53it/s] 193it [00:42, 4.55it/s] 194it [00:42, 4.57it/s] 195it [00:42, 4.46it/s] 196it [00:43, 4.53it/s] 196it [00:43, 4.54it/s] +2025-05-25 23:23:33,521 - INFO - Epoch: 38, Objective: tensor([1541.9781], device='cuda:0', grad_fn=), Loss: 0.006994233466684818, KL/n: 27.92793846130371 + 0it [00:00, ?it/s]2025-05-25 23:23:33,938 - INFO - [Epoch 039 | Batch 0000] IWAE-loss 2019.2355 | mean log_px -0.0157 | KL -1369.24 + 1it [00:00, 2.94it/s] 2it [00:00, 3.74it/s] 3it [00:00, 3.93it/s] 4it [00:01, 4.20it/s] 5it [00:01, 4.35it/s] 6it [00:01, 4.45it/s] 7it [00:01, 4.48it/s] 8it [00:01, 4.40it/s] 9it [00:02, 4.47it/s] 10it [00:02, 4.52it/s] 11it [00:02, 4.54it/s] 12it [00:02, 4.43it/s] 13it [00:03, 4.44it/s] 14it [00:03, 4.52it/s] 15it [00:03, 4.49it/s] 16it [00:03, 4.44it/s] 17it [00:03, 4.49it/s] 18it [00:04, 4.52it/s] 19it [00:04, 4.55it/s] 20it [00:04, 4.56it/s] 21it [00:04, 4.46it/s] 22it [00:04, 4.52it/s] 23it [00:05, 4.57it/s] 24it [00:05, 4.57it/s] 25it [00:05, 4.60it/s] 26it [00:05, 4.61it/s] 27it [00:06, 4.62it/s] 28it [00:06, 4.63it/s] 29it [00:06, 4.64it/s] 30it [00:06, 4.63it/s] 31it [00:06, 4.64it/s] 32it [00:07, 4.66it/s] 33it [00:07, 4.66it/s] 34it [00:07, 4.64it/s] 35it [00:07, 4.65it/s] 36it [00:08, 4.64it/s] 37it [00:08, 4.63it/s] 38it [00:08, 4.62it/s] 39it [00:08, 4.46it/s] 40it [00:08, 4.51it/s] 41it [00:09, 4.56it/s] 42it [00:09, 4.58it/s] 43it [00:09, 4.60it/s] 44it [00:09, 4.61it/s] 45it [00:09, 4.64it/s] 46it [00:10, 4.64it/s] 47it [00:10, 4.65it/s] 48it [00:10, 4.65it/s] 49it [00:10, 4.61it/s] 50it [00:11, 4.61it/s]2025-05-25 23:23:44,871 - INFO - [Epoch 039 | Batch 0050] IWAE-loss 1660.3208 | mean log_px -0.0043 | KL -1355.90 + 51it [00:11, 4.63it/s] 52it [00:11, 4.61it/s] 53it [00:11, 4.61it/s] 54it [00:11, 4.64it/s] 55it [00:12, 4.50it/s] 56it [00:12, 4.53it/s] 57it [00:12, 4.57it/s] 58it [00:12, 4.59it/s] 59it [00:13, 4.62it/s] 60it [00:13, 4.62it/s] 61it [00:13, 4.64it/s] 62it [00:13, 4.63it/s] 63it [00:13, 4.63it/s] 64it [00:14, 4.49it/s] 65it [00:14, 4.54it/s] 66it [00:14, 4.57it/s] 67it [00:14, 4.59it/s] 68it [00:14, 4.62it/s] 69it [00:15, 4.61it/s] 70it [00:15, 4.61it/s] 71it [00:15, 4.65it/s] 72it [00:15, 4.64it/s] 73it [00:16, 4.53it/s] 74it [00:16, 4.57it/s] 75it [00:16, 4.60it/s] 76it [00:16, 4.62it/s] 77it [00:16, 4.62it/s] 78it [00:17, 4.62it/s] 79it [00:17, 3.68it/s] 80it [00:17, 3.93it/s] 81it [00:17, 4.12it/s] 82it [00:18, 4.24it/s] 83it [00:18, 4.34it/s] 84it [00:18, 4.42it/s] 85it [00:18, 4.50it/s] 86it [00:19, 4.53it/s] 87it [00:19, 4.42it/s] 88it [00:19, 4.51it/s] 89it [00:19, 4.55it/s] 90it [00:19, 4.58it/s] 91it [00:20, 4.60it/s] 92it [00:20, 4.60it/s] 93it [00:20, 4.62it/s] 94it [00:20, 4.62it/s] 95it [00:21, 4.43it/s] 96it [00:21, 4.49it/s] 97it [00:21, 4.54it/s] 98it [00:21, 4.57it/s] 99it [00:21, 4.59it/s] 100it [00:22, 4.60it/s]2025-05-25 23:23:55,949 - INFO - [Epoch 039 | Batch 0100] IWAE-loss 2246.3765 | mean log_px -0.0212 | KL -1355.14 + 101it [00:22, 4.58it/s] 102it [00:22, 4.59it/s] 103it [00:22, 4.61it/s] 104it [00:23, 4.60it/s] 105it [00:23, 4.35it/s] 106it [00:23, 4.44it/s] 107it [00:23, 4.50it/s] 108it [00:23, 4.53it/s] 109it [00:24, 4.56it/s] 110it [00:24, 4.59it/s] 111it [00:24, 4.62it/s] 112it [00:24, 4.63it/s] 113it [00:24, 4.65it/s] 114it [00:25, 4.50it/s] 115it [00:25, 4.55it/s] 116it [00:25, 4.58it/s] 117it [00:25, 4.59it/s] 118it [00:26, 4.60it/s] 119it [00:26, 4.62it/s] 120it [00:26, 4.62it/s] 121it [00:26, 4.64it/s] 122it [00:26, 4.64it/s] 123it [00:27, 4.60it/s] 124it [00:27, 4.63it/s] 125it [00:27, 4.64it/s] 126it [00:27, 4.63it/s] 127it [00:28, 4.62it/s] 128it [00:28, 4.62it/s] 129it [00:28, 4.63it/s] 130it [00:28, 4.63it/s] 131it [00:28, 4.66it/s] 132it [00:29, 4.49it/s] 133it [00:29, 4.55it/s] 134it [00:29, 4.58it/s] 135it [00:29, 4.61it/s] 136it [00:29, 4.61it/s] 137it [00:30, 4.63it/s] 138it [00:30, 4.50it/s] 139it [00:30, 4.57it/s] 140it [00:30, 4.43it/s] 141it [00:31, 4.50it/s] 142it [00:31, 4.54it/s] 143it [00:31, 4.58it/s] 144it [00:31, 4.60it/s] 145it [00:31, 4.61it/s] 146it [00:32, 4.47it/s] 147it [00:32, 4.53it/s] 148it [00:32, 4.57it/s] 149it [00:32, 4.59it/s] 150it [00:33, 4.60it/s]2025-05-25 23:24:06,876 - INFO - [Epoch 039 | Batch 0150] IWAE-loss 1432.8291 | mean log_px -0.0022 | KL -1358.02 + 151it [00:33, 4.61it/s] 152it [00:33, 4.63it/s] 153it [00:33, 4.62it/s] 154it [00:33, 4.63it/s] 155it [00:34, 4.50it/s] 156it [00:34, 4.54it/s] 157it [00:34, 4.51it/s] 158it [00:34, 4.46it/s] 159it [00:35, 4.51it/s] 160it [00:35, 4.56it/s] 161it [00:35, 4.60it/s] 162it [00:35, 4.62it/s] 163it [00:35, 4.54it/s] 164it [00:36, 4.43it/s] 165it [00:36, 4.39it/s] 166it [00:36, 4.46it/s] 167it [00:36, 4.53it/s] 168it [00:37, 4.55it/s] 169it [00:37, 4.58it/s] 170it [00:37, 4.59it/s] 171it [00:37, 4.61it/s] 172it [00:37, 4.62it/s] 173it [00:38, 4.63it/s] 174it [00:38, 4.50it/s] 175it [00:38, 4.40it/s] 176it [00:38, 4.44it/s] 177it [00:39, 4.49it/s] 178it [00:39, 4.53it/s] 179it [00:39, 4.56it/s] 180it [00:39, 4.59it/s] 181it [00:39, 4.61it/s] 182it [00:40, 4.62it/s] 183it [00:40, 4.62it/s] 184it [00:40, 4.63it/s] 185it [00:40, 4.49it/s] 186it [00:40, 4.54it/s] 187it [00:41, 4.58it/s] 188it [00:41, 4.59it/s] 189it [00:41, 4.61it/s] 190it [00:41, 4.62it/s] 191it [00:42, 4.64it/s] 192it [00:42, 4.63it/s] 193it [00:42, 4.49it/s] 194it [00:42, 4.41it/s] 195it [00:42, 4.30it/s] 196it [00:43, 4.38it/s] 196it [00:43, 4.53it/s] +2025-05-25 23:24:16,934 - INFO - Epoch: 39, Objective: tensor([1496.1766], device='cuda:0', grad_fn=), Loss: 0.00248352880589664, KL/n: 27.671977996826172 + 0it [00:00, ?it/s]2025-05-25 23:24:17,313 - INFO - [Epoch 040 | Batch 0000] IWAE-loss 1431.6737 | mean log_px -0.0017 | KL -1354.64 + 1it [00:00, 3.28it/s] 2it [00:00, 3.97it/s] 3it [00:00, 4.26it/s] 4it [00:00, 4.40it/s] 5it [00:01, 4.49it/s] 6it [00:01, 4.51it/s] 7it [00:01, 4.54it/s] 8it [00:01, 4.57it/s] 9it [00:02, 4.60it/s] 10it [00:02, 4.61it/s] 11it [00:02, 4.64it/s] 12it [00:02, 4.46it/s] 13it [00:02, 4.53it/s] 14it [00:03, 4.56it/s] 15it [00:03, 4.61it/s] 16it [00:03, 4.63it/s] 17it [00:03, 4.65it/s] 18it [00:03, 4.66it/s] 19it [00:04, 4.68it/s] 20it [00:04, 4.69it/s] 21it [00:04, 4.66it/s] 22it [00:04, 4.66it/s] 23it [00:05, 4.68it/s] 24it [00:05, 4.53it/s] 25it [00:05, 4.59it/s] 26it [00:05, 4.60it/s] 27it [00:05, 4.63it/s] 28it [00:06, 4.63it/s] 29it [00:06, 4.63it/s] 30it [00:06, 4.63it/s] 31it [00:06, 4.64it/s] 32it [00:07, 4.64it/s] 33it [00:07, 4.65it/s] 34it [00:07, 4.65it/s] 35it [00:07, 4.66it/s] 36it [00:07, 4.66it/s] 37it [00:08, 4.66it/s] 38it [00:08, 4.65it/s] 39it [00:08, 4.66it/s] 40it [00:08, 4.66it/s] 41it [00:08, 4.67it/s] 42it [00:09, 4.66it/s] 43it [00:09, 4.67it/s] 44it [00:09, 4.66it/s] 45it [00:09, 4.66it/s] 46it [00:10, 4.65it/s] 47it [00:10, 4.64it/s] 48it [00:10, 4.48it/s] 49it [00:10, 4.56it/s] 50it [00:10, 4.58it/s]2025-05-25 23:24:28,119 - INFO - [Epoch 040 | Batch 0050] IWAE-loss 1473.0669 | mean log_px -0.0033 | KL -1345.21 + 51it [00:11, 4.61it/s] 52it [00:11, 4.56it/s] 53it [00:11, 4.58it/s] 54it [00:11, 4.59it/s] 55it [00:11, 4.62it/s] 56it [00:12, 4.63it/s] 57it [00:12, 4.64it/s] 58it [00:12, 4.63it/s] 59it [00:12, 4.64it/s] 60it [00:13, 4.64it/s] 61it [00:13, 4.64it/s] 62it [00:13, 4.65it/s] 63it [00:13, 4.65it/s] 64it [00:13, 4.65it/s] 65it [00:14, 4.65it/s] 66it [00:14, 4.49it/s] 67it [00:14, 4.55it/s] 68it [00:14, 4.57it/s] 69it [00:15, 4.61it/s] 70it [00:15, 4.61it/s] 71it [00:15, 4.62it/s] 72it [00:15, 4.61it/s] 73it [00:15, 4.62it/s] 74it [00:16, 4.64it/s] 75it [00:16, 4.64it/s] 76it [00:16, 4.64it/s] 77it [00:16, 4.64it/s] 78it [00:16, 4.64it/s] 79it [00:17, 4.65it/s] 80it [00:17, 4.63it/s] 81it [00:17, 4.63it/s] 82it [00:17, 4.64it/s] 83it [00:18, 4.65it/s] 84it [00:18, 4.64it/s] 85it [00:18, 4.65it/s] 86it [00:18, 4.64it/s] 87it [00:18, 4.61it/s] 88it [00:19, 4.62it/s] 89it [00:19, 4.63it/s] 90it [00:19, 4.63it/s] 91it [00:19, 4.64it/s] 92it [00:19, 4.53it/s] 93it [00:20, 4.58it/s] 94it [00:20, 4.60it/s] 95it [00:20, 4.62it/s] 96it [00:20, 4.63it/s] 97it [00:21, 4.64it/s] 98it [00:21, 4.51it/s] 99it [00:21, 4.56it/s] 100it [00:21, 4.60it/s]2025-05-25 23:24:38,950 - INFO - [Epoch 040 | Batch 0100] IWAE-loss 1605.0006 | mean log_px -0.0037 | KL -1343.43 + 101it [00:21, 4.63it/s] 102it [00:22, 4.63it/s] 103it [00:22, 4.63it/s] 104it [00:22, 4.63it/s] 105it [00:22, 4.44it/s] 106it [00:23, 4.46it/s] 107it [00:23, 4.48it/s] 108it [00:23, 4.48it/s] 109it [00:23, 4.49it/s] 110it [00:23, 4.49it/s] 111it [00:24, 4.53it/s] 112it [00:24, 4.56it/s] 113it [00:24, 4.46it/s] 114it [00:24, 4.51it/s] 115it [00:25, 4.57it/s] 116it [00:25, 4.59it/s] 117it [00:25, 4.60it/s] 118it [00:25, 4.57it/s] 119it [00:25, 4.61it/s] 120it [00:26, 4.62it/s] 121it [00:26, 4.63it/s] 122it [00:26, 4.64it/s] 123it [00:26, 4.65it/s] 124it [00:26, 4.64it/s] 125it [00:27, 4.64it/s] 126it [00:27, 4.64it/s] 127it [00:27, 4.62it/s] 128it [00:27, 4.64it/s] 129it [00:28, 4.65it/s] 130it [00:28, 4.65it/s] 131it [00:28, 4.66it/s] 132it [00:28, 4.52it/s] 133it [00:28, 4.58it/s] 134it [00:29, 4.61it/s] 135it [00:29, 4.63it/s] 136it [00:29, 4.63it/s] 137it [00:29, 4.65it/s] 138it [00:30, 4.64it/s] 139it [00:30, 4.64it/s] 140it [00:30, 4.63it/s] 141it [00:30, 4.55it/s] 142it [00:30, 4.60it/s] 143it [00:31, 4.62it/s] 144it [00:31, 4.62it/s] 145it [00:31, 4.63it/s] 146it [00:31, 4.48it/s] 147it [00:31, 4.53it/s] 148it [00:32, 4.56it/s] 149it [00:32, 4.60it/s] 150it [00:32, 4.61it/s]2025-05-25 23:24:49,849 - INFO - [Epoch 040 | Batch 0150] IWAE-loss 1694.4125 | mean log_px -0.0137 | KL -1343.96 + 151it [00:32, 4.62it/s] 152it [00:33, 4.62it/s] 153it [00:33, 4.63it/s] 154it [00:33, 4.64it/s] 155it [00:33, 4.55it/s] 156it [00:33, 4.60it/s] 157it [00:34, 4.61it/s] 158it [00:34, 4.62it/s] 159it [00:34, 4.63it/s] 160it [00:34, 4.63it/s] 161it [00:35, 4.65it/s] 162it [00:35, 4.55it/s] 163it [00:35, 4.59it/s] 164it [00:35, 4.60it/s] 165it [00:35, 4.63it/s] 166it [00:36, 4.65it/s] 167it [00:36, 4.55it/s] 168it [00:36, 4.59it/s] 169it [00:36, 4.61it/s] 170it [00:36, 4.57it/s] 171it [00:37, 4.54it/s] 172it [00:37, 4.58it/s] 173it [00:37, 4.45it/s] 174it [00:37, 4.52it/s] 175it [00:38, 4.56it/s] 176it [00:38, 4.58it/s] 177it [00:38, 4.61it/s] 178it [00:38, 4.61it/s] 179it [00:38, 4.62it/s] 180it [00:39, 4.49it/s] 181it [00:39, 4.55it/s] 182it [00:39, 4.58it/s] 183it [00:39, 4.60it/s] 184it [00:40, 4.60it/s] 185it [00:40, 4.62it/s] 186it [00:40, 4.48it/s] 187it [00:40, 4.53it/s] 188it [00:40, 4.55it/s] 189it [00:41, 4.59it/s] 190it [00:41, 4.60it/s] 191it [00:41, 4.61it/s] 192it [00:41, 4.62it/s] 193it [00:42, 4.50it/s] 194it [00:42, 4.54it/s] 195it [00:42, 4.24it/s] 196it [00:42, 4.36it/s] 196it [00:42, 4.58it/s] +2025-05-25 23:24:59,859 - INFO - Epoch: 40, Objective: tensor([1448.3232], device='cuda:0', grad_fn=), Loss: 0.0037635706830769777, KL/n: 27.25246238708496 + 0it [00:00, ?it/s]2025-05-25 23:25:00,450 - INFO - [Epoch 041 | Batch 0000] IWAE-loss 1551.8910 | mean log_px -0.0058 | KL -1334.23 + 1it [00:00, 2.93it/s] 2it [00:00, 3.72it/s] 3it [00:00, 4.10it/s] 4it [00:00, 4.30it/s] 5it [00:01, 4.42it/s] 6it [00:01, 4.38it/s] 7it [00:01, 4.38it/s] 8it [00:01, 4.45it/s] 9it [00:02, 4.45it/s] 10it [00:02, 4.32it/s] 11it [00:02, 4.16it/s] 12it [00:02, 4.19it/s] 13it [00:03, 4.21it/s] 14it [00:03, 4.29it/s] 15it [00:03, 4.34it/s] 16it [00:03, 4.34it/s] 17it [00:03, 4.34it/s] 18it [00:04, 4.36it/s] 19it [00:04, 4.37it/s] 20it [00:04, 4.26it/s] 21it [00:04, 4.37it/s] 22it [00:05, 4.44it/s] 23it [00:05, 4.50it/s] 24it [00:05, 4.52it/s] 25it [00:05, 4.53it/s] 26it [00:05, 4.57it/s] 27it [00:06, 4.61it/s] 28it [00:06, 4.64it/s] 29it [00:06, 4.66it/s] 30it [00:06, 4.67it/s] 31it [00:07, 4.52it/s] 32it [00:07, 4.59it/s] 33it [00:07, 4.63it/s] 34it [00:07, 4.65it/s] 35it [00:07, 4.65it/s] 36it [00:08, 4.66it/s] 37it [00:08, 4.62it/s] 38it [00:08, 4.64it/s] 39it [00:08, 4.66it/s] 40it [00:09, 4.68it/s] 41it [00:09, 4.52it/s] 42it [00:09, 4.54it/s] 43it [00:09, 4.57it/s] 44it [00:09, 4.58it/s] 45it [00:10, 4.60it/s] 46it [00:10, 4.61it/s] 47it [00:10, 4.62it/s] 48it [00:10, 4.59it/s] 49it [00:11, 4.31it/s] 50it [00:11, 4.36it/s]2025-05-25 23:25:11,577 - INFO - [Epoch 041 | Batch 0050] IWAE-loss 1382.9540 | mean log_px -0.0018 | KL -1326.47 + 51it [00:11, 4.42it/s] 52it [00:11, 4.46it/s] 53it [00:11, 4.51it/s] 54it [00:12, 4.52it/s] 55it [00:12, 4.55it/s] 56it [00:12, 4.52it/s] 57it [00:12, 4.54it/s] 58it [00:12, 4.56it/s] 59it [00:13, 4.58it/s] 60it [00:13, 4.58it/s] 61it [00:13, 4.60it/s] 62it [00:13, 4.60it/s] 63it [00:14, 4.62it/s] 64it [00:14, 4.61it/s] 65it [00:14, 4.62it/s] 66it [00:14, 4.62it/s] 67it [00:14, 4.61it/s] 68it [00:15, 4.60it/s] 69it [00:15, 4.60it/s] 70it [00:15, 4.47it/s] 71it [00:15, 4.53it/s] 72it [00:16, 4.56it/s] 73it [00:16, 4.58it/s] 74it [00:16, 4.59it/s] 75it [00:16, 4.60it/s] 76it [00:16, 4.60it/s] 77it [00:17, 4.58it/s] 78it [00:17, 4.59it/s] 79it [00:17, 4.60it/s] 80it [00:17, 4.60it/s] 81it [00:18, 4.61it/s] 82it [00:18, 4.60it/s] 83it [00:18, 4.63it/s] 84it [00:18, 4.48it/s] 85it [00:18, 4.53it/s] 86it [00:19, 4.56it/s] 87it [00:19, 4.58it/s] 88it [00:19, 4.60it/s] 89it [00:19, 4.61it/s] 90it [00:19, 4.62it/s] 91it [00:20, 4.62it/s] 92it [00:20, 4.58it/s] 93it [00:20, 4.45it/s] 94it [00:20, 4.51it/s] 95it [00:21, 4.55it/s] 96it [00:21, 4.56it/s] 97it [00:21, 4.57it/s] 98it [00:21, 4.58it/s] 99it [00:21, 4.58it/s] 100it [00:22, 4.54it/s]2025-05-25 23:25:22,502 - INFO - [Epoch 041 | Batch 0100] IWAE-loss 1411.5579 | mean log_px -0.0019 | KL -1321.44 + 101it [00:22, 4.56it/s] 102it [00:22, 4.44it/s] 103it [00:22, 4.50it/s] 104it [00:23, 4.51it/s] 105it [00:23, 4.56it/s] 106it [00:23, 4.57it/s] 107it [00:23, 4.58it/s] 108it [00:23, 4.59it/s] 109it [00:24, 4.47it/s] 110it [00:24, 4.53it/s] 111it [00:24, 4.58it/s] 112it [00:24, 4.60it/s] 113it [00:25, 4.62it/s] 114it [00:25, 4.63it/s] 115it [00:25, 4.64it/s] 116it [00:25, 4.48it/s] 117it [00:25, 4.55it/s] 118it [00:26, 4.57it/s] 119it [00:26, 4.61it/s] 120it [00:26, 4.62it/s] 121it [00:26, 4.63it/s] 122it [00:27, 4.46it/s] 123it [00:27, 4.54it/s] 124it [00:27, 4.56it/s] 125it [00:27, 4.58it/s] 126it [00:27, 4.60it/s] 127it [00:28, 4.61it/s] 128it [00:28, 4.59it/s] 129it [00:28, 4.56it/s] 130it [00:28, 4.58it/s] 131it [00:28, 4.61it/s] 132it [00:29, 4.62it/s] 133it [00:29, 4.64it/s] 134it [00:29, 4.52it/s] 135it [00:29, 4.58it/s] 136it [00:30, 4.60it/s] 137it [00:30, 4.60it/s] 138it [00:30, 4.60it/s] 139it [00:30, 4.63it/s] 140it [00:30, 4.64it/s] 141it [00:31, 4.48it/s] 142it [00:31, 4.53it/s] 143it [00:31, 4.57it/s] 144it [00:31, 4.60it/s] 145it [00:32, 4.62it/s] 146it [00:32, 4.62it/s] 147it [00:32, 4.64it/s] 148it [00:32, 4.64it/s] 149it [00:32, 4.65it/s] 150it [00:33, 4.49it/s]2025-05-25 23:25:33,435 - INFO - [Epoch 041 | Batch 0150] IWAE-loss 1899.3881 | mean log_px -0.0105 | KL -1315.73 + 151it [00:33, 4.55it/s] 152it [00:33, 4.58it/s] 153it [00:33, 4.59it/s] 154it [00:33, 4.57it/s] 155it [00:34, 4.59it/s] 156it [00:34, 4.61it/s] 157it [00:34, 4.57it/s] 158it [00:34, 4.60it/s] 159it [00:35, 4.47it/s] 160it [00:35, 4.52it/s] 161it [00:35, 4.56it/s] 162it [00:35, 4.58it/s] 163it [00:35, 4.56it/s] 164it [00:36, 4.57it/s] 165it [00:36, 4.61it/s] 166it [00:36, 4.61it/s] 167it [00:36, 4.64it/s] 168it [00:37, 4.64it/s] 169it [00:37, 4.48it/s] 170it [00:37, 4.53it/s] 171it [00:37, 4.56it/s] 172it [00:37, 4.52it/s] 173it [00:38, 4.58it/s] 174it [00:38, 4.60it/s] 175it [00:38, 4.62it/s] 176it [00:38, 4.48it/s] 177it [00:39, 4.53it/s] 178it [00:39, 4.58it/s] 179it [00:39, 4.58it/s] 180it [00:39, 4.59it/s] 181it [00:39, 4.58it/s] 182it [00:40, 4.62it/s] 183it [00:40, 4.65it/s] 184it [00:40, 4.66it/s] 185it [00:40, 4.67it/s] 186it [00:40, 4.67it/s] 187it [00:41, 4.68it/s] 188it [00:41, 4.51it/s] 189it [00:41, 4.58it/s] 190it [00:41, 4.55it/s] 191it [00:42, 4.46it/s] 192it [00:42, 4.46it/s] 193it [00:42, 4.51it/s] 194it [00:42, 4.56it/s] 195it [00:42, 4.49it/s] 196it [00:43, 4.56it/s] 196it [00:43, 4.53it/s] +2025-05-25 23:25:43,411 - INFO - Epoch: 41, Objective: tensor([1496.4008], device='cuda:0', grad_fn=), Loss: 0.004434915725141764, KL/n: 26.789295196533203 + 0it [00:00, ?it/s]2025-05-25 23:25:43,792 - INFO - [Epoch 042 | Batch 0000] IWAE-loss 1575.5166 | mean log_px -0.0100 | KL -1312.57 + 1it [00:00, 3.04it/s] 2it [00:00, 3.81it/s] 3it [00:00, 4.17it/s] 4it [00:00, 4.35it/s] 5it [00:01, 4.47it/s] 6it [00:01, 4.54it/s] 7it [00:01, 4.59it/s] 8it [00:01, 4.62it/s] 9it [00:02, 4.65it/s] 10it [00:02, 4.49it/s] 11it [00:02, 4.57it/s] 12it [00:02, 4.60it/s] 13it [00:02, 4.63it/s] 14it [00:03, 4.48it/s] 15it [00:03, 4.56it/s] 16it [00:03, 4.59it/s] 17it [00:03, 4.62it/s] 18it [00:04, 4.64it/s] 19it [00:04, 4.65it/s] 20it [00:04, 4.65it/s] 21it [00:04, 4.50it/s] 22it [00:04, 4.57it/s] 23it [00:05, 4.61it/s] 24it [00:05, 4.63it/s] 25it [00:05, 4.65it/s] 26it [00:05, 4.66it/s] 27it [00:05, 4.67it/s] 28it [00:06, 4.50it/s] 29it [00:06, 4.58it/s] 30it [00:06, 4.60it/s] 31it [00:06, 4.64it/s] 32it [00:07, 4.65it/s] 33it [00:07, 4.67it/s] 34it [00:07, 4.67it/s] 35it [00:07, 4.68it/s] 36it [00:07, 4.64it/s] 37it [00:08, 4.50it/s] 38it [00:08, 4.57it/s] 39it [00:08, 3.65it/s] 40it [00:08, 3.90it/s] 41it [00:09, 4.12it/s] 42it [00:09, 4.13it/s] 43it [00:09, 4.30it/s] 44it [00:09, 4.41it/s] 45it [00:10, 4.50it/s] 46it [00:10, 4.55it/s] 47it [00:10, 4.59it/s] 48it [00:10, 4.44it/s] 49it [00:10, 4.53it/s] 50it [00:11, 4.57it/s]2025-05-25 23:25:54,850 - INFO - [Epoch 042 | Batch 0050] IWAE-loss 1876.5878 | mean log_px -0.0155 | KL -1306.35 + 51it [00:11, 4.60it/s] 52it [00:11, 4.63it/s] 53it [00:11, 4.49it/s] 54it [00:12, 4.56it/s] 55it [00:12, 4.60it/s] 56it [00:12, 4.63it/s] 57it [00:12, 4.64it/s] 58it [00:12, 4.46it/s] 59it [00:13, 4.55it/s] 60it [00:13, 4.58it/s] 61it [00:13, 4.62it/s] 62it [00:13, 4.63it/s] 63it [00:13, 4.64it/s] 64it [00:14, 4.49it/s] 65it [00:14, 4.57it/s] 66it [00:14, 4.61it/s] 67it [00:14, 4.63it/s] 68it [00:15, 4.65it/s] 69it [00:15, 4.67it/s] 70it [00:15, 4.67it/s] 71it [00:15, 4.69it/s] 72it [00:15, 4.69it/s] 73it [00:16, 4.50it/s] 74it [00:16, 4.57it/s] 75it [00:16, 4.61it/s] 76it [00:16, 4.62it/s] 77it [00:17, 4.64it/s] 78it [00:17, 4.66it/s] 79it [00:17, 4.68it/s] 80it [00:17, 4.67it/s] 81it [00:17, 4.52it/s] 82it [00:18, 4.59it/s] 83it [00:18, 4.62it/s] 84it [00:18, 4.63it/s] 85it [00:18, 4.65it/s] 86it [00:18, 4.66it/s] 87it [00:19, 4.63it/s] 88it [00:19, 4.65it/s] 89it [00:19, 4.67it/s] 90it [00:19, 4.50it/s] 91it [00:20, 4.56it/s] 92it [00:20, 4.59it/s] 93it [00:20, 4.63it/s] 94it [00:20, 4.64it/s] 95it [00:20, 4.66it/s] 96it [00:21, 4.67it/s] 97it [00:21, 4.68it/s] 98it [00:21, 4.67it/s] 99it [00:21, 4.69it/s] 100it [00:21, 4.68it/s]2025-05-25 23:26:05,670 - INFO - [Epoch 042 | Batch 0100] IWAE-loss 1476.0132 | mean log_px -0.0030 | KL -1307.70 + 101it [00:22, 4.52it/s] 102it [00:22, 4.58it/s] 103it [00:22, 4.60it/s] 104it [00:22, 4.61it/s] 105it [00:23, 4.64it/s] 106it [00:23, 4.64it/s] 107it [00:23, 4.60it/s] 108it [00:23, 4.64it/s] 109it [00:23, 4.65it/s] 110it [00:24, 4.50it/s] 111it [00:24, 4.57it/s] 112it [00:24, 4.59it/s] 113it [00:24, 4.62it/s] 114it [00:25, 4.63it/s] 115it [00:25, 4.64it/s] 116it [00:25, 4.65it/s] 117it [00:25, 4.67it/s] 118it [00:25, 4.66it/s] 119it [00:26, 4.68it/s] 120it [00:26, 4.52it/s] 121it [00:26, 4.56it/s] 122it [00:26, 4.60it/s] 123it [00:26, 4.63it/s] 124it [00:27, 4.64it/s] 125it [00:27, 4.67it/s] 126it [00:27, 4.67it/s] 127it [00:27, 4.51it/s] 128it [00:28, 4.57it/s] 129it [00:28, 4.58it/s] 130it [00:28, 4.57it/s] 131it [00:28, 4.61it/s] 132it [00:28, 4.62it/s] 133it [00:29, 4.48it/s] 134it [00:29, 4.55it/s] 135it [00:29, 4.59it/s] 136it [00:29, 4.62it/s] 137it [00:30, 4.64it/s] 138it [00:30, 4.59it/s] 139it [00:30, 4.55it/s] 140it [00:30, 4.42it/s] 141it [00:30, 4.51it/s] 142it [00:31, 4.56it/s] 143it [00:31, 4.60it/s] 144it [00:31, 4.61it/s] 145it [00:31, 4.63it/s] 146it [00:32, 4.47it/s] 147it [00:32, 4.54it/s] 148it [00:32, 4.58it/s] 149it [00:32, 4.60it/s] 150it [00:32, 4.62it/s]2025-05-25 23:26:16,567 - INFO - [Epoch 042 | Batch 0150] IWAE-loss 1960.0638 | mean log_px -0.0210 | KL -1302.23 + 151it [00:33, 4.48it/s] 152it [00:33, 4.53it/s] 153it [00:33, 4.41it/s] 154it [00:33, 4.40it/s] 155it [00:33, 4.48it/s] 156it [00:34, 4.54it/s] 157it [00:34, 4.58it/s] 158it [00:34, 4.45it/s] 159it [00:34, 4.52it/s] 160it [00:35, 4.57it/s] 161it [00:35, 4.61it/s] 162it [00:35, 4.63it/s] 163it [00:35, 4.67it/s] 164it [00:35, 4.67it/s] 165it [00:36, 4.67it/s] 166it [00:36, 4.68it/s] 167it [00:36, 4.52it/s] 168it [00:36, 4.57it/s] 169it [00:37, 4.54it/s] 170it [00:37, 4.59it/s] 171it [00:37, 4.61it/s] 172it [00:37, 4.63it/s] 173it [00:37, 4.49it/s] 174it [00:38, 4.56it/s] 175it [00:38, 4.60it/s] 176it [00:38, 4.62it/s] 177it [00:38, 4.63it/s] 178it [00:38, 4.64it/s] 179it [00:39, 4.67it/s] 180it [00:39, 4.67it/s] 181it [00:39, 4.68it/s] 182it [00:39, 4.67it/s] 183it [00:40, 4.51it/s] 184it [00:40, 4.57it/s] 185it [00:40, 4.60it/s] 186it [00:40, 4.42it/s] 187it [00:40, 4.47it/s] 188it [00:41, 4.47it/s] 189it [00:41, 4.48it/s] 190it [00:41, 4.48it/s] 191it [00:41, 4.50it/s] 192it [00:42, 4.39it/s] 193it [00:42, 4.45it/s] 194it [00:42, 4.48it/s] 195it [00:42, 4.26it/s] 196it [00:43, 4.36it/s] 196it [00:43, 4.55it/s] +2025-05-25 23:26:26,643 - INFO - Epoch: 42, Objective: tensor([1482.2252], device='cuda:0', grad_fn=), Loss: 0.007103536278009415, KL/n: 26.547670364379883 + 0it [00:00, ?it/s]2025-05-25 23:26:27,061 - INFO - [Epoch 043 | Batch 0000] IWAE-loss 1369.3737 | mean log_px -0.0017 | KL -1301.93 + 1it [00:00, 2.93it/s] 2it [00:00, 3.71it/s] 3it [00:00, 4.05it/s] 4it [00:01, 4.11it/s] 5it [00:01, 4.30it/s] 6it [00:01, 4.40it/s] 7it [00:01, 4.48it/s] 8it [00:01, 4.38it/s] 9it [00:02, 4.47it/s] 10it [00:02, 4.51it/s] 11it [00:02, 4.54it/s] 12it [00:02, 4.57it/s] 13it [00:02, 4.57it/s] 14it [00:03, 4.58it/s] 15it [00:03, 4.58it/s] 16it [00:03, 4.59it/s] 17it [00:03, 4.59it/s] 18it [00:04, 4.44it/s] 19it [00:04, 4.50it/s] 20it [00:04, 4.52it/s] 21it [00:04, 4.54it/s] 22it [00:04, 4.56it/s] 23it [00:05, 4.57it/s] 24it [00:05, 4.51it/s] 25it [00:05, 4.56it/s] 26it [00:05, 4.57it/s] 27it [00:06, 4.57it/s] 28it [00:06, 4.58it/s] 29it [00:06, 4.45it/s] 30it [00:06, 4.50it/s] 31it [00:06, 4.50it/s] 32it [00:07, 4.54it/s] 33it [00:07, 4.48it/s] 34it [00:07, 4.52it/s] 35it [00:07, 4.55it/s] 36it [00:08, 4.42it/s] 37it [00:08, 4.49it/s] 38it [00:08, 4.53it/s] 39it [00:08, 4.53it/s] 40it [00:08, 4.56it/s] 41it [00:09, 4.57it/s] 42it [00:09, 4.57it/s] 43it [00:09, 4.58it/s] 44it [00:09, 4.59it/s] 45it [00:10, 4.60it/s] 46it [00:10, 4.55it/s] 47it [00:10, 4.56it/s] 48it [00:10, 4.57it/s] 49it [00:10, 4.57it/s] 50it [00:11, 4.58it/s]2025-05-25 23:26:38,069 - INFO - [Epoch 043 | Batch 0050] IWAE-loss 1440.7559 | mean log_px -0.0027 | KL -1296.14 + 51it [00:11, 4.44it/s] 52it [00:11, 4.46it/s] 53it [00:11, 4.52it/s] 54it [00:12, 4.55it/s] 55it [00:12, 4.58it/s] 56it [00:12, 4.61it/s] 57it [00:12, 4.62it/s] 58it [00:12, 4.63it/s] 59it [00:13, 4.65it/s] 60it [00:13, 4.64it/s] 61it [00:13, 4.61it/s] 62it [00:13, 4.61it/s] 63it [00:13, 4.62it/s] 64it [00:14, 4.63it/s] 65it [00:14, 4.64it/s] 66it [00:14, 4.64it/s] 67it [00:14, 4.64it/s] 68it [00:15, 4.64it/s] 69it [00:15, 4.64it/s] 70it [00:15, 4.63it/s] 71it [00:15, 4.62it/s] 72it [00:15, 4.63it/s] 73it [00:16, 4.65it/s] 74it [00:16, 4.65it/s] 75it [00:16, 4.65it/s] 76it [00:16, 4.65it/s] 77it [00:16, 4.64it/s] 78it [00:17, 4.64it/s] 79it [00:17, 4.65it/s] 80it [00:17, 4.65it/s] 81it [00:17, 4.65it/s] 82it [00:18, 4.64it/s] 83it [00:18, 4.65it/s] 84it [00:18, 4.42it/s] 85it [00:18, 4.50it/s] 86it [00:18, 4.55it/s] 87it [00:19, 4.59it/s] 88it [00:19, 4.61it/s] 89it [00:19, 4.63it/s] 90it [00:19, 4.49it/s] 91it [00:20, 4.55it/s] 92it [00:20, 4.57it/s] 93it [00:20, 4.50it/s] 94it [00:20, 4.55it/s] 95it [00:20, 4.58it/s] 96it [00:21, 4.60it/s] 97it [00:21, 4.63it/s] 98it [00:21, 4.50it/s] 99it [00:21, 4.55it/s] 100it [00:22, 4.57it/s]2025-05-25 23:26:48,949 - INFO - [Epoch 043 | Batch 0100] IWAE-loss 1553.6163 | mean log_px -0.0052 | KL -1291.85 + 101it [00:22, 4.61it/s] 102it [00:22, 4.61it/s] 103it [00:22, 4.62it/s] 104it [00:22, 4.48it/s] 105it [00:23, 4.51it/s] 106it [00:23, 4.53it/s] 107it [00:23, 4.56it/s] 108it [00:23, 4.60it/s] 109it [00:23, 4.64it/s] 110it [00:24, 4.65it/s] 111it [00:24, 4.68it/s] 112it [00:24, 4.53it/s] 113it [00:24, 4.60it/s] 114it [00:25, 4.64it/s] 115it [00:25, 4.66it/s] 116it [00:25, 4.67it/s] 117it [00:25, 4.70it/s] 118it [00:25, 4.70it/s] 119it [00:26, 4.54it/s] 120it [00:26, 4.61it/s] 121it [00:26, 4.64it/s] 122it [00:26, 4.66it/s] 123it [00:26, 4.68it/s] 124it [00:27, 4.69it/s] 125it [00:27, 4.69it/s] 126it [00:27, 4.52it/s] 127it [00:27, 4.60it/s] 128it [00:28, 4.63it/s] 129it [00:28, 4.63it/s] 130it [00:28, 4.63it/s] 131it [00:28, 4.63it/s] 132it [00:28, 4.66it/s] 133it [00:29, 4.68it/s] 134it [00:29, 4.53it/s] 135it [00:29, 4.59it/s] 136it [00:29, 4.63it/s] 137it [00:30, 4.65it/s] 138it [00:30, 4.66it/s] 139it [00:30, 4.68it/s] 140it [00:30, 4.53it/s] 141it [00:30, 4.59it/s] 142it [00:31, 4.63it/s] 143it [00:31, 4.65it/s] 144it [00:31, 4.65it/s] 145it [00:31, 4.51it/s] 146it [00:31, 4.58it/s] 147it [00:32, 4.62it/s] 148it [00:32, 4.64it/s] 149it [00:32, 4.67it/s] 150it [00:32, 4.68it/s]2025-05-25 23:26:59,763 - INFO - [Epoch 043 | Batch 0150] IWAE-loss 2060.3196 | mean log_px -0.0110 | KL -1286.15 + 151it [00:33, 4.52it/s] 152it [00:33, 4.59it/s] 153it [00:33, 4.63it/s] 154it [00:33, 4.66it/s] 155it [00:33, 4.67it/s] 156it [00:34, 4.52it/s] 157it [00:34, 4.58it/s] 158it [00:34, 4.61it/s] 159it [00:34, 4.63it/s] 160it [00:34, 4.66it/s] 161it [00:35, 4.67it/s] 162it [00:35, 4.69it/s] 163it [00:35, 4.70it/s] 164it [00:35, 4.70it/s] 165it [00:36, 4.71it/s] 166it [00:36, 4.72it/s] 167it [00:36, 4.72it/s] 168it [00:36, 4.72it/s] 169it [00:36, 4.72it/s] 170it [00:37, 4.72it/s] 171it [00:37, 4.72it/s] 172it [00:37, 4.55it/s] 173it [00:37, 4.62it/s] 174it [00:37, 4.64it/s] 175it [00:38, 4.67it/s] 176it [00:38, 4.68it/s] 177it [00:38, 4.70it/s] 178it [00:38, 4.70it/s] 179it [00:39, 4.71it/s] 180it [00:39, 4.70it/s] 181it [00:39, 4.54it/s] 182it [00:39, 4.61it/s] 183it [00:39, 4.65it/s] 184it [00:40, 4.66it/s] 185it [00:40, 4.68it/s] 186it [00:40, 4.67it/s] 187it [00:40, 4.69it/s] 188it [00:41, 4.54it/s] 189it [00:41, 4.61it/s] 190it [00:41, 4.64it/s] 191it [00:41, 4.66it/s] 192it [00:41, 4.67it/s] 193it [00:42, 4.52it/s] 194it [00:42, 4.58it/s] 195it [00:42, 4.45it/s] 196it [00:42, 4.52it/s] 196it [00:42, 4.58it/s] +2025-05-25 23:27:09,606 - INFO - Epoch: 43, Objective: tensor([1422.8802], device='cuda:0', grad_fn=), Loss: 0.004217221401631832, KL/n: 26.26324462890625 + 0it [00:00, ?it/s]2025-05-25 23:27:10,206 - INFO - [Epoch 044 | Batch 0000] IWAE-loss 1640.3896 | mean log_px -0.0097 | KL -1284.26 + 1it [00:00, 2.94it/s] 2it [00:00, 3.52it/s] 3it [00:00, 4.01it/s] 4it [00:01, 4.25it/s] 5it [00:01, 4.41it/s] 6it [00:01, 4.51it/s] 7it [00:01, 4.58it/s] 8it [00:01, 4.61it/s] 9it [00:02, 4.47it/s] 10it [00:02, 4.54it/s] 11it [00:02, 4.47it/s] 12it [00:02, 4.56it/s] 13it [00:02, 4.58it/s] 14it [00:03, 4.60it/s] 15it [00:03, 4.63it/s] 16it [00:03, 4.52it/s] 17it [00:03, 4.59it/s] 18it [00:04, 4.61it/s] 19it [00:04, 4.63it/s] 20it [00:04, 4.64it/s] 21it [00:04, 4.50it/s] 22it [00:04, 4.53it/s] 23it [00:05, 4.56it/s] 24it [00:05, 4.58it/s] 25it [00:05, 4.60it/s] 26it [00:05, 4.60it/s] 27it [00:06, 4.61it/s] 28it [00:06, 4.46it/s] 29it [00:06, 4.52it/s] 30it [00:06, 4.44it/s] 31it [00:06, 4.46it/s] 32it [00:07, 4.48it/s] 33it [00:07, 4.52it/s] 34it [00:07, 4.53it/s] 35it [00:07, 4.42it/s] 36it [00:08, 4.47it/s] 37it [00:08, 4.52it/s] 38it [00:08, 4.54it/s] 39it [00:08, 4.57it/s] 40it [00:08, 4.58it/s] 41it [00:09, 4.60it/s] 42it [00:09, 4.60it/s] 43it [00:09, 4.47it/s] 44it [00:09, 4.53it/s] 45it [00:10, 4.56it/s] 46it [00:10, 4.58it/s] 47it [00:10, 4.60it/s] 48it [00:10, 4.61it/s] 49it [00:10, 4.62it/s] 50it [00:11, 4.62it/s]2025-05-25 23:27:21,168 - INFO - [Epoch 044 | Batch 0050] IWAE-loss 1426.9062 | mean log_px -0.0024 | KL -1280.41 + 51it [00:11, 4.64it/s] 52it [00:11, 4.51it/s] 53it [00:11, 4.56it/s] 54it [00:11, 4.57it/s] 55it [00:12, 4.60it/s] 56it [00:12, 4.58it/s] 57it [00:12, 4.61it/s] 58it [00:12, 4.62it/s] 59it [00:13, 4.63it/s] 60it [00:13, 4.63it/s] 61it [00:13, 4.48it/s] 62it [00:13, 4.53it/s] 63it [00:13, 4.56it/s] 64it [00:14, 4.58it/s] 65it [00:14, 4.57it/s] 66it [00:14, 4.59it/s] 67it [00:14, 4.58it/s] 68it [00:15, 4.58it/s] 69it [00:15, 4.59it/s] 70it [00:15, 4.44it/s] 71it [00:15, 4.50it/s] 72it [00:15, 4.51it/s] 73it [00:16, 4.54it/s] 74it [00:16, 4.55it/s] 75it [00:16, 4.54it/s] 76it [00:16, 4.55it/s] 77it [00:17, 4.44it/s] 78it [00:17, 4.48it/s] 79it [00:17, 4.49it/s] 80it [00:17, 4.51it/s] 81it [00:17, 4.50it/s] 82it [00:18, 4.53it/s] 83it [00:18, 4.52it/s] 84it [00:18, 4.50it/s] 85it [00:18, 4.50it/s] 86it [00:19, 4.49it/s] 87it [00:19, 4.49it/s] 88it [00:19, 4.35it/s] 89it [00:19, 4.43it/s] 90it [00:19, 4.48it/s] 91it [00:20, 4.44it/s] 92it [00:20, 4.48it/s] 93it [00:20, 4.52it/s] 94it [00:20, 4.51it/s] 95it [00:21, 4.49it/s] 96it [00:21, 4.50it/s] 97it [00:21, 4.36it/s] 98it [00:21, 4.39it/s] 99it [00:21, 4.45it/s] 100it [00:22, 4.50it/s]2025-05-25 23:27:32,249 - INFO - [Epoch 044 | Batch 0100] IWAE-loss 1384.5699 | mean log_px -0.0015 | KL -1274.65 + 101it [00:22, 4.52it/s] 102it [00:22, 4.55it/s] 103it [00:22, 4.56it/s] 104it [00:23, 4.56it/s] 105it [00:23, 4.54it/s] 106it [00:23, 4.40it/s] 107it [00:23, 4.38it/s] 108it [00:23, 4.43it/s] 109it [00:24, 4.45it/s] 110it [00:24, 4.48it/s] 111it [00:24, 4.51it/s] 112it [00:24, 4.50it/s] 113it [00:25, 4.54it/s] 114it [00:25, 4.55it/s] 115it [00:25, 4.41it/s] 116it [00:25, 4.46it/s] 117it [00:25, 4.50it/s] 118it [00:26, 4.49it/s] 119it [00:26, 4.52it/s] 120it [00:26, 4.54it/s] 121it [00:26, 4.56it/s] 122it [00:27, 4.57it/s] 123it [00:27, 4.58it/s] 124it [00:27, 4.40it/s] 125it [00:27, 4.46it/s] 126it [00:27, 4.42it/s] 127it [00:28, 4.44it/s] 128it [00:28, 4.47it/s] 129it [00:28, 4.49it/s] 130it [00:28, 4.54it/s] 131it [00:29, 4.53it/s] 132it [00:29, 4.47it/s] 133it [00:29, 4.36it/s] 134it [00:29, 4.41it/s] 135it [00:29, 4.46it/s] 136it [00:30, 4.49it/s] 137it [00:30, 4.52it/s] 138it [00:30, 4.54it/s] 139it [00:30, 4.56it/s] 140it [00:31, 4.52it/s] 141it [00:31, 4.53it/s] 142it [00:31, 4.35it/s] 143it [00:31, 4.43it/s] 144it [00:31, 4.44it/s] 145it [00:32, 4.46it/s] 146it [00:32, 4.49it/s] 147it [00:32, 4.51it/s] 148it [00:32, 4.45it/s] 149it [00:33, 4.50it/s] 150it [00:33, 4.47it/s]2025-05-25 23:27:43,399 - INFO - [Epoch 044 | Batch 0150] IWAE-loss 1477.1619 | mean log_px -0.0045 | KL -1270.62 + 151it [00:33, 4.51it/s] 152it [00:33, 4.48it/s] 153it [00:33, 4.50it/s] 154it [00:34, 4.52it/s] 155it [00:34, 4.40it/s] 156it [00:34, 4.43it/s] 157it [00:34, 4.49it/s] 158it [00:35, 4.51it/s] 159it [00:35, 4.54it/s] 160it [00:35, 4.50it/s] 161it [00:35, 4.52it/s] 162it [00:35, 4.54it/s] 163it [00:36, 4.54it/s] 164it [00:36, 4.42it/s] 165it [00:36, 4.48it/s] 166it [00:36, 4.51it/s] 167it [00:37, 4.54it/s] 168it [00:37, 4.54it/s] 169it [00:37, 4.39it/s] 170it [00:37, 4.44it/s] 171it [00:37, 4.44it/s] 172it [00:38, 4.42it/s] 173it [00:38, 4.44it/s] 174it [00:38, 4.47it/s] 175it [00:38, 4.48it/s] 176it [00:39, 4.50it/s] 177it [00:39, 4.53it/s] 178it [00:39, 4.35it/s] 179it [00:39, 4.29it/s] 180it [00:40, 4.33it/s] 181it [00:40, 4.41it/s] 182it [00:40, 4.45it/s] 183it [00:40, 4.50it/s] 184it [00:40, 4.53it/s] 185it [00:41, 4.56it/s] 186it [00:41, 4.55it/s] 187it [00:41, 4.58it/s] 188it [00:41, 4.55it/s] 189it [00:42, 4.57it/s] 190it [00:42, 4.43it/s] 191it [00:42, 4.49it/s] 192it [00:42, 4.52it/s] 193it [00:42, 4.52it/s] 194it [00:43, 4.53it/s] 195it [00:43, 4.43it/s] 196it [00:43, 4.41it/s] 196it [00:43, 4.49it/s] +2025-05-25 23:27:53,593 - INFO - Epoch: 44, Objective: tensor([1421.5844], device='cuda:0', grad_fn=), Loss: 0.0031296706292778254, KL/n: 25.87446403503418 + 0it [00:00, ?it/s]2025-05-25 23:27:53,989 - INFO - [Epoch 045 | Batch 0000] IWAE-loss 1360.7262 | mean log_px -0.0022 | KL -1263.72 + 1it [00:00, 3.07it/s] 2it [00:00, 3.81it/s] 3it [00:00, 4.12it/s] 4it [00:00, 4.26it/s] 5it [00:01, 4.38it/s] 6it [00:01, 4.30it/s] 7it [00:01, 4.39it/s] 8it [00:01, 4.45it/s] 9it [00:02, 4.50it/s] 10it [00:02, 4.52it/s] 11it [00:02, 4.52it/s] 12it [00:02, 3.58it/s] 13it [00:03, 3.84it/s] 14it [00:03, 4.05it/s] 15it [00:03, 4.19it/s] 16it [00:03, 4.16it/s] 17it [00:04, 4.30it/s] 18it [00:04, 4.27it/s] 19it [00:04, 4.11it/s] 20it [00:04, 4.17it/s] 21it [00:05, 4.26it/s] 22it [00:05, 4.32it/s] 23it [00:05, 4.35it/s] 24it [00:05, 4.37it/s] 25it [00:05, 4.40it/s] 26it [00:06, 4.45it/s] 27it [00:06, 4.35it/s] 28it [00:06, 4.29it/s] 29it [00:06, 4.35it/s] 30it [00:07, 4.40it/s] 31it [00:07, 4.46it/s] 32it [00:07, 4.47it/s] 33it [00:07, 4.50it/s] 34it [00:07, 4.30it/s] 35it [00:08, 4.38it/s] 36it [00:08, 4.45it/s] 37it [00:08, 4.50it/s] 38it [00:08, 4.53it/s] 39it [00:09, 4.56it/s] 40it [00:09, 4.58it/s] 41it [00:09, 4.62it/s] 42it [00:09, 4.40it/s] 43it [00:09, 4.48it/s] 44it [00:10, 4.53it/s] 45it [00:10, 4.56it/s] 46it [00:10, 4.58it/s] 47it [00:10, 4.45it/s] 48it [00:11, 4.47it/s] 49it [00:11, 4.53it/s] 50it [00:11, 4.56it/s]2025-05-25 23:28:05,379 - INFO - [Epoch 045 | Batch 0050] IWAE-loss 1378.6949 | mean log_px -0.0038 | KL -1256.42 + 51it [00:11, 4.58it/s] 52it [00:11, 4.59it/s] 53it [00:12, 4.60it/s] 54it [00:12, 4.49it/s] 55it [00:12, 4.55it/s] 56it [00:12, 4.59it/s] 57it [00:13, 4.61it/s] 58it [00:13, 4.62it/s] 59it [00:13, 4.63it/s] 60it [00:13, 4.64it/s] 61it [00:13, 4.51it/s] 62it [00:14, 4.52it/s] 63it [00:14, 4.52it/s] 64it [00:14, 4.55it/s] 65it [00:14, 4.54it/s] 66it [00:14, 4.58it/s] 67it [00:15, 4.61it/s] 68it [00:15, 4.60it/s] 69it [00:15, 4.62it/s] 70it [00:15, 4.61it/s] 71it [00:16, 4.63it/s] 72it [00:16, 4.65it/s] 73it [00:16, 4.65it/s] 74it [00:16, 4.63it/s] 75it [00:16, 4.62it/s] 76it [00:17, 4.62it/s] 77it [00:17, 4.63it/s] 78it [00:17, 4.63it/s] 79it [00:17, 4.64it/s] 80it [00:18, 4.64it/s] 81it [00:18, 4.65it/s] 82it [00:18, 4.64it/s] 83it [00:18, 4.59it/s] 84it [00:18, 4.57it/s] 85it [00:19, 4.57it/s] 86it [00:19, 4.57it/s] 87it [00:19, 4.59it/s] 88it [00:19, 4.60it/s] 89it [00:19, 4.62it/s] 90it [00:20, 4.62it/s] 91it [00:20, 4.63it/s] 92it [00:20, 4.46it/s] 93it [00:20, 4.53it/s] 94it [00:21, 4.55it/s] 95it [00:21, 4.58it/s] 96it [00:21, 4.54it/s] 97it [00:21, 4.57it/s] 98it [00:21, 4.59it/s] 99it [00:22, 4.61it/s] 100it [00:22, 4.61it/s]2025-05-25 23:28:16,261 - INFO - [Epoch 045 | Batch 0100] IWAE-loss 1430.3690 | mean log_px -0.0046 | KL -1253.53 + 101it [00:22, 4.49it/s] 102it [00:22, 4.55it/s] 103it [00:23, 4.59it/s] 104it [00:23, 4.49it/s] 105it [00:23, 4.53it/s] 106it [00:23, 4.56it/s] 107it [00:23, 4.59it/s] 108it [00:24, 4.61it/s] 109it [00:24, 4.61it/s] 110it [00:24, 4.62it/s] 111it [00:24, 4.64it/s] 112it [00:24, 4.64it/s] 113it [00:25, 4.64it/s] 114it [00:25, 4.64it/s] 115it [00:25, 4.64it/s] 116it [00:25, 4.43it/s] 117it [00:26, 4.51it/s] 118it [00:26, 4.55it/s] 119it [00:26, 4.59it/s] 120it [00:26, 4.60it/s] 121it [00:26, 4.62it/s] 122it [00:27, 4.48it/s] 123it [00:27, 4.55it/s] 124it [00:27, 4.58it/s] 125it [00:27, 4.60it/s] 126it [00:28, 4.61it/s] 127it [00:28, 4.63it/s] 128it [00:28, 4.45it/s] 129it [00:28, 4.51it/s] 130it [00:28, 4.54it/s] 131it [00:29, 4.58it/s] 132it [00:29, 4.60it/s] 133it [00:29, 4.62it/s] 134it [00:29, 4.62it/s] 135it [00:30, 4.63it/s] 136it [00:30, 4.64it/s] 137it [00:30, 4.48it/s] 138it [00:30, 4.54it/s] 139it [00:30, 4.57it/s] 140it [00:31, 4.59it/s] 141it [00:31, 4.61it/s] 142it [00:31, 4.62it/s] 143it [00:31, 4.63it/s] 144it [00:32, 4.46it/s] 145it [00:32, 4.53it/s] 146it [00:32, 4.56it/s] 147it [00:32, 4.59it/s] 148it [00:32, 4.60it/s] 149it [00:33, 4.61it/s] 150it [00:33, 4.56it/s]2025-05-25 23:28:27,197 - INFO - [Epoch 045 | Batch 0150] IWAE-loss 1851.1366 | mean log_px -0.0243 | KL -1258.04 + 151it [00:33, 4.59it/s] 152it [00:33, 4.60it/s] 153it [00:33, 4.62it/s] 154it [00:34, 4.63it/s] 155it [00:34, 4.50it/s] 156it [00:34, 4.55it/s] 157it [00:34, 4.58it/s] 158it [00:35, 4.60it/s] 159it [00:35, 4.62it/s] 160it [00:35, 4.63it/s] 161it [00:35, 4.63it/s] 162it [00:35, 4.58it/s] 163it [00:36, 4.59it/s] 164it [00:36, 4.59it/s] 165it [00:36, 4.61it/s] 166it [00:36, 4.48it/s] 167it [00:37, 4.53it/s] 168it [00:37, 4.56it/s] 169it [00:37, 4.58it/s] 170it [00:37, 4.60it/s] 171it [00:37, 4.61it/s] 172it [00:38, 4.61it/s] 173it [00:38, 4.62it/s] 174it [00:38, 4.63it/s] 175it [00:38, 4.64it/s] 176it [00:38, 4.57it/s] 177it [00:39, 4.52it/s] 178it [00:39, 4.57it/s] 179it [00:39, 4.59it/s] 180it [00:39, 4.49it/s] 181it [00:40, 4.49it/s] 182it [00:40, 4.51it/s] 183it [00:40, 4.55it/s] 184it [00:40, 4.58it/s] 185it [00:40, 4.60it/s] 186it [00:41, 4.61it/s] 187it [00:41, 4.63it/s] 188it [00:41, 4.57it/s] 189it [00:41, 4.57it/s] 190it [00:42, 4.60it/s] 191it [00:42, 4.60it/s] 192it [00:42, 4.63it/s] 193it [00:42, 4.49it/s] 194it [00:42, 4.55it/s] 195it [00:43, 4.44it/s] 196it [00:43, 4.49it/s] 196it [00:43, 4.51it/s] +2025-05-25 23:28:37,187 - INFO - Epoch: 45, Objective: tensor([1544.8090], device='cuda:0', grad_fn=), Loss: 0.005014732480049133, KL/n: 25.61770248413086 + 0it [00:00, ?it/s]2025-05-25 23:28:37,608 - INFO - [Epoch 046 | Batch 0000] IWAE-loss 1496.1056 | mean log_px -0.0046 | KL -1254.61 + 1it [00:00, 2.95it/s] 2it [00:00, 3.75it/s] 3it [00:00, 3.91it/s] 4it [00:01, 4.19it/s] 5it [00:01, 4.35it/s] 6it [00:01, 4.44it/s] 7it [00:01, 4.49it/s] 8it [00:01, 4.54it/s] 9it [00:02, 4.54it/s] 10it [00:02, 4.57it/s] 11it [00:02, 4.59it/s] 12it [00:02, 4.61it/s] 13it [00:02, 4.46it/s] 14it [00:03, 4.53it/s] 15it [00:03, 4.57it/s] 16it [00:03, 4.59it/s] 17it [00:03, 4.60it/s] 18it [00:04, 4.59it/s] 19it [00:04, 4.60it/s] 20it [00:04, 4.61it/s] 21it [00:04, 4.63it/s] 22it [00:04, 4.50it/s] 23it [00:05, 4.54it/s] 24it [00:05, 4.57it/s] 25it [00:05, 4.59it/s] 26it [00:05, 4.61it/s] 27it [00:06, 4.62it/s] 28it [00:06, 4.63it/s] 29it [00:06, 4.63it/s] 30it [00:06, 4.54it/s] 31it [00:06, 4.58it/s] 32it [00:07, 4.58it/s] 33it [00:07, 4.57it/s] 34it [00:07, 4.56it/s] 35it [00:07, 4.55it/s] 36it [00:07, 4.57it/s] 37it [00:08, 4.59it/s] 38it [00:08, 4.58it/s] 39it [00:08, 4.60it/s] 40it [00:08, 4.47it/s] 41it [00:09, 4.53it/s] 42it [00:09, 4.56it/s] 43it [00:09, 4.58it/s] 44it [00:09, 4.60it/s] 45it [00:09, 4.61it/s] 46it [00:10, 4.63it/s] 47it [00:10, 4.64it/s] 48it [00:10, 4.64it/s] 49it [00:10, 4.49it/s] 50it [00:11, 4.54it/s]2025-05-25 23:28:48,537 - INFO - [Epoch 046 | Batch 0050] IWAE-loss 1504.4362 | mean log_px -0.0047 | KL -1249.88 + 51it [00:11, 4.57it/s] 52it [00:11, 4.60it/s] 53it [00:11, 4.61it/s] 54it [00:11, 4.47it/s] 55it [00:12, 4.52it/s] 56it [00:12, 4.56it/s] 57it [00:12, 4.56it/s] 58it [00:12, 4.58it/s] 59it [00:13, 4.61it/s] 60it [00:13, 4.61it/s] 61it [00:13, 4.62it/s] 62it [00:13, 4.35it/s] 63it [00:13, 4.45it/s] 64it [00:14, 4.51it/s] 65it [00:14, 4.56it/s] 66it [00:14, 4.59it/s] 67it [00:14, 4.61it/s] 68it [00:15, 4.48it/s] 69it [00:15, 4.50it/s] 70it [00:15, 4.53it/s] 71it [00:15, 4.57it/s] 72it [00:15, 4.59it/s] 73it [00:16, 4.61it/s] 74it [00:16, 4.62it/s] 75it [00:16, 4.64it/s] 76it [00:16, 4.64it/s] 77it [00:16, 4.65it/s] 78it [00:17, 4.64it/s] 79it [00:17, 4.58it/s] 80it [00:17, 4.59it/s] 81it [00:17, 4.56it/s] 82it [00:18, 4.59it/s] 83it [00:18, 4.61it/s] 84it [00:18, 4.62it/s] 85it [00:18, 4.45it/s] 86it [00:18, 4.48it/s] 87it [00:19, 4.53it/s] 88it [00:19, 4.56it/s] 89it [00:19, 4.58it/s] 90it [00:19, 4.60it/s] 91it [00:20, 4.61it/s] 92it [00:20, 4.47it/s] 93it [00:20, 4.54it/s] 94it [00:20, 4.54it/s] 95it [00:20, 4.59it/s] 96it [00:21, 4.60it/s] 97it [00:21, 4.62it/s] 98it [00:21, 4.61it/s] 99it [00:21, 4.62it/s] 100it [00:21, 4.62it/s]2025-05-25 23:28:59,475 - INFO - [Epoch 046 | Batch 0100] IWAE-loss 2131.2534 | mean log_px -0.0194 | KL -1246.14 + 101it [00:22, 4.62it/s] 102it [00:22, 4.62it/s] 103it [00:22, 4.62it/s] 104it [00:22, 4.48it/s] 105it [00:23, 4.55it/s] 106it [00:23, 4.57it/s] 107it [00:23, 4.59it/s] 108it [00:23, 4.61it/s] 109it [00:23, 4.61it/s] 110it [00:24, 4.62it/s] 111it [00:24, 4.64it/s] 112it [00:24, 4.64it/s] 113it [00:24, 4.50it/s] 114it [00:25, 4.54it/s] 115it [00:25, 4.57it/s] 116it [00:25, 4.58it/s] 117it [00:25, 4.57it/s] 118it [00:25, 4.58it/s] 119it [00:26, 4.56it/s] 120it [00:26, 4.56it/s] 121it [00:26, 4.59it/s] 122it [00:26, 4.60it/s] 123it [00:27, 4.47it/s] 124it [00:27, 4.52it/s] 125it [00:27, 4.56it/s] 126it [00:27, 4.58it/s] 127it [00:27, 4.60it/s] 128it [00:28, 4.62it/s] 129it [00:28, 4.63it/s] 130it [00:28, 4.46it/s] 131it [00:28, 4.52it/s] 132it [00:28, 4.54it/s] 133it [00:29, 4.58it/s] 134it [00:29, 4.60it/s] 135it [00:29, 4.62it/s] 136it [00:29, 4.62it/s] 137it [00:30, 4.63it/s] 138it [00:30, 4.61it/s] 139it [00:30, 4.62it/s] 140it [00:30, 4.63it/s] 141it [00:30, 4.65it/s] 142it [00:31, 4.64it/s] 143it [00:31, 4.65it/s] 144it [00:31, 4.52it/s] 145it [00:31, 4.58it/s] 146it [00:32, 4.60it/s] 147it [00:32, 4.61it/s] 148it [00:32, 4.62it/s] 149it [00:32, 4.62it/s] 150it [00:32, 4.48it/s]2025-05-25 23:29:10,396 - INFO - [Epoch 046 | Batch 0150] IWAE-loss 1519.1067 | mean log_px -0.0050 | KL -1243.51 + 151it [00:33, 4.55it/s] 152it [00:33, 4.57it/s] 153it [00:33, 4.60it/s] 154it [00:33, 4.61it/s] 155it [00:33, 4.62it/s] 156it [00:34, 4.64it/s] 157it [00:34, 4.64it/s] 158it [00:34, 4.62it/s] 159it [00:34, 4.48it/s] 160it [00:35, 4.53it/s] 161it [00:35, 4.55it/s] 162it [00:35, 4.58it/s] 163it [00:35, 4.61it/s] 164it [00:35, 4.61it/s] 165it [00:36, 4.62it/s] 166it [00:36, 4.48it/s] 167it [00:36, 4.54it/s] 168it [00:36, 4.57it/s] 169it [00:37, 4.60it/s] 170it [00:37, 4.61it/s] 171it [00:37, 4.62it/s] 172it [00:37, 4.62it/s] 173it [00:37, 4.64it/s] 174it [00:38, 4.63it/s] 175it [00:38, 4.63it/s] 176it [00:38, 4.63it/s] 177it [00:38, 4.48it/s] 178it [00:39, 4.53it/s] 179it [00:39, 4.56it/s] 180it [00:39, 4.58it/s] 181it [00:39, 4.60it/s] 182it [00:39, 4.60it/s] 183it [00:40, 4.62it/s] 184it [00:40, 4.63it/s] 185it [00:40, 4.65it/s] 186it [00:40, 4.64it/s] 187it [00:40, 4.49it/s] 188it [00:41, 4.55it/s] 189it [00:41, 4.58it/s] 190it [00:41, 4.59it/s] 191it [00:41, 4.57it/s] 192it [00:42, 4.58it/s] 193it [00:42, 4.58it/s] 194it [00:42, 4.39it/s] 195it [00:42, 4.36it/s] 196it [00:42, 4.44it/s] 196it [00:43, 4.55it/s] +2025-05-25 23:29:20,378 - INFO - Epoch: 46, Objective: tensor([1405.0212], device='cuda:0', grad_fn=), Loss: 0.008077585138380527, KL/n: 25.350950241088867 + 0it [00:00, ?it/s]2025-05-25 23:29:20,969 - INFO - [Epoch 047 | Batch 0000] IWAE-loss 1908.2433 | mean log_px -0.0132 | KL -1241.40 + 1it [00:00, 2.94it/s] 2it [00:00, 3.73it/s] 3it [00:00, 4.00it/s] 4it [00:01, 4.07it/s] 5it [00:01, 4.26it/s] 6it [00:01, 4.38it/s] 7it [00:01, 4.41it/s] 8it [00:01, 4.36it/s] 9it [00:02, 4.41it/s] 10it [00:02, 4.48it/s] 11it [00:02, 4.54it/s] 12it [00:02, 4.34it/s] 13it [00:03, 4.41it/s] 14it [00:03, 4.47it/s] 15it [00:03, 4.51it/s] 16it [00:03, 4.54it/s] 17it [00:03, 4.58it/s] 18it [00:04, 4.30it/s] 19it [00:04, 4.41it/s] 20it [00:04, 4.36it/s] 21it [00:04, 4.45it/s] 22it [00:05, 4.49it/s] 23it [00:05, 4.52it/s] 24it [00:05, 4.27it/s] 25it [00:05, 4.39it/s] 26it [00:05, 4.46it/s] 27it [00:06, 4.50it/s] 28it [00:06, 4.51it/s] 29it [00:06, 4.53it/s] 30it [00:06, 4.54it/s] 31it [00:07, 4.51it/s] 32it [00:07, 4.54it/s] 33it [00:07, 4.42it/s] 34it [00:07, 4.46it/s] 35it [00:07, 4.50it/s] 36it [00:08, 4.42it/s] 37it [00:08, 4.50it/s] 38it [00:08, 4.54it/s] 39it [00:08, 4.57it/s] 40it [00:09, 4.44it/s] 41it [00:09, 4.51it/s] 42it [00:09, 4.55it/s] 43it [00:09, 4.56it/s] 44it [00:09, 4.51it/s] 45it [00:10, 4.47it/s] 46it [00:10, 4.46it/s] 47it [00:10, 4.43it/s] 48it [00:10, 4.47it/s] 49it [00:11, 4.52it/s] 50it [00:11, 4.55it/s]2025-05-25 23:29:32,130 - INFO - [Epoch 047 | Batch 0050] IWAE-loss 1597.2115 | mean log_px -0.0160 | KL -1236.86 + 51it [00:11, 4.43it/s] 52it [00:11, 4.45it/s] 53it [00:11, 4.51it/s] 54it [00:12, 4.40it/s] 55it [00:12, 4.40it/s] 56it [00:12, 4.49it/s] 57it [00:12, 4.50it/s] 58it [00:13, 4.54it/s] 59it [00:13, 4.59it/s] 60it [00:13, 4.41it/s] 61it [00:13, 4.38it/s] 62it [00:13, 4.47it/s] 63it [00:14, 4.42it/s] 64it [00:14, 4.48it/s] 65it [00:14, 4.42it/s] 66it [00:14, 4.45it/s] 67it [00:15, 4.43it/s] 68it [00:15, 4.49it/s] 69it [00:15, 4.31it/s] 70it [00:15, 4.40it/s] 71it [00:16, 4.38it/s] 72it [00:16, 4.43it/s] 73it [00:16, 4.49it/s] 74it [00:16, 4.52it/s] 75it [00:16, 4.52it/s] 76it [00:17, 4.48it/s] 77it [00:17, 4.52it/s] 78it [00:17, 4.38it/s] 79it [00:17, 4.43it/s] 80it [00:18, 4.47it/s] 81it [00:18, 4.52it/s] 82it [00:18, 4.54it/s] 83it [00:18, 4.45it/s] 84it [00:18, 4.52it/s] 85it [00:19, 4.55it/s] 86it [00:19, 4.56it/s] 87it [00:19, 4.57it/s] 88it [00:19, 4.58it/s] 89it [00:20, 4.57it/s] 90it [00:20, 4.42it/s] 91it [00:20, 4.50it/s] 92it [00:20, 4.53it/s] 93it [00:20, 4.50it/s] 94it [00:21, 4.48it/s] 95it [00:21, 4.52it/s] 96it [00:21, 4.36it/s] 97it [00:21, 4.44it/s] 98it [00:22, 4.43it/s] 99it [00:22, 4.47it/s] 100it [00:22, 4.51it/s]2025-05-25 23:29:43,329 - INFO - [Epoch 047 | Batch 0100] IWAE-loss 2198.4983 | mean log_px -0.0194 | KL -1234.72 + 101it [00:22, 4.46it/s] 102it [00:22, 4.36it/s] 103it [00:23, 4.45it/s] 104it [00:23, 4.50it/s] 105it [00:23, 4.53it/s] 106it [00:23, 4.55it/s] 107it [00:24, 4.40it/s] 108it [00:24, 4.30it/s] 109it [00:24, 4.38it/s] 110it [00:24, 4.43it/s] 111it [00:24, 4.42it/s] 112it [00:25, 4.48it/s] 113it [00:25, 4.40it/s] 114it [00:25, 4.46it/s] 115it [00:25, 4.41it/s] 116it [00:26, 4.47it/s] 117it [00:26, 4.44it/s] 118it [00:26, 4.47it/s] 119it [00:26, 4.49it/s] 120it [00:26, 4.36it/s] 121it [00:27, 4.41it/s] 122it [00:27, 4.45it/s] 123it [00:27, 4.48it/s] 124it [00:27, 4.41it/s] 125it [00:28, 4.49it/s] 126it [00:28, 4.48it/s] 127it [00:28, 4.48it/s] 128it [00:28, 4.52it/s] 129it [00:29, 4.44it/s] 130it [00:29, 4.49it/s] 131it [00:29, 4.47it/s] 132it [00:29, 4.52it/s] 133it [00:29, 4.49it/s] 134it [00:30, 4.52it/s] 135it [00:30, 4.52it/s] 136it [00:30, 4.52it/s] 137it [00:30, 4.34it/s] 138it [00:31, 4.40it/s] 139it [00:31, 4.47it/s] 140it [00:31, 4.52it/s] 141it [00:31, 4.55it/s] 142it [00:31, 4.58it/s] 143it [00:32, 4.53it/s] 144it [00:32, 4.52it/s] 145it [00:32, 4.42it/s] 146it [00:32, 4.31it/s] 147it [00:33, 4.35it/s] 148it [00:33, 4.37it/s] 149it [00:33, 4.46it/s] 150it [00:33, 4.52it/s]2025-05-25 23:29:54,538 - INFO - [Epoch 047 | Batch 0150] IWAE-loss 1541.9181 | mean log_px -0.0085 | KL -1228.83 + 151it [00:33, 4.56it/s] 152it [00:34, 4.59it/s] 153it [00:34, 4.45it/s] 154it [00:34, 4.34it/s] 155it [00:34, 4.38it/s] 156it [00:35, 4.45it/s] 157it [00:35, 4.52it/s] 158it [00:35, 4.56it/s] 159it [00:35, 4.58it/s] 160it [00:35, 4.56it/s] 161it [00:36, 4.56it/s] 162it [00:36, 4.56it/s] 163it [00:36, 4.57it/s] 164it [00:36, 4.44it/s] 165it [00:37, 4.37it/s] 166it [00:37, 4.46it/s] 167it [00:37, 4.51it/s] 168it [00:37, 4.54it/s] 169it [00:37, 4.41it/s] 170it [00:38, 4.46it/s] 171it [00:38, 4.45it/s] 172it [00:38, 4.49it/s] 173it [00:38, 4.52it/s] 174it [00:39, 4.42it/s] 175it [00:39, 4.49it/s] 176it [00:39, 4.53it/s] 177it [00:39, 4.49it/s] 178it [00:39, 4.40it/s] 179it [00:40, 4.37it/s] 180it [00:40, 4.46it/s] 181it [00:40, 4.39it/s] 182it [00:40, 4.42it/s] 183it [00:41, 4.47it/s] 184it [00:41, 4.50it/s] 185it [00:41, 4.49it/s] 186it [00:41, 4.52it/s] 187it [00:41, 4.44it/s] 188it [00:42, 4.48it/s] 189it [00:42, 4.53it/s] 190it [00:42, 4.50it/s] 191it [00:42, 4.55it/s] 192it [00:43, 4.57it/s] 193it [00:43, 4.59it/s] 194it [00:43, 4.60it/s] 195it [00:43, 4.40it/s] 196it [00:43, 4.47it/s] 196it [00:44, 4.45it/s] +2025-05-25 23:30:04,720 - INFO - Epoch: 47, Objective: tensor([1696.6771], device='cuda:0', grad_fn=), Loss: 0.011943808756768703, KL/n: 25.065183639526367 + 0it [00:00, ?it/s]2025-05-25 23:30:05,142 - INFO - [Epoch 048 | Batch 0000] IWAE-loss 2080.8501 | mean log_px -0.0122 | KL -1227.69 + 1it [00:00, 2.87it/s] 2it [00:00, 3.62it/s] 3it [00:00, 3.85it/s] 4it [00:01, 4.14it/s] 5it [00:01, 4.31it/s] 6it [00:01, 4.39it/s] 7it [00:01, 4.43it/s] 8it [00:01, 4.49it/s] 9it [00:02, 4.53it/s] 10it [00:02, 4.53it/s] 11it [00:02, 3.61it/s] 12it [00:02, 3.86it/s] 13it [00:03, 4.06it/s] 14it [00:03, 4.10it/s] 15it [00:03, 4.26it/s] 16it [00:03, 4.32it/s] 17it [00:04, 4.38it/s] 18it [00:04, 4.43it/s] 19it [00:04, 4.48it/s] 20it [00:04, 4.49it/s] 21it [00:04, 4.40it/s] 22it [00:05, 4.46it/s] 23it [00:05, 4.50it/s] 24it [00:05, 4.53it/s] 25it [00:05, 4.47it/s] 26it [00:06, 4.49it/s] 27it [00:06, 4.49it/s] 28it [00:06, 4.50it/s] 29it [00:06, 4.54it/s] 30it [00:06, 4.51it/s] 31it [00:07, 4.54it/s] 32it [00:07, 4.57it/s] 33it [00:07, 4.45it/s] 34it [00:07, 4.51it/s] 35it [00:08, 4.50it/s] 36it [00:08, 4.52it/s] 37it [00:08, 4.51it/s] 38it [00:08, 4.51it/s] 39it [00:08, 4.48it/s] 40it [00:09, 4.51it/s] 41it [00:09, 4.56it/s] 42it [00:09, 4.44it/s] 43it [00:09, 4.51it/s] 44it [00:10, 4.54it/s] 45it [00:10, 4.57it/s] 46it [00:10, 4.59it/s] 47it [00:10, 4.58it/s] 48it [00:10, 4.57it/s] 49it [00:11, 4.53it/s] 50it [00:11, 4.50it/s]2025-05-25 23:30:16,398 - INFO - [Epoch 048 | Batch 0050] IWAE-loss 1285.0804 | mean log_px -0.0012 | KL -1222.04 + 51it [00:11, 4.52it/s] 52it [00:11, 4.47it/s] 53it [00:12, 4.34it/s] 54it [00:12, 4.40it/s] 55it [00:12, 4.43it/s] 56it [00:12, 4.46it/s] 57it [00:12, 4.46it/s] 58it [00:13, 4.48it/s] 59it [00:13, 4.39it/s] 60it [00:13, 4.47it/s] 61it [00:13, 4.49it/s] 62it [00:14, 4.51it/s] 63it [00:14, 4.53it/s] 64it [00:14, 4.54it/s] 65it [00:14, 4.57it/s] 66it [00:14, 4.59it/s] 67it [00:15, 4.61it/s] 68it [00:15, 4.42it/s] 69it [00:15, 4.52it/s] 70it [00:15, 4.53it/s] 71it [00:16, 4.55it/s] 72it [00:16, 4.56it/s] 73it [00:16, 4.59it/s] 74it [00:16, 4.58it/s] 75it [00:16, 4.59it/s] 76it [00:17, 4.59it/s] 77it [00:17, 4.57it/s] 78it [00:17, 4.55it/s] 79it [00:17, 4.54it/s] 80it [00:18, 4.57it/s] 81it [00:18, 4.60it/s] 82it [00:18, 4.60it/s] 83it [00:18, 4.61it/s] 84it [00:18, 4.56it/s] 85it [00:19, 4.58it/s] 86it [00:19, 4.59it/s] 87it [00:19, 4.44it/s] 88it [00:19, 4.48it/s] 89it [00:20, 4.49it/s] 90it [00:20, 4.52it/s] 91it [00:20, 4.44it/s] 92it [00:20, 4.52it/s] 93it [00:20, 4.50it/s] 94it [00:21, 4.53it/s] 95it [00:21, 4.41it/s] 96it [00:21, 4.39it/s] 97it [00:21, 4.40it/s] 98it [00:22, 4.44it/s] 99it [00:22, 4.49it/s] 100it [00:22, 4.48it/s]2025-05-25 23:30:27,486 - INFO - [Epoch 048 | Batch 0100] IWAE-loss 1300.4762 | mean log_px -0.0050 | KL -1212.15 + 101it [00:22, 4.53it/s] 102it [00:22, 4.41it/s] 103it [00:23, 4.45it/s] 104it [00:23, 4.50it/s] 105it [00:23, 4.50it/s] 106it [00:23, 4.54it/s] 107it [00:24, 4.56it/s] 108it [00:24, 4.57it/s] 109it [00:24, 4.59it/s] 110it [00:24, 4.45it/s] 111it [00:24, 4.52it/s] 112it [00:25, 4.53it/s] 113it [00:25, 4.56it/s] 114it [00:25, 4.47it/s] 115it [00:25, 4.48it/s] 116it [00:26, 4.50it/s] 117it [00:26, 4.50it/s] 118it [00:26, 4.50it/s] 119it [00:26, 4.38it/s] 120it [00:26, 4.44it/s] 121it [00:27, 4.43it/s] 122it [00:27, 4.48it/s] 123it [00:27, 4.43it/s] 124it [00:27, 4.47it/s] 125it [00:28, 4.49it/s] 126it [00:28, 4.53it/s] 127it [00:28, 4.42it/s] 128it [00:28, 4.50it/s] 129it [00:28, 4.53it/s] 130it [00:29, 4.56it/s] 131it [00:29, 4.47it/s] 132it [00:29, 4.52it/s] 133it [00:29, 4.29it/s] 134it [00:30, 4.38it/s] 135it [00:30, 4.44it/s] 136it [00:30, 4.46it/s] 137it [00:30, 4.42it/s] 138it [00:30, 4.43it/s] 139it [00:31, 4.42it/s] 140it [00:31, 4.44it/s] 141it [00:31, 4.44it/s] 142it [00:31, 4.30it/s] 143it [00:32, 4.40it/s] 144it [00:32, 4.47it/s] 145it [00:32, 4.51it/s] 146it [00:32, 4.54it/s] 147it [00:32, 4.56it/s] 148it [00:33, 4.54it/s] 149it [00:33, 4.57it/s] 150it [00:33, 4.57it/s]2025-05-25 23:30:38,638 - INFO - [Epoch 048 | Batch 0150] IWAE-loss 1771.9763 | mean log_px -0.0080 | KL -1212.38 + 151it [00:33, 4.61it/s] 152it [00:34, 4.53it/s] 153it [00:34, 4.55it/s] 154it [00:34, 4.57it/s] 155it [00:34, 4.56it/s] 156it [00:34, 4.58it/s] 157it [00:35, 4.53it/s] 158it [00:35, 4.56it/s] 159it [00:35, 4.42it/s] 160it [00:35, 4.45it/s] 161it [00:36, 4.51it/s] 162it [00:36, 4.53it/s] 163it [00:36, 4.57it/s] 164it [00:36, 4.60it/s] 165it [00:36, 4.63it/s] 166it [00:37, 4.62it/s] 167it [00:37, 4.54it/s] 168it [00:37, 4.55it/s] 169it [00:37, 4.48it/s] 170it [00:38, 4.53it/s] 171it [00:38, 4.54it/s] 172it [00:38, 4.57it/s] 173it [00:38, 4.46it/s] 174it [00:38, 4.51it/s] 175it [00:39, 4.51it/s] 176it [00:39, 4.52it/s] 177it [00:39, 4.41it/s] 178it [00:39, 4.48it/s] 179it [00:40, 4.47it/s] 180it [00:40, 4.50it/s] 181it [00:40, 4.45it/s] 182it [00:40, 4.50it/s] 183it [00:40, 4.51it/s] 184it [00:41, 4.52it/s] 185it [00:41, 4.40it/s] 186it [00:41, 4.48it/s] 187it [00:41, 4.52it/s] 188it [00:42, 4.55it/s] 189it [00:42, 4.44it/s] 190it [00:42, 4.45it/s] 191it [00:42, 4.53it/s] 192it [00:42, 4.56it/s] 193it [00:43, 4.46it/s] 194it [00:43, 4.53it/s] 195it [00:43, 4.45it/s] 196it [00:43, 4.48it/s] 196it [00:43, 4.46it/s] +2025-05-25 23:30:48,759 - INFO - Epoch: 48, Objective: tensor([1534.0585], device='cuda:0', grad_fn=), Loss: 0.016182228922843933, KL/n: 24.804851531982422 + 0it [00:00, ?it/s]2025-05-25 23:30:49,138 - INFO - [Epoch 049 | Batch 0000] IWAE-loss 1611.0990 | mean log_px -0.0056 | KL -1216.53 + 1it [00:00, 3.28it/s] 2it [00:00, 3.97it/s] 3it [00:00, 4.08it/s] 4it [00:00, 4.30it/s] 5it [00:01, 4.44it/s] 6it [00:01, 4.48it/s] 7it [00:01, 4.56it/s] 8it [00:01, 4.59it/s] 9it [00:02, 4.46it/s] 10it [00:02, 4.53it/s] 11it [00:02, 4.53it/s] 12it [00:02, 4.50it/s] 13it [00:02, 4.55it/s] 14it [00:03, 4.59it/s] 15it [00:03, 4.48it/s] 16it [00:03, 4.54it/s] 17it [00:03, 4.59it/s] 18it [00:04, 4.61it/s] 19it [00:04, 4.63it/s] 20it [00:04, 4.65it/s] 21it [00:04, 4.51it/s] 22it [00:04, 4.56it/s] 23it [00:05, 4.61it/s] 24it [00:05, 4.62it/s] 25it [00:05, 4.63it/s] 26it [00:05, 4.64it/s] 27it [00:06, 4.50it/s] 28it [00:06, 4.56it/s] 29it [00:06, 4.60it/s] 30it [00:06, 4.61it/s] 31it [00:06, 4.63it/s] 32it [00:07, 4.65it/s] 33it [00:07, 4.51it/s] 34it [00:07, 4.55it/s] 35it [00:07, 4.55it/s] 36it [00:07, 4.43it/s] 37it [00:08, 4.51it/s] 38it [00:08, 4.55it/s] 39it [00:08, 4.59it/s] 40it [00:08, 4.47it/s] 41it [00:09, 4.53it/s] 42it [00:09, 4.57it/s] 43it [00:09, 4.60it/s] 44it [00:09, 4.60it/s] 45it [00:09, 4.63it/s] 46it [00:10, 4.49it/s] 47it [00:10, 4.57it/s] 48it [00:10, 4.59it/s] 49it [00:10, 4.57it/s] 50it [00:11, 4.58it/s]2025-05-25 23:31:00,083 - INFO - [Epoch 049 | Batch 0050] IWAE-loss 1382.5945 | mean log_px -0.0030 | KL -1212.96 + 51it [00:11, 4.60it/s] 52it [00:11, 4.49it/s] 53it [00:11, 4.55it/s] 54it [00:11, 4.58it/s] 55it [00:12, 4.62it/s] 56it [00:12, 4.63it/s] 57it [00:12, 4.62it/s] 58it [00:12, 4.47it/s] 59it [00:13, 4.54it/s] 60it [00:13, 4.58it/s] 61it [00:13, 4.61it/s] 62it [00:13, 4.62it/s] 63it [00:13, 4.64it/s] 64it [00:14, 4.50it/s] 65it [00:14, 4.57it/s] 66it [00:14, 4.59it/s] 67it [00:14, 4.62it/s] 68it [00:14, 4.63it/s] 69it [00:15, 4.57it/s] 70it [00:15, 4.61it/s] 71it [00:15, 4.63it/s] 72it [00:15, 4.49it/s] 73it [00:16, 4.55it/s] 74it [00:16, 4.59it/s] 75it [00:16, 4.62it/s] 76it [00:16, 4.63it/s] 77it [00:16, 4.65it/s] 78it [00:17, 4.50it/s] 79it [00:17, 4.57it/s] 80it [00:17, 4.59it/s] 81it [00:17, 4.47it/s] 82it [00:18, 4.54it/s] 83it [00:18, 4.58it/s] 84it [00:18, 4.60it/s] 85it [00:18, 4.63it/s] 86it [00:18, 4.63it/s] 87it [00:19, 4.51it/s] 88it [00:19, 4.57it/s] 89it [00:19, 4.60it/s] 90it [00:19, 4.62it/s] 91it [00:19, 4.65it/s] 92it [00:20, 4.65it/s] 93it [00:20, 4.51it/s] 94it [00:20, 4.57it/s] 95it [00:20, 4.60it/s] 96it [00:21, 4.62it/s] 97it [00:21, 4.64it/s] 98it [00:21, 4.66it/s] 99it [00:21, 4.51it/s] 100it [00:21, 4.57it/s]2025-05-25 23:31:10,992 - INFO - [Epoch 049 | Batch 0100] IWAE-loss 1519.3214 | mean log_px -0.0086 | KL -1206.96 + 101it [00:22, 4.60it/s] 102it [00:22, 4.47it/s] 103it [00:22, 4.55it/s] 104it [00:22, 4.58it/s] 105it [00:23, 4.60it/s] 106it [00:23, 4.62it/s] 107it [00:23, 4.63it/s] 108it [00:23, 4.49it/s] 109it [00:23, 4.56it/s] 110it [00:24, 4.59it/s] 111it [00:24, 4.56it/s] 112it [00:24, 4.59it/s] 113it [00:24, 4.62it/s] 114it [00:25, 4.48it/s] 115it [00:25, 4.55it/s] 116it [00:25, 4.58it/s] 117it [00:25, 4.61it/s] 118it [00:25, 4.62it/s] 119it [00:26, 4.63it/s] 120it [00:26, 4.50it/s] 121it [00:26, 4.56it/s] 122it [00:26, 4.59it/s] 123it [00:26, 4.62it/s] 124it [00:27, 4.63it/s] 125it [00:27, 4.64it/s] 126it [00:27, 4.50it/s] 127it [00:27, 4.57it/s] 128it [00:28, 4.59it/s] 129it [00:28, 4.62it/s] 130it [00:28, 4.63it/s] 131it [00:28, 4.64it/s] 132it [00:28, 4.50it/s] 133it [00:29, 4.56it/s] 134it [00:29, 4.60it/s] 135it [00:29, 4.61it/s] 136it [00:29, 4.62it/s] 137it [00:30, 4.64it/s] 138it [00:30, 4.50it/s] 139it [00:30, 4.56it/s] 140it [00:30, 4.58it/s] 141it [00:30, 4.61it/s] 142it [00:31, 4.62it/s] 143it [00:31, 4.64it/s] 144it [00:31, 4.50it/s] 145it [00:31, 4.57it/s] 146it [00:31, 4.59it/s] 147it [00:32, 4.62it/s] 148it [00:32, 4.64it/s] 149it [00:32, 4.65it/s] 150it [00:32, 4.50it/s]2025-05-25 23:31:21,908 - INFO - [Epoch 049 | Batch 0150] IWAE-loss 1296.9624 | mean log_px -0.0015 | KL -1203.38 + 151it [00:33, 4.57it/s] 152it [00:33, 4.60it/s] 153it [00:33, 4.56it/s] 154it [00:33, 4.60it/s] 155it [00:33, 4.61it/s] 156it [00:34, 4.63it/s] 157it [00:34, 4.65it/s] 158it [00:34, 4.66it/s] 159it [00:34, 4.52it/s] 160it [00:35, 4.58it/s] 161it [00:35, 4.61it/s] 162it [00:35, 4.62it/s] 163it [00:35, 4.58it/s] 164it [00:35, 4.59it/s] 165it [00:36, 4.63it/s] 166it [00:36, 4.49it/s] 167it [00:36, 4.54it/s] 168it [00:36, 4.57it/s] 169it [00:36, 4.60it/s] 170it [00:37, 4.61it/s] 171it [00:37, 4.63it/s] 172it [00:37, 4.63it/s] 173it [00:37, 4.50it/s] 174it [00:38, 4.55it/s] 175it [00:38, 4.58it/s] 176it [00:38, 4.61it/s] 177it [00:38, 4.48it/s] 178it [00:38, 4.54it/s] 179it [00:39, 4.52it/s] 180it [00:39, 4.52it/s] 181it [00:39, 4.57it/s] 182it [00:39, 4.59it/s] 183it [00:40, 4.48it/s] 184it [00:40, 4.51it/s] 185it [00:40, 4.58it/s] 186it [00:40, 4.60it/s] 187it [00:40, 4.63it/s] 188it [00:41, 4.63it/s] 189it [00:41, 4.49it/s] 190it [00:41, 4.55it/s] 191it [00:41, 4.56it/s] 192it [00:42, 4.60it/s] 193it [00:42, 4.62it/s] 194it [00:42, 4.63it/s] 195it [00:42, 4.32it/s] 196it [00:42, 4.37it/s] 196it [00:43, 4.56it/s] +2025-05-25 23:31:31,915 - INFO - Epoch: 49, Objective: tensor([1426.3483], device='cuda:0', grad_fn=), Loss: 0.002869151998311281, KL/n: 24.51639175415039 + 0it [00:00, ?it/s]2025-05-25 23:31:32,509 - INFO - [Epoch 050 | Batch 0000] IWAE-loss 1417.0724 | mean log_px -0.0090 | KL -1203.12 + 1it [00:00, 2.76it/s] 2it [00:00, 3.65it/s] 3it [00:00, 4.05it/s] 4it [00:01, 4.26it/s] 5it [00:01, 4.40it/s] 6it [00:01, 4.44it/s] 7it [00:01, 4.51it/s] 8it [00:01, 4.47it/s] 9it [00:02, 4.51it/s] 10it [00:02, 4.57it/s] 11it [00:02, 4.54it/s] 12it [00:02, 4.56it/s] 13it [00:02, 4.45it/s] 14it [00:03, 4.51it/s] 15it [00:03, 4.55it/s] 16it [00:03, 4.48it/s] 17it [00:03, 4.53it/s] 18it [00:04, 4.40it/s] 19it [00:04, 4.44it/s] 20it [00:04, 4.41it/s] 21it [00:04, 4.45it/s] 22it [00:05, 4.42it/s] 23it [00:05, 4.51it/s] 24it [00:05, 4.55it/s] 25it [00:05, 4.55it/s] 26it [00:05, 4.56it/s] 27it [00:06, 4.55it/s] 28it [00:06, 4.50it/s] 29it [00:06, 4.52it/s] 30it [00:06, 4.52it/s] 31it [00:07, 4.42it/s] 32it [00:07, 4.45it/s] 33it [00:07, 4.51it/s] 34it [00:07, 4.47it/s] 35it [00:07, 4.49it/s] 36it [00:08, 4.52it/s] 37it [00:08, 4.55it/s] 38it [00:08, 4.43it/s] 39it [00:08, 4.47it/s] 40it [00:09, 4.43it/s] 41it [00:09, 4.49it/s] 42it [00:09, 4.54it/s] 43it [00:09, 4.56it/s] 44it [00:09, 4.58it/s] 45it [00:10, 4.46it/s] 46it [00:10, 4.50it/s] 47it [00:10, 4.50it/s] 48it [00:10, 4.52it/s] 49it [00:10, 4.56it/s] 50it [00:11, 4.49it/s]2025-05-25 23:31:43,601 - INFO - [Epoch 050 | Batch 0050] IWAE-loss 1422.3885 | mean log_px -0.0056 | KL -1198.54 + 51it [00:11, 4.55it/s] 52it [00:11, 4.58it/s] 53it [00:11, 4.47it/s] 54it [00:12, 4.53it/s] 55it [00:12, 4.56it/s] 56it [00:12, 4.58it/s] 57it [00:12, 4.61it/s] 58it [00:12, 4.62it/s] 59it [00:13, 4.61it/s] 60it [00:13, 4.58it/s] 61it [00:13, 4.61it/s] 62it [00:13, 4.61it/s] 63it [00:14, 4.47it/s] 64it [00:14, 4.51it/s] 65it [00:14, 4.53it/s] 66it [00:14, 4.57it/s] 67it [00:14, 4.54it/s] 68it [00:15, 4.57it/s] 69it [00:15, 4.45it/s] 70it [00:15, 4.47it/s] 71it [00:15, 4.48it/s] 72it [00:16, 4.53it/s] 73it [00:16, 4.58it/s] 74it [00:16, 4.56it/s] 75it [00:16, 4.60it/s] 76it [00:16, 4.63it/s] 77it [00:17, 4.55it/s] 78it [00:17, 4.55it/s] 79it [00:17, 4.46it/s] 80it [00:17, 4.50it/s] 81it [00:18, 4.42it/s] 82it [00:18, 4.50it/s] 83it [00:18, 4.56it/s] 84it [00:18, 4.59it/s] 85it [00:18, 4.62it/s] 86it [00:19, 4.49it/s] 87it [00:19, 4.56it/s] 88it [00:19, 4.59it/s] 89it [00:19, 4.62it/s] 90it [00:19, 4.63it/s] 91it [00:20, 4.65it/s] 92it [00:20, 4.65it/s] 93it [00:20, 4.67it/s] 94it [00:20, 4.65it/s] 95it [00:21, 4.51it/s] 96it [00:21, 4.55it/s] 97it [00:21, 4.57it/s] 98it [00:21, 4.59it/s] 99it [00:21, 4.59it/s] 100it [00:22, 4.46it/s]2025-05-25 23:31:54,575 - INFO - [Epoch 050 | Batch 0100] IWAE-loss 1353.2869 | mean log_px -0.0037 | KL -1194.16 + 101it [00:22, 4.52it/s] 102it [00:22, 4.53it/s] 103it [00:22, 4.54it/s] 104it [00:23, 4.55it/s] 105it [00:23, 4.49it/s] 106it [00:23, 4.50it/s] 107it [00:23, 4.48it/s] 108it [00:23, 4.40it/s] 109it [00:24, 4.46it/s] 110it [00:24, 4.51it/s] 111it [00:24, 4.55it/s] 112it [00:24, 4.56it/s] 113it [00:25, 4.58it/s] 114it [00:25, 4.44it/s] 115it [00:25, 4.52it/s] 116it [00:25, 4.55it/s] 117it [00:25, 4.58it/s] 118it [00:26, 4.59it/s] 119it [00:26, 4.62it/s] 120it [00:26, 4.62it/s] 121it [00:26, 4.63it/s] 122it [00:27, 4.59it/s] 123it [00:27, 4.37it/s] 124it [00:27, 4.43it/s] 125it [00:27, 4.48it/s] 126it [00:27, 4.50it/s] 127it [00:28, 4.50it/s] 128it [00:28, 4.52it/s] 129it [00:28, 4.56it/s] 130it [00:28, 4.59it/s] 131it [00:29, 4.61it/s] 132it [00:29, 4.47it/s] 133it [00:29, 4.53it/s] 134it [00:29, 4.56it/s] 135it [00:29, 4.59it/s] 136it [00:30, 4.60it/s] 137it [00:30, 4.63it/s] 138it [00:30, 4.48it/s] 139it [00:30, 4.48it/s] 140it [00:31, 4.49it/s] 141it [00:31, 4.46it/s] 142it [00:31, 4.52it/s] 143it [00:31, 4.44it/s] 144it [00:31, 4.52it/s] 145it [00:32, 4.56it/s] 146it [00:32, 4.49it/s] 147it [00:32, 4.49it/s] 148it [00:32, 4.54it/s] 149it [00:33, 4.56it/s] 150it [00:33, 4.58it/s]2025-05-25 23:32:05,608 - INFO - [Epoch 050 | Batch 0150] IWAE-loss 1559.9613 | mean log_px -0.0173 | KL -1188.04 + 151it [00:33, 4.46it/s] 152it [00:33, 4.52it/s] 153it [00:33, 4.56it/s] 154it [00:34, 4.50it/s] 155it [00:34, 4.56it/s] 156it [00:34, 4.59it/s] 157it [00:34, 4.57it/s] 158it [00:34, 4.59it/s] 159it [00:35, 4.61it/s] 160it [00:35, 4.48it/s] 161it [00:35, 4.53it/s] 162it [00:35, 4.54it/s] 163it [00:36, 4.59it/s] 164it [00:36, 4.60it/s] 165it [00:36, 4.59it/s] 166it [00:36, 4.41it/s] 167it [00:36, 4.49it/s] 168it [00:37, 4.51it/s] 169it [00:37, 4.55it/s] 170it [00:37, 4.57it/s] 171it [00:37, 4.60it/s] 172it [00:38, 4.61it/s] 173it [00:38, 4.62it/s] 174it [00:38, 4.45it/s] 175it [00:38, 4.52it/s] 176it [00:38, 4.55it/s] 177it [00:39, 4.58it/s] 178it [00:39, 4.51it/s] 179it [00:39, 4.51it/s] 180it [00:39, 4.41it/s] 181it [00:40, 4.50it/s] 182it [00:40, 4.53it/s] 183it [00:40, 4.56it/s] 184it [00:40, 4.57it/s] 185it [00:40, 4.48it/s] 186it [00:41, 4.54it/s] 187it [00:41, 4.57it/s] 188it [00:41, 4.42it/s] 189it [00:41, 4.47it/s] 190it [00:42, 4.51it/s] 191it [00:42, 4.49it/s] 192it [00:42, 4.48it/s] 193it [00:42, 4.54it/s] 194it [00:42, 4.57it/s] 195it [00:43, 4.47it/s] 196it [00:43, 4.54it/s] 196it [00:43, 4.51it/s] +2025-05-25 23:32:15,688 - INFO - Epoch: 50, Objective: tensor([1407.9646], device='cuda:0', grad_fn=), Loss: 0.00830838456749916, KL/n: 24.236207962036133 + 0it [00:00, ?it/s]2025-05-25 23:32:16,068 - INFO - [Epoch 051 | Batch 0000] IWAE-loss 1334.0294 | mean log_px -0.0045 | KL -1185.92 + 1it [00:00, 3.01it/s] 2it [00:00, 3.81it/s] 3it [00:00, 3.96it/s] 4it [00:01, 4.10it/s] 5it [00:01, 4.06it/s] 6it [00:01, 4.21it/s] 7it [00:01, 3.40it/s] 8it [00:02, 3.61it/s] 9it [00:02, 3.89it/s] 10it [00:02, 3.99it/s] 11it [00:02, 4.18it/s] 12it [00:03, 4.30it/s] 13it [00:03, 4.35it/s] 14it [00:03, 4.41it/s] 15it [00:03, 4.45it/s] 16it [00:03, 4.49it/s] 17it [00:04, 4.33it/s] 18it [00:04, 4.42it/s] 19it [00:04, 4.41it/s] 20it [00:04, 4.45it/s] 21it [00:05, 4.40it/s] 22it [00:05, 4.45it/s] 23it [00:05, 4.34it/s] 24it [00:05, 4.40it/s] 25it [00:05, 4.46it/s] 26it [00:06, 4.43it/s] 27it [00:06, 4.47it/s] 28it [00:06, 4.48it/s] 29it [00:06, 4.51it/s] 30it [00:07, 4.55it/s] 31it [00:07, 4.37it/s] 32it [00:07, 4.46it/s] 33it [00:07, 4.45it/s] 34it [00:07, 4.52it/s] 35it [00:08, 4.49it/s] 36it [00:08, 4.52it/s] 37it [00:08, 4.41it/s] 38it [00:08, 4.50it/s] 39it [00:09, 4.48it/s] 40it [00:09, 4.51it/s] 41it [00:09, 4.49it/s] 42it [00:09, 4.52it/s] 43it [00:09, 4.55it/s] 44it [00:10, 4.57it/s] 45it [00:10, 4.39it/s] 46it [00:10, 4.44it/s] 47it [00:10, 4.48it/s] 48it [00:11, 4.52it/s] 49it [00:11, 4.45it/s] 50it [00:11, 4.49it/s]2025-05-25 23:32:27,505 - INFO - [Epoch 051 | Batch 0050] IWAE-loss 1236.7412 | mean log_px -0.0013 | KL -1183.91 + 51it [00:11, 4.48it/s] 52it [00:11, 4.52it/s] 53it [00:12, 4.55it/s] 54it [00:12, 4.58it/s] 55it [00:12, 4.44it/s] 56it [00:12, 4.47it/s] 57it [00:13, 4.44it/s] 58it [00:13, 4.49it/s] 59it [00:13, 4.46it/s] 60it [00:13, 4.38it/s] 61it [00:13, 4.47it/s] 62it [00:14, 4.52it/s] 63it [00:14, 4.54it/s] 64it [00:14, 4.50it/s] 65it [00:14, 4.44it/s] 66it [00:15, 4.41it/s] 67it [00:15, 4.41it/s] 68it [00:15, 4.45it/s] 69it [00:15, 4.39it/s] 70it [00:15, 4.47it/s] 71it [00:16, 4.47it/s] 72it [00:16, 4.50it/s] 73it [00:16, 4.27it/s] 74it [00:16, 4.39it/s] 75it [00:17, 4.45it/s] 76it [00:17, 4.50it/s] 77it [00:17, 4.42it/s] 78it [00:17, 4.47it/s] 79it [00:18, 4.46it/s] 80it [00:18, 4.50it/s] 81it [00:18, 4.55it/s] 82it [00:18, 4.55it/s] 83it [00:18, 4.41it/s] 84it [00:19, 4.47it/s] 85it [00:19, 4.52it/s] 86it [00:19, 4.55it/s] 87it [00:19, 4.54it/s] 88it [00:20, 4.55it/s] 89it [00:20, 4.51it/s] 90it [00:20, 4.46it/s] 91it [00:20, 4.40it/s] 92it [00:20, 4.32it/s] 93it [00:21, 4.39it/s] 94it [00:21, 4.45it/s] 95it [00:21, 4.46it/s] 96it [00:21, 4.51it/s] 97it [00:22, 4.52it/s] 98it [00:22, 4.57it/s] 99it [00:22, 4.60it/s] 100it [00:22, 4.57it/s]2025-05-25 23:32:38,667 - INFO - [Epoch 051 | Batch 0100] IWAE-loss 1498.0203 | mean log_px -0.0071 | KL -1184.13 + 101it [00:22, 4.57it/s] 102it [00:23, 4.51it/s] 103it [00:23, 4.54it/s] 104it [00:23, 4.55it/s] 105it [00:23, 4.53it/s] 106it [00:24, 4.37it/s] 107it [00:24, 4.46it/s] 108it [00:24, 4.50it/s] 109it [00:24, 4.53it/s] 110it [00:24, 4.53it/s] 111it [00:25, 4.56it/s] 112it [00:25, 4.38it/s] 113it [00:25, 4.44it/s] 114it [00:25, 4.40it/s] 115it [00:26, 4.43it/s] 116it [00:26, 4.46it/s] 117it [00:26, 4.49it/s] 118it [00:26, 4.53it/s] 119it [00:26, 4.50it/s] 120it [00:27, 4.35it/s] 121it [00:27, 4.44it/s] 122it [00:27, 4.51it/s] 123it [00:27, 4.50it/s] 124it [00:28, 4.53it/s] 125it [00:28, 4.50it/s] 126it [00:28, 4.54it/s] 127it [00:28, 4.57it/s] 128it [00:28, 4.61it/s] 129it [00:29, 4.34it/s] 130it [00:29, 4.44it/s] 131it [00:29, 4.46it/s] 132it [00:29, 4.53it/s] 133it [00:30, 4.58it/s] 134it [00:30, 4.58it/s] 135it [00:30, 4.62it/s] 136it [00:30, 4.63it/s] 137it [00:30, 4.65it/s] 138it [00:31, 4.66it/s] 139it [00:31, 4.56it/s] 140it [00:31, 4.59it/s] 141it [00:31, 4.61it/s] 142it [00:31, 4.63it/s] 143it [00:32, 4.63it/s] 144it [00:32, 4.65it/s] 145it [00:32, 4.58it/s] 146it [00:32, 4.58it/s] 147it [00:33, 4.56it/s] 148it [00:33, 4.58it/s] 149it [00:33, 4.54it/s] 150it [00:33, 4.56it/s]2025-05-25 23:32:49,729 - INFO - [Epoch 051 | Batch 0150] IWAE-loss 1679.6946 | mean log_px -0.0117 | KL -1184.98 + 151it [00:33, 4.48it/s] 152it [00:34, 4.55it/s] 153it [00:34, 4.54it/s] 154it [00:34, 4.42it/s] 155it [00:34, 4.49it/s] 156it [00:35, 4.54it/s] 157it [00:35, 4.58it/s] 158it [00:35, 4.61it/s] 159it [00:35, 4.59it/s] 160it [00:35, 4.58it/s] 161it [00:36, 4.58it/s] 162it [00:36, 4.58it/s] 163it [00:36, 4.37it/s] 164it [00:36, 4.43it/s] 165it [00:37, 4.41it/s] 166it [00:37, 4.51it/s] 167it [00:37, 4.53it/s] 168it [00:37, 4.58it/s] 169it [00:37, 4.60it/s] 170it [00:38, 4.59it/s] 171it [00:38, 4.49it/s] 172it [00:38, 4.40it/s] 173it [00:38, 4.49it/s] 174it [00:39, 4.54it/s] 175it [00:39, 4.49it/s] 176it [00:39, 4.56it/s] 177it [00:39, 4.56it/s] 178it [00:39, 4.57it/s] 179it [00:40, 4.54it/s] 180it [00:40, 4.56it/s] 181it [00:40, 4.53it/s] 182it [00:40, 4.56it/s] 183it [00:41, 4.38it/s] 184it [00:41, 4.44it/s] 185it [00:41, 4.48it/s] 186it [00:41, 4.49it/s] 187it [00:41, 4.51it/s] 188it [00:42, 4.52it/s] 189it [00:42, 4.49it/s] 190it [00:42, 4.53it/s] 191it [00:42, 4.55it/s] 192it [00:43, 4.58it/s] 193it [00:43, 4.61it/s] 194it [00:43, 4.60it/s] 195it [00:43, 4.41it/s] 196it [00:43, 4.52it/s] 196it [00:43, 4.46it/s] +2025-05-25 23:32:59,815 - INFO - Epoch: 51, Objective: tensor([1720.4115], device='cuda:0', grad_fn=), Loss: 0.011251946911215782, KL/n: 24.17317771911621 + 0it [00:00, ?it/s]2025-05-25 23:33:00,221 - INFO - [Epoch 052 | Batch 0000] IWAE-loss 1308.6581 | mean log_px -0.0024 | KL -1183.32 + 1it [00:00, 2.82it/s] 2it [00:00, 3.70it/s] 3it [00:00, 4.09it/s] 4it [00:00, 4.30it/s] 5it [00:01, 4.44it/s] 6it [00:01, 4.51it/s] 7it [00:01, 4.56it/s] 8it [00:01, 4.44it/s] 9it [00:02, 4.53it/s] 10it [00:02, 4.43it/s] 11it [00:02, 4.51it/s] 12it [00:02, 4.55it/s] 13it [00:02, 4.60it/s] 14it [00:03, 4.62it/s] 15it [00:03, 4.63it/s] 16it [00:03, 4.65it/s] 17it [00:03, 4.66it/s] 18it [00:04, 4.66it/s] 19it [00:04, 4.68it/s] 20it [00:04, 4.67it/s] 21it [00:04, 4.68it/s] 22it [00:04, 4.65it/s] 23it [00:05, 4.67it/s] 24it [00:05, 4.67it/s] 25it [00:05, 4.68it/s] 26it [00:05, 4.67it/s] 27it [00:05, 4.68it/s] 28it [00:06, 4.68it/s] 29it [00:06, 4.69it/s] 30it [00:06, 4.69it/s] 31it [00:06, 4.68it/s] 32it [00:07, 4.68it/s] 33it [00:07, 4.68it/s] 34it [00:07, 4.53it/s] 35it [00:07, 4.57it/s] 36it [00:07, 4.56it/s] 37it [00:08, 4.59it/s] 38it [00:08, 4.62it/s] 39it [00:08, 4.64it/s] 40it [00:08, 4.65it/s] 41it [00:08, 4.66it/s] 42it [00:09, 4.67it/s] 43it [00:09, 4.68it/s] 44it [00:09, 4.67it/s] 45it [00:09, 4.68it/s] 46it [00:10, 4.68it/s] 47it [00:10, 4.68it/s] 48it [00:10, 4.68it/s] 49it [00:10, 4.53it/s] 50it [00:10, 4.59it/s]2025-05-25 23:33:11,022 - INFO - [Epoch 052 | Batch 0050] IWAE-loss 1253.5378 | mean log_px -0.0022 | KL -1182.44 + 51it [00:11, 4.62it/s] 52it [00:11, 4.64it/s] 53it [00:11, 4.66it/s] 54it [00:11, 4.66it/s] 55it [00:11, 4.66it/s] 56it [00:12, 4.66it/s] 57it [00:12, 4.67it/s] 58it [00:12, 4.51it/s] 59it [00:12, 4.58it/s] 60it [00:13, 4.60it/s] 61it [00:13, 4.63it/s] 62it [00:13, 4.64it/s] 63it [00:13, 4.66it/s] 64it [00:13, 4.67it/s] 65it [00:14, 4.68it/s] 66it [00:14, 4.67it/s] 67it [00:14, 4.68it/s] 68it [00:14, 4.68it/s] 69it [00:14, 4.69it/s] 70it [00:15, 4.69it/s] 71it [00:15, 4.69it/s] 72it [00:15, 4.68it/s] 73it [00:15, 4.69it/s] 74it [00:16, 4.68it/s] 75it [00:16, 4.62it/s] 76it [00:16, 4.65it/s] 77it [00:16, 4.66it/s] 78it [00:16, 4.66it/s] 79it [00:17, 4.67it/s] 80it [00:17, 4.67it/s] 81it [00:17, 4.68it/s] 82it [00:17, 4.52it/s] 83it [00:18, 4.59it/s] 84it [00:18, 4.61it/s] 85it [00:18, 4.63it/s] 86it [00:18, 4.64it/s] 87it [00:18, 4.66it/s] 88it [00:19, 4.64it/s] 89it [00:19, 4.65it/s] 90it [00:19, 4.66it/s] 91it [00:19, 4.68it/s] 92it [00:19, 4.67it/s] 93it [00:20, 4.68it/s] 94it [00:20, 4.68it/s] 95it [00:20, 4.69it/s] 96it [00:20, 4.68it/s] 97it [00:21, 4.69it/s] 98it [00:21, 4.68it/s] 99it [00:21, 4.69it/s] 100it [00:21, 4.67it/s]2025-05-25 23:33:21,758 - INFO - [Epoch 052 | Batch 0100] IWAE-loss 1299.2296 | mean log_px -0.0027 | KL -1181.27 + 101it [00:21, 4.68it/s] 102it [00:22, 4.53it/s] 103it [00:22, 4.58it/s] 104it [00:22, 4.60it/s] 105it [00:22, 4.61it/s] 106it [00:22, 4.64it/s] 107it [00:23, 4.66it/s] 108it [00:23, 4.67it/s] 109it [00:23, 4.67it/s] 110it [00:23, 4.67it/s] 111it [00:24, 4.67it/s] 112it [00:24, 4.67it/s] 113it [00:24, 4.68it/s] 114it [00:24, 4.67it/s] 115it [00:24, 4.68it/s] 116it [00:25, 4.67it/s] 117it [00:25, 4.68it/s] 118it [00:25, 4.68it/s] 119it [00:25, 4.54it/s] 120it [00:25, 4.59it/s] 121it [00:26, 4.62it/s] 122it [00:26, 4.63it/s] 123it [00:26, 4.65it/s] 124it [00:26, 4.66it/s] 125it [00:27, 4.66it/s] 126it [00:27, 4.56it/s] 127it [00:27, 4.61it/s] 128it [00:27, 4.62it/s] 129it [00:27, 4.65it/s] 130it [00:28, 4.66it/s] 131it [00:28, 4.52it/s] 132it [00:28, 4.58it/s] 133it [00:28, 4.62it/s] 134it [00:28, 4.63it/s] 135it [00:29, 4.65it/s] 136it [00:29, 4.59it/s] 137it [00:29, 4.58it/s] 138it [00:29, 4.59it/s] 139it [00:30, 4.46it/s] 140it [00:30, 4.54it/s] 141it [00:30, 4.55it/s] 142it [00:30, 4.58it/s] 143it [00:30, 4.62it/s] 144it [00:31, 4.63it/s] 145it [00:31, 4.65it/s] 146it [00:31, 4.66it/s] 147it [00:31, 4.67it/s] 148it [00:32, 4.67it/s] 149it [00:32, 4.64it/s] 150it [00:32, 4.46it/s]2025-05-25 23:33:32,612 - INFO - [Epoch 052 | Batch 0150] IWAE-loss 1224.5007 | mean log_px -0.0009 | KL -1180.44 + 151it [00:32, 4.48it/s] 152it [00:32, 4.52it/s] 153it [00:33, 4.57it/s] 154it [00:33, 4.40it/s] 155it [00:33, 4.47it/s] 156it [00:33, 4.41it/s] 157it [00:34, 4.50it/s] 158it [00:34, 4.55it/s] 159it [00:34, 4.58it/s] 160it [00:34, 4.62it/s] 161it [00:34, 4.63it/s] 162it [00:35, 4.65it/s] 163it [00:35, 4.68it/s] 164it [00:35, 4.48it/s] 165it [00:35, 4.53it/s] 166it [00:36, 4.55it/s] 167it [00:36, 4.58it/s] 168it [00:36, 4.60it/s] 169it [00:36, 4.62it/s] 170it [00:36, 4.62it/s] 171it [00:37, 4.49it/s] 172it [00:37, 4.53it/s] 173it [00:37, 4.42it/s] 174it [00:37, 4.51it/s] 175it [00:38, 4.41it/s] 176it [00:38, 4.48it/s] 177it [00:38, 4.54it/s] 178it [00:38, 4.57it/s] 179it [00:38, 4.59it/s] 180it [00:39, 4.60it/s] 181it [00:39, 4.63it/s] 182it [00:39, 4.50it/s] 183it [00:39, 4.56it/s] 184it [00:39, 4.59it/s] 185it [00:40, 4.60it/s] 186it [00:40, 4.62it/s] 187it [00:40, 4.64it/s] 188it [00:40, 4.49it/s] 189it [00:41, 4.54it/s] 190it [00:41, 4.58it/s] 191it [00:41, 4.61it/s] 192it [00:41, 4.62it/s] 193it [00:41, 4.61it/s] 194it [00:42, 4.64it/s] 195it [00:42, 4.52it/s] 196it [00:42, 4.45it/s] 196it [00:42, 4.59it/s] +2025-05-25 23:33:42,629 - INFO - Epoch: 52, Objective: tensor([1489.6241], device='cuda:0', grad_fn=), Loss: 0.0029403548687696457, KL/n: 23.974336624145508 + 0it [00:00, ?it/s]2025-05-25 23:33:43,218 - INFO - [Epoch 053 | Batch 0000] IWAE-loss 1426.3737 | mean log_px -0.0070 | KL -1176.55 + 1it [00:00, 3.07it/s] 2it [00:00, 3.60it/s] 3it [00:00, 4.04it/s] 4it [00:00, 4.24it/s] 5it [00:01, 4.39it/s] 6it [00:01, 4.46it/s] 7it [00:01, 4.52it/s] 8it [00:01, 4.31it/s] 9it [00:02, 4.41it/s] 10it [00:02, 4.46it/s] 11it [00:02, 4.50it/s] 12it [00:02, 4.53it/s] 13it [00:02, 4.54it/s] 14it [00:03, 4.56it/s] 15it [00:03, 4.59it/s] 16it [00:03, 4.61it/s] 17it [00:03, 4.63it/s] 18it [00:04, 4.64it/s] 19it [00:04, 4.63it/s] 20it [00:04, 4.48it/s] 21it [00:04, 4.53it/s] 22it [00:04, 4.56it/s] 23it [00:05, 4.59it/s] 24it [00:05, 4.60it/s] 25it [00:05, 4.62it/s] 26it [00:05, 4.62it/s] 27it [00:06, 4.64it/s] 28it [00:06, 4.64it/s] 29it [00:06, 4.66it/s] 30it [00:06, 4.66it/s] 31it [00:06, 4.66it/s] 32it [00:07, 4.64it/s] 33it [00:07, 4.65it/s] 34it [00:07, 4.65it/s] 35it [00:07, 4.65it/s] 36it [00:07, 4.66it/s] 37it [00:08, 4.66it/s] 38it [00:08, 4.65it/s] 39it [00:08, 4.54it/s] 40it [00:08, 4.58it/s] 41it [00:09, 4.61it/s] 42it [00:09, 4.62it/s] 43it [00:09, 4.63it/s] 44it [00:09, 4.48it/s] 45it [00:09, 4.54it/s] 46it [00:10, 4.57it/s] 47it [00:10, 4.55it/s] 48it [00:10, 4.60it/s] 49it [00:10, 4.64it/s] 50it [00:11, 4.65it/s]2025-05-25 23:33:54,117 - INFO - [Epoch 053 | Batch 0050] IWAE-loss 1257.6678 | mean log_px -0.0016 | KL -1169.34 + 51it [00:11, 4.50it/s] 52it [00:11, 4.57it/s] 53it [00:11, 4.57it/s] 54it [00:11, 4.59it/s] 55it [00:12, 4.62it/s] 56it [00:12, 4.64it/s] 57it [00:12, 4.67it/s] 58it [00:12, 4.67it/s] 59it [00:12, 4.68it/s] 60it [00:13, 4.68it/s] 61it [00:13, 4.67it/s] 62it [00:13, 4.69it/s] 63it [00:13, 4.69it/s] 64it [00:14, 4.52it/s] 65it [00:14, 4.57it/s] 66it [00:14, 4.44it/s] 67it [00:14, 4.53it/s] 68it [00:14, 4.57it/s] 69it [00:15, 4.61it/s] 70it [00:15, 4.62it/s] 71it [00:15, 4.67it/s] 72it [00:15, 4.67it/s] 73it [00:15, 4.68it/s] 74it [00:16, 4.68it/s] 75it [00:16, 4.69it/s] 76it [00:16, 4.52it/s] 77it [00:16, 4.59it/s] 78it [00:17, 4.55it/s] 79it [00:17, 4.60it/s] 80it [00:17, 4.62it/s] 81it [00:17, 4.64it/s] 82it [00:17, 4.49it/s] 83it [00:18, 4.57it/s] 84it [00:18, 4.61it/s] 85it [00:18, 4.62it/s] 86it [00:18, 4.64it/s] 87it [00:19, 4.67it/s] 88it [00:19, 4.67it/s] 89it [00:19, 4.51it/s] 90it [00:19, 4.57it/s] 91it [00:19, 4.61it/s] 92it [00:20, 4.60it/s] 93it [00:20, 4.64it/s] 94it [00:20, 4.64it/s] 95it [00:20, 4.65it/s] 96it [00:20, 4.67it/s] 97it [00:21, 4.68it/s] 98it [00:21, 4.66it/s] 99it [00:21, 4.67it/s] 100it [00:21, 4.64it/s]2025-05-25 23:34:04,950 - INFO - [Epoch 053 | Batch 0100] IWAE-loss 1240.2892 | mean log_px -0.0014 | KL -1168.91 + 101it [00:22, 4.62it/s] 102it [00:22, 4.42it/s] 103it [00:22, 4.49it/s] 104it [00:22, 4.54it/s] 105it [00:22, 4.58it/s] 106it [00:23, 4.61it/s] 107it [00:23, 4.61it/s] 108it [00:23, 4.62it/s] 109it [00:23, 4.62it/s] 110it [00:24, 4.62it/s] 111it [00:24, 4.63it/s] 112it [00:24, 4.62it/s] 113it [00:24, 4.64it/s] 114it [00:24, 4.64it/s] 115it [00:25, 4.65it/s] 116it [00:25, 4.66it/s] 117it [00:25, 4.67it/s] 118it [00:25, 4.66it/s] 119it [00:25, 4.66it/s] 120it [00:26, 4.66it/s] 121it [00:26, 4.67it/s] 122it [00:26, 4.66it/s] 123it [00:26, 4.67it/s] 124it [00:27, 4.67it/s] 125it [00:27, 4.68it/s] 126it [00:27, 4.67it/s] 127it [00:27, 4.69it/s] 128it [00:27, 4.66it/s] 129it [00:28, 4.68it/s] 130it [00:28, 4.69it/s] 131it [00:28, 4.70it/s] 132it [00:28, 4.68it/s] 133it [00:28, 4.68it/s] 134it [00:29, 4.55it/s] 135it [00:29, 4.60it/s] 136it [00:29, 4.62it/s] 137it [00:29, 4.64it/s] 138it [00:30, 4.65it/s] 139it [00:30, 4.67it/s] 140it [00:30, 4.67it/s] 141it [00:30, 4.67it/s] 142it [00:30, 4.68it/s] 143it [00:31, 4.68it/s] 144it [00:31, 4.68it/s] 145it [00:31, 4.68it/s] 146it [00:31, 4.52it/s] 147it [00:31, 4.58it/s] 148it [00:32, 4.60it/s] 149it [00:32, 4.62it/s] 150it [00:32, 4.62it/s]2025-05-25 23:34:15,740 - INFO - [Epoch 053 | Batch 0150] IWAE-loss 1517.0568 | mean log_px -0.0129 | KL -1162.64 + 151it [00:32, 4.63it/s] 152it [00:33, 4.47it/s] 153it [00:33, 4.51it/s] 154it [00:33, 4.54it/s] 155it [00:33, 4.58it/s] 156it [00:33, 4.60it/s] 157it [00:34, 4.62it/s] 158it [00:34, 4.47it/s] 159it [00:34, 4.54it/s] 160it [00:34, 4.57it/s] 161it [00:35, 4.59it/s] 162it [00:35, 4.60it/s] 163it [00:35, 4.62it/s] 164it [00:35, 4.51it/s] 165it [00:35, 4.57it/s] 166it [00:36, 4.58it/s] 167it [00:36, 4.60it/s] 168it [00:36, 4.59it/s] 169it [00:36, 4.59it/s] 170it [00:37, 4.61it/s] 171it [00:37, 4.63it/s] 172it [00:37, 4.63it/s] 173it [00:37, 4.52it/s] 174it [00:37, 4.57it/s] 175it [00:38, 4.60it/s] 176it [00:38, 4.61it/s] 177it [00:38, 4.63it/s] 178it [00:38, 4.64it/s] 179it [00:38, 4.65it/s] 180it [00:39, 4.64it/s] 181it [00:39, 4.65it/s] 182it [00:39, 4.66it/s] 183it [00:39, 4.66it/s] 184it [00:40, 4.66it/s] 185it [00:40, 4.66it/s] 186it [00:40, 4.65it/s] 187it [00:40, 4.65it/s] 188it [00:40, 4.65it/s] 189it [00:41, 4.66it/s] 190it [00:41, 4.65it/s] 191it [00:41, 4.67it/s] 192it [00:41, 4.66it/s] 193it [00:41, 4.66it/s] 194it [00:42, 4.66it/s] 195it [00:42, 4.55it/s] 196it [00:42, 4.60it/s] 196it [00:42, 4.59it/s] +2025-05-25 23:34:25,649 - INFO - Epoch: 53, Objective: tensor([1300.9849], device='cuda:0', grad_fn=), Loss: 0.0023734073620289564, KL/n: 23.757631301879883 + 0it [00:00, ?it/s]2025-05-25 23:34:26,056 - INFO - [Epoch 054 | Batch 0000] IWAE-loss 1428.1246 | mean log_px -0.0070 | KL -1163.56 + 1it [00:00, 2.78it/s] 2it [00:00, 3.66it/s] 3it [00:00, 3.96it/s] 4it [00:01, 4.21it/s] 5it [00:01, 4.36it/s] 6it [00:01, 4.36it/s] 7it [00:01, 4.43it/s] 8it [00:01, 4.37it/s] 9it [00:02, 4.48it/s] 10it [00:02, 4.53it/s] 11it [00:02, 4.58it/s] 12it [00:02, 4.60it/s] 13it [00:02, 4.62it/s] 14it [00:03, 4.63it/s] 15it [00:03, 4.64it/s] 16it [00:03, 4.65it/s] 17it [00:03, 4.66it/s] 18it [00:04, 4.64it/s] 19it [00:04, 4.65it/s] 20it [00:04, 4.64it/s] 21it [00:04, 4.66it/s] 22it [00:04, 4.66it/s] 23it [00:05, 4.67it/s] 24it [00:05, 4.57it/s] 25it [00:05, 4.62it/s] 26it [00:05, 4.62it/s] 27it [00:05, 4.64it/s] 28it [00:06, 4.65it/s] 29it [00:06, 4.65it/s] 30it [00:06, 4.51it/s] 31it [00:06, 4.57it/s] 32it [00:07, 4.59it/s] 33it [00:07, 4.62it/s] 34it [00:07, 4.62it/s] 35it [00:07, 4.65it/s] 36it [00:07, 4.65it/s] 37it [00:08, 4.66it/s] 38it [00:08, 4.66it/s] 39it [00:08, 4.65it/s] 40it [00:08, 4.63it/s] 41it [00:09, 4.64it/s] 42it [00:09, 4.54it/s] 43it [00:09, 4.59it/s] 44it [00:09, 4.61it/s] 45it [00:09, 4.63it/s] 46it [00:10, 4.63it/s] 47it [00:10, 4.64it/s] 48it [00:10, 4.64it/s] 49it [00:10, 4.65it/s] 50it [00:11, 4.43it/s]2025-05-25 23:34:36,941 - INFO - [Epoch 054 | Batch 0050] IWAE-loss 1222.4982 | mean log_px -0.0012 | KL -1156.77 + 51it [00:11, 4.51it/s] 52it [00:11, 4.55it/s] 53it [00:11, 4.58it/s] 54it [00:11, 4.61it/s] 55it [00:12, 4.61it/s] 56it [00:12, 4.64it/s] 57it [00:12, 4.64it/s] 58it [00:12, 4.63it/s] 59it [00:12, 4.64it/s] 60it [00:13, 4.60it/s] 61it [00:13, 4.47it/s] 62it [00:13, 4.51it/s] 63it [00:13, 4.54it/s] 64it [00:14, 4.59it/s] 65it [00:14, 4.62it/s] 66it [00:14, 4.52it/s] 67it [00:14, 4.60it/s] 68it [00:14, 4.63it/s] 69it [00:15, 4.66it/s] 70it [00:15, 4.67it/s] 71it [00:15, 4.69it/s] 72it [00:15, 4.53it/s] 73it [00:15, 4.59it/s] 74it [00:16, 4.62it/s] 75it [00:16, 4.65it/s] 76it [00:16, 4.67it/s] 77it [00:16, 4.49it/s] 78it [00:17, 4.57it/s] 79it [00:17, 4.61it/s] 80it [00:17, 4.64it/s] 81it [00:17, 4.67it/s] 82it [00:17, 4.49it/s] 83it [00:18, 4.57it/s] 84it [00:18, 4.56it/s] 85it [00:18, 4.60it/s] 86it [00:18, 4.59it/s] 87it [00:19, 4.65it/s] 88it [00:19, 4.65it/s] 89it [00:19, 4.68it/s] 90it [00:19, 3.68it/s] 91it [00:20, 3.94it/s] 92it [00:20, 4.14it/s] 93it [00:20, 4.16it/s] 94it [00:20, 4.32it/s] 95it [00:20, 4.44it/s] 96it [00:21, 4.42it/s] 97it [00:21, 4.47it/s] 98it [00:21, 4.52it/s] 99it [00:21, 4.42it/s] 100it [00:22, 4.50it/s]2025-05-25 23:34:48,003 - INFO - [Epoch 054 | Batch 0100] IWAE-loss 1336.7174 | mean log_px -0.0042 | KL -1150.52 + 101it [00:22, 4.54it/s] 102it [00:22, 4.58it/s] 103it [00:22, 4.63it/s] 104it [00:22, 4.65it/s] 105it [00:23, 4.67it/s] 106it [00:23, 4.68it/s] 107it [00:23, 4.70it/s] 108it [00:23, 4.70it/s] 109it [00:23, 4.70it/s] 110it [00:24, 4.70it/s] 111it [00:24, 4.71it/s] 112it [00:24, 4.49it/s] 113it [00:24, 4.57it/s] 114it [00:25, 4.61it/s] 115it [00:25, 4.65it/s] 116it [00:25, 4.67it/s] 117it [00:25, 4.68it/s] 118it [00:25, 4.70it/s] 119it [00:26, 4.71it/s] 120it [00:26, 4.71it/s] 121it [00:26, 4.72it/s] 122it [00:26, 4.72it/s] 123it [00:26, 4.72it/s] 124it [00:27, 4.55it/s] 125it [00:27, 4.62it/s] 126it [00:27, 4.64it/s] 127it [00:27, 4.66it/s] 128it [00:28, 4.68it/s] 129it [00:28, 4.70it/s] 130it [00:28, 4.70it/s] 131it [00:28, 4.72it/s] 132it [00:28, 4.71it/s] 133it [00:29, 4.71it/s] 134it [00:29, 4.70it/s] 135it [00:29, 4.70it/s] 136it [00:29, 4.70it/s] 137it [00:29, 4.54it/s] 138it [00:30, 4.59it/s] 139it [00:30, 4.63it/s] 140it [00:30, 4.65it/s] 141it [00:30, 4.67it/s] 142it [00:31, 4.68it/s] 143it [00:31, 4.52it/s] 144it [00:31, 4.58it/s] 145it [00:31, 4.61it/s] 146it [00:31, 4.63it/s] 147it [00:32, 4.65it/s] 148it [00:32, 4.66it/s] 149it [00:32, 4.68it/s] 150it [00:32, 4.68it/s]2025-05-25 23:34:58,724 - INFO - [Epoch 054 | Batch 0150] IWAE-loss 1233.8479 | mean log_px -0.0012 | KL -1151.34 + 151it [00:32, 4.69it/s] 152it [00:33, 4.70it/s] 153it [00:33, 4.71it/s] 154it [00:33, 4.72it/s] 155it [00:33, 4.72it/s] 156it [00:34, 4.72it/s] 157it [00:34, 4.72it/s] 158it [00:34, 4.71it/s] 159it [00:34, 4.72it/s] 160it [00:34, 4.72it/s] 161it [00:35, 4.72it/s] 162it [00:35, 4.71it/s] 163it [00:35, 4.72it/s] 164it [00:35, 4.71it/s] 165it [00:35, 4.64it/s] 166it [00:36, 4.67it/s] 167it [00:36, 4.69it/s] 168it [00:36, 4.63it/s] 169it [00:36, 4.48it/s] 170it [00:37, 4.55it/s] 171it [00:37, 4.60it/s] 172it [00:37, 4.64it/s] 173it [00:37, 4.67it/s] 174it [00:37, 4.68it/s] 175it [00:38, 4.69it/s] 176it [00:38, 4.70it/s] 177it [00:38, 4.54it/s] 178it [00:38, 4.61it/s] 179it [00:39, 4.64it/s] 180it [00:39, 4.66it/s] 181it [00:39, 4.68it/s] 182it [00:39, 4.68it/s] 183it [00:39, 4.70it/s] 184it [00:40, 4.70it/s] 185it [00:40, 4.71it/s] 186it [00:40, 4.71it/s] 187it [00:40, 4.71it/s] 188it [00:40, 4.71it/s] 189it [00:41, 4.72it/s] 190it [00:41, 4.71it/s] 191it [00:41, 4.72it/s] 192it [00:41, 4.72it/s] 193it [00:41, 4.55it/s] 194it [00:42, 4.58it/s] 195it [00:42, 4.40it/s] 196it [00:42, 4.49it/s] 196it [00:42, 4.59it/s] +2025-05-25 23:35:08,530 - INFO - Epoch: 54, Objective: tensor([1524.9691], device='cuda:0', grad_fn=), Loss: 0.006559988018125296, KL/n: 23.41026496887207 + 0it [00:00, ?it/s]2025-05-25 23:35:08,909 - INFO - [Epoch 055 | Batch 0000] IWAE-loss 1968.7968 | mean log_px -0.0207 | KL -1144.99 + 1it [00:00, 3.30it/s] 2it [00:00, 3.98it/s] 3it [00:00, 4.25it/s] 4it [00:01, 3.99it/s] 5it [00:01, 4.23it/s] 6it [00:01, 4.38it/s] 7it [00:01, 4.48it/s] 8it [00:01, 4.55it/s] 9it [00:02, 4.60it/s] 10it [00:02, 4.63it/s] 11it [00:02, 4.50it/s] 12it [00:02, 4.57it/s] 13it [00:02, 4.62it/s] 14it [00:03, 4.65it/s] 15it [00:03, 4.67it/s] 16it [00:03, 4.50it/s] 17it [00:03, 4.58it/s] 18it [00:04, 4.61it/s] 19it [00:04, 4.65it/s] 20it [00:04, 4.66it/s] 21it [00:04, 4.64it/s] 22it [00:04, 4.49it/s] 23it [00:05, 4.57it/s] 24it [00:05, 4.61it/s] 25it [00:05, 4.64it/s] 26it [00:05, 4.65it/s] 27it [00:05, 4.67it/s] 28it [00:06, 4.68it/s] 29it [00:06, 4.53it/s] 30it [00:06, 4.59it/s] 31it [00:06, 4.64it/s] 32it [00:07, 4.66it/s] 33it [00:07, 4.68it/s] 34it [00:07, 4.69it/s] 35it [00:07, 4.53it/s] 36it [00:07, 4.59it/s] 37it [00:08, 4.64it/s] 38it [00:08, 4.65it/s] 39it [00:08, 4.67it/s] 40it [00:08, 4.68it/s] 41it [00:08, 4.70it/s] 42it [00:09, 4.54it/s] 43it [00:09, 4.62it/s] 44it [00:09, 4.65it/s] 45it [00:09, 4.67it/s] 46it [00:10, 4.68it/s] 47it [00:10, 4.70it/s] 48it [00:10, 4.54it/s] 49it [00:10, 4.61it/s] 50it [00:10, 4.63it/s]2025-05-25 23:35:19,758 - INFO - [Epoch 055 | Batch 0050] IWAE-loss 1384.5171 | mean log_px -0.0034 | KL -1144.44 + 51it [00:11, 4.66it/s] 52it [00:11, 4.67it/s] 53it [00:11, 4.68it/s] 54it [00:11, 4.53it/s] 55it [00:12, 4.60it/s] 56it [00:12, 4.63it/s] 57it [00:12, 4.66it/s] 58it [00:12, 4.67it/s] 59it [00:12, 4.69it/s] 60it [00:13, 4.69it/s] 61it [00:13, 4.71it/s] 62it [00:13, 4.71it/s] 63it [00:13, 4.55it/s] 64it [00:13, 4.61it/s] 65it [00:14, 4.65it/s] 66it [00:14, 4.66it/s] 67it [00:14, 4.68it/s] 68it [00:14, 4.69it/s] 69it [00:15, 4.54it/s] 70it [00:15, 4.61it/s] 71it [00:15, 4.64it/s] 72it [00:15, 4.64it/s] 73it [00:15, 4.67it/s] 74it [00:16, 4.49it/s] 75it [00:16, 4.57it/s] 76it [00:16, 4.61it/s] 77it [00:16, 4.64it/s] 78it [00:16, 4.66it/s] 79it [00:17, 4.69it/s] 80it [00:17, 4.70it/s] 81it [00:17, 4.54it/s] 82it [00:17, 4.61it/s] 83it [00:18, 4.64it/s] 84it [00:18, 4.66it/s] 85it [00:18, 4.67it/s] 86it [00:18, 4.68it/s] 87it [00:18, 4.66it/s] 88it [00:19, 4.52it/s] 89it [00:19, 4.60it/s] 90it [00:19, 4.63it/s] 91it [00:19, 4.65it/s] 92it [00:19, 4.67it/s] 93it [00:20, 4.69it/s] 94it [00:20, 4.69it/s] 95it [00:20, 4.72it/s] 96it [00:20, 4.71it/s] 97it [00:21, 4.72it/s] 98it [00:21, 4.71it/s] 99it [00:21, 4.72it/s] 100it [00:21, 4.55it/s]2025-05-25 23:35:30,530 - INFO - [Epoch 055 | Batch 0100] IWAE-loss 1683.7357 | mean log_px -0.0097 | KL -1142.95 + 101it [00:21, 4.61it/s] 102it [00:22, 4.64it/s] 103it [00:22, 4.67it/s] 104it [00:22, 4.69it/s] 105it [00:22, 4.70it/s] 106it [00:22, 4.71it/s] 107it [00:23, 4.72it/s] 108it [00:23, 4.71it/s] 109it [00:23, 4.55it/s] 110it [00:23, 4.61it/s] 111it [00:24, 4.64it/s] 112it [00:24, 4.66it/s] 113it [00:24, 4.69it/s] 114it [00:24, 4.69it/s] 115it [00:24, 4.70it/s] 116it [00:25, 4.71it/s] 117it [00:25, 4.71it/s] 118it [00:25, 4.71it/s] 119it [00:25, 4.55it/s] 120it [00:25, 4.58it/s] 121it [00:26, 4.63it/s] 122it [00:26, 4.65it/s] 123it [00:26, 4.67it/s] 124it [00:26, 4.52it/s] 125it [00:27, 4.59it/s] 126it [00:27, 4.62it/s] 127it [00:27, 4.60it/s] 128it [00:27, 4.62it/s] 129it [00:27, 4.59it/s] 130it [00:28, 4.63it/s] 131it [00:28, 4.61it/s] 132it [00:28, 4.45it/s] 133it [00:28, 4.54it/s] 134it [00:29, 4.59it/s] 135it [00:29, 4.63it/s] 136it [00:29, 4.65it/s] 137it [00:29, 4.51it/s] 138it [00:29, 4.58it/s] 139it [00:30, 4.62it/s] 140it [00:30, 4.63it/s] 141it [00:30, 4.67it/s] 142it [00:30, 4.46it/s] 143it [00:31, 4.52it/s] 144it [00:31, 4.57it/s] 145it [00:31, 4.62it/s] 146it [00:31, 4.63it/s] 147it [00:31, 4.65it/s] 148it [00:32, 4.67it/s] 149it [00:32, 4.69it/s] 150it [00:32, 4.69it/s]2025-05-25 23:35:41,328 - INFO - [Epoch 055 | Batch 0150] IWAE-loss 1441.7352 | mean log_px -0.0088 | KL -1140.60 + 151it [00:32, 4.69it/s] 152it [00:32, 4.69it/s] 153it [00:33, 4.70it/s] 154it [00:33, 4.70it/s] 155it [00:33, 4.71it/s] 156it [00:33, 4.59it/s] 157it [00:34, 4.64it/s] 158it [00:34, 4.66it/s] 159it [00:34, 4.67it/s] 160it [00:34, 4.68it/s] 161it [00:34, 4.69it/s] 162it [00:35, 4.70it/s] 163it [00:35, 4.71it/s] 164it [00:35, 4.71it/s] 165it [00:35, 4.72it/s] 166it [00:35, 4.72it/s] 167it [00:36, 4.72it/s] 168it [00:36, 4.72it/s] 169it [00:36, 4.72it/s] 170it [00:36, 4.71it/s] 171it [00:36, 4.72it/s] 172it [00:37, 4.72it/s] 173it [00:37, 4.72it/s] 174it [00:37, 4.72it/s] 175it [00:37, 4.72it/s] 176it [00:38, 4.71it/s] 177it [00:38, 4.72it/s] 178it [00:38, 4.71it/s] 179it [00:38, 4.71it/s] 180it [00:38, 4.69it/s] 181it [00:39, 4.69it/s] 182it [00:39, 4.68it/s] 183it [00:39, 4.71it/s] 184it [00:39, 4.70it/s] 185it [00:39, 4.71it/s] 186it [00:40, 4.71it/s] 187it [00:40, 4.71it/s] 188it [00:40, 4.71it/s] 189it [00:40, 4.71it/s] 190it [00:41, 4.72it/s] 191it [00:41, 4.72it/s] 192it [00:41, 4.72it/s] 193it [00:41, 4.72it/s] 194it [00:41, 4.72it/s] 195it [00:42, 4.63it/s] 196it [00:42, 4.49it/s] 196it [00:42, 4.62it/s] +2025-05-25 23:35:51,059 - INFO - Epoch: 55, Objective: tensor([2532.4099], device='cuda:0', grad_fn=), Loss: 0.026845891028642654, KL/n: 23.29350471496582 + 0it [00:00, ?it/s]2025-05-25 23:35:51,652 - INFO - [Epoch 056 | Batch 0000] IWAE-loss 1829.8907 | mean log_px -0.0137 | KL -1141.24 + 1it [00:00, 2.75it/s] 2it [00:00, 3.63it/s] 3it [00:00, 4.05it/s] 4it [00:01, 4.29it/s] 5it [00:01, 4.43it/s] 6it [00:01, 4.52it/s] 7it [00:01, 4.42it/s] 8it [00:01, 4.52it/s] 9it [00:02, 4.58it/s] 10it [00:02, 4.62it/s] 11it [00:02, 4.65it/s] 12it [00:02, 4.66it/s] 13it [00:02, 4.68it/s] 14it [00:03, 4.57it/s] 15it [00:03, 4.63it/s] 16it [00:03, 4.65it/s] 17it [00:03, 4.67it/s] 18it [00:04, 4.68it/s] 19it [00:04, 4.70it/s] 20it [00:04, 4.70it/s] 21it [00:04, 4.71it/s] 22it [00:04, 4.71it/s] 23it [00:05, 4.71it/s] 24it [00:05, 4.71it/s] 25it [00:05, 4.71it/s] 26it [00:05, 4.57it/s] 27it [00:05, 4.63it/s] 28it [00:06, 4.64it/s] 29it [00:06, 4.66it/s] 30it [00:06, 4.67it/s] 31it [00:06, 4.70it/s] 32it [00:07, 4.70it/s] 33it [00:07, 4.71it/s] 34it [00:07, 4.68it/s] 35it [00:07, 4.53it/s] 36it [00:07, 4.60it/s] 37it [00:08, 4.64it/s] 38it [00:08, 4.62it/s] 39it [00:08, 4.67it/s] 40it [00:08, 4.68it/s] 41it [00:08, 4.70it/s] 42it [00:09, 4.70it/s] 43it [00:09, 4.71it/s] 44it [00:09, 4.70it/s] 45it [00:09, 4.55it/s] 46it [00:10, 4.61it/s] 47it [00:10, 4.64it/s] 48it [00:10, 4.63it/s] 49it [00:10, 4.66it/s] 50it [00:10, 4.67it/s]2025-05-25 23:36:02,407 - INFO - [Epoch 056 | Batch 0050] IWAE-loss 1205.6969 | mean log_px -0.0039 | KL -1133.87 + 51it [00:11, 4.69it/s] 52it [00:11, 4.69it/s] 53it [00:11, 4.70it/s] 54it [00:11, 4.55it/s] 55it [00:11, 4.62it/s] 56it [00:12, 4.63it/s] 57it [00:12, 4.65it/s] 58it [00:12, 4.67it/s] 59it [00:12, 4.68it/s] 60it [00:13, 4.69it/s] 61it [00:13, 4.54it/s] 62it [00:13, 4.60it/s] 63it [00:13, 4.64it/s] 64it [00:13, 4.66it/s] 65it [00:14, 4.67it/s] 66it [00:14, 4.68it/s] 67it [00:14, 4.70it/s] 68it [00:14, 4.53it/s] 69it [00:14, 4.61it/s] 70it [00:15, 4.63it/s] 71it [00:15, 4.66it/s] 72it [00:15, 4.68it/s] 73it [00:15, 4.69it/s] 74it [00:16, 4.69it/s] 75it [00:16, 4.71it/s] 76it [00:16, 4.54it/s] 77it [00:16, 4.61it/s] 78it [00:16, 4.65it/s] 79it [00:17, 4.67it/s] 80it [00:17, 4.68it/s] 81it [00:17, 4.70it/s] 82it [00:17, 4.70it/s] 83it [00:17, 4.70it/s] 84it [00:18, 4.71it/s] 85it [00:18, 4.72it/s] 86it [00:18, 4.72it/s] 87it [00:18, 4.68it/s] 88it [00:19, 4.69it/s] 89it [00:19, 4.70it/s] 90it [00:19, 4.65it/s] 91it [00:19, 4.43it/s] 92it [00:19, 4.51it/s] 93it [00:20, 4.57it/s] 94it [00:20, 4.61it/s] 95it [00:20, 4.62it/s] 96it [00:20, 4.64it/s] 97it [00:20, 4.64it/s] 98it [00:21, 4.66it/s] 99it [00:21, 4.68it/s] 100it [00:21, 4.52it/s]2025-05-25 23:36:13,189 - INFO - [Epoch 056 | Batch 0100] IWAE-loss 1527.7909 | mean log_px -0.0108 | KL -1131.17 + 101it [00:21, 4.59it/s] 102it [00:22, 4.62it/s] 103it [00:22, 4.65it/s] 104it [00:22, 4.67it/s] 105it [00:22, 4.52it/s] 106it [00:22, 4.58it/s] 107it [00:23, 4.63it/s] 108it [00:23, 4.65it/s] 109it [00:23, 4.67it/s] 110it [00:23, 4.68it/s] 111it [00:24, 4.69it/s] 112it [00:24, 4.69it/s] 113it [00:24, 4.71it/s] 114it [00:24, 4.71it/s] 115it [00:24, 4.71it/s] 116it [00:25, 4.72it/s] 117it [00:25, 4.72it/s] 118it [00:25, 4.72it/s] 119it [00:25, 4.72it/s] 120it [00:25, 4.72it/s] 121it [00:26, 4.72it/s] 122it [00:26, 4.63it/s] 123it [00:26, 4.68it/s] 124it [00:26, 4.68it/s] 125it [00:26, 4.68it/s] 126it [00:27, 4.69it/s] 127it [00:27, 4.70it/s] 128it [00:27, 4.70it/s] 129it [00:27, 4.70it/s] 130it [00:28, 4.70it/s] 131it [00:28, 4.71it/s] 132it [00:28, 4.66it/s] 133it [00:28, 4.68it/s] 134it [00:28, 4.68it/s] 135it [00:29, 4.53it/s] 136it [00:29, 4.60it/s] 137it [00:29, 4.63it/s] 138it [00:29, 4.66it/s] 139it [00:29, 4.69it/s] 140it [00:30, 4.64it/s] 141it [00:30, 4.68it/s] 142it [00:30, 4.69it/s] 143it [00:30, 4.57it/s] 144it [00:31, 4.62it/s] 145it [00:31, 4.66it/s] 146it [00:31, 4.67it/s] 147it [00:31, 4.68it/s] 148it [00:31, 4.69it/s] 149it [00:32, 4.70it/s] 150it [00:32, 4.70it/s]2025-05-25 23:36:23,884 - INFO - [Epoch 056 | Batch 0150] IWAE-loss 1384.1519 | mean log_px -0.0041 | KL -1127.91 + 151it [00:32, 4.72it/s] 152it [00:32, 4.71it/s] 153it [00:32, 4.71it/s] 154it [00:33, 4.69it/s] 155it [00:33, 4.73it/s] 156it [00:33, 4.71it/s] 157it [00:33, 4.56it/s] 158it [00:34, 4.62it/s] 159it [00:34, 4.63it/s] 160it [00:34, 4.66it/s] 161it [00:34, 4.69it/s] 162it [00:34, 4.69it/s] 163it [00:35, 4.70it/s] 164it [00:35, 4.70it/s] 165it [00:35, 4.71it/s] 166it [00:35, 4.70it/s] 167it [00:36, 4.57it/s] 168it [00:36, 4.62it/s] 169it [00:36, 4.66it/s] 170it [00:36, 4.67it/s] 171it [00:36, 4.69it/s] 172it [00:37, 4.70it/s] 173it [00:37, 4.71it/s] 174it [00:37, 4.71it/s] 175it [00:37, 4.72it/s] 176it [00:37, 4.72it/s] 177it [00:38, 4.72it/s] 178it [00:38, 4.72it/s] 179it [00:38, 4.73it/s] 180it [00:38, 4.72it/s] 181it [00:38, 4.73it/s] 182it [00:39, 4.72it/s] 183it [00:39, 4.72it/s] 184it [00:39, 4.73it/s] 185it [00:39, 4.73it/s] 186it [00:40, 4.72it/s] 187it [00:40, 4.73it/s] 188it [00:40, 4.73it/s] 189it [00:40, 4.73it/s] 190it [00:40, 4.72it/s] 191it [00:41, 4.72it/s] 192it [00:41, 4.72it/s] 193it [00:41, 4.73it/s] 194it [00:41, 4.52it/s] 195it [00:41, 4.48it/s] 196it [00:42, 4.56it/s] 196it [00:42, 4.64it/s] +2025-05-25 23:36:33,640 - INFO - Epoch: 56, Objective: tensor([1635.1464], device='cuda:0', grad_fn=), Loss: 0.0118552902713418, KL/n: 23.14141273498535 + 0it [00:00, ?it/s]2025-05-25 23:36:34,057 - INFO - [Epoch 057 | Batch 0000] IWAE-loss 1257.1718 | mean log_px -0.0018 | KL -1129.48 + 1it [00:00, 2.93it/s] 2it [00:00, 3.70it/s] 3it [00:00, 4.06it/s] 4it [00:00, 4.28it/s] 5it [00:01, 4.39it/s] 6it [00:01, 4.46it/s] 7it [00:01, 4.33it/s] 8it [00:01, 4.45it/s] 9it [00:02, 4.48it/s] 10it [00:02, 4.52it/s] 11it [00:02, 4.57it/s] 12it [00:02, 4.60it/s] 13it [00:02, 4.61it/s] 14it [00:03, 4.62it/s] 15it [00:03, 4.61it/s] 16it [00:03, 4.45it/s] 17it [00:03, 4.54it/s] 18it [00:04, 4.58it/s] 19it [00:04, 4.57it/s] 20it [00:04, 4.51it/s] 21it [00:04, 4.55it/s] 22it [00:04, 4.57it/s] 23it [00:05, 4.60it/s] 24it [00:05, 4.59it/s] 25it [00:05, 4.46it/s] 26it [00:06, 3.58it/s] 27it [00:06, 3.81it/s] 28it [00:06, 4.03it/s] 29it [00:06, 4.20it/s] 30it [00:06, 4.18it/s] 31it [00:07, 4.32it/s] 32it [00:07, 4.37it/s] 33it [00:07, 4.46it/s] 34it [00:07, 4.47it/s] 35it [00:08, 4.53it/s] 36it [00:08, 4.58it/s] 37it [00:08, 4.40it/s] 38it [00:08, 4.48it/s] 39it [00:08, 4.55it/s] 40it [00:09, 4.59it/s] 41it [00:09, 4.63it/s] 42it [00:09, 4.51it/s] 43it [00:09, 4.59it/s] 44it [00:09, 4.62it/s] 45it [00:10, 4.65it/s] 46it [00:10, 4.67it/s] 47it [00:10, 4.69it/s] 48it [00:10, 4.45it/s] 49it [00:11, 4.55it/s] 50it [00:11, 4.59it/s]2025-05-25 23:36:45,213 - INFO - [Epoch 057 | Batch 0050] IWAE-loss 1460.0142 | mean log_px -0.0058 | KL -1131.17 + 51it [00:11, 4.63it/s] 52it [00:11, 4.64it/s] 53it [00:11, 4.49it/s] 54it [00:12, 4.57it/s] 55it [00:12, 4.61it/s] 56it [00:12, 4.64it/s] 57it [00:12, 4.65it/s] 58it [00:13, 4.65it/s] 59it [00:13, 4.67it/s] 60it [00:13, 4.68it/s] 61it [00:13, 4.52it/s] 62it [00:13, 4.56it/s] 63it [00:14, 4.58it/s] 64it [00:14, 4.59it/s] 65it [00:14, 4.62it/s] 66it [00:14, 4.65it/s] 67it [00:14, 4.68it/s] 68it [00:15, 4.67it/s] 69it [00:15, 4.69it/s] 70it [00:15, 4.68it/s] 71it [00:15, 4.63it/s] 72it [00:16, 4.45it/s] 73it [00:16, 4.54it/s] 74it [00:16, 4.43it/s] 75it [00:16, 4.52it/s] 76it [00:16, 4.56it/s] 77it [00:17, 4.61it/s] 78it [00:17, 4.58it/s] 79it [00:17, 4.58it/s] 80it [00:17, 4.60it/s] 81it [00:18, 4.62it/s] 82it [00:18, 4.63it/s] 83it [00:18, 4.47it/s] 84it [00:18, 4.56it/s] 85it [00:18, 4.59it/s] 86it [00:19, 4.60it/s] 87it [00:19, 4.64it/s] 88it [00:19, 4.66it/s] 89it [00:19, 4.67it/s] 90it [00:19, 4.68it/s] 91it [00:20, 4.69it/s] 92it [00:20, 4.69it/s] 93it [00:20, 4.53it/s] 94it [00:20, 4.59it/s] 95it [00:21, 4.63it/s] 96it [00:21, 4.66it/s] 97it [00:21, 4.66it/s] 98it [00:21, 4.68it/s] 99it [00:21, 4.62it/s] 100it [00:22, 4.44it/s]2025-05-25 23:36:56,088 - INFO - [Epoch 057 | Batch 0100] IWAE-loss 1242.8251 | mean log_px -0.0040 | KL -1129.03 + 101it [00:22, 4.50it/s] 102it [00:22, 4.46it/s] 103it [00:22, 4.50it/s] 104it [00:23, 4.53it/s] 105it [00:23, 4.55it/s] 106it [00:23, 4.40it/s] 107it [00:23, 4.43it/s] 108it [00:23, 4.49it/s] 109it [00:24, 4.52it/s] 110it [00:24, 4.53it/s] 111it [00:24, 4.43it/s] 112it [00:24, 4.49it/s] 113it [00:25, 4.53it/s] 114it [00:25, 4.55it/s] 115it [00:25, 4.56it/s] 116it [00:25, 4.57it/s] 117it [00:25, 4.53it/s] 118it [00:26, 4.41it/s] 119it [00:26, 4.50it/s] 120it [00:26, 4.49it/s] 121it [00:26, 4.50it/s] 122it [00:27, 4.53it/s] 123it [00:27, 4.51it/s] 124it [00:27, 4.53it/s] 125it [00:27, 4.52it/s] 126it [00:27, 4.53it/s] 127it [00:28, 4.55it/s] 128it [00:28, 4.41it/s] 129it [00:28, 4.46it/s] 130it [00:28, 4.50it/s] 131it [00:29, 4.53it/s] 132it [00:29, 4.56it/s] 133it [00:29, 4.58it/s] 134it [00:29, 4.58it/s] 135it [00:29, 4.57it/s] 136it [00:30, 4.41it/s] 137it [00:30, 4.45it/s] 138it [00:30, 4.50it/s] 139it [00:30, 4.53it/s] 140it [00:31, 4.55it/s] 141it [00:31, 4.57it/s] 142it [00:31, 4.53it/s] 143it [00:31, 4.55it/s] 144it [00:31, 4.53it/s] 145it [00:32, 4.55it/s] 146it [00:32, 4.54it/s] 147it [00:32, 4.54it/s] 148it [00:32, 4.55it/s] 149it [00:33, 4.44it/s] 150it [00:33, 4.51it/s]2025-05-25 23:37:07,173 - INFO - [Epoch 057 | Batch 0150] IWAE-loss 1292.4027 | mean log_px -0.0033 | KL -1125.85 + 151it [00:33, 4.49it/s] 152it [00:33, 4.52it/s] 153it [00:33, 4.55it/s] 154it [00:34, 4.55it/s] 155it [00:34, 4.56it/s] 156it [00:34, 4.57it/s] 157it [00:34, 4.51it/s] 158it [00:34, 4.51it/s] 159it [00:35, 4.53it/s] 160it [00:35, 4.53it/s] 161it [00:35, 4.34it/s] 162it [00:35, 4.22it/s] 163it [00:36, 4.27it/s] 164it [00:36, 4.34it/s] 165it [00:36, 4.43it/s] 166it [00:36, 4.47it/s] 167it [00:37, 4.52it/s] 168it [00:37, 4.55it/s] 169it [00:37, 4.57it/s] 170it [00:37, 4.57it/s] 171it [00:37, 4.59it/s] 172it [00:38, 4.58it/s] 173it [00:38, 4.57it/s] 174it [00:38, 4.59it/s] 175it [00:38, 4.55it/s] 176it [00:39, 4.53it/s] 177it [00:39, 4.55it/s] 178it [00:39, 4.39it/s] 179it [00:39, 4.39it/s] 180it [00:39, 4.27it/s] 181it [00:40, 4.34it/s] 182it [00:40, 4.39it/s] 183it [00:40, 4.43it/s] 184it [00:40, 4.39it/s] 185it [00:41, 4.39it/s] 186it [00:41, 4.39it/s] 187it [00:41, 4.41it/s] 188it [00:41, 4.29it/s] 189it [00:42, 4.33it/s] 190it [00:42, 4.36it/s] 191it [00:42, 4.41it/s] 192it [00:42, 4.40it/s] 193it [00:42, 4.39it/s] 194it [00:43, 4.44it/s] 195it [00:43, 4.36it/s] 196it [00:43, 4.36it/s] 196it [00:43, 4.49it/s] +2025-05-25 23:37:17,443 - INFO - Epoch: 57, Objective: tensor([1774.2374], device='cuda:0', grad_fn=), Loss: 0.010805794037878513, KL/n: 22.974790573120117 + 0it [00:00, ?it/s]2025-05-25 23:37:17,854 - INFO - [Epoch 058 | Batch 0000] IWAE-loss 1154.4401 | mean log_px -0.0014 | KL -1126.00 + 1it [00:00, 2.96it/s] 2it [00:00, 3.69it/s] 3it [00:00, 3.95it/s] 4it [00:01, 4.17it/s] 5it [00:01, 4.11it/s] 6it [00:01, 4.31it/s] 7it [00:01, 4.41it/s] 8it [00:01, 4.48it/s] 9it [00:02, 4.47it/s] 10it [00:02, 4.51it/s] 11it [00:02, 4.53it/s] 12it [00:02, 4.57it/s] 13it [00:03, 4.35it/s] 14it [00:03, 4.43it/s] 15it [00:03, 4.49it/s] 16it [00:03, 4.55it/s] 17it [00:03, 4.51it/s] 18it [00:04, 4.51it/s] 19it [00:04, 4.52it/s] 20it [00:04, 4.43it/s] 21it [00:04, 4.44it/s] 22it [00:05, 4.46it/s] 23it [00:05, 4.50it/s] 24it [00:05, 4.50it/s] 25it [00:05, 4.55it/s] 26it [00:05, 4.54it/s] 27it [00:06, 4.57it/s] 28it [00:06, 4.61it/s] 29it [00:06, 4.64it/s] 30it [00:06, 4.65it/s] 31it [00:06, 4.57it/s] 32it [00:07, 4.49it/s] 33it [00:07, 4.51it/s] 34it [00:07, 4.56it/s] 35it [00:07, 4.53it/s] 36it [00:08, 4.58it/s] 37it [00:08, 4.61it/s] 38it [00:08, 4.60it/s] 39it [00:08, 4.61it/s] 40it [00:08, 4.49it/s] 41it [00:09, 4.55it/s] 42it [00:09, 4.59it/s] 43it [00:09, 4.55it/s] 44it [00:09, 4.50it/s] 45it [00:10, 4.56it/s] 46it [00:10, 4.56it/s] 47it [00:10, 4.58it/s] 48it [00:10, 4.62it/s] 49it [00:10, 4.41it/s] 50it [00:11, 4.45it/s]2025-05-25 23:37:28,913 - INFO - [Epoch 058 | Batch 0050] IWAE-loss 1403.6750 | mean log_px -0.0124 | KL -1118.93 + 51it [00:11, 4.51it/s] 52it [00:11, 4.56it/s] 53it [00:11, 4.60it/s] 54it [00:12, 4.49it/s] 55it [00:12, 4.40it/s] 56it [00:12, 4.50it/s] 57it [00:12, 4.51it/s] 58it [00:12, 4.47it/s] 59it [00:13, 4.49it/s] 60it [00:13, 4.48it/s] 61it [00:13, 4.55it/s] 62it [00:13, 4.57it/s] 63it [00:14, 4.62it/s] 64it [00:14, 4.64it/s] 65it [00:14, 4.61it/s] 66it [00:14, 4.61it/s] 67it [00:14, 4.54it/s] 68it [00:15, 4.60it/s] 69it [00:15, 4.56it/s] 70it [00:15, 4.58it/s] 71it [00:15, 4.55it/s] 72it [00:16, 4.36it/s] 73it [00:16, 4.45it/s] 74it [00:16, 4.50it/s] 75it [00:16, 4.55it/s] 76it [00:16, 4.50it/s] 77it [00:17, 4.52it/s] 78it [00:17, 4.56it/s] 79it [00:17, 4.55it/s] 80it [00:17, 4.43it/s] 81it [00:18, 4.46it/s] 82it [00:18, 4.50it/s] 83it [00:18, 4.56it/s] 84it [00:18, 4.55it/s] 85it [00:18, 4.43it/s] 86it [00:19, 4.48it/s] 87it [00:19, 4.55it/s] 88it [00:19, 4.55it/s] 89it [00:19, 4.60it/s] 90it [00:20, 4.46it/s] 91it [00:20, 4.49it/s] 92it [00:20, 4.54it/s] 93it [00:20, 4.51it/s] 94it [00:20, 4.49it/s] 95it [00:21, 4.52it/s] 96it [00:21, 4.53it/s] 97it [00:21, 4.58it/s] 98it [00:21, 4.59it/s] 99it [00:22, 4.53it/s] 100it [00:22, 4.55it/s]2025-05-25 23:37:39,958 - INFO - [Epoch 058 | Batch 0100] IWAE-loss 1223.3649 | mean log_px -0.0015 | KL -1114.54 + 101it [00:22, 4.52it/s] 102it [00:22, 4.45it/s] 103it [00:22, 4.38it/s] 104it [00:23, 4.40it/s] 105it [00:23, 4.44it/s] 106it [00:23, 4.48it/s] 107it [00:23, 4.54it/s] 108it [00:24, 4.30it/s] 109it [00:24, 4.34it/s] 110it [00:24, 4.44it/s] 111it [00:24, 4.50it/s] 112it [00:24, 4.39it/s] 113it [00:25, 4.43it/s] 114it [00:25, 4.48it/s] 115it [00:25, 4.51it/s] 116it [00:25, 4.53it/s] 117it [00:26, 4.54it/s] 118it [00:26, 4.54it/s] 119it [00:26, 4.56it/s] 120it [00:26, 4.56it/s] 121it [00:26, 4.42it/s] 122it [00:27, 4.45it/s] 123it [00:27, 4.46it/s] 124it [00:27, 4.44it/s] 125it [00:27, 4.46it/s] 126it [00:28, 4.42it/s] 127it [00:28, 4.41it/s] 128it [00:28, 4.40it/s] 129it [00:28, 4.43it/s] 130it [00:28, 4.46it/s] 131it [00:29, 4.46it/s] 132it [00:29, 4.46it/s] 133it [00:29, 4.37it/s] 134it [00:29, 4.38it/s] 135it [00:30, 4.38it/s] 136it [00:30, 4.44it/s] 137it [00:30, 4.48it/s] 138it [00:30, 4.52it/s] 139it [00:30, 4.51it/s] 140it [00:31, 4.50it/s] 141it [00:31, 4.54it/s] 142it [00:31, 4.51it/s] 143it [00:31, 4.49it/s] 144it [00:32, 4.52it/s] 145it [00:32, 4.54it/s] 146it [00:32, 4.56it/s] 147it [00:32, 4.56it/s] 148it [00:32, 4.39it/s] 149it [00:33, 4.43it/s] 150it [00:33, 4.45it/s]2025-05-25 23:37:51,175 - INFO - [Epoch 058 | Batch 0150] IWAE-loss 1539.7325 | mean log_px -0.0100 | KL -1111.33 + 151it [00:33, 4.44it/s] 152it [00:33, 4.46it/s] 153it [00:34, 4.48it/s] 154it [00:34, 4.48it/s] 155it [00:34, 4.49it/s] 156it [00:34, 4.36it/s] 157it [00:35, 4.43it/s] 158it [00:35, 4.47it/s] 159it [00:35, 4.42it/s] 160it [00:35, 4.29it/s] 161it [00:35, 4.38it/s] 162it [00:36, 4.44it/s] 163it [00:36, 4.44it/s] 164it [00:36, 4.49it/s] 165it [00:36, 4.50it/s] 166it [00:37, 4.53it/s] 167it [00:37, 4.48it/s] 168it [00:37, 4.50it/s] 169it [00:37, 4.51it/s] 170it [00:37, 4.48it/s] 171it [00:38, 4.51it/s] 172it [00:38, 4.48it/s] 173it [00:38, 4.52it/s] 174it [00:38, 4.45it/s] 175it [00:39, 4.46it/s] 176it [00:39, 4.48it/s] 177it [00:39, 4.50it/s] 178it [00:39, 4.40it/s] 179it [00:39, 4.47it/s] 180it [00:40, 4.50it/s] 181it [00:40, 4.52it/s] 182it [00:40, 4.55it/s] 183it [00:40, 4.47it/s] 184it [00:41, 4.49it/s] 185it [00:41, 4.52it/s] 186it [00:41, 4.53it/s] 187it [00:41, 4.54it/s] 188it [00:41, 4.53it/s] 189it [00:42, 4.54it/s] 190it [00:42, 4.51it/s] 191it [00:42, 4.50it/s] 192it [00:42, 4.48it/s] 193it [00:43, 4.51it/s] 194it [00:43, 4.53it/s] 195it [00:43, 4.38it/s] 196it [00:43, 4.43it/s] 196it [00:43, 4.48it/s] +2025-05-25 23:38:01,366 - INFO - Epoch: 58, Objective: tensor([1163.4995], device='cuda:0', grad_fn=), Loss: 0.0014143032021820545, KL/n: 22.712282180786133 + 0it [00:00, ?it/s]2025-05-25 23:38:01,952 - INFO - [Epoch 059 | Batch 0000] IWAE-loss 1306.7094 | mean log_px -0.0034 | KL -1115.00 + 1it [00:00, 2.98it/s] 2it [00:00, 3.77it/s] 3it [00:00, 3.94it/s] 4it [00:01, 4.19it/s] 5it [00:01, 4.35it/s] 6it [00:01, 4.32it/s] 7it [00:01, 4.37it/s] 8it [00:01, 4.32it/s] 9it [00:02, 4.39it/s] 10it [00:02, 4.40it/s] 11it [00:02, 4.46it/s] 12it [00:02, 4.30it/s] 13it [00:03, 4.39it/s] 14it [00:03, 4.40it/s] 15it [00:03, 4.46it/s] 16it [00:03, 4.47it/s] 17it [00:03, 4.49it/s] 18it [00:04, 4.44it/s] 19it [00:04, 4.46it/s] 20it [00:04, 4.47it/s] 21it [00:04, 4.45it/s] 22it [00:05, 4.41it/s] 23it [00:05, 4.42it/s] 24it [00:05, 4.44it/s] 25it [00:05, 4.47it/s] 26it [00:05, 4.48it/s] 27it [00:06, 4.49it/s] 28it [00:06, 4.52it/s] 29it [00:06, 4.47it/s] 30it [00:06, 4.48it/s] 31it [00:07, 4.50it/s] 32it [00:07, 4.48it/s] 33it [00:07, 4.36it/s] 34it [00:07, 4.42it/s] 35it [00:07, 4.44it/s] 36it [00:08, 4.44it/s] 37it [00:08, 4.48it/s] 38it [00:08, 4.50it/s] 39it [00:08, 4.39it/s] 40it [00:09, 4.47it/s] 41it [00:09, 4.45it/s] 42it [00:09, 4.51it/s] 43it [00:09, 4.53it/s] 44it [00:09, 4.47it/s] 45it [00:10, 4.51it/s] 46it [00:10, 4.53it/s] 47it [00:10, 4.55it/s] 48it [00:10, 4.55it/s] 49it [00:11, 4.35it/s] 50it [00:11, 4.44it/s]2025-05-25 23:38:13,173 - INFO - [Epoch 059 | Batch 0050] IWAE-loss 1501.0148 | mean log_px -0.0083 | KL -1108.41 + 51it [00:11, 4.44it/s] 52it [00:11, 4.46it/s] 53it [00:11, 4.48it/s] 54it [00:12, 4.52it/s] 55it [00:12, 4.53it/s] 56it [00:12, 4.46it/s] 57it [00:12, 4.49it/s] 58it [00:13, 4.50it/s] 59it [00:13, 4.52it/s] 60it [00:13, 4.55it/s] 61it [00:13, 4.55it/s] 62it [00:13, 4.51it/s] 63it [00:14, 4.53it/s] 64it [00:14, 4.46it/s] 65it [00:14, 4.37it/s] 66it [00:14, 4.35it/s] 67it [00:15, 4.44it/s] 68it [00:15, 4.50it/s] 69it [00:15, 4.55it/s] 70it [00:15, 4.57it/s] 71it [00:15, 4.56it/s] 72it [00:16, 4.45it/s] 73it [00:16, 4.53it/s] 74it [00:16, 4.55it/s] 75it [00:16, 4.43it/s] 76it [00:17, 4.49it/s] 77it [00:17, 4.38it/s] 78it [00:17, 4.30it/s] 79it [00:17, 4.33it/s] 80it [00:18, 4.39it/s] 81it [00:18, 4.45it/s] 82it [00:18, 4.49it/s] 83it [00:18, 4.53it/s] 84it [00:18, 4.51it/s] 85it [00:19, 4.54it/s] 86it [00:19, 4.56it/s] 87it [00:19, 4.58it/s] 88it [00:19, 4.46it/s] 89it [00:20, 4.51it/s] 90it [00:20, 4.47it/s] 91it [00:20, 4.37it/s] 92it [00:20, 4.33it/s] 93it [00:20, 4.42it/s] 94it [00:21, 4.44it/s] 95it [00:21, 4.45it/s] 96it [00:21, 4.46it/s] 97it [00:21, 4.44it/s] 98it [00:22, 4.34it/s] 99it [00:22, 4.33it/s] 100it [00:22, 4.36it/s]2025-05-25 23:38:24,384 - INFO - [Epoch 059 | Batch 0100] IWAE-loss 1170.6613 | mean log_px -0.0009 | KL -1106.82 + 101it [00:22, 4.40it/s] 102it [00:22, 4.44it/s] 103it [00:23, 4.39it/s] 104it [00:23, 4.49it/s] 105it [00:23, 4.53it/s] 106it [00:23, 4.59it/s] 107it [00:24, 4.62it/s] 108it [00:24, 4.64it/s] 109it [00:24, 4.67it/s] 110it [00:24, 4.65it/s] 111it [00:24, 4.62it/s] 112it [00:25, 4.64it/s] 113it [00:25, 4.51it/s] 114it [00:25, 4.54it/s] 115it [00:25, 4.51it/s] 116it [00:26, 4.55it/s] 117it [00:26, 4.55it/s] 118it [00:26, 4.58it/s] 119it [00:26, 4.56it/s] 120it [00:26, 4.58it/s] 121it [00:27, 4.60it/s] 122it [00:27, 4.62it/s] 123it [00:27, 4.57it/s] 124it [00:27, 4.62it/s] 125it [00:27, 4.60it/s] 126it [00:28, 4.63it/s] 127it [00:28, 4.57it/s] 128it [00:28, 4.54it/s] 129it [00:28, 4.60it/s] 130it [00:29, 4.63it/s] 131it [00:29, 4.62it/s] 132it [00:29, 4.64it/s] 133it [00:29, 4.67it/s] 134it [00:29, 4.64it/s] 135it [00:30, 4.66it/s] 136it [00:30, 4.65it/s] 137it [00:30, 4.63it/s] 138it [00:30, 4.57it/s] 139it [00:31, 4.59it/s] 140it [00:31, 4.61it/s] 141it [00:31, 4.58it/s] 142it [00:31, 4.62it/s] 143it [00:31, 4.66it/s] 144it [00:32, 4.68it/s] 145it [00:32, 4.68it/s] 146it [00:32, 4.67it/s] 147it [00:32, 4.59it/s] 148it [00:32, 4.50it/s] 149it [00:33, 4.52it/s] 150it [00:33, 4.57it/s]2025-05-25 23:38:35,261 - INFO - [Epoch 059 | Batch 0150] IWAE-loss 1656.5128 | mean log_px -0.0145 | KL -1106.05 + 151it [00:33, 4.54it/s] 152it [00:33, 4.49it/s] 153it [00:34, 4.54it/s] 154it [00:34, 4.50it/s] 155it [00:34, 4.51it/s] 156it [00:34, 4.49it/s] 157it [00:34, 4.51it/s] 158it [00:35, 4.53it/s] 159it [00:35, 4.59it/s] 160it [00:35, 4.63it/s] 161it [00:35, 4.64it/s] 162it [00:36, 4.54it/s] 163it [00:36, 4.58it/s] 164it [00:36, 4.56it/s] 165it [00:36, 4.57it/s] 166it [00:36, 4.46it/s] 167it [00:37, 4.52it/s] 168it [00:37, 4.53it/s] 169it [00:37, 4.56it/s] 170it [00:37, 4.56it/s] 171it [00:38, 4.57it/s] 172it [00:38, 4.58it/s] 173it [00:38, 4.56it/s] 174it [00:38, 4.57it/s] 175it [00:38, 4.53it/s] 176it [00:39, 4.53it/s] 177it [00:39, 4.53it/s] 178it [00:39, 4.52it/s] 179it [00:39, 4.54it/s] 180it [00:40, 4.56it/s] 181it [00:40, 4.57it/s] 182it [00:40, 4.57it/s] 183it [00:40, 4.62it/s] 184it [00:40, 4.48it/s] 185it [00:41, 4.56it/s] 186it [00:41, 4.52it/s] 187it [00:41, 4.56it/s] 188it [00:41, 4.56it/s] 189it [00:41, 4.57it/s] 190it [00:42, 4.50it/s] 191it [00:42, 4.56it/s] 192it [00:42, 4.47it/s] 193it [00:42, 4.54it/s] 194it [00:43, 4.55it/s] 195it [00:43, 4.47it/s] 196it [00:43, 4.54it/s] 196it [00:43, 4.49it/s] +2025-05-25 23:38:45,301 - INFO - Epoch: 59, Objective: tensor([1502.0814], device='cuda:0', grad_fn=), Loss: 0.015234545804560184, KL/n: 22.524457931518555 + 0it [00:00, ?it/s]2025-05-25 23:38:45,677 - INFO - [Epoch 060 | Batch 0000] IWAE-loss 1251.1169 | mean log_px -0.0041 | KL -1102.64 + 1it [00:00, 3.30it/s] 2it [00:00, 4.01it/s] 3it [00:00, 4.36it/s] 4it [00:00, 4.47it/s] 5it [00:01, 4.57it/s] 6it [00:01, 4.61it/s] 7it [00:01, 4.66it/s] 8it [00:01, 4.66it/s] 9it [00:01, 4.69it/s] 10it [00:02, 4.69it/s] 11it [00:02, 3.59it/s] 12it [00:02, 3.86it/s] 13it [00:03, 4.08it/s] 14it [00:03, 4.24it/s] 15it [00:03, 4.35it/s] 16it [00:03, 4.45it/s] 17it [00:03, 4.54it/s] 18it [00:04, 4.59it/s] 19it [00:04, 4.63it/s] 20it [00:04, 4.62it/s] 21it [00:04, 4.66it/s] 22it [00:04, 4.67it/s] 23it [00:05, 4.70it/s] 24it [00:05, 4.71it/s] 25it [00:05, 4.72it/s] 26it [00:05, 4.72it/s] 27it [00:06, 4.73it/s] 28it [00:06, 4.72it/s] 29it [00:06, 4.72it/s] 30it [00:06, 4.72it/s] 31it [00:06, 4.72it/s] 32it [00:07, 4.72it/s] 33it [00:07, 4.73it/s] 34it [00:07, 4.72it/s] 35it [00:07, 4.73it/s] 36it [00:07, 4.72it/s] 37it [00:08, 4.73it/s] 38it [00:08, 4.73it/s] 39it [00:08, 4.73it/s] 40it [00:08, 4.72it/s] 41it [00:08, 4.73it/s] 42it [00:09, 4.69it/s] 43it [00:09, 4.71it/s] 44it [00:09, 4.71it/s] 45it [00:09, 4.72it/s] 46it [00:10, 4.72it/s] 47it [00:10, 4.72it/s] 48it [00:10, 4.72it/s] 49it [00:10, 4.73it/s] 50it [00:10, 4.72it/s]2025-05-25 23:38:56,493 - INFO - [Epoch 060 | Batch 0050] IWAE-loss 1318.0186 | mean log_px -0.0060 | KL -1099.36 + 51it [00:11, 4.70it/s] 52it [00:11, 4.70it/s] 53it [00:11, 4.72it/s] 54it [00:11, 4.70it/s] 55it [00:11, 4.71it/s] 56it [00:12, 4.72it/s] 57it [00:12, 4.72it/s] 58it [00:12, 4.72it/s] 59it [00:12, 4.68it/s] 60it [00:13, 4.59it/s] 61it [00:13, 4.63it/s] 62it [00:13, 4.67it/s] 63it [00:13, 4.70it/s] 64it [00:13, 4.71it/s] 65it [00:14, 4.71it/s] 66it [00:14, 4.71it/s] 67it [00:14, 4.72it/s] 68it [00:14, 4.72it/s] 69it [00:14, 4.72it/s] 70it [00:15, 4.72it/s] 71it [00:15, 4.72it/s] 72it [00:15, 4.72it/s] 73it [00:15, 4.71it/s] 74it [00:16, 4.69it/s] 75it [00:16, 4.71it/s] 76it [00:16, 4.71it/s] 77it [00:16, 4.72it/s] 78it [00:16, 4.65it/s] 79it [00:17, 4.68it/s] 80it [00:17, 4.69it/s] 81it [00:17, 4.71it/s] 82it [00:17, 4.71it/s] 83it [00:17, 4.72it/s] 84it [00:18, 4.71it/s] 85it [00:18, 4.72it/s] 86it [00:18, 4.72it/s] 87it [00:18, 4.73it/s] 88it [00:18, 4.72it/s] 89it [00:19, 4.73it/s] 90it [00:19, 4.72it/s] 91it [00:19, 4.73it/s] 92it [00:19, 4.72it/s] 93it [00:20, 4.73it/s] 94it [00:20, 4.72it/s] 95it [00:20, 4.72it/s] 96it [00:20, 4.71it/s] 97it [00:20, 4.72it/s] 98it [00:21, 4.72it/s] 99it [00:21, 4.73it/s] 100it [00:21, 4.72it/s]2025-05-25 23:39:07,114 - INFO - [Epoch 060 | Batch 0100] IWAE-loss 1443.9005 | mean log_px -0.0049 | KL -1095.84 + 101it [00:21, 4.72it/s] 102it [00:21, 4.72it/s] 103it [00:22, 4.73it/s] 104it [00:22, 4.69it/s] 105it [00:22, 4.70it/s] 106it [00:22, 4.70it/s] 107it [00:23, 4.71it/s] 108it [00:23, 4.69it/s] 109it [00:23, 4.71it/s] 110it [00:23, 4.71it/s] 111it [00:23, 4.73it/s] 112it [00:24, 4.73it/s] 113it [00:24, 4.74it/s] 114it [00:24, 4.74it/s] 115it [00:24, 4.75it/s] 116it [00:24, 4.74it/s] 117it [00:25, 4.75it/s] 118it [00:25, 4.75it/s] 119it [00:25, 4.75it/s] 120it [00:25, 4.74it/s] 121it [00:25, 4.75it/s] 122it [00:26, 4.76it/s] 123it [00:26, 4.75it/s] 124it [00:26, 4.74it/s] 125it [00:26, 4.75it/s] 126it [00:27, 4.74it/s] 127it [00:27, 4.71it/s] 128it [00:27, 4.71it/s] 129it [00:27, 4.72it/s] 130it [00:27, 4.73it/s] 131it [00:28, 4.74it/s] 132it [00:28, 4.74it/s] 133it [00:28, 4.75it/s] 134it [00:28, 4.74it/s] 135it [00:28, 4.73it/s] 136it [00:29, 4.72it/s] 137it [00:29, 4.72it/s] 138it [00:29, 4.71it/s] 139it [00:29, 4.56it/s] 140it [00:30, 4.60it/s] 141it [00:30, 4.64it/s] 142it [00:30, 4.50it/s] 143it [00:30, 4.58it/s] 144it [00:30, 4.61it/s] 145it [00:31, 4.64it/s] 146it [00:31, 4.66it/s] 147it [00:31, 4.67it/s] 148it [00:31, 4.67it/s] 149it [00:31, 4.68it/s] 150it [00:32, 4.68it/s]2025-05-25 23:39:17,752 - INFO - [Epoch 060 | Batch 0150] IWAE-loss 1876.3032 | mean log_px -0.0125 | KL -1099.04 + 151it [00:32, 4.52it/s] 152it [00:32, 4.60it/s] 153it [00:32, 4.65it/s] 154it [00:33, 4.67it/s] 155it [00:33, 4.69it/s] 156it [00:33, 4.70it/s] 157it [00:33, 4.49it/s] 158it [00:33, 4.45it/s] 159it [00:34, 4.46it/s] 160it [00:34, 4.48it/s] 161it [00:34, 4.49it/s] 162it [00:34, 4.45it/s] 163it [00:35, 4.49it/s] 164it [00:35, 4.34it/s] 165it [00:35, 4.43it/s] 166it [00:35, 4.47it/s] 167it [00:35, 4.51it/s] 168it [00:36, 4.53it/s] 169it [00:36, 4.56it/s] 170it [00:36, 4.57it/s] 171it [00:36, 4.58it/s] 172it [00:37, 4.45it/s] 173it [00:37, 4.50it/s] 174it [00:37, 4.54it/s] 175it [00:37, 4.56it/s] 176it [00:37, 4.57it/s] 177it [00:38, 4.57it/s] 178it [00:38, 4.44it/s] 179it [00:38, 4.47it/s] 180it [00:38, 4.50it/s] 181it [00:39, 4.53it/s] 182it [00:39, 4.57it/s] 183it [00:39, 4.59it/s] 184it [00:39, 4.63it/s] 185it [00:39, 4.50it/s] 186it [00:40, 4.58it/s] 187it [00:40, 4.62it/s] 188it [00:40, 4.65it/s] 189it [00:40, 4.68it/s] 190it [00:40, 4.56it/s] 191it [00:41, 4.63it/s] 192it [00:41, 4.66it/s] 193it [00:41, 4.68it/s] 194it [00:41, 4.53it/s] 195it [00:42, 4.33it/s] 196it [00:42, 4.32it/s] 196it [00:42, 4.62it/s] +2025-05-25 23:39:27,853 - INFO - Epoch: 60, Objective: tensor([1335.1680], device='cuda:0', grad_fn=), Loss: 0.0030267671681940556, KL/n: 22.3603515625 + 0it [00:00, ?it/s]2025-05-25 23:39:28,205 - INFO - [Epoch 061 | Batch 0000] IWAE-loss 1409.4937 | mean log_px -0.0081 | KL -1098.50 + 1it [00:00, 3.65it/s] 2it [00:00, 3.82it/s] 3it [00:00, 4.13it/s] 4it [00:00, 4.31it/s] 5it [00:01, 4.26it/s] 6it [00:01, 4.40it/s] 7it [00:01, 4.49it/s] 8it [00:01, 4.54it/s] 9it [00:02, 4.62it/s] 10it [00:02, 4.62it/s] 11it [00:02, 4.65it/s] 12it [00:02, 4.67it/s] 13it [00:02, 4.49it/s] 14it [00:03, 4.57it/s] 15it [00:03, 4.61it/s] 16it [00:03, 4.57it/s] 17it [00:03, 4.43it/s] 18it [00:04, 4.50it/s] 19it [00:04, 4.38it/s] 20it [00:04, 4.48it/s] 21it [00:04, 4.55it/s] 22it [00:04, 4.58it/s] 23it [00:05, 4.61it/s] 24it [00:05, 4.63it/s] 25it [00:05, 4.65it/s] 26it [00:05, 4.63it/s] 27it [00:05, 4.67it/s] 28it [00:06, 4.68it/s] 29it [00:06, 4.69it/s] 30it [00:06, 4.51it/s] 31it [00:06, 4.58it/s] 32it [00:07, 4.62it/s] 33it [00:07, 4.65it/s] 34it [00:07, 4.66it/s] 35it [00:07, 4.62it/s] 36it [00:07, 4.63it/s] 37it [00:08, 4.66it/s] 38it [00:08, 4.54it/s] 39it [00:08, 4.61it/s] 40it [00:08, 4.63it/s] 41it [00:09, 4.66it/s] 42it [00:09, 4.66it/s] 43it [00:09, 4.67it/s] 44it [00:09, 4.67it/s] 45it [00:09, 4.68it/s] 46it [00:10, 4.56it/s] 47it [00:10, 4.60it/s] 48it [00:10, 4.60it/s] 49it [00:10, 4.59it/s] 50it [00:10, 4.60it/s]2025-05-25 23:39:39,114 - INFO - [Epoch 061 | Batch 0050] IWAE-loss 1398.4414 | mean log_px -0.0127 | KL -1090.44 + 51it [00:11, 4.61it/s] 52it [00:11, 4.64it/s] 53it [00:11, 4.67it/s] 54it [00:11, 4.68it/s] 55it [00:12, 4.68it/s] 56it [00:12, 4.67it/s] 57it [00:12, 4.69it/s] 58it [00:12, 4.51it/s] 59it [00:12, 4.55it/s] 60it [00:13, 4.60it/s] 61it [00:13, 4.64it/s] 62it [00:13, 4.63it/s] 63it [00:13, 4.64it/s] 64it [00:13, 4.66it/s] 65it [00:14, 4.66it/s] 66it [00:14, 4.67it/s] 67it [00:14, 4.67it/s] 68it [00:14, 4.51it/s] 69it [00:15, 4.59it/s] 70it [00:15, 4.63it/s] 71it [00:15, 4.65it/s] 72it [00:15, 4.66it/s] 73it [00:15, 4.66it/s] 74it [00:16, 4.68it/s] 75it [00:16, 4.65it/s] 76it [00:16, 4.67it/s] 77it [00:16, 4.47it/s] 78it [00:17, 4.55it/s] 79it [00:17, 4.60it/s] 80it [00:17, 4.63it/s] 81it [00:17, 4.66it/s] 82it [00:17, 4.65it/s] 83it [00:18, 4.64it/s] 84it [00:18, 4.66it/s] 85it [00:18, 4.52it/s] 86it [00:18, 4.59it/s] 87it [00:18, 4.56it/s] 88it [00:19, 4.62it/s] 89it [00:19, 4.65it/s] 90it [00:19, 4.67it/s] 91it [00:19, 4.69it/s] 92it [00:20, 4.69it/s] 93it [00:20, 4.52it/s] 94it [00:20, 4.56it/s] 95it [00:20, 4.58it/s] 96it [00:20, 4.62it/s] 97it [00:21, 4.66it/s] 98it [00:21, 4.67it/s] 99it [00:21, 4.68it/s] 100it [00:21, 4.66it/s]2025-05-25 23:39:49,917 - INFO - [Epoch 061 | Batch 0100] IWAE-loss 1398.7993 | mean log_px -0.0086 | KL -1086.49 + 101it [00:21, 4.63it/s] 102it [00:22, 4.61it/s] 103it [00:22, 4.41it/s] 104it [00:22, 4.32it/s] 105it [00:22, 4.43it/s] 106it [00:23, 4.51it/s] 107it [00:23, 4.56it/s] 108it [00:23, 4.57it/s] 109it [00:23, 4.60it/s] 110it [00:23, 4.63it/s] 111it [00:24, 4.63it/s] 112it [00:24, 4.53it/s] 113it [00:24, 4.60it/s] 114it [00:24, 4.63it/s] 115it [00:25, 4.66it/s] 116it [00:25, 4.64it/s] 117it [00:25, 4.63it/s] 118it [00:25, 4.62it/s] 119it [00:25, 4.65it/s] 120it [00:26, 4.67it/s] 121it [00:26, 4.66it/s] 122it [00:26, 4.65it/s] 123it [00:26, 4.51it/s] 124it [00:27, 4.58it/s] 125it [00:27, 4.63it/s] 126it [00:27, 4.65it/s] 127it [00:27, 4.67it/s] 128it [00:27, 4.69it/s] 129it [00:28, 4.71it/s] 130it [00:28, 4.70it/s] 131it [00:28, 4.54it/s] 132it [00:28, 4.61it/s] 133it [00:28, 4.64it/s] 134it [00:29, 4.66it/s] 135it [00:29, 4.68it/s] 136it [00:29, 4.52it/s] 137it [00:29, 4.59it/s] 138it [00:30, 4.62it/s] 139it [00:30, 4.62it/s] 140it [00:30, 4.63it/s] 141it [00:30, 4.66it/s] 142it [00:30, 4.68it/s] 143it [00:31, 4.70it/s] 144it [00:31, 4.70it/s] 145it [00:31, 4.71it/s] 146it [00:31, 4.71it/s] 147it [00:31, 4.72it/s] 148it [00:32, 4.72it/s] 149it [00:32, 4.72it/s] 150it [00:32, 4.71it/s]2025-05-25 23:40:00,726 - INFO - [Epoch 061 | Batch 0150] IWAE-loss 1164.0669 | mean log_px -0.0021 | KL -1089.75 + 151it [00:32, 4.54it/s] 152it [00:33, 4.59it/s] 153it [00:33, 4.57it/s] 154it [00:33, 4.57it/s] 155it [00:33, 4.63it/s] 156it [00:33, 4.64it/s] 157it [00:34, 4.59it/s] 158it [00:34, 4.58it/s] 159it [00:34, 4.60it/s] 160it [00:34, 4.61it/s] 161it [00:34, 4.65it/s] 162it [00:35, 4.67it/s] 163it [00:35, 4.69it/s] 164it [00:35, 4.70it/s] 165it [00:35, 4.54it/s] 166it [00:36, 4.61it/s] 167it [00:36, 4.64it/s] 168it [00:36, 4.64it/s] 169it [00:36, 4.67it/s] 170it [00:36, 4.67it/s] 171it [00:37, 4.69it/s] 172it [00:37, 4.52it/s] 173it [00:37, 4.58it/s] 174it [00:37, 4.61it/s] 175it [00:38, 4.65it/s] 176it [00:38, 4.67it/s] 177it [00:38, 4.69it/s] 178it [00:38, 4.69it/s] 179it [00:38, 4.70it/s] 180it [00:39, 4.63it/s] 181it [00:39, 4.68it/s] 182it [00:39, 4.69it/s] 183it [00:39, 4.71it/s] 184it [00:39, 4.71it/s] 185it [00:40, 4.72it/s] 186it [00:40, 4.71it/s] 187it [00:40, 4.71it/s] 188it [00:40, 4.71it/s] 189it [00:40, 4.72it/s] 190it [00:41, 4.71it/s] 191it [00:41, 4.72it/s] 192it [00:41, 4.72it/s] 193it [00:41, 4.51it/s] 194it [00:42, 4.55it/s] 195it [00:42, 4.52it/s] 196it [00:42, 4.58it/s] 196it [00:42, 4.60it/s] +2025-05-25 23:40:10,566 - INFO - Epoch: 61, Objective: tensor([2204.2148], device='cuda:0', grad_fn=), Loss: 0.01952478662133217, KL/n: 22.221717834472656 + 0it [00:00, ?it/s]2025-05-25 23:40:11,163 - INFO - [Epoch 062 | Batch 0000] IWAE-loss 1198.3219 | mean log_px -0.0081 | KL -1089.96 + 1it [00:00, 2.94it/s] 2it [00:00, 3.77it/s] 3it [00:00, 4.13it/s] 4it [00:00, 4.34it/s] 5it [00:01, 4.46it/s] 6it [00:01, 4.54it/s] 7it [00:01, 4.58it/s] 8it [00:01, 4.62it/s] 9it [00:02, 4.48it/s] 10it [00:02, 4.56it/s] 11it [00:02, 4.61it/s] 12it [00:02, 4.65it/s] 13it [00:02, 4.68it/s] 14it [00:03, 4.69it/s] 15it [00:03, 4.71it/s] 16it [00:03, 4.71it/s] 17it [00:03, 4.72it/s] 18it [00:03, 4.71it/s] 19it [00:04, 4.73it/s] 20it [00:04, 4.72it/s] 21it [00:04, 4.72it/s] 22it [00:04, 4.73it/s] 23it [00:05, 4.73it/s] 24it [00:05, 4.73it/s] 25it [00:05, 4.74it/s] 26it [00:05, 4.72it/s] 27it [00:05, 4.72it/s] 28it [00:06, 4.72it/s] 29it [00:06, 4.56it/s] 30it [00:06, 4.62it/s] 31it [00:06, 4.66it/s] 32it [00:06, 4.67it/s] 33it [00:07, 4.66it/s] 34it [00:07, 4.68it/s] 35it [00:07, 4.70it/s] 36it [00:07, 4.71it/s] 37it [00:08, 4.72it/s] 38it [00:08, 4.72it/s] 39it [00:08, 4.73it/s] 40it [00:08, 4.73it/s] 41it [00:08, 4.73it/s] 42it [00:09, 4.74it/s] 43it [00:09, 4.57it/s] 44it [00:09, 4.62it/s] 45it [00:09, 4.66it/s] 46it [00:09, 4.68it/s] 47it [00:10, 4.69it/s] 48it [00:10, 4.65it/s] 49it [00:10, 4.69it/s] 50it [00:10, 4.66it/s]2025-05-25 23:40:21,847 - INFO - [Epoch 062 | Batch 0050] IWAE-loss 1275.6980 | mean log_px -0.0043 | KL -1085.77 + 51it [00:11, 4.43it/s] 52it [00:11, 4.53it/s] 53it [00:11, 4.59it/s] 54it [00:11, 4.62it/s] 55it [00:11, 4.66it/s] 56it [00:12, 4.66it/s] 57it [00:12, 4.67it/s] 58it [00:12, 4.68it/s] 59it [00:12, 4.70it/s] 60it [00:12, 4.71it/s] 61it [00:13, 4.72it/s] 62it [00:13, 4.55it/s] 63it [00:13, 4.63it/s] 64it [00:13, 4.65it/s] 65it [00:14, 4.68it/s] 66it [00:14, 4.69it/s] 67it [00:14, 4.70it/s] 68it [00:14, 4.71it/s] 69it [00:14, 4.55it/s] 70it [00:15, 4.62it/s] 71it [00:15, 4.65it/s] 72it [00:15, 4.67it/s] 73it [00:15, 4.70it/s] 74it [00:15, 4.70it/s] 75it [00:16, 4.71it/s] 76it [00:16, 4.70it/s] 77it [00:16, 4.70it/s] 78it [00:16, 4.71it/s] 79it [00:17, 4.55it/s] 80it [00:17, 4.61it/s] 81it [00:17, 4.65it/s] 82it [00:17, 4.68it/s] 83it [00:17, 4.69it/s] 84it [00:18, 4.70it/s] 85it [00:18, 4.71it/s] 86it [00:18, 4.72it/s] 87it [00:18, 4.73it/s] 88it [00:18, 4.72it/s] 89it [00:19, 4.73it/s] 90it [00:19, 4.72it/s] 91it [00:19, 4.62it/s] 92it [00:19, 4.67it/s] 93it [00:20, 4.68it/s] 94it [00:20, 4.70it/s] 95it [00:20, 4.71it/s] 96it [00:20, 4.71it/s] 97it [00:20, 4.73it/s] 98it [00:21, 4.72it/s] 99it [00:21, 4.73it/s] 100it [00:21, 4.73it/s]2025-05-25 23:40:32,540 - INFO - [Epoch 062 | Batch 0100] IWAE-loss 1882.4122 | mean log_px -0.0167 | KL -1085.27 + 101it [00:21, 4.73it/s] 102it [00:21, 4.52it/s] 103it [00:22, 4.60it/s] 104it [00:22, 4.64it/s] 105it [00:22, 4.66it/s] 106it [00:22, 4.68it/s] 107it [00:23, 4.71it/s] 108it [00:23, 4.70it/s] 109it [00:23, 4.71it/s] 110it [00:23, 4.70it/s] 111it [00:23, 4.53it/s] 112it [00:24, 4.60it/s] 113it [00:24, 4.64it/s] 114it [00:24, 4.66it/s] 115it [00:24, 4.68it/s] 116it [00:24, 4.68it/s] 117it [00:25, 4.68it/s] 118it [00:25, 4.52it/s] 119it [00:25, 4.60it/s] 120it [00:25, 4.64it/s] 121it [00:26, 4.67it/s] 122it [00:26, 4.68it/s] 123it [00:26, 4.70it/s] 124it [00:26, 4.70it/s] 125it [00:26, 4.72it/s] 126it [00:27, 4.72it/s] 127it [00:27, 4.73it/s] 128it [00:27, 4.72it/s] 129it [00:27, 4.73it/s] 130it [00:27, 4.73it/s] 131it [00:28, 4.73it/s] 132it [00:28, 4.72it/s] 133it [00:28, 4.73it/s] 134it [00:28, 4.72it/s] 135it [00:28, 4.74it/s] 136it [00:29, 4.73it/s] 137it [00:29, 4.73it/s] 138it [00:29, 4.73it/s] 139it [00:29, 4.73it/s] 140it [00:30, 4.73it/s] 141it [00:30, 4.72it/s] 142it [00:30, 4.72it/s] 143it [00:30, 4.73it/s] 144it [00:30, 4.72it/s] 145it [00:31, 4.73it/s] 146it [00:31, 4.72it/s] 147it [00:31, 4.59it/s] 148it [00:31, 4.64it/s] 149it [00:31, 4.66it/s] 150it [00:32, 4.67it/s]2025-05-25 23:40:43,225 - INFO - [Epoch 062 | Batch 0150] IWAE-loss 1197.9325 | mean log_px -0.0030 | KL -1087.20 + 151it [00:32, 4.69it/s] 152it [00:32, 4.70it/s] 153it [00:32, 4.70it/s] 154it [00:33, 4.72it/s] 155it [00:33, 4.67it/s] 156it [00:33, 4.68it/s] 157it [00:33, 4.70it/s] 158it [00:33, 4.54it/s] 159it [00:34, 4.61it/s] 160it [00:34, 4.63it/s] 161it [00:34, 4.66it/s] 162it [00:34, 4.68it/s] 163it [00:34, 4.69it/s] 164it [00:35, 4.70it/s] 165it [00:35, 4.71it/s] 166it [00:35, 4.53it/s] 167it [00:35, 4.44it/s] 168it [00:36, 4.47it/s] 169it [00:36, 4.54it/s] 170it [00:36, 4.58it/s] 171it [00:36, 4.63it/s] 172it [00:36, 4.66it/s] 173it [00:37, 4.68it/s] 174it [00:37, 4.69it/s] 175it [00:37, 4.70it/s] 176it [00:37, 4.70it/s] 177it [00:37, 4.72it/s] 178it [00:38, 4.72it/s] 179it [00:38, 4.72it/s] 180it [00:38, 4.72it/s] 181it [00:38, 4.72it/s] 182it [00:39, 4.70it/s] 183it [00:39, 4.71it/s] 184it [00:39, 4.72it/s] 185it [00:39, 4.49it/s] 186it [00:39, 4.57it/s] 187it [00:40, 4.62it/s] 188it [00:40, 4.65it/s] 189it [00:40, 4.67it/s] 190it [00:40, 4.68it/s] 191it [00:41, 4.53it/s] 192it [00:41, 4.61it/s] 193it [00:41, 4.64it/s] 194it [00:41, 4.66it/s] 195it [00:41, 4.56it/s] 196it [00:42, 4.62it/s] 196it [00:42, 4.65it/s] +2025-05-25 23:40:53,055 - INFO - Epoch: 62, Objective: tensor([1330.0718], device='cuda:0', grad_fn=), Loss: 0.0047620623372495174, KL/n: 22.193544387817383 + 0it [00:00, ?it/s]2025-05-25 23:40:53,472 - INFO - [Epoch 063 | Batch 0000] IWAE-loss 1133.7760 | mean log_px -0.0013 | KL -1085.79 + 1it [00:00, 2.71it/s] 2it [00:00, 3.62it/s] 3it [00:00, 4.03it/s] 4it [00:01, 4.22it/s] 5it [00:01, 4.33it/s] 6it [00:01, 4.45it/s] 7it [00:01, 4.52it/s] 8it [00:01, 4.56it/s] 9it [00:02, 4.59it/s] 10it [00:02, 3.51it/s] 11it [00:02, 3.82it/s] 12it [00:02, 4.05it/s] 13it [00:03, 4.20it/s] 14it [00:03, 4.34it/s] 15it [00:03, 4.28it/s] 16it [00:03, 4.37it/s] 17it [00:04, 4.44it/s] 18it [00:04, 4.51it/s] 19it [00:04, 4.37it/s] 20it [00:04, 4.46it/s] 21it [00:04, 4.42it/s] 22it [00:05, 4.50it/s] 23it [00:05, 4.42it/s] 24it [00:05, 4.51it/s] 25it [00:05, 4.34it/s] 26it [00:06, 4.41it/s] 27it [00:06, 4.45it/s] 28it [00:06, 4.45it/s] 29it [00:06, 4.50it/s] 30it [00:06, 4.50it/s] 31it [00:07, 4.34it/s] 32it [00:07, 4.42it/s] 33it [00:07, 4.43it/s] 34it [00:07, 4.49it/s] 35it [00:08, 4.48it/s] 36it [00:08, 4.50it/s] 37it [00:08, 4.39it/s] 38it [00:08, 4.48it/s] 39it [00:08, 4.50it/s] 40it [00:09, 4.54it/s] 41it [00:09, 4.51it/s] 42it [00:09, 4.42it/s] 43it [00:09, 4.50it/s] 44it [00:10, 4.54it/s] 45it [00:10, 4.49it/s] 46it [00:10, 4.53it/s] 47it [00:10, 4.47it/s] 48it [00:11, 4.35it/s] 49it [00:11, 4.39it/s] 50it [00:11, 4.45it/s]2025-05-25 23:41:04,812 - INFO - [Epoch 063 | Batch 0050] IWAE-loss 1150.0118 | mean log_px -0.0013 | KL -1081.11 + 51it [00:11, 4.47it/s] 52it [00:11, 4.52it/s] 53it [00:12, 4.55it/s] 54it [00:12, 4.46it/s] 55it [00:12, 4.51it/s] 56it [00:12, 4.53it/s] 57it [00:12, 4.55it/s] 58it [00:13, 4.57it/s] 59it [00:13, 4.59it/s] 60it [00:13, 4.40it/s] 61it [00:13, 4.37it/s] 62it [00:14, 4.47it/s] 63it [00:14, 4.49it/s] 64it [00:14, 4.54it/s] 65it [00:14, 4.46it/s] 66it [00:15, 4.50it/s] 67it [00:15, 4.50it/s] 68it [00:15, 4.56it/s] 69it [00:15, 4.56it/s] 70it [00:15, 4.50it/s] 71it [00:16, 4.55it/s] 72it [00:16, 4.59it/s] 73it [00:16, 4.58it/s] 74it [00:16, 4.58it/s] 75it [00:16, 4.48it/s] 76it [00:17, 4.55it/s] 77it [00:17, 4.50it/s] 78it [00:17, 4.56it/s] 79it [00:17, 4.60it/s] 80it [00:18, 4.60it/s] 81it [00:18, 4.63it/s] 82it [00:18, 4.57it/s] 83it [00:18, 4.43it/s] 84it [00:18, 4.47it/s] 85it [00:19, 4.44it/s] 86it [00:19, 4.47it/s] 87it [00:19, 4.46it/s] 88it [00:19, 4.50it/s] 89it [00:20, 4.52it/s] 90it [00:20, 4.55it/s] 91it [00:20, 4.54it/s] 92it [00:20, 4.58it/s] 93it [00:20, 4.58it/s] 94it [00:21, 4.45it/s] 95it [00:21, 4.51it/s] 96it [00:21, 4.54it/s] 97it [00:21, 4.51it/s] 98it [00:22, 4.54it/s] 99it [00:22, 4.45it/s] 100it [00:22, 4.52it/s]2025-05-25 23:41:15,874 - INFO - [Epoch 063 | Batch 0100] IWAE-loss 1351.5203 | mean log_px -0.0092 | KL -1081.81 + 101it [00:22, 4.50it/s] 102it [00:22, 4.54it/s] 103it [00:23, 4.57it/s] 104it [00:23, 4.60it/s] 105it [00:23, 4.35it/s] 106it [00:23, 4.45it/s] 107it [00:24, 4.38it/s] 108it [00:24, 4.45it/s] 109it [00:24, 4.40it/s] 110it [00:24, 4.46it/s] 111it [00:24, 4.50it/s] 112it [00:25, 4.34it/s] 113it [00:25, 4.42it/s] 114it [00:25, 4.49it/s] 115it [00:25, 4.50it/s] 116it [00:26, 4.54it/s] 117it [00:26, 4.48it/s] 118it [00:26, 4.51it/s] 119it [00:26, 4.41it/s] 120it [00:26, 4.50it/s] 121it [00:27, 4.45it/s] 122it [00:27, 4.50it/s] 123it [00:27, 4.49it/s] 124it [00:27, 4.53it/s] 125it [00:28, 4.54it/s] 126it [00:28, 4.34it/s] 127it [00:28, 4.40it/s] 128it [00:28, 4.39it/s] 129it [00:29, 4.47it/s] 130it [00:29, 4.42it/s] 131it [00:29, 4.48it/s] 132it [00:29, 4.29it/s] 133it [00:29, 4.38it/s] 134it [00:30, 4.46it/s] 135it [00:30, 4.50it/s] 136it [00:30, 4.46it/s] 137it [00:30, 4.51it/s] 138it [00:31, 4.38it/s] 139it [00:31, 4.45it/s] 140it [00:31, 4.47it/s] 141it [00:31, 4.44it/s] 142it [00:31, 4.51it/s] 143it [00:32, 4.48it/s] 144it [00:32, 4.39it/s] 145it [00:32, 4.41it/s] 146it [00:32, 4.45it/s] 147it [00:33, 4.50it/s] 148it [00:33, 4.36it/s] 149it [00:33, 4.47it/s] 150it [00:33, 4.44it/s]2025-05-25 23:41:27,107 - INFO - [Epoch 063 | Batch 0150] IWAE-loss 1242.8817 | mean log_px -0.0063 | KL -1077.83 + 151it [00:33, 4.48it/s] 152it [00:34, 4.48it/s] 153it [00:34, 4.38it/s] 154it [00:34, 4.45it/s] 155it [00:34, 4.43it/s] 156it [00:35, 4.46it/s] 157it [00:35, 4.47it/s] 158it [00:35, 4.50it/s] 159it [00:35, 4.37it/s] 160it [00:36, 4.43it/s] 161it [00:36, 4.50it/s] 162it [00:36, 4.55it/s] 163it [00:36, 4.53it/s] 164it [00:36, 4.58it/s] 165it [00:37, 4.45it/s] 166it [00:37, 4.44it/s] 167it [00:37, 4.47it/s] 168it [00:37, 4.41it/s] 169it [00:38, 4.45it/s] 170it [00:38, 4.46it/s] 171it [00:38, 4.29it/s] 172it [00:38, 4.39it/s] 173it [00:38, 4.43it/s] 174it [00:39, 4.48it/s] 175it [00:39, 4.49it/s] 176it [00:39, 4.52it/s] 177it [00:39, 4.43it/s] 178it [00:40, 4.50it/s] 179it [00:40, 4.56it/s] 180it [00:40, 4.57it/s] 181it [00:40, 4.58it/s] 182it [00:40, 4.43it/s] 183it [00:41, 4.43it/s] 184it [00:41, 4.46it/s] 185it [00:41, 4.49it/s] 186it [00:41, 4.51it/s] 187it [00:42, 4.56it/s] 188it [00:42, 4.42it/s] 189it [00:42, 4.48it/s] 190it [00:42, 4.53it/s] 191it [00:42, 4.50it/s] 192it [00:43, 4.52it/s] 193it [00:43, 4.48it/s] 194it [00:43, 4.38it/s] 195it [00:43, 4.32it/s] 196it [00:44, 4.43it/s] 196it [00:44, 4.44it/s] +2025-05-25 23:41:37,305 - INFO - Epoch: 63, Objective: tensor([1271.1880], device='cuda:0', grad_fn=), Loss: 0.0068045128136873245, KL/n: 21.986188888549805 + 0it [00:00, ?it/s]2025-05-25 23:41:37,712 - INFO - [Epoch 064 | Batch 0000] IWAE-loss 1491.5543 | mean log_px -0.0086 | KL -1077.20 + 1it [00:00, 2.75it/s] 2it [00:00, 3.63it/s] 3it [00:00, 4.06it/s] 4it [00:01, 4.26it/s] 5it [00:01, 4.41it/s] 6it [00:01, 4.50it/s] 7it [00:01, 4.38it/s] 8it [00:01, 4.48it/s] 9it [00:02, 4.55it/s] 10it [00:02, 4.57it/s] 11it [00:02, 4.61it/s] 12it [00:02, 4.64it/s] 13it [00:02, 4.65it/s] 14it [00:03, 4.64it/s] 15it [00:03, 4.66it/s] 16it [00:03, 4.64it/s] 17it [00:03, 4.50it/s] 18it [00:04, 4.53it/s] 19it [00:04, 4.57it/s] 20it [00:04, 4.59it/s] 21it [00:04, 4.62it/s] 22it [00:04, 4.63it/s] 23it [00:05, 4.49it/s] 24it [00:05, 4.56it/s] 25it [00:05, 4.60it/s] 26it [00:05, 4.61it/s] 27it [00:06, 4.62it/s] 28it [00:06, 4.65it/s] 29it [00:06, 4.67it/s] 30it [00:06, 4.50it/s] 31it [00:06, 4.57it/s] 32it [00:07, 4.61it/s] 33it [00:07, 4.59it/s] 34it [00:07, 4.60it/s] 35it [00:07, 4.62it/s] 36it [00:07, 4.62it/s] 37it [00:08, 4.65it/s] 38it [00:08, 4.66it/s] 39it [00:08, 4.67it/s] 40it [00:08, 4.68it/s] 41it [00:09, 4.69it/s] 42it [00:09, 4.68it/s] 43it [00:09, 4.69it/s] 44it [00:09, 4.68it/s] 45it [00:09, 4.67it/s] 46it [00:10, 4.68it/s] 47it [00:10, 4.52it/s] 48it [00:10, 4.58it/s] 49it [00:10, 4.62it/s] 50it [00:10, 4.64it/s]2025-05-25 23:41:48,565 - INFO - [Epoch 064 | Batch 0050] IWAE-loss 1201.7369 | mean log_px -0.0023 | KL -1074.23 + 51it [00:11, 4.66it/s] 52it [00:11, 4.65it/s] 53it [00:11, 4.67it/s] 54it [00:11, 4.52it/s] 55it [00:12, 4.58it/s] 56it [00:12, 4.55it/s] 57it [00:12, 4.61it/s] 58it [00:12, 4.62it/s] 59it [00:12, 4.64it/s] 60it [00:13, 4.66it/s] 61it [00:13, 4.67it/s] 62it [00:13, 4.67it/s] 63it [00:13, 4.68it/s] 64it [00:13, 4.68it/s] 65it [00:14, 4.70it/s] 66it [00:14, 4.69it/s] 67it [00:14, 4.70it/s] 68it [00:14, 4.70it/s] 69it [00:15, 4.70it/s] 70it [00:15, 4.67it/s] 71it [00:15, 4.52it/s] 72it [00:15, 4.59it/s] 73it [00:15, 4.59it/s] 74it [00:16, 4.62it/s] 75it [00:16, 4.61it/s] 76it [00:16, 4.64it/s] 77it [00:16, 4.51it/s] 78it [00:17, 4.58it/s] 79it [00:17, 4.61it/s] 80it [00:17, 4.63it/s] 81it [00:17, 4.66it/s] 82it [00:17, 4.67it/s] 83it [00:18, 4.68it/s] 84it [00:18, 4.68it/s] 85it [00:18, 4.68it/s] 86it [00:18, 4.48it/s] 87it [00:18, 4.52it/s] 88it [00:19, 4.57it/s] 89it [00:19, 4.61it/s] 90it [00:19, 4.53it/s] 91it [00:19, 4.58it/s] 92it [00:20, 4.62it/s] 93it [00:20, 4.50it/s] 94it [00:20, 4.56it/s] 95it [00:20, 4.61it/s] 96it [00:20, 4.63it/s] 97it [00:21, 4.65it/s] 98it [00:21, 4.66it/s] 99it [00:21, 4.68it/s] 100it [00:21, 4.67it/s]2025-05-25 23:41:59,380 - INFO - [Epoch 064 | Batch 0100] IWAE-loss 1448.6731 | mean log_px -0.0105 | KL -1068.36 + 101it [00:21, 4.67it/s] 102it [00:22, 4.67it/s] 103it [00:22, 4.66it/s] 104it [00:22, 4.67it/s] 105it [00:22, 4.68it/s] 106it [00:23, 4.67it/s] 107it [00:23, 4.66it/s] 108it [00:23, 4.66it/s] 109it [00:23, 4.68it/s] 110it [00:23, 4.68it/s] 111it [00:24, 4.50it/s] 112it [00:24, 4.56it/s] 113it [00:24, 4.58it/s] 114it [00:24, 4.61it/s] 115it [00:25, 4.64it/s] 116it [00:25, 4.65it/s] 117it [00:25, 4.63it/s] 118it [00:25, 4.45it/s] 119it [00:25, 4.53it/s] 120it [00:26, 4.54it/s] 121it [00:26, 4.59it/s] 122it [00:26, 4.59it/s] 123it [00:26, 4.63it/s] 124it [00:27, 4.49it/s] 125it [00:27, 4.57it/s] 126it [00:27, 4.60it/s] 127it [00:27, 4.59it/s] 128it [00:27, 4.59it/s] 129it [00:28, 4.61it/s] 130it [00:28, 4.57it/s] 131it [00:28, 4.59it/s] 132it [00:28, 4.60it/s] 133it [00:28, 4.47it/s] 134it [00:29, 4.52it/s] 135it [00:29, 4.56it/s] 136it [00:29, 4.46it/s] 137it [00:29, 4.54it/s] 138it [00:30, 4.43it/s] 139it [00:30, 4.49it/s] 140it [00:30, 4.53it/s] 141it [00:30, 4.56it/s] 142it [00:30, 4.58it/s] 143it [00:31, 4.60it/s] 144it [00:31, 4.60it/s] 145it [00:31, 4.61it/s] 146it [00:31, 4.61it/s] 147it [00:32, 4.62it/s] 148it [00:32, 4.61it/s] 149it [00:32, 4.61it/s] 150it [00:32, 4.61it/s]2025-05-25 23:42:10,286 - INFO - [Epoch 064 | Batch 0150] IWAE-loss 1139.3844 | mean log_px -0.0025 | KL -1069.10 + 151it [00:32, 4.47it/s] 152it [00:33, 4.51it/s] 153it [00:33, 4.54it/s] 154it [00:33, 4.57it/s] 155it [00:33, 4.57it/s] 156it [00:34, 4.55it/s] 157it [00:34, 4.53it/s] 158it [00:34, 4.55it/s] 159it [00:34, 4.44it/s] 160it [00:34, 4.48it/s] 161it [00:35, 4.50it/s] 162it [00:35, 4.52it/s] 163it [00:35, 4.55it/s] 164it [00:35, 4.57it/s] 165it [00:36, 4.58it/s] 166it [00:36, 4.58it/s] 167it [00:36, 4.54it/s] 168it [00:36, 4.54it/s] 169it [00:36, 4.42it/s] 170it [00:37, 4.43it/s] 171it [00:37, 4.48it/s] 172it [00:37, 4.51it/s] 173it [00:37, 4.55it/s] 174it [00:38, 4.54it/s] 175it [00:38, 4.55it/s] 176it [00:38, 4.55it/s] 177it [00:38, 4.58it/s] 178it [00:38, 4.55it/s] 179it [00:39, 4.57it/s] 180it [00:39, 4.57it/s] 181it [00:39, 4.57it/s] 182it [00:39, 4.58it/s] 183it [00:39, 4.57it/s] 184it [00:40, 4.56it/s] 185it [00:40, 4.56it/s] 186it [00:40, 4.57it/s] 187it [00:40, 4.58it/s] 188it [00:41, 4.45it/s] 189it [00:41, 4.49it/s] 190it [00:41, 4.52it/s] 191it [00:41, 4.53it/s] 192it [00:41, 4.54it/s] 193it [00:42, 4.51it/s] 194it [00:42, 4.53it/s] 195it [00:42, 4.42it/s] 196it [00:42, 4.48it/s] 196it [00:42, 4.57it/s] +2025-05-25 23:42:20,372 - INFO - Epoch: 64, Objective: tensor([1219.0177], device='cuda:0', grad_fn=), Loss: 0.005087015684694052, KL/n: 21.777986526489258 + 0it [00:00, ?it/s]2025-05-25 23:42:20,965 - INFO - [Epoch 065 | Batch 0000] IWAE-loss 1199.1672 | mean log_px -0.0037 | KL -1066.61 + 1it [00:00, 3.00it/s] 2it [00:00, 3.77it/s] 3it [00:00, 4.10it/s] 4it [00:00, 4.28it/s] 5it [00:01, 4.40it/s] 6it [00:01, 4.47it/s] 7it [00:01, 4.49it/s] 8it [00:01, 4.39it/s] 9it [00:02, 4.48it/s] 10it [00:02, 4.53it/s] 11it [00:02, 4.56it/s] 12it [00:02, 4.58it/s] 13it [00:02, 4.60it/s] 14it [00:03, 4.60it/s] 15it [00:03, 4.61it/s] 16it [00:03, 4.48it/s] 17it [00:03, 4.53it/s] 18it [00:04, 4.55it/s] 19it [00:04, 4.54it/s] 20it [00:04, 4.47it/s] 21it [00:04, 4.47it/s] 22it [00:04, 4.50it/s] 23it [00:05, 4.53it/s] 24it [00:05, 4.53it/s] 25it [00:05, 4.53it/s] 26it [00:05, 4.57it/s] 27it [00:06, 4.58it/s] 28it [00:06, 4.58it/s] 29it [00:06, 4.60it/s] 30it [00:06, 4.49it/s] 31it [00:06, 4.47it/s] 32it [00:07, 4.47it/s] 33it [00:07, 4.52it/s] 34it [00:07, 4.55it/s] 35it [00:07, 4.58it/s] 36it [00:08, 4.45it/s] 37it [00:08, 4.50it/s] 38it [00:08, 4.56it/s] 39it [00:08, 4.59it/s] 40it [00:08, 4.61it/s] 41it [00:09, 4.63it/s] 42it [00:09, 4.64it/s] 43it [00:09, 4.64it/s] 44it [00:09, 4.63it/s] 45it [00:10, 4.49it/s] 46it [00:10, 4.55it/s] 47it [00:10, 4.60it/s] 48it [00:10, 4.60it/s] 49it [00:10, 4.62it/s] 50it [00:11, 4.63it/s]2025-05-25 23:42:31,929 - INFO - [Epoch 065 | Batch 0050] IWAE-loss 1212.4058 | mean log_px -0.0064 | KL -1062.44 + 51it [00:11, 4.63it/s] 52it [00:11, 4.64it/s] 53it [00:11, 4.65it/s] 54it [00:11, 4.54it/s] 55it [00:12, 4.57it/s] 56it [00:12, 4.60it/s] 57it [00:12, 4.59it/s] 58it [00:12, 4.61it/s] 59it [00:13, 4.48it/s] 60it [00:13, 4.54it/s] 61it [00:13, 4.58it/s] 62it [00:13, 4.60it/s] 63it [00:13, 4.62it/s] 64it [00:14, 4.60it/s] 65it [00:14, 4.63it/s] 66it [00:14, 4.64it/s] 67it [00:14, 4.64it/s] 68it [00:14, 4.64it/s] 69it [00:15, 4.65it/s] 70it [00:15, 4.65it/s] 71it [00:15, 4.65it/s] 72it [00:15, 4.50it/s] 73it [00:16, 4.54it/s] 74it [00:16, 4.58it/s] 75it [00:16, 4.61it/s] 76it [00:16, 4.62it/s] 77it [00:16, 4.64it/s] 78it [00:17, 4.64it/s] 79it [00:17, 4.56it/s] 80it [00:17, 4.57it/s] 81it [00:17, 4.57it/s] 82it [00:18, 4.60it/s] 83it [00:18, 4.62it/s] 84it [00:18, 4.61it/s] 85it [00:18, 4.63it/s] 86it [00:18, 4.65it/s] 87it [00:19, 4.50it/s] 88it [00:19, 4.55it/s] 89it [00:19, 4.59it/s] 90it [00:19, 4.46it/s] 91it [00:20, 4.54it/s] 92it [00:20, 4.57it/s] 93it [00:20, 4.60it/s] 94it [00:20, 4.60it/s] 95it [00:20, 4.62it/s] 96it [00:21, 4.64it/s] 97it [00:21, 4.64it/s] 98it [00:21, 4.63it/s] 99it [00:21, 4.48it/s] 100it [00:21, 4.53it/s]2025-05-25 23:42:42,826 - INFO - [Epoch 065 | Batch 0100] IWAE-loss 1217.0249 | mean log_px -0.0038 | KL -1067.40 + 101it [00:22, 4.57it/s] 102it [00:22, 4.57it/s] 103it [00:22, 4.61it/s] 104it [00:22, 4.62it/s] 105it [00:23, 4.64it/s] 106it [00:23, 4.65it/s] 107it [00:23, 4.66it/s] 108it [00:23, 4.65it/s] 109it [00:23, 4.66it/s] 110it [00:24, 4.66it/s] 111it [00:24, 4.67it/s] 112it [00:24, 4.67it/s] 113it [00:24, 4.67it/s] 114it [00:24, 4.67it/s] 115it [00:25, 4.67it/s] 116it [00:25, 4.66it/s] 117it [00:25, 4.67it/s] 118it [00:25, 4.49it/s] 119it [00:26, 4.55it/s] 120it [00:26, 4.58it/s] 121it [00:26, 4.60it/s] 122it [00:26, 4.55it/s] 123it [00:26, 4.58it/s] 124it [00:27, 4.60it/s] 125it [00:27, 4.53it/s] 126it [00:27, 4.58it/s] 127it [00:27, 4.60it/s] 128it [00:28, 4.60it/s] 129it [00:28, 4.61it/s] 130it [00:28, 4.61it/s] 131it [00:28, 4.63it/s] 132it [00:28, 4.58it/s] 133it [00:29, 4.61it/s] 134it [00:29, 4.62it/s] 135it [00:29, 4.64it/s] 136it [00:29, 4.63it/s] 137it [00:30, 4.48it/s] 138it [00:30, 4.54it/s] 139it [00:30, 4.58it/s] 140it [00:30, 4.60it/s] 141it [00:30, 4.62it/s] 142it [00:31, 4.62it/s] 143it [00:31, 4.64it/s] 144it [00:31, 4.65it/s] 145it [00:31, 4.65it/s] 146it [00:31, 4.49it/s] 147it [00:32, 4.55it/s] 148it [00:32, 4.58it/s] 149it [00:32, 4.60it/s] 150it [00:32, 4.61it/s]2025-05-25 23:42:53,672 - INFO - [Epoch 065 | Batch 0150] IWAE-loss 1168.8063 | mean log_px -0.0032 | KL -1064.15 + 151it [00:33, 4.62it/s] 152it [00:33, 4.62it/s] 153it [00:33, 4.64it/s] 154it [00:33, 4.45it/s] 155it [00:33, 4.53it/s] 156it [00:34, 4.56it/s] 157it [00:34, 4.59it/s] 158it [00:34, 4.60it/s] 159it [00:34, 4.63it/s] 160it [00:35, 4.47it/s] 161it [00:35, 4.54it/s] 162it [00:35, 4.57it/s] 163it [00:35, 4.60it/s] 164it [00:35, 4.61it/s] 165it [00:36, 4.63it/s] 166it [00:36, 4.48it/s] 167it [00:36, 4.55it/s] 168it [00:36, 4.55it/s] 169it [00:36, 4.59it/s] 170it [00:37, 4.52it/s] 171it [00:37, 4.57it/s] 172it [00:37, 4.58it/s] 173it [00:37, 4.61it/s] 174it [00:38, 4.63it/s] 175it [00:38, 4.39it/s] 176it [00:38, 4.45it/s] 177it [00:38, 4.51it/s] 178it [00:38, 4.55it/s] 179it [00:39, 4.59it/s] 180it [00:39, 4.59it/s] 181it [00:39, 4.61it/s] 182it [00:39, 4.63it/s] 183it [00:40, 4.48it/s] 184it [00:40, 4.49it/s] 185it [00:40, 4.54it/s] 186it [00:40, 4.57it/s] 187it [00:40, 4.56it/s] 188it [00:41, 4.60it/s] 189it [00:41, 4.62it/s] 190it [00:41, 4.63it/s] 191it [00:41, 4.64it/s] 192it [00:42, 4.50it/s] 193it [00:42, 4.56it/s] 194it [00:42, 4.58it/s] 195it [00:42, 4.49it/s] 196it [00:42, 4.54it/s] 196it [00:42, 4.56it/s] +2025-05-25 23:43:03,665 - INFO - Epoch: 65, Objective: tensor([1230.9609], device='cuda:0', grad_fn=), Loss: 0.005760730244219303, KL/n: 21.655872344970703 + 0it [00:00, ?it/s]2025-05-25 23:43:04,072 - INFO - [Epoch 066 | Batch 0000] IWAE-loss 1246.0516 | mean log_px -0.0045 | KL -1060.09 + 1it [00:00, 2.96it/s] 2it [00:00, 3.79it/s] 3it [00:00, 3.98it/s] 4it [00:01, 4.22it/s] 5it [00:01, 4.38it/s] 6it [00:01, 4.46it/s] 7it [00:01, 3.55it/s] 8it [00:02, 3.84it/s] 9it [00:02, 4.08it/s] 10it [00:02, 4.25it/s] 11it [00:02, 4.38it/s] 12it [00:02, 4.46it/s] 13it [00:03, 4.53it/s] 14it [00:03, 4.57it/s] 15it [00:03, 4.44it/s] 16it [00:03, 4.51it/s] 17it [00:03, 4.56it/s] 18it [00:04, 4.59it/s] 19it [00:04, 4.63it/s] 20it [00:04, 4.64it/s] 21it [00:04, 4.66it/s] 22it [00:05, 4.66it/s] 23it [00:05, 4.55it/s] 24it [00:05, 4.60it/s] 25it [00:05, 4.62it/s] 26it [00:05, 4.58it/s] 27it [00:06, 4.53it/s] 28it [00:06, 4.56it/s] 29it [00:06, 4.44it/s] 30it [00:06, 4.50it/s] 31it [00:07, 4.55it/s] 32it [00:07, 4.58it/s] 33it [00:07, 4.45it/s] 34it [00:07, 4.53it/s] 35it [00:07, 4.57it/s] 36it [00:08, 4.55it/s] 37it [00:08, 4.60it/s] 38it [00:08, 4.54it/s] 39it [00:08, 4.59it/s] 40it [00:09, 4.61it/s] 41it [00:09, 4.48it/s] 42it [00:09, 4.54it/s] 43it [00:09, 4.58it/s] 44it [00:09, 4.60it/s] 45it [00:10, 4.63it/s] 46it [00:10, 4.64it/s] 47it [00:10, 4.51it/s] 48it [00:10, 4.57it/s] 49it [00:10, 4.60it/s] 50it [00:11, 4.63it/s]2025-05-25 23:43:15,157 - INFO - [Epoch 066 | Batch 0050] IWAE-loss 1207.2434 | mean log_px -0.0082 | KL -1055.60 + 51it [00:11, 4.64it/s] 52it [00:11, 4.65it/s] 53it [00:11, 4.66it/s] 54it [00:12, 4.66it/s] 55it [00:12, 4.67it/s] 56it [00:12, 4.67it/s] 57it [00:12, 4.51it/s] 58it [00:12, 4.56it/s] 59it [00:13, 4.60it/s] 60it [00:13, 4.62it/s] 61it [00:13, 4.64it/s] 62it [00:13, 4.64it/s] 63it [00:14, 4.50it/s] 64it [00:14, 4.56it/s] 65it [00:14, 4.60it/s] 66it [00:14, 4.61it/s] 67it [00:14, 4.63it/s] 68it [00:15, 4.65it/s] 69it [00:15, 4.66it/s] 70it [00:15, 4.66it/s] 71it [00:15, 4.67it/s] 72it [00:15, 4.67it/s] 73it [00:16, 4.66it/s] 74it [00:16, 4.68it/s] 75it [00:16, 4.68it/s] 76it [00:16, 4.67it/s] 77it [00:17, 4.68it/s] 78it [00:17, 4.67it/s] 79it [00:17, 4.68it/s] 80it [00:17, 4.51it/s] 81it [00:17, 4.57it/s] 82it [00:18, 4.59it/s] 83it [00:18, 4.62it/s] 84it [00:18, 4.64it/s] 85it [00:18, 4.65it/s] 86it [00:18, 4.65it/s] 87it [00:19, 4.67it/s] 88it [00:19, 4.67it/s] 89it [00:19, 4.67it/s] 90it [00:19, 4.66it/s] 91it [00:20, 4.63it/s] 92it [00:20, 4.64it/s] 93it [00:20, 4.66it/s] 94it [00:20, 4.66it/s] 95it [00:20, 4.67it/s] 96it [00:21, 4.67it/s] 97it [00:21, 4.67it/s] 98it [00:21, 4.67it/s] 99it [00:21, 4.68it/s] 100it [00:22, 4.51it/s]2025-05-25 23:43:25,955 - INFO - [Epoch 066 | Batch 0100] IWAE-loss 1485.7710 | mean log_px -0.0174 | KL -1055.98 + 101it [00:22, 4.57it/s] 102it [00:22, 4.60it/s] 103it [00:22, 4.63it/s] 104it [00:22, 4.64it/s] 105it [00:23, 4.64it/s] 106it [00:23, 4.50it/s] 107it [00:23, 4.55it/s] 108it [00:23, 4.55it/s] 109it [00:23, 4.59it/s] 110it [00:24, 4.61it/s] 111it [00:24, 4.64it/s] 112it [00:24, 4.63it/s] 113it [00:24, 4.65it/s] 114it [00:25, 4.50it/s] 115it [00:25, 4.56it/s] 116it [00:25, 4.58it/s] 117it [00:25, 4.63it/s] 118it [00:25, 4.60it/s] 119it [00:26, 4.63it/s] 120it [00:26, 4.63it/s] 121it [00:26, 4.44it/s] 122it [00:26, 4.45it/s] 123it [00:27, 4.51it/s] 124it [00:27, 4.54it/s] 125it [00:27, 4.58it/s] 126it [00:27, 4.57it/s] 127it [00:27, 4.61it/s] 128it [00:28, 4.57it/s] 129it [00:28, 4.59it/s] 130it [00:28, 4.61it/s] 131it [00:28, 4.64it/s] 132it [00:28, 4.49it/s] 133it [00:29, 4.56it/s] 134it [00:29, 4.59it/s] 135it [00:29, 4.62it/s] 136it [00:29, 4.63it/s] 137it [00:30, 4.65it/s] 138it [00:30, 4.66it/s] 139it [00:30, 4.66it/s] 140it [00:30, 4.66it/s] 141it [00:30, 4.66it/s] 142it [00:31, 4.67it/s] 143it [00:31, 4.63it/s] 144it [00:31, 4.63it/s] 145it [00:31, 4.50it/s] 146it [00:32, 4.54it/s] 147it [00:32, 4.59it/s] 148it [00:32, 4.61it/s] 149it [00:32, 4.64it/s] 150it [00:32, 4.65it/s]2025-05-25 23:43:36,829 - INFO - [Epoch 066 | Batch 0150] IWAE-loss 1216.0743 | mean log_px -0.0039 | KL -1054.95 + 151it [00:33, 4.49it/s] 152it [00:33, 4.55it/s] 153it [00:33, 4.59it/s] 154it [00:33, 4.61it/s] 155it [00:33, 4.63it/s] 156it [00:34, 4.64it/s] 157it [00:34, 4.65it/s] 158it [00:34, 4.66it/s] 159it [00:34, 4.67it/s] 160it [00:35, 4.52it/s] 161it [00:35, 4.56it/s] 162it [00:35, 4.60it/s] 163it [00:35, 4.63it/s] 164it [00:35, 4.63it/s] 165it [00:36, 4.65it/s] 166it [00:36, 4.66it/s] 167it [00:36, 4.67it/s] 168it [00:36, 4.67it/s] 169it [00:37, 4.52it/s] 170it [00:37, 4.56it/s] 171it [00:37, 4.59it/s] 172it [00:37, 4.62it/s] 173it [00:37, 4.64it/s] 174it [00:38, 4.63it/s] 175it [00:38, 4.64it/s] 176it [00:38, 4.54it/s] 177it [00:38, 4.58it/s] 178it [00:38, 4.61it/s] 179it [00:39, 4.64it/s] 180it [00:39, 4.64it/s] 181it [00:39, 4.65it/s] 182it [00:39, 4.49it/s] 183it [00:40, 4.55it/s] 184it [00:40, 4.58it/s] 185it [00:40, 4.61it/s] 186it [00:40, 4.62it/s] 187it [00:40, 4.64it/s] 188it [00:41, 4.65it/s] 189it [00:41, 4.65it/s] 190it [00:41, 4.66it/s] 191it [00:41, 4.66it/s] 192it [00:42, 4.52it/s] 193it [00:42, 4.57it/s] 194it [00:42, 4.58it/s] 195it [00:42, 4.46it/s] 196it [00:42, 4.54it/s] 196it [00:42, 4.56it/s] +2025-05-25 23:43:46,756 - INFO - Epoch: 66, Objective: tensor([1588.1846], device='cuda:0', grad_fn=), Loss: 0.013912596739828587, KL/n: 21.540197372436523 + 0it [00:00, ?it/s]2025-05-25 23:43:47,166 - INFO - [Epoch 067 | Batch 0000] IWAE-loss 1198.7195 | mean log_px -0.0020 | KL -1053.46 + 1it [00:00, 2.98it/s] 2it [00:00, 3.79it/s] 3it [00:00, 4.12it/s] 4it [00:01, 4.16it/s] 5it [00:01, 4.31it/s] 6it [00:01, 4.43it/s] 7it [00:01, 4.50it/s] 8it [00:01, 4.55it/s] 9it [00:02, 4.60it/s] 10it [00:02, 4.48it/s] 11it [00:02, 4.55it/s] 12it [00:02, 4.58it/s] 13it [00:02, 4.61it/s] 14it [00:03, 4.63it/s] 15it [00:03, 4.65it/s] 16it [00:03, 4.66it/s] 17it [00:03, 4.51it/s] 18it [00:04, 4.56it/s] 19it [00:04, 4.61it/s] 20it [00:04, 4.64it/s] 21it [00:04, 4.66it/s] 22it [00:04, 4.65it/s] 23it [00:05, 4.67it/s] 24it [00:05, 4.67it/s] 25it [00:05, 4.69it/s] 26it [00:05, 4.67it/s] 27it [00:05, 4.53it/s] 28it [00:06, 4.58it/s] 29it [00:06, 4.61it/s] 30it [00:06, 4.62it/s] 31it [00:06, 4.65it/s] 32it [00:07, 4.65it/s] 33it [00:07, 4.65it/s] 34it [00:07, 4.66it/s] 35it [00:07, 4.67it/s] 36it [00:07, 4.46it/s] 37it [00:08, 4.55it/s] 38it [00:08, 4.56it/s] 39it [00:08, 4.56it/s] 40it [00:08, 4.56it/s] 41it [00:09, 4.46it/s] 42it [00:09, 4.52it/s] 43it [00:09, 4.57it/s] 44it [00:09, 4.60it/s] 45it [00:09, 4.60it/s] 46it [00:10, 4.61it/s] 47it [00:10, 4.57it/s] 48it [00:10, 4.60it/s] 49it [00:10, 4.63it/s] 50it [00:11, 4.47it/s]2025-05-25 23:43:58,064 - INFO - [Epoch 067 | Batch 0050] IWAE-loss 1289.7285 | mean log_px -0.0091 | KL -1050.17 + 51it [00:11, 4.53it/s] 52it [00:11, 4.58it/s] 53it [00:11, 4.61it/s] 54it [00:11, 4.62it/s] 55it [00:12, 4.64it/s] 56it [00:12, 4.62it/s] 57it [00:12, 4.47it/s] 58it [00:12, 4.51it/s] 59it [00:12, 4.56it/s] 60it [00:13, 4.60it/s] 61it [00:13, 4.63it/s] 62it [00:13, 4.63it/s] 63it [00:13, 4.65it/s] 64it [00:14, 4.64it/s] 65it [00:14, 4.65it/s] 66it [00:14, 4.65it/s] 67it [00:14, 4.66it/s] 68it [00:14, 4.48it/s] 69it [00:15, 4.48it/s] 70it [00:15, 4.53it/s] 71it [00:15, 4.58it/s] 72it [00:15, 4.62it/s] 73it [00:16, 4.64it/s] 74it [00:16, 4.65it/s] 75it [00:16, 4.64it/s] 76it [00:16, 4.66it/s] 77it [00:16, 4.66it/s] 78it [00:17, 4.52it/s] 79it [00:17, 4.57it/s] 80it [00:17, 4.58it/s] 81it [00:17, 4.61it/s] 82it [00:17, 4.62it/s] 83it [00:18, 4.64it/s] 84it [00:18, 4.64it/s] 85it [00:18, 4.65it/s] 86it [00:18, 4.65it/s] 87it [00:19, 4.51it/s] 88it [00:19, 4.56it/s] 89it [00:19, 4.59it/s] 90it [00:19, 4.60it/s] 91it [00:19, 4.64it/s] 92it [00:20, 4.65it/s] 93it [00:20, 4.66it/s] 94it [00:20, 4.65it/s] 95it [00:20, 4.51it/s] 96it [00:21, 4.56it/s] 97it [00:21, 4.61it/s] 98it [00:21, 4.63it/s] 99it [00:21, 4.65it/s] 100it [00:21, 4.66it/s]2025-05-25 23:44:08,906 - INFO - [Epoch 067 | Batch 0100] IWAE-loss 1387.3746 | mean log_px -0.0188 | KL -1049.04 + 101it [00:22, 4.66it/s] 102it [00:22, 4.66it/s] 103it [00:22, 4.63it/s] 104it [00:22, 4.64it/s] 105it [00:22, 4.66it/s] 106it [00:23, 4.65it/s] 107it [00:23, 4.67it/s] 108it [00:23, 4.66it/s] 109it [00:23, 4.67it/s] 110it [00:24, 4.53it/s] 111it [00:24, 4.58it/s] 112it [00:24, 4.60it/s] 113it [00:24, 4.63it/s] 114it [00:24, 4.64it/s] 115it [00:25, 4.64it/s] 116it [00:25, 4.64it/s] 117it [00:25, 4.65it/s] 118it [00:25, 4.65it/s] 119it [00:25, 4.51it/s] 120it [00:26, 4.56it/s] 121it [00:26, 4.61it/s] 122it [00:26, 4.62it/s] 123it [00:26, 4.65it/s] 124it [00:27, 4.66it/s] 125it [00:27, 4.52it/s] 126it [00:27, 4.58it/s] 127it [00:27, 4.61it/s] 128it [00:27, 4.62it/s] 129it [00:28, 4.64it/s] 130it [00:28, 4.65it/s] 131it [00:28, 4.66it/s] 132it [00:28, 4.48it/s] 133it [00:29, 4.53it/s] 134it [00:29, 4.58it/s] 135it [00:29, 4.61it/s] 136it [00:29, 4.63it/s] 137it [00:29, 4.65it/s] 138it [00:30, 4.66it/s] 139it [00:30, 4.66it/s] 140it [00:30, 4.67it/s] 141it [00:30, 4.67it/s] 142it [00:30, 4.52it/s] 143it [00:31, 4.57it/s] 144it [00:31, 4.59it/s] 145it [00:31, 4.62it/s] 146it [00:31, 4.63it/s] 147it [00:32, 4.65it/s] 148it [00:32, 4.65it/s] 149it [00:32, 4.66it/s] 150it [00:32, 4.66it/s]2025-05-25 23:44:19,734 - INFO - [Epoch 067 | Batch 0150] IWAE-loss 1194.1609 | mean log_px -0.0024 | KL -1048.20 + 151it [00:32, 4.63it/s] 152it [00:33, 4.64it/s] 153it [00:33, 4.66it/s] 154it [00:33, 4.66it/s] 155it [00:33, 4.66it/s] 156it [00:33, 4.59it/s] 157it [00:34, 4.63it/s] 158it [00:34, 4.63it/s] 159it [00:34, 4.63it/s] 160it [00:34, 4.61it/s] 161it [00:35, 4.59it/s] 162it [00:35, 4.48it/s] 163it [00:35, 4.49it/s] 164it [00:35, 4.51it/s] 165it [00:35, 4.54it/s] 166it [00:36, 4.55it/s] 167it [00:36, 4.39it/s] 168it [00:36, 4.45it/s] 169it [00:36, 4.35it/s] 170it [00:37, 4.33it/s] 171it [00:37, 4.39it/s] 172it [00:37, 4.46it/s] 173it [00:37, 4.53it/s] 174it [00:38, 4.43it/s] 175it [00:38, 4.50it/s] 176it [00:38, 4.54it/s] 177it [00:38, 4.52it/s] 178it [00:38, 4.57it/s] 179it [00:39, 4.60it/s] 180it [00:39, 4.63it/s] 181it [00:39, 4.50it/s] 182it [00:39, 4.56it/s] 183it [00:39, 4.58it/s] 184it [00:40, 4.47it/s] 185it [00:40, 4.54it/s] 186it [00:40, 4.50it/s] 187it [00:40, 4.55it/s] 188it [00:41, 4.55it/s] 189it [00:41, 4.55it/s] 190it [00:41, 4.60it/s] 191it [00:41, 4.58it/s] 192it [00:41, 4.59it/s] 193it [00:42, 4.62it/s] 194it [00:42, 4.64it/s] 195it [00:42, 4.38it/s] 196it [00:42, 4.47it/s] 196it [00:42, 4.57it/s] +2025-05-25 23:44:29,799 - INFO - Epoch: 67, Objective: tensor([1625.6294], device='cuda:0', grad_fn=), Loss: 0.012983052060008049, KL/n: 21.431779861450195 + 0it [00:00, ?it/s]2025-05-25 23:44:30,389 - INFO - [Epoch 068 | Batch 0000] IWAE-loss 1262.3419 | mean log_px -0.0057 | KL -1050.64 + 1it [00:00, 2.98it/s] 2it [00:00, 3.71it/s] 3it [00:00, 4.06it/s] 4it [00:00, 4.26it/s] 5it [00:01, 4.34it/s] 6it [00:01, 4.42it/s] 7it [00:01, 4.32it/s] 8it [00:01, 4.38it/s] 9it [00:02, 4.40it/s] 10it [00:02, 4.44it/s] 11it [00:02, 4.51it/s] 12it [00:02, 4.52it/s] 13it [00:02, 4.56it/s] 14it [00:03, 4.47it/s] 15it [00:03, 4.32it/s] 16it [00:03, 4.40it/s] 17it [00:03, 4.46it/s] 18it [00:04, 4.48it/s] 19it [00:04, 4.52it/s] 20it [00:04, 4.56it/s] 21it [00:04, 4.43it/s] 22it [00:05, 4.49it/s] 23it [00:05, 4.52it/s] 24it [00:05, 4.53it/s] 25it [00:05, 4.56it/s] 26it [00:05, 4.58it/s] 27it [00:06, 4.59it/s] 28it [00:06, 4.44it/s] 29it [00:06, 4.51it/s] 30it [00:06, 4.55it/s] 31it [00:07, 4.51it/s] 32it [00:07, 4.54it/s] 33it [00:07, 4.58it/s] 34it [00:07, 4.59it/s] 35it [00:07, 4.62it/s] 36it [00:08, 4.47it/s] 37it [00:08, 4.52it/s] 38it [00:08, 4.54it/s] 39it [00:08, 4.54it/s] 40it [00:08, 4.51it/s] 41it [00:09, 4.53it/s] 42it [00:09, 4.54it/s] 43it [00:09, 4.40it/s] 44it [00:09, 4.46it/s] 45it [00:10, 4.51it/s] 46it [00:10, 4.51it/s] 47it [00:10, 4.53it/s] 48it [00:10, 4.54it/s] 49it [00:10, 4.51it/s] 50it [00:11, 4.47it/s]2025-05-25 23:44:41,484 - INFO - [Epoch 068 | Batch 0050] IWAE-loss 1151.6068 | mean log_px -0.0023 | KL -1047.97 + 51it [00:11, 4.52it/s] 52it [00:11, 4.55it/s] 53it [00:11, 4.58it/s] 54it [00:12, 4.59it/s] 55it [00:12, 4.62it/s] 56it [00:12, 4.62it/s] 57it [00:12, 4.46it/s] 58it [00:12, 4.52it/s] 59it [00:13, 4.49it/s] 60it [00:13, 4.51it/s] 61it [00:13, 4.54it/s] 62it [00:13, 4.53it/s] 63it [00:14, 4.58it/s] 64it [00:14, 4.42it/s] 65it [00:14, 4.46it/s] 66it [00:14, 4.49it/s] 67it [00:14, 4.54it/s] 68it [00:15, 4.51it/s] 69it [00:15, 4.54it/s] 70it [00:15, 4.51it/s] 71it [00:15, 4.40it/s] 72it [00:16, 4.48it/s] 73it [00:16, 4.53it/s] 74it [00:16, 4.56it/s] 75it [00:16, 4.57it/s] 76it [00:16, 4.55it/s] 77it [00:17, 4.58it/s] 78it [00:17, 4.60it/s] 79it [00:17, 4.62it/s] 80it [00:17, 4.62it/s] 81it [00:18, 4.62it/s] 82it [00:18, 4.60it/s] 83it [00:18, 4.58it/s] 84it [00:18, 4.44it/s] 85it [00:18, 4.50it/s] 86it [00:19, 4.50it/s] 87it [00:19, 4.54it/s] 88it [00:19, 4.57it/s] 89it [00:19, 4.59it/s] 90it [00:20, 4.59it/s] 91it [00:20, 4.57it/s] 92it [00:20, 4.40it/s] 93it [00:20, 4.44it/s] 94it [00:20, 4.51it/s] 95it [00:21, 4.54it/s] 96it [00:21, 4.53it/s] 97it [00:21, 4.56it/s] 98it [00:21, 4.44it/s] 99it [00:22, 4.47it/s] 100it [00:22, 4.51it/s]2025-05-25 23:44:52,513 - INFO - [Epoch 068 | Batch 0100] IWAE-loss 1225.7665 | mean log_px -0.0087 | KL -1041.03 + 101it [00:22, 4.57it/s] 102it [00:22, 4.59it/s] 103it [00:22, 4.55it/s] 104it [00:23, 4.58it/s] 105it [00:23, 4.61it/s] 106it [00:23, 4.60it/s] 107it [00:23, 4.56it/s] 108it [00:23, 4.59it/s] 109it [00:24, 4.57it/s] 110it [00:24, 4.55it/s] 111it [00:24, 4.57it/s] 112it [00:24, 4.50it/s] 113it [00:25, 4.40it/s] 114it [00:25, 4.48it/s] 115it [00:25, 4.54it/s] 116it [00:25, 4.55it/s] 117it [00:25, 4.54it/s] 118it [00:26, 4.55it/s] 119it [00:26, 4.59it/s] 120it [00:26, 4.60it/s] 121it [00:26, 4.47it/s] 122it [00:27, 4.51it/s] 123it [00:27, 4.55it/s] 124it [00:27, 4.42it/s] 125it [00:27, 4.50it/s] 126it [00:27, 4.49it/s] 127it [00:28, 4.55it/s] 128it [00:28, 4.55it/s] 129it [00:28, 4.54it/s] 130it [00:28, 4.54it/s] 131it [00:29, 4.52it/s] 132it [00:29, 4.41it/s] 133it [00:29, 4.46it/s] 134it [00:29, 4.48it/s] 135it [00:29, 4.44it/s] 136it [00:30, 4.50it/s] 137it [00:30, 4.55it/s] 138it [00:30, 4.57it/s] 139it [00:30, 4.46it/s] 140it [00:31, 4.46it/s] 141it [00:31, 4.51it/s] 142it [00:31, 4.55it/s] 143it [00:31, 4.56it/s] 144it [00:31, 4.60it/s] 145it [00:32, 4.62it/s] 146it [00:32, 4.46it/s] 147it [00:32, 4.45it/s] 148it [00:32, 4.49it/s] 149it [00:33, 4.47it/s] 150it [00:33, 4.52it/s]2025-05-25 23:45:03,569 - INFO - [Epoch 068 | Batch 0150] IWAE-loss 1264.9144 | mean log_px -0.0035 | KL -1042.59 + 151it [00:33, 4.52it/s] 152it [00:33, 4.52it/s] 153it [00:33, 4.54it/s] 154it [00:34, 4.58it/s] 155it [00:34, 4.45it/s] 156it [00:34, 4.41it/s] 157it [00:34, 4.43it/s] 158it [00:35, 4.45it/s] 159it [00:35, 4.51it/s] 160it [00:35, 4.45it/s] 161it [00:35, 4.49it/s] 162it [00:35, 4.51it/s] 163it [00:36, 4.56it/s] 164it [00:36, 4.53it/s] 165it [00:36, 4.57it/s] 166it [00:36, 4.38it/s] 167it [00:37, 4.42it/s] 168it [00:37, 4.45it/s] 169it [00:37, 4.49it/s] 170it [00:37, 4.54it/s] 171it [00:37, 4.56it/s] 172it [00:38, 4.57it/s] 173it [00:38, 4.59it/s] 174it [00:38, 4.61it/s] 175it [00:38, 4.47it/s] 176it [00:39, 4.54it/s] 177it [00:39, 4.58it/s] 178it [00:39, 4.58it/s] 179it [00:39, 4.59it/s] 180it [00:39, 4.60it/s] 181it [00:40, 4.61it/s] 182it [00:40, 4.60it/s] 183it [00:40, 4.62it/s] 184it [00:40, 4.46it/s] 185it [00:41, 4.51it/s] 186it [00:41, 4.53it/s] 187it [00:41, 4.56it/s] 188it [00:41, 4.56it/s] 189it [00:41, 4.56it/s] 190it [00:42, 4.58it/s] 191it [00:42, 4.45it/s] 192it [00:42, 4.50it/s] 193it [00:42, 4.54it/s] 194it [00:43, 4.57it/s] 195it [00:43, 4.48it/s] 196it [00:43, 4.50it/s] 196it [00:43, 4.50it/s] +2025-05-25 23:45:13,653 - INFO - Epoch: 68, Objective: tensor([1242.0751], device='cuda:0', grad_fn=), Loss: 0.003887968137860298, KL/n: 21.28978157043457 + 0it [00:00, ?it/s]2025-05-25 23:45:14,062 - INFO - [Epoch 069 | Batch 0000] IWAE-loss 1280.5768 | mean log_px -0.0051 | KL -1042.65 + 1it [00:00, 2.98it/s] 2it [00:00, 3.68it/s] 3it [00:00, 4.01it/s] 4it [00:01, 4.18it/s] 5it [00:01, 4.25it/s] 6it [00:01, 4.29it/s] 7it [00:01, 4.37it/s] 8it [00:01, 4.46it/s] 9it [00:02, 4.52it/s] 10it [00:02, 4.54it/s] 11it [00:02, 4.57it/s] 12it [00:02, 4.58it/s] 13it [00:02, 4.62it/s] 14it [00:03, 4.55it/s] 15it [00:03, 4.57it/s] 16it [00:03, 4.58it/s] 17it [00:03, 4.38it/s] 18it [00:04, 4.46it/s] 19it [00:04, 4.48it/s] 20it [00:04, 4.46it/s] 21it [00:04, 4.36it/s] 22it [00:05, 4.42it/s] 23it [00:05, 4.46it/s] 24it [00:05, 4.48it/s] 25it [00:05, 4.47it/s] 26it [00:05, 4.33it/s] 27it [00:06, 4.39it/s] 28it [00:06, 4.42it/s] 29it [00:06, 4.49it/s] 30it [00:06, 4.41it/s] 31it [00:07, 4.45it/s] 32it [00:07, 4.43it/s] 33it [00:07, 4.49it/s] 34it [00:07, 4.48it/s] 35it [00:07, 4.51it/s] 36it [00:08, 4.36it/s] 37it [00:08, 4.40it/s] 38it [00:08, 4.45it/s] 39it [00:09, 3.57it/s] 40it [00:09, 3.84it/s] 41it [00:09, 4.02it/s] 42it [00:09, 4.18it/s] 43it [00:09, 4.30it/s] 44it [00:10, 4.41it/s] 45it [00:10, 4.48it/s] 46it [00:10, 4.38it/s] 47it [00:10, 4.46it/s] 48it [00:10, 4.48it/s] 49it [00:11, 4.51it/s] 50it [00:11, 4.54it/s]2025-05-25 23:45:25,377 - INFO - [Epoch 069 | Batch 0050] IWAE-loss 1204.5205 | mean log_px -0.0046 | KL -1043.10 + 51it [00:11, 4.56it/s] 52it [00:11, 4.57it/s] 53it [00:12, 4.59it/s] 54it [00:12, 4.51it/s] 55it [00:12, 4.55it/s] 56it [00:12, 4.56it/s] 57it [00:12, 4.58it/s] 58it [00:13, 4.58it/s] 59it [00:13, 4.60it/s] 60it [00:13, 4.62it/s] 61it [00:13, 4.63it/s] 62it [00:14, 4.49it/s] 63it [00:14, 4.56it/s] 64it [00:14, 4.59it/s] 65it [00:14, 4.62it/s] 66it [00:14, 4.63it/s] 67it [00:15, 4.64it/s] 68it [00:15, 4.63it/s] 69it [00:15, 4.64it/s] 70it [00:15, 4.64it/s] 71it [00:15, 4.65it/s] 72it [00:16, 4.64it/s] 73it [00:16, 4.65it/s] 74it [00:16, 4.65it/s] 75it [00:16, 4.66it/s] 76it [00:17, 4.49it/s] 77it [00:17, 4.56it/s] 78it [00:17, 4.59it/s] 79it [00:17, 4.62it/s] 80it [00:17, 4.63it/s] 81it [00:18, 4.63it/s] 82it [00:18, 4.64it/s] 83it [00:18, 4.65it/s] 84it [00:18, 4.65it/s] 85it [00:19, 4.50it/s] 86it [00:19, 4.56it/s] 87it [00:19, 4.59it/s] 88it [00:19, 4.61it/s] 89it [00:19, 4.63it/s] 90it [00:20, 4.64it/s] 91it [00:20, 4.53it/s] 92it [00:20, 4.57it/s] 93it [00:20, 4.45it/s] 94it [00:21, 4.49it/s] 95it [00:21, 4.48it/s] 96it [00:21, 4.33it/s] 97it [00:21, 4.44it/s] 98it [00:21, 4.50it/s] 99it [00:22, 4.40it/s] 100it [00:22, 4.39it/s]2025-05-25 23:45:36,347 - INFO - [Epoch 069 | Batch 0100] IWAE-loss 1164.3147 | mean log_px -0.0017 | KL -1040.04 + 101it [00:22, 4.39it/s] 102it [00:22, 4.44it/s] 103it [00:23, 4.47it/s] 104it [00:23, 4.51it/s] 105it [00:23, 4.50it/s] 106it [00:23, 4.52it/s] 107it [00:23, 4.39it/s] 108it [00:24, 4.45it/s] 109it [00:24, 4.47it/s] 110it [00:24, 4.52it/s] 111it [00:24, 4.46it/s] 112it [00:25, 4.44it/s] 113it [00:25, 4.36it/s] 114it [00:25, 4.24it/s] 115it [00:25, 4.23it/s] 116it [00:26, 4.25it/s] 117it [00:26, 4.22it/s] 118it [00:26, 4.20it/s] 119it [00:26, 4.23it/s] 120it [00:27, 4.13it/s] 121it [00:27, 4.17it/s] 122it [00:27, 4.22it/s] 123it [00:27, 4.22it/s] 124it [00:27, 4.26it/s] 125it [00:28, 4.28it/s] 126it [00:28, 4.28it/s] 127it [00:28, 4.31it/s] 128it [00:28, 4.24it/s] 129it [00:29, 4.20it/s] 130it [00:29, 4.15it/s] 131it [00:29, 4.18it/s] 132it [00:29, 4.16it/s] 133it [00:30, 4.14it/s] 134it [00:30, 4.17it/s] 135it [00:30, 4.20it/s] 136it [00:30, 4.21it/s] 137it [00:31, 4.18it/s] 138it [00:31, 4.23it/s] 139it [00:31, 4.28it/s] 140it [00:31, 4.28it/s] 141it [00:31, 4.32it/s] 142it [00:32, 4.35it/s] 143it [00:32, 4.37it/s] 144it [00:32, 4.37it/s] 145it [00:32, 4.25it/s] 146it [00:33, 4.30it/s] 147it [00:33, 4.33it/s] 148it [00:33, 4.35it/s] 149it [00:33, 4.38it/s] 150it [00:34, 4.37it/s]2025-05-25 23:45:47,974 - INFO - [Epoch 069 | Batch 0150] IWAE-loss 1321.3817 | mean log_px -0.0040 | KL -1039.04 + 151it [00:34, 4.36it/s] 152it [00:34, 4.39it/s] 153it [00:34, 4.42it/s] 154it [00:34, 4.30it/s] 155it [00:35, 4.32it/s] 156it [00:35, 4.36it/s] 157it [00:35, 4.41it/s] 158it [00:35, 4.34it/s] 159it [00:36, 4.35it/s] 160it [00:36, 4.38it/s] 161it [00:36, 4.38it/s] 162it [00:36, 4.28it/s] 163it [00:37, 4.31it/s] 164it [00:37, 4.34it/s] 165it [00:37, 4.35it/s] 166it [00:37, 4.27it/s] 167it [00:37, 4.32it/s] 168it [00:38, 4.21it/s] 169it [00:38, 4.26it/s] 170it [00:38, 4.32it/s] 171it [00:38, 4.37it/s] 172it [00:39, 4.37it/s] 173it [00:39, 4.35it/s] 174it [00:39, 4.38it/s] 175it [00:39, 4.40it/s] 176it [00:40, 4.28it/s] 177it [00:40, 4.31it/s] 178it [00:40, 4.36it/s] 179it [00:40, 4.40it/s] 180it [00:40, 4.41it/s] 181it [00:41, 4.41it/s] 182it [00:41, 4.39it/s] 183it [00:41, 4.36it/s] 184it [00:41, 4.36it/s] 185it [00:42, 4.38it/s] 186it [00:42, 4.39it/s] 187it [00:42, 4.26it/s] 188it [00:42, 4.29it/s] 189it [00:43, 4.30it/s] 190it [00:43, 4.33it/s] 191it [00:43, 4.36it/s] 192it [00:43, 4.37it/s] 193it [00:43, 4.31it/s] 194it [00:44, 4.31it/s] 195it [00:44, 4.22it/s] 196it [00:44, 4.26it/s] 196it [00:44, 4.38it/s] +2025-05-25 23:45:58,500 - INFO - Epoch: 69, Objective: tensor([1152.8077], device='cuda:0', grad_fn=), Loss: 0.006191767752170563, KL/n: 21.240211486816406 + 0it [00:00, ?it/s]2025-05-25 23:45:58,926 - INFO - [Epoch 070 | Batch 0000] IWAE-loss 1134.6925 | mean log_px -0.0031 | KL -1039.89 + 1it [00:00, 2.68it/s] 2it [00:00, 3.23it/s] 3it [00:00, 3.58it/s] 4it [00:01, 3.66it/s] 5it [00:01, 3.70it/s] 6it [00:01, 3.85it/s] 7it [00:01, 3.98it/s] 8it [00:02, 4.04it/s] 9it [00:02, 4.05it/s] 10it [00:02, 4.08it/s] 11it [00:02, 3.94it/s] 12it [00:03, 3.99it/s] 13it [00:03, 4.02it/s] 14it [00:03, 3.95it/s] 15it [00:03, 4.05it/s] 16it [00:04, 4.05it/s] 17it [00:04, 4.13it/s] 18it [00:04, 4.20it/s] 19it [00:04, 4.24it/s] 20it [00:05, 4.24it/s] 21it [00:05, 4.28it/s] 22it [00:05, 4.16it/s] 23it [00:05, 4.21it/s] 24it [00:05, 4.20it/s] 25it [00:06, 4.21it/s] 26it [00:06, 4.23it/s] 27it [00:06, 4.22it/s] 28it [00:06, 4.10it/s] 29it [00:07, 4.16it/s] 30it [00:07, 4.16it/s] 31it [00:07, 4.15it/s] 32it [00:07, 4.20it/s] 33it [00:08, 4.26it/s] 34it [00:08, 4.31it/s] 35it [00:08, 4.34it/s] 36it [00:08, 4.11it/s] 37it [00:09, 4.13it/s] 38it [00:09, 4.13it/s] 39it [00:09, 4.21it/s] 40it [00:09, 4.24it/s] 41it [00:10, 4.23it/s] 42it [00:10, 4.10it/s] 43it [00:10, 4.14it/s] 44it [00:10, 4.16it/s] 45it [00:11, 4.18it/s] 46it [00:11, 4.22it/s] 47it [00:11, 4.20it/s] 48it [00:11, 4.23it/s] 49it [00:11, 4.16it/s] 50it [00:12, 4.19it/s]2025-05-25 23:46:11,016 - INFO - [Epoch 070 | Batch 0050] IWAE-loss 1186.9631 | mean log_px -0.0027 | KL -1039.01 + 51it [00:12, 4.18it/s] 52it [00:12, 4.06it/s] 53it [00:12, 4.10it/s] 54it [00:13, 4.11it/s] 55it [00:13, 4.03it/s] 56it [00:13, 4.04it/s] 57it [00:13, 4.04it/s] 58it [00:14, 4.07it/s] 59it [00:14, 3.99it/s] 60it [00:14, 3.99it/s] 61it [00:14, 4.03it/s] 62it [00:15, 4.07it/s] 63it [00:15, 4.08it/s] 64it [00:15, 3.93it/s] 65it [00:15, 4.01it/s] 66it [00:16, 4.03it/s] 67it [00:16, 4.04it/s] 68it [00:16, 4.07it/s] 69it [00:16, 4.11it/s] 70it [00:17, 4.11it/s] 71it [00:17, 4.15it/s] 72it [00:17, 4.12it/s] 73it [00:17, 4.17it/s] 74it [00:18, 4.18it/s] 75it [00:18, 4.20it/s] 76it [00:18, 4.10it/s] 77it [00:18, 4.17it/s] 78it [00:19, 4.14it/s] 79it [00:19, 4.16it/s] 80it [00:19, 4.06it/s] 81it [00:19, 4.09it/s] 82it [00:20, 4.15it/s] 83it [00:20, 4.18it/s] 84it [00:20, 4.21it/s] 85it [00:20, 4.05it/s] 86it [00:21, 4.10it/s] 87it [00:21, 4.08it/s] 88it [00:21, 4.04it/s] 89it [00:21, 3.94it/s] 90it [00:22, 3.88it/s] 91it [00:22, 3.90it/s] 92it [00:22, 3.87it/s] 93it [00:22, 3.90it/s] 94it [00:23, 3.88it/s] 95it [00:23, 3.91it/s] 96it [00:23, 3.94it/s] 97it [00:23, 4.06it/s] 98it [00:24, 4.11it/s] 99it [00:24, 4.17it/s] 100it [00:24, 4.11it/s]2025-05-25 23:46:23,339 - INFO - [Epoch 070 | Batch 0100] IWAE-loss 1322.7841 | mean log_px -0.0044 | KL -1041.32 + 101it [00:24, 4.14it/s] 102it [00:25, 3.93it/s] 103it [00:25, 3.97it/s] 104it [00:25, 4.00it/s] 105it [00:25, 3.99it/s] 106it [00:26, 4.05it/s] 107it [00:26, 4.06it/s] 108it [00:26, 4.12it/s] 109it [00:26, 4.12it/s] 110it [00:27, 4.09it/s] 111it [00:27, 4.09it/s] 112it [00:27, 4.07it/s] 113it [00:27, 4.07it/s] 114it [00:27, 4.11it/s] 115it [00:28, 4.09it/s] 116it [00:28, 4.07it/s] 117it [00:28, 4.08it/s] 118it [00:28, 4.07it/s] 119it [00:29, 4.16it/s] 120it [00:29, 4.03it/s] 121it [00:29, 4.12it/s] 122it [00:29, 4.11it/s] 123it [00:30, 4.15it/s] 124it [00:30, 4.18it/s] 125it [00:30, 4.22it/s] 126it [00:30, 4.18it/s] 127it [00:31, 4.20it/s] 128it [00:31, 4.22it/s] 129it [00:31, 4.24it/s] 130it [00:31, 4.16it/s] 131it [00:32, 4.25it/s] 132it [00:32, 4.23it/s] 133it [00:32, 4.24it/s] 134it [00:32, 4.18it/s] 135it [00:33, 4.20it/s] 136it [00:33, 4.15it/s] 137it [00:33, 4.16it/s] 138it [00:33, 4.17it/s] 139it [00:33, 4.18it/s] 140it [00:34, 3.98it/s] 141it [00:34, 4.05it/s] 142it [00:34, 4.00it/s] 143it [00:34, 4.05it/s] 144it [00:35, 4.06it/s] 145it [00:35, 4.11it/s] 146it [00:35, 4.15it/s] 147it [00:35, 4.19it/s] 148it [00:36, 4.10it/s] 149it [00:36, 4.13it/s] 150it [00:36, 4.04it/s]2025-05-25 23:46:35,503 - INFO - [Epoch 070 | Batch 0150] IWAE-loss 1312.4045 | mean log_px -0.0061 | KL -1034.94 + 151it [00:36, 4.12it/s] 152it [00:37, 4.16it/s] 153it [00:37, 4.24it/s] 154it [00:37, 4.16it/s] 155it [00:37, 4.09it/s] 156it [00:38, 4.07it/s] 157it [00:38, 4.01it/s] 158it [00:38, 4.02it/s] 159it [00:38, 4.11it/s] 160it [00:39, 4.09it/s] 161it [00:39, 4.10it/s] 162it [00:39, 4.05it/s] 163it [00:39, 4.00it/s] 164it [00:40, 4.06it/s] 165it [00:40, 4.11it/s] 166it [00:40, 4.02it/s] 167it [00:40, 4.04it/s] 168it [00:41, 4.07it/s] 169it [00:41, 4.09it/s] 170it [00:41, 4.12it/s] 171it [00:41, 4.03it/s] 172it [00:42, 4.03it/s] 173it [00:42, 4.11it/s] 174it [00:42, 4.13it/s] 175it [00:42, 4.18it/s] 176it [00:43, 4.22it/s] 177it [00:43, 4.19it/s] 178it [00:43, 4.21it/s] 179it [00:43, 4.15it/s] 180it [00:43, 4.12it/s] 181it [00:44, 4.12it/s] 182it [00:44, 4.09it/s] 183it [00:44, 4.14it/s] 184it [00:44, 4.03it/s] 185it [00:45, 4.08it/s] 186it [00:45, 4.08it/s] 187it [00:45, 3.98it/s] 188it [00:45, 3.92it/s] 189it [00:46, 4.00it/s] 190it [00:46, 3.94it/s] 191it [00:46, 4.02it/s] 192it [00:46, 3.99it/s] 193it [00:47, 4.06it/s] 194it [00:47, 3.99it/s] 195it [00:47, 3.90it/s] 196it [00:47, 4.04it/s] 196it [00:48, 4.08it/s] +2025-05-25 23:46:46,684 - INFO - Epoch: 70, Objective: tensor([1542.3411], device='cuda:0', grad_fn=), Loss: 0.008527607657015324, KL/n: 21.169261932373047 + 0it [00:00, ?it/s]2025-05-25 23:46:47,278 - INFO - [Epoch 071 | Batch 0000] IWAE-loss 1529.1766 | mean log_px -0.0078 | KL -1036.11 + 1it [00:00, 2.96it/s] 2it [00:00, 3.35it/s] 3it [00:00, 3.61it/s] 4it [00:01, 3.82it/s] 5it [00:01, 3.99it/s] 6it [00:01, 4.10it/s] 7it [00:01, 4.15it/s] 8it [00:02, 4.21it/s] 9it [00:02, 4.10it/s] 10it [00:02, 4.14it/s] 11it [00:02, 4.15it/s] 12it [00:02, 4.20it/s] 13it [00:03, 4.15it/s] 14it [00:03, 4.18it/s] 15it [00:03, 4.19it/s] 16it [00:03, 4.19it/s] 17it [00:04, 4.09it/s] 18it [00:04, 4.14it/s] 19it [00:04, 4.07it/s] 20it [00:04, 4.09it/s] 21it [00:05, 4.04it/s] 22it [00:05, 4.05it/s] 23it [00:05, 4.03it/s] 24it [00:05, 4.01it/s] 25it [00:06, 4.08it/s] 26it [00:06, 4.15it/s] 27it [00:06, 4.06it/s] 28it [00:06, 4.14it/s] 29it [00:07, 4.23it/s] 30it [00:07, 4.16it/s] 31it [00:07, 4.22it/s] 32it [00:07, 4.33it/s] 33it [00:08, 4.33it/s] 34it [00:08, 4.36it/s] 35it [00:08, 4.35it/s] 36it [00:08, 4.39it/s] 37it [00:08, 4.30it/s] 38it [00:09, 4.34it/s] 39it [00:09, 4.32it/s] 40it [00:09, 4.35it/s] 41it [00:09, 4.29it/s] 42it [00:10, 4.33it/s] 43it [00:10, 4.33it/s] 44it [00:10, 4.32it/s] 45it [00:10, 4.34it/s] 46it [00:11, 4.12it/s] 47it [00:11, 4.11it/s] 48it [00:11, 4.15it/s] 49it [00:11, 4.16it/s] 50it [00:12, 4.18it/s]2025-05-25 23:46:59,226 - INFO - [Epoch 071 | Batch 0050] IWAE-loss 1191.1381 | mean log_px -0.0072 | KL -1032.97 + 51it [00:12, 4.15it/s] 52it [00:12, 4.21it/s] 53it [00:12, 4.20it/s] 54it [00:12, 4.28it/s] 55it [00:13, 4.33it/s] 56it [00:13, 4.32it/s] 57it [00:13, 4.21it/s] 58it [00:13, 4.21it/s] 59it [00:14, 4.30it/s] 60it [00:14, 4.32it/s] 61it [00:14, 4.32it/s] 62it [00:14, 4.14it/s] 63it [00:15, 4.22it/s] 64it [00:15, 4.33it/s] 65it [00:15, 4.41it/s] 66it [00:15, 4.47it/s] 67it [00:15, 4.51it/s] 68it [00:16, 4.39it/s] 69it [00:16, 4.37it/s] 70it [00:16, 4.45it/s] 71it [00:16, 4.40it/s] 72it [00:17, 4.47it/s] 73it [00:17, 4.51it/s] 74it [00:17, 4.44it/s] 75it [00:17, 4.27it/s] 76it [00:18, 4.30it/s] 77it [00:18, 4.36it/s] 78it [00:18, 4.38it/s] 79it [00:18, 4.34it/s] 80it [00:18, 4.38it/s] 81it [00:19, 4.46it/s] 82it [00:19, 4.34it/s] 83it [00:19, 4.14it/s] 84it [00:19, 4.25it/s] 85it [00:20, 4.27it/s] 86it [00:20, 4.37it/s] 87it [00:20, 4.31it/s] 88it [00:20, 4.41it/s] 89it [00:21, 4.38it/s] 90it [00:21, 4.29it/s] 91it [00:21, 4.30it/s] 92it [00:21, 4.09it/s] 93it [00:22, 4.05it/s] 94it [00:22, 4.00it/s] 95it [00:22, 4.12it/s] 96it [00:22, 4.07it/s] 97it [00:23, 4.08it/s] 98it [00:23, 4.12it/s] 99it [00:23, 4.12it/s] 100it [00:23, 4.13it/s]2025-05-25 23:47:10,899 - INFO - [Epoch 071 | Batch 0100] IWAE-loss 1299.5299 | mean log_px -0.0067 | KL -1027.02 + 101it [00:23, 4.22it/s] 102it [00:24, 4.31it/s] 103it [00:24, 4.30it/s] 104it [00:24, 4.26it/s] 105it [00:24, 4.37it/s] 106it [00:25, 4.40it/s] 107it [00:25, 4.47it/s] 108it [00:25, 4.41it/s] 109it [00:25, 4.32it/s] 110it [00:26, 4.32it/s] 111it [00:26, 4.37it/s] 112it [00:26, 4.34it/s] 113it [00:26, 4.33it/s] 114it [00:26, 4.25it/s] 115it [00:27, 4.18it/s] 116it [00:27, 4.22it/s] 117it [00:27, 4.24it/s] 118it [00:27, 4.12it/s] 119it [00:28, 4.24it/s] 120it [00:28, 4.30it/s] 121it [00:28, 4.38it/s] 122it [00:28, 4.31it/s] 123it [00:29, 4.41it/s] 124it [00:29, 4.47it/s] 125it [00:29, 4.50it/s] 126it [00:29, 4.29it/s] 127it [00:29, 4.35it/s] 128it [00:30, 4.38it/s] 129it [00:30, 4.40it/s] 130it [00:30, 4.43it/s] 131it [00:30, 4.44it/s] 132it [00:31, 4.31it/s] 133it [00:31, 4.13it/s] 134it [00:31, 4.19it/s] 135it [00:31, 4.14it/s] 136it [00:32, 4.20it/s] 137it [00:32, 4.13it/s] 138it [00:32, 4.24it/s] 139it [00:32, 4.16it/s] 140it [00:33, 4.09it/s] 141it [00:33, 4.00it/s] 142it [00:33, 4.06it/s] 143it [00:33, 4.13it/s] 144it [00:34, 4.05it/s] 145it [00:34, 4.09it/s] 146it [00:34, 4.19it/s] 147it [00:34, 4.25it/s] 148it [00:34, 4.19it/s] 149it [00:35, 4.19it/s] 150it [00:35, 4.31it/s]2025-05-25 23:47:22,609 - INFO - [Epoch 071 | Batch 0150] IWAE-loss 1175.8381 | mean log_px -0.0057 | KL -1027.57 + 151it [00:35, 4.29it/s] 152it [00:35, 4.25it/s] 153it [00:36, 4.32it/s] 154it [00:36, 4.41it/s] 155it [00:36, 4.42it/s] 156it [00:36, 4.47it/s] 157it [00:37, 4.37it/s] 158it [00:37, 4.44it/s] 159it [00:37, 4.49it/s] 160it [00:37, 4.50it/s] 161it [00:37, 4.46it/s] 162it [00:38, 4.33it/s] 163it [00:38, 4.42it/s] 164it [00:38, 4.41it/s] 165it [00:38, 4.46it/s] 166it [00:39, 4.51it/s] 167it [00:39, 4.48it/s] 168it [00:39, 4.38it/s] 169it [00:39, 4.38it/s] 170it [00:39, 4.42it/s] 171it [00:40, 4.40it/s] 172it [00:40, 4.43it/s] 173it [00:40, 4.45it/s] 174it [00:40, 4.50it/s] 175it [00:41, 4.50it/s] 176it [00:41, 4.51it/s] 177it [00:41, 4.51it/s] 178it [00:41, 4.36it/s] 179it [00:41, 4.38it/s] 180it [00:42, 4.46it/s] 181it [00:42, 4.46it/s] 182it [00:42, 4.35it/s] 183it [00:42, 4.42it/s] 184it [00:43, 4.48it/s] 185it [00:43, 4.50it/s] 186it [00:43, 4.51it/s] 187it [00:43, 4.54it/s] 188it [00:43, 4.56it/s] 189it [00:44, 4.48it/s] 190it [00:44, 4.34it/s] 191it [00:44, 4.36it/s] 192it [00:44, 4.39it/s] 193it [00:45, 4.44it/s] 194it [00:45, 4.36it/s] 195it [00:45, 4.17it/s] 196it [00:45, 4.35it/s] 196it [00:45, 4.27it/s] +2025-05-25 23:47:32,911 - INFO - Epoch: 71, Objective: tensor([1101.7721], device='cuda:0', grad_fn=), Loss: 0.003083721501752734, KL/n: 21.038372039794922 + 0it [00:00, ?it/s]2025-05-25 23:47:33,286 - INFO - [Epoch 072 | Batch 0000] IWAE-loss 1105.3588 | mean log_px -0.0021 | KL -1030.98 + 1it [00:00, 3.31it/s] 2it [00:00, 3.95it/s] 3it [00:00, 4.15it/s] 4it [00:00, 4.36it/s] 5it [00:01, 4.40it/s] 6it [00:01, 4.48it/s] 7it [00:01, 4.40it/s] 8it [00:01, 4.46it/s] 9it [00:02, 4.53it/s] 10it [00:02, 4.56it/s] 11it [00:02, 4.59it/s] 12it [00:02, 4.57it/s] 13it [00:02, 4.48it/s] 14it [00:03, 4.44it/s] 15it [00:03, 4.34it/s] 16it [00:03, 4.33it/s] 17it [00:03, 4.34it/s] 18it [00:04, 4.42it/s] 19it [00:04, 4.50it/s] 20it [00:04, 4.54it/s] 21it [00:04, 4.39it/s] 22it [00:04, 4.50it/s] 23it [00:05, 4.56it/s] 24it [00:05, 4.61it/s] 25it [00:05, 4.64it/s] 26it [00:05, 4.65it/s] 27it [00:06, 4.66it/s] 28it [00:06, 4.67it/s] 29it [00:06, 4.66it/s] 30it [00:06, 4.68it/s] 31it [00:06, 4.69it/s] 32it [00:07, 4.69it/s] 33it [00:07, 4.53it/s] 34it [00:07, 4.59it/s] 35it [00:07, 4.62it/s] 36it [00:07, 4.65it/s] 37it [00:08, 4.68it/s] 38it [00:08, 4.52it/s] 39it [00:08, 4.57it/s] 40it [00:09, 3.54it/s] 41it [00:09, 3.81it/s] 42it [00:09, 4.04it/s] 43it [00:09, 4.23it/s] 44it [00:09, 4.22it/s] 45it [00:10, 4.38it/s] 46it [00:10, 4.47it/s] 47it [00:10, 4.51it/s] 48it [00:10, 4.56it/s] 49it [00:11, 4.61it/s] 50it [00:11, 4.64it/s]2025-05-25 23:47:44,430 - INFO - [Epoch 072 | Batch 0050] IWAE-loss 1345.4274 | mean log_px -0.0059 | KL -1030.80 + 51it [00:11, 4.50it/s] 52it [00:11, 4.58it/s] 53it [00:11, 4.63it/s] 54it [00:12, 4.65it/s] 55it [00:12, 4.67it/s] 56it [00:12, 4.69it/s] 57it [00:12, 4.53it/s] 58it [00:12, 4.60it/s] 59it [00:13, 4.64it/s] 60it [00:13, 4.65it/s] 61it [00:13, 4.51it/s] 62it [00:13, 4.59it/s] 63it [00:14, 4.63it/s] 64it [00:14, 4.65it/s] 65it [00:14, 4.51it/s] 66it [00:14, 4.58it/s] 67it [00:14, 4.62it/s] 68it [00:15, 4.65it/s] 69it [00:15, 4.67it/s] 70it [00:15, 4.68it/s] 71it [00:15, 4.70it/s] 72it [00:15, 4.70it/s] 73it [00:16, 4.71it/s] 74it [00:16, 4.54it/s] 75it [00:16, 4.61it/s] 76it [00:16, 4.64it/s] 77it [00:17, 4.66it/s] 78it [00:17, 4.68it/s] 79it [00:17, 4.70it/s] 80it [00:17, 4.71it/s] 81it [00:17, 4.72it/s] 82it [00:18, 4.55it/s] 83it [00:18, 4.62it/s] 84it [00:18, 4.65it/s] 85it [00:18, 4.68it/s] 86it [00:18, 4.69it/s] 87it [00:19, 4.71it/s] 88it [00:19, 4.54it/s] 89it [00:19, 4.62it/s] 90it [00:19, 4.64it/s] 91it [00:20, 4.66it/s] 92it [00:20, 4.68it/s] 93it [00:20, 4.70it/s] 94it [00:20, 4.71it/s] 95it [00:20, 4.72it/s] 96it [00:21, 4.72it/s] 97it [00:21, 4.57it/s] 98it [00:21, 4.62it/s] 99it [00:21, 4.64it/s] 100it [00:22, 4.67it/s]2025-05-25 23:47:55,204 - INFO - [Epoch 072 | Batch 0100] IWAE-loss 1193.0322 | mean log_px -0.0023 | KL -1026.61 + 101it [00:22, 4.69it/s] 102it [00:22, 4.69it/s] 103it [00:22, 4.70it/s] 104it [00:22, 4.70it/s] 105it [00:23, 4.71it/s] 106it [00:23, 4.54it/s] 107it [00:23, 4.61it/s] 108it [00:23, 4.64it/s] 109it [00:23, 4.67it/s] 110it [00:24, 4.68it/s] 111it [00:24, 4.53it/s] 112it [00:24, 4.59it/s] 113it [00:24, 4.63it/s] 114it [00:25, 4.66it/s] 115it [00:25, 4.68it/s] 116it [00:25, 4.69it/s] 117it [00:25, 4.71it/s] 118it [00:25, 4.55it/s] 119it [00:26, 4.62it/s] 120it [00:26, 4.65it/s] 121it [00:26, 4.67it/s] 122it [00:26, 4.70it/s] 123it [00:26, 4.71it/s] 124it [00:27, 4.71it/s] 125it [00:27, 4.53it/s] 126it [00:27, 4.59it/s] 127it [00:27, 4.47it/s] 128it [00:28, 4.35it/s] 129it [00:28, 4.43it/s] 130it [00:28, 4.46it/s] 131it [00:28, 4.49it/s] 132it [00:28, 4.50it/s] 133it [00:29, 4.54it/s] 134it [00:29, 4.54it/s] 135it [00:29, 4.55it/s] 136it [00:29, 4.43it/s] 137it [00:30, 4.50it/s] 138it [00:30, 4.52it/s] 139it [00:30, 4.54it/s] 140it [00:30, 4.53it/s] 141it [00:30, 4.52it/s] 142it [00:31, 4.52it/s] 143it [00:31, 4.53it/s] 144it [00:31, 4.30it/s] 145it [00:31, 4.36it/s] 146it [00:32, 4.43it/s] 147it [00:32, 4.44it/s] 148it [00:32, 4.46it/s] 149it [00:32, 4.48it/s] 150it [00:32, 4.46it/s]2025-05-25 23:48:06,201 - INFO - [Epoch 072 | Batch 0150] IWAE-loss 1439.5580 | mean log_px -0.0069 | KL -1025.86 + 151it [00:33, 4.46it/s] 152it [00:33, 4.29it/s] 153it [00:33, 4.38it/s] 154it [00:33, 4.44it/s] 155it [00:34, 4.49it/s] 156it [00:34, 4.52it/s] 157it [00:34, 4.55it/s] 158it [00:34, 4.42it/s] 159it [00:35, 4.48it/s] 160it [00:35, 4.50it/s] 161it [00:35, 4.50it/s] 162it [00:35, 4.53it/s] 163it [00:35, 4.54it/s] 164it [00:36, 4.43it/s] 165it [00:36, 4.47it/s] 166it [00:36, 4.51it/s] 167it [00:36, 4.54it/s] 168it [00:37, 4.55it/s] 169it [00:37, 4.56it/s] 170it [00:37, 4.42it/s] 171it [00:37, 4.46it/s] 172it [00:37, 4.49it/s] 173it [00:38, 4.53it/s] 174it [00:38, 4.53it/s] 175it [00:38, 4.56it/s] 176it [00:38, 4.36it/s] 177it [00:39, 4.38it/s] 178it [00:39, 4.43it/s] 179it [00:39, 4.45it/s] 180it [00:39, 4.43it/s] 181it [00:39, 4.36it/s] 182it [00:40, 4.41it/s] 183it [00:40, 4.27it/s] 184it [00:40, 4.36it/s] 185it [00:40, 4.44it/s] 186it [00:41, 4.48it/s] 187it [00:41, 4.38it/s] 188it [00:41, 4.43it/s] 189it [00:41, 4.47it/s] 190it [00:41, 4.49it/s] 191it [00:42, 4.51it/s] 192it [00:42, 4.52it/s] 193it [00:42, 4.41it/s] 194it [00:42, 4.46it/s] 195it [00:43, 4.35it/s] 196it [00:43, 4.42it/s] 196it [00:43, 4.52it/s] +2025-05-25 23:48:16,440 - INFO - Epoch: 72, Objective: tensor([1084.2766], device='cuda:0', grad_fn=), Loss: 0.004034184850752354, KL/n: 20.965299606323242 + 0it [00:00, ?it/s]2025-05-25 23:48:16,827 - INFO - [Epoch 073 | Batch 0000] IWAE-loss 1114.9978 | mean log_px -0.0042 | KL -1030.27 + 1it [00:00, 3.13it/s] 2it [00:00, 3.67it/s] 3it [00:00, 4.06it/s] 4it [00:01, 4.19it/s] 5it [00:01, 4.32it/s] 6it [00:01, 4.41it/s] 7it [00:01, 4.33it/s] 8it [00:01, 4.41it/s] 9it [00:02, 4.47it/s] 10it [00:02, 4.51it/s] 11it [00:02, 4.56it/s] 12it [00:02, 4.57it/s] 13it [00:02, 4.50it/s] 14it [00:03, 4.49it/s] 15it [00:03, 4.53it/s] 16it [00:03, 4.53it/s] 17it [00:03, 4.40it/s] 18it [00:04, 4.46it/s] 19it [00:04, 4.50it/s] 20it [00:04, 4.54it/s] 21it [00:04, 4.57it/s] 22it [00:04, 4.57it/s] 23it [00:05, 4.58it/s] 24it [00:05, 4.49it/s] 25it [00:05, 4.54it/s] 26it [00:05, 4.54it/s] 27it [00:06, 4.55it/s] 28it [00:06, 4.56it/s] 29it [00:06, 4.47it/s] 30it [00:06, 4.52it/s] 31it [00:06, 4.55it/s] 32it [00:07, 4.56it/s] 33it [00:07, 4.57it/s] 34it [00:07, 4.58it/s] 35it [00:07, 4.52it/s] 36it [00:08, 4.55it/s] 37it [00:08, 4.57it/s] 38it [00:08, 4.57it/s] 39it [00:08, 4.58it/s] 40it [00:08, 4.55it/s] 41it [00:09, 4.43it/s] 42it [00:09, 4.49it/s] 43it [00:09, 4.53it/s] 44it [00:09, 4.54it/s] 45it [00:10, 4.55it/s] 46it [00:10, 4.57it/s] 47it [00:10, 4.45it/s] 48it [00:10, 4.50it/s] 49it [00:10, 4.53it/s] 50it [00:11, 4.43it/s]2025-05-25 23:48:27,903 - INFO - [Epoch 073 | Batch 0050] IWAE-loss 1135.3855 | mean log_px -0.0090 | KL -1023.86 + 51it [00:11, 4.48it/s] 52it [00:11, 4.51it/s] 53it [00:11, 4.54it/s] 54it [00:12, 4.55it/s] 55it [00:12, 4.57it/s] 56it [00:12, 4.51it/s] 57it [00:12, 4.40it/s] 58it [00:12, 4.46it/s] 59it [00:13, 4.47it/s] 60it [00:13, 4.46it/s] 61it [00:13, 4.35it/s] 62it [00:13, 4.33it/s] 63it [00:14, 4.34it/s] 64it [00:14, 4.28it/s] 65it [00:14, 4.38it/s] 66it [00:14, 4.41it/s] 67it [00:14, 4.48it/s] 68it [00:15, 4.50it/s] 69it [00:15, 4.54it/s] 70it [00:15, 4.41it/s] 71it [00:15, 4.48it/s] 72it [00:16, 4.49it/s] 73it [00:16, 4.54it/s] 74it [00:16, 4.56it/s] 75it [00:16, 4.58it/s] 76it [00:16, 4.57it/s] 77it [00:17, 4.59it/s] 78it [00:17, 4.58it/s] 79it [00:17, 4.60it/s] 80it [00:17, 4.45it/s] 81it [00:18, 4.51it/s] 82it [00:18, 4.52it/s] 83it [00:18, 4.56it/s] 84it [00:18, 4.56it/s] 85it [00:18, 4.59it/s] 86it [00:19, 4.59it/s] 87it [00:19, 4.59it/s] 88it [00:19, 4.59it/s] 89it [00:19, 4.45it/s] 90it [00:20, 4.49it/s] 91it [00:20, 4.52it/s] 92it [00:20, 4.48it/s] 93it [00:20, 4.53it/s] 94it [00:20, 4.55it/s] 95it [00:21, 4.55it/s] 96it [00:21, 4.56it/s] 97it [00:21, 4.58it/s] 98it [00:21, 4.44it/s] 99it [00:22, 4.49it/s] 100it [00:22, 4.53it/s]2025-05-25 23:48:39,003 - INFO - [Epoch 073 | Batch 0100] IWAE-loss 1121.1622 | mean log_px -0.0042 | KL -1021.58 + 101it [00:22, 4.56it/s] 102it [00:22, 4.58it/s] 103it [00:22, 4.59it/s] 104it [00:23, 4.60it/s] 105it [00:23, 4.61it/s] 106it [00:23, 4.60it/s] 107it [00:23, 4.45it/s] 108it [00:24, 4.50it/s] 109it [00:24, 4.51it/s] 110it [00:24, 4.54it/s] 111it [00:24, 4.56it/s] 112it [00:24, 4.57it/s] 113it [00:25, 4.60it/s] 114it [00:25, 4.60it/s] 115it [00:25, 4.62it/s] 116it [00:25, 4.48it/s] 117it [00:26, 4.53it/s] 118it [00:26, 4.50it/s] 119it [00:26, 4.56it/s] 120it [00:26, 4.59it/s] 121it [00:26, 4.62it/s] 122it [00:27, 4.62it/s] 123it [00:27, 4.63it/s] 124it [00:27, 4.65it/s] 125it [00:27, 4.50it/s] 126it [00:27, 4.55it/s] 127it [00:28, 4.48it/s] 128it [00:28, 4.52it/s] 129it [00:28, 4.54it/s] 130it [00:28, 4.56it/s] 131it [00:29, 4.59it/s] 132it [00:29, 4.56it/s] 133it [00:29, 4.61it/s] 134it [00:29, 4.62it/s] 135it [00:29, 4.62it/s] 136it [00:30, 4.62it/s] 137it [00:30, 4.63it/s] 138it [00:30, 4.64it/s] 139it [00:30, 4.64it/s] 140it [00:31, 4.64it/s] 141it [00:31, 4.66it/s] 142it [00:31, 4.65it/s] 143it [00:31, 4.65it/s] 144it [00:31, 4.50it/s] 145it [00:32, 4.56it/s] 146it [00:32, 4.58it/s] 147it [00:32, 4.60it/s] 148it [00:32, 4.63it/s] 149it [00:32, 4.63it/s] 150it [00:33, 4.64it/s]2025-05-25 23:48:49,903 - INFO - [Epoch 073 | Batch 0150] IWAE-loss 1471.0764 | mean log_px -0.0143 | KL -1019.94 + 151it [00:33, 4.49it/s] 152it [00:33, 4.55it/s] 153it [00:33, 4.58it/s] 154it [00:34, 4.58it/s] 155it [00:34, 4.61it/s] 156it [00:34, 4.61it/s] 157it [00:34, 4.63it/s] 158it [00:34, 4.63it/s] 159it [00:35, 4.64it/s] 160it [00:35, 4.64it/s] 161it [00:35, 4.64it/s] 162it [00:35, 4.50it/s] 163it [00:36, 4.57it/s] 164it [00:36, 4.58it/s] 165it [00:36, 4.60it/s] 166it [00:36, 4.61it/s] 167it [00:36, 4.63it/s] 168it [00:37, 4.64it/s] 169it [00:37, 4.65it/s] 170it [00:37, 4.64it/s] 171it [00:37, 4.65it/s] 172it [00:37, 4.63it/s] 173it [00:38, 4.62it/s] 174it [00:38, 4.63it/s] 175it [00:38, 4.65it/s] 176it [00:38, 4.64it/s] 177it [00:39, 4.64it/s] 178it [00:39, 4.64it/s] 179it [00:39, 4.63it/s] 180it [00:39, 4.63it/s] 181it [00:39, 4.62it/s] 182it [00:40, 4.61it/s] 183it [00:40, 4.44it/s] 184it [00:40, 4.48it/s] 185it [00:40, 4.51it/s] 186it [00:41, 4.53it/s] 187it [00:41, 4.56it/s] 188it [00:41, 4.55it/s] 189it [00:41, 4.58it/s] 190it [00:41, 4.59it/s] 191it [00:42, 4.60it/s] 192it [00:42, 4.60it/s] 193it [00:42, 4.60it/s] 194it [00:42, 4.49it/s] 195it [00:43, 4.37it/s] 196it [00:43, 4.45it/s] 196it [00:43, 4.53it/s] +2025-05-25 23:48:59,872 - INFO - Epoch: 73, Objective: tensor([1196.2977], device='cuda:0', grad_fn=), Loss: 0.0025322872679680586, KL/n: 20.85674285888672 + 0it [00:00, ?it/s]2025-05-25 23:49:00,464 - INFO - [Epoch 074 | Batch 0000] IWAE-loss 1272.5872 | mean log_px -0.0103 | KL -1021.67 + 1it [00:00, 2.92it/s] 2it [00:00, 3.67it/s] 3it [00:00, 4.03it/s] 4it [00:01, 4.23it/s] 5it [00:01, 4.37it/s] 6it [00:01, 4.37it/s] 7it [00:01, 4.46it/s] 8it [00:01, 4.48it/s] 9it [00:02, 4.50it/s] 10it [00:02, 4.36it/s] 11it [00:02, 4.42it/s] 12it [00:02, 4.47it/s] 13it [00:03, 4.52it/s] 14it [00:03, 4.52it/s] 15it [00:03, 4.50it/s] 16it [00:03, 4.49it/s] 17it [00:03, 4.46it/s] 18it [00:04, 4.50it/s] 19it [00:04, 4.49it/s] 20it [00:04, 4.41it/s] 21it [00:04, 4.38it/s] 22it [00:05, 4.42it/s] 23it [00:05, 4.43it/s] 24it [00:05, 4.44it/s] 25it [00:05, 4.47it/s] 26it [00:05, 4.47it/s] 27it [00:06, 4.49it/s] 28it [00:06, 4.48it/s] 29it [00:06, 4.42it/s] 30it [00:06, 4.47it/s] 31it [00:07, 4.47it/s] 32it [00:07, 4.50it/s] 33it [00:07, 4.38it/s] 34it [00:07, 4.38it/s] 35it [00:07, 4.44it/s] 36it [00:08, 4.46it/s] 37it [00:08, 4.47it/s] 38it [00:08, 4.45it/s] 39it [00:08, 4.48it/s] 40it [00:09, 4.40it/s] 41it [00:09, 4.43it/s] 42it [00:09, 4.41it/s] 43it [00:09, 4.42it/s] 44it [00:09, 4.41it/s] 45it [00:10, 4.44it/s] 46it [00:10, 4.39it/s] 47it [00:10, 4.44it/s] 48it [00:10, 4.48it/s] 49it [00:11, 4.51it/s] 50it [00:11, 4.54it/s]2025-05-25 23:49:11,666 - INFO - [Epoch 074 | Batch 0050] IWAE-loss 1296.5245 | mean log_px -0.0073 | KL -1021.05 + 51it [00:11, 4.46it/s] 52it [00:11, 4.49it/s] 53it [00:11, 4.46it/s] 54it [00:12, 4.45it/s] 55it [00:12, 4.44it/s] 56it [00:12, 4.47it/s] 57it [00:12, 4.34it/s] 58it [00:13, 4.41it/s] 59it [00:13, 4.46it/s] 60it [00:13, 4.39it/s] 61it [00:13, 4.43it/s] 62it [00:14, 4.48it/s] 63it [00:14, 4.46it/s] 64it [00:14, 4.36it/s] 65it [00:14, 4.41it/s] 66it [00:14, 4.44it/s] 67it [00:15, 4.49it/s] 68it [00:15, 4.41it/s] 69it [00:15, 4.44it/s] 70it [00:15, 4.39it/s] 71it [00:16, 4.36it/s] 72it [00:16, 4.44it/s] 73it [00:16, 4.48it/s] 74it [00:16, 4.48it/s] 75it [00:16, 4.48it/s] 76it [00:17, 4.34it/s] 77it [00:17, 4.39it/s] 78it [00:17, 4.36it/s] 79it [00:17, 4.36it/s] 80it [00:18, 4.34it/s] 81it [00:18, 4.35it/s] 82it [00:18, 4.35it/s] 83it [00:18, 4.39it/s] 84it [00:19, 4.46it/s] 85it [00:19, 4.51it/s] 86it [00:19, 4.50it/s] 87it [00:19, 4.53it/s] 88it [00:19, 4.55it/s] 89it [00:20, 4.57it/s] 90it [00:20, 4.59it/s] 91it [00:20, 4.61it/s] 92it [00:20, 4.52it/s] 93it [00:20, 4.55it/s] 94it [00:21, 4.43it/s] 95it [00:21, 4.48it/s] 96it [00:21, 4.41it/s] 97it [00:21, 4.41it/s] 98it [00:22, 4.30it/s] 99it [00:22, 4.36it/s] 100it [00:22, 4.42it/s]2025-05-25 23:49:22,941 - INFO - [Epoch 074 | Batch 0100] IWAE-loss 1122.7998 | mean log_px -0.0063 | KL -1019.44 + 101it [00:22, 4.40it/s] 102it [00:23, 4.44it/s] 103it [00:23, 4.39it/s] 104it [00:23, 4.39it/s] 105it [00:23, 4.42it/s] 106it [00:23, 4.41it/s] 107it [00:24, 4.44it/s] 108it [00:24, 4.37it/s] 109it [00:24, 4.44it/s] 110it [00:24, 4.40it/s] 111it [00:25, 4.45it/s] 112it [00:25, 4.44it/s] 113it [00:25, 4.47it/s] 114it [00:25, 4.49it/s] 115it [00:25, 4.47it/s] 116it [00:26, 4.34it/s] 117it [00:26, 4.39it/s] 118it [00:26, 4.46it/s] 119it [00:26, 4.37it/s] 120it [00:27, 4.42it/s] 121it [00:27, 4.31it/s] 122it [00:27, 4.40it/s] 123it [00:27, 4.38it/s] 124it [00:28, 4.41it/s] 125it [00:28, 4.46it/s] 126it [00:28, 4.49it/s] 127it [00:28, 4.40it/s] 128it [00:28, 4.39it/s] 129it [00:29, 4.41it/s] 130it [00:29, 4.42it/s] 131it [00:29, 4.34it/s] 132it [00:29, 4.31it/s] 133it [00:30, 4.38it/s] 134it [00:30, 4.34it/s] 135it [00:30, 4.37it/s] 136it [00:30, 4.33it/s] 137it [00:30, 4.40it/s] 138it [00:31, 4.43it/s] 139it [00:31, 4.46it/s] 140it [00:31, 4.42it/s] 141it [00:31, 4.44it/s] 142it [00:32, 4.22it/s] 143it [00:32, 4.35it/s] 144it [00:32, 4.38it/s] 145it [00:32, 4.44it/s] 146it [00:33, 4.44it/s] 147it [00:33, 4.46it/s] 148it [00:33, 4.27it/s] 149it [00:33, 4.35it/s] 150it [00:33, 4.36it/s]2025-05-25 23:49:34,316 - INFO - [Epoch 074 | Batch 0150] IWAE-loss 1158.7916 | mean log_px -0.0036 | KL -1011.06 + 151it [00:34, 4.40it/s] 152it [00:34, 4.39it/s] 153it [00:34, 4.43it/s] 154it [00:34, 4.43it/s] 155it [00:35, 4.33it/s] 156it [00:35, 4.42it/s] 157it [00:35, 4.45it/s] 158it [00:35, 4.45it/s] 159it [00:36, 4.38it/s] 160it [00:36, 4.40it/s] 161it [00:36, 4.44it/s] 162it [00:36, 4.47it/s] 163it [00:36, 4.34it/s] 164it [00:37, 4.41it/s] 165it [00:37, 4.38it/s] 166it [00:37, 4.42it/s] 167it [00:37, 4.39it/s] 168it [00:38, 4.42it/s] 169it [00:38, 4.34it/s] 170it [00:38, 4.40it/s] 171it [00:38, 4.45it/s] 172it [00:38, 4.41it/s] 173it [00:39, 4.49it/s] 174it [00:39, 4.48it/s] 175it [00:39, 4.49it/s] 176it [00:39, 4.52it/s] 177it [00:40, 4.27it/s] 178it [00:40, 4.34it/s] 179it [00:40, 4.41it/s] 180it [00:40, 4.38it/s] 181it [00:40, 4.45it/s] 182it [00:41, 4.49it/s] 183it [00:41, 4.53it/s] 184it [00:41, 4.55it/s] 185it [00:41, 4.58it/s] 186it [00:42, 4.34it/s] 187it [00:42, 4.41it/s] 188it [00:42, 4.40it/s] 189it [00:42, 4.45it/s] 190it [00:43, 4.40it/s] 191it [00:43, 4.48it/s] 192it [00:43, 4.45it/s] 193it [00:43, 4.47it/s] 194it [00:43, 4.54it/s] 195it [00:44, 4.38it/s] 196it [00:44, 4.44it/s] 196it [00:44, 4.41it/s] +2025-05-25 23:49:44,597 - INFO - Epoch: 74, Objective: tensor([1074.4708], device='cuda:0', grad_fn=), Loss: 0.0014531121123582125, KL/n: 20.634225845336914 + 0it [00:00, ?it/s]2025-05-25 23:49:44,994 - INFO - [Epoch 075 | Batch 0000] IWAE-loss 1407.3490 | mean log_px -0.0097 | KL -1012.06 + 1it [00:00, 3.10it/s] 2it [00:00, 3.74it/s] 3it [00:00, 4.09it/s] 4it [00:01, 4.10it/s] 5it [00:01, 4.30it/s] 6it [00:01, 4.40it/s] 7it [00:01, 4.46it/s] 8it [00:01, 4.52it/s] 9it [00:02, 4.56it/s] 10it [00:02, 4.57it/s] 11it [00:02, 4.58it/s] 12it [00:02, 3.49it/s] 13it [00:03, 3.79it/s] 14it [00:03, 4.01it/s] 15it [00:03, 4.20it/s] 16it [00:03, 4.31it/s] 17it [00:04, 4.41it/s] 18it [00:04, 4.48it/s] 19it [00:04, 4.52it/s] 20it [00:04, 4.55it/s] 21it [00:04, 4.43it/s] 22it [00:05, 4.51it/s] 23it [00:05, 4.54it/s] 24it [00:05, 4.56it/s] 25it [00:05, 4.59it/s] 26it [00:06, 4.60it/s] 27it [00:06, 4.62it/s] 28it [00:06, 4.62it/s] 29it [00:06, 4.62it/s] 30it [00:06, 4.47it/s] 31it [00:07, 4.52it/s] 32it [00:07, 4.55it/s] 33it [00:07, 4.57it/s] 34it [00:07, 4.59it/s] 35it [00:07, 4.59it/s] 36it [00:08, 4.60it/s] 37it [00:08, 4.63it/s] 38it [00:08, 4.62it/s] 39it [00:08, 4.48it/s] 40it [00:09, 4.55it/s] 41it [00:09, 4.56it/s] 42it [00:09, 4.58it/s] 43it [00:09, 4.60it/s] 44it [00:09, 4.61it/s] 45it [00:10, 4.62it/s] 46it [00:10, 4.63it/s] 47it [00:10, 4.48it/s] 48it [00:10, 4.52it/s] 49it [00:11, 4.55it/s] 50it [00:11, 4.57it/s]2025-05-25 23:49:56,148 - INFO - [Epoch 075 | Batch 0050] IWAE-loss 1448.6622 | mean log_px -0.0086 | KL -1008.97 + 51it [00:11, 4.59it/s] 52it [00:11, 4.59it/s] 53it [00:11, 4.61it/s] 54it [00:12, 4.61it/s] 55it [00:12, 4.52it/s] 56it [00:12, 4.55it/s] 57it [00:12, 4.57it/s] 58it [00:13, 4.59it/s] 59it [00:13, 4.45it/s] 60it [00:13, 4.52it/s] 61it [00:13, 4.53it/s] 62it [00:13, 4.54it/s] 63it [00:14, 4.58it/s] 64it [00:14, 4.46it/s] 65it [00:14, 4.53it/s] 66it [00:14, 4.56it/s] 67it [00:14, 4.60it/s] 68it [00:15, 4.61it/s] 69it [00:15, 4.62it/s] 70it [00:15, 4.47it/s] 71it [00:15, 4.54it/s] 72it [00:16, 4.56it/s] 73it [00:16, 4.59it/s] 74it [00:16, 4.60it/s] 75it [00:16, 4.61it/s] 76it [00:16, 4.43it/s] 77it [00:17, 4.43it/s] 78it [00:17, 4.47it/s] 79it [00:17, 4.52it/s] 80it [00:17, 4.53it/s] 81it [00:18, 4.45it/s] 82it [00:18, 4.47it/s] 83it [00:18, 4.53it/s] 84it [00:18, 4.41it/s] 85it [00:18, 4.42it/s] 86it [00:19, 4.50it/s] 87it [00:19, 4.55it/s] 88it [00:19, 4.59it/s] 89it [00:19, 4.62it/s] 90it [00:20, 4.50it/s] 91it [00:20, 4.57it/s] 92it [00:20, 4.60it/s] 93it [00:20, 4.63it/s] 94it [00:20, 4.64it/s] 95it [00:21, 4.67it/s] 96it [00:21, 4.67it/s] 97it [00:21, 4.68it/s] 98it [00:21, 4.68it/s] 99it [00:21, 4.69it/s] 100it [00:22, 4.69it/s]2025-05-25 23:50:07,102 - INFO - [Epoch 075 | Batch 0100] IWAE-loss 1112.7964 | mean log_px -0.0021 | KL -1007.40 + 101it [00:22, 4.69it/s] 102it [00:22, 4.69it/s] 103it [00:22, 4.68it/s] 104it [00:23, 4.68it/s] 105it [00:23, 4.69it/s] 106it [00:23, 4.65it/s] 107it [00:23, 4.65it/s] 108it [00:23, 4.63it/s] 109it [00:24, 4.64it/s] 110it [00:24, 4.51it/s] 111it [00:24, 4.57it/s] 112it [00:24, 4.56it/s] 113it [00:25, 4.55it/s] 114it [00:25, 4.55it/s] 115it [00:25, 4.58it/s] 116it [00:25, 4.60it/s] 117it [00:25, 4.61it/s] 118it [00:26, 4.63it/s] 119it [00:26, 4.64it/s] 120it [00:26, 4.63it/s] 121it [00:26, 4.48it/s] 122it [00:27, 4.53it/s] 123it [00:27, 4.55it/s] 124it [00:27, 4.57it/s] 125it [00:27, 4.60it/s] 126it [00:27, 4.59it/s] 127it [00:28, 4.60it/s] 128it [00:28, 4.60it/s] 129it [00:28, 4.59it/s] 130it [00:28, 4.61it/s] 131it [00:28, 4.63it/s] 132it [00:29, 4.63it/s] 133it [00:29, 4.64it/s] 134it [00:29, 4.63it/s] 135it [00:29, 4.50it/s] 136it [00:30, 4.54it/s] 137it [00:30, 4.58it/s] 138it [00:30, 4.60it/s] 139it [00:30, 4.62it/s] 140it [00:30, 4.62it/s] 141it [00:31, 4.63it/s] 142it [00:31, 4.63it/s] 143it [00:31, 4.63it/s] 144it [00:31, 4.63it/s] 145it [00:31, 4.63it/s] 146it [00:32, 4.63it/s] 147it [00:32, 4.64it/s] 148it [00:32, 4.63it/s] 149it [00:32, 4.64it/s] 150it [00:33, 4.50it/s]2025-05-25 23:50:17,977 - INFO - [Epoch 075 | Batch 0150] IWAE-loss 2491.0842 | mean log_px -0.0430 | KL -1002.79 + 151it [00:33, 4.56it/s] 152it [00:33, 4.59it/s] 153it [00:33, 4.61it/s] 154it [00:33, 4.59it/s] 155it [00:34, 4.54it/s] 156it [00:34, 4.56it/s] 157it [00:34, 4.58it/s] 158it [00:34, 4.58it/s] 159it [00:35, 4.59it/s] 160it [00:35, 4.51it/s] 161it [00:35, 4.56it/s] 162it [00:35, 4.60it/s] 163it [00:35, 4.62it/s] 164it [00:36, 4.61it/s] 165it [00:36, 4.63it/s] 166it [00:36, 4.63it/s] 167it [00:36, 4.64it/s] 168it [00:36, 4.63it/s] 169it [00:37, 4.63it/s] 170it [00:37, 4.63it/s] 171it [00:37, 4.51it/s] 172it [00:37, 4.56it/s] 173it [00:38, 4.59it/s] 174it [00:38, 4.61it/s] 175it [00:38, 4.62it/s] 176it [00:38, 4.62it/s] 177it [00:38, 4.64it/s] 178it [00:39, 4.64it/s] 179it [00:39, 4.56it/s] 180it [00:39, 4.60it/s] 181it [00:39, 4.61it/s] 182it [00:40, 4.62it/s] 183it [00:40, 4.62it/s] 184it [00:40, 4.62it/s] 185it [00:40, 4.64it/s] 186it [00:40, 4.63it/s] 187it [00:41, 4.61it/s] 188it [00:41, 4.62it/s] 189it [00:41, 4.63it/s] 190it [00:41, 4.63it/s] 191it [00:41, 4.64it/s] 192it [00:42, 4.64it/s] 193it [00:42, 4.50it/s] 194it [00:42, 4.54it/s] 195it [00:42, 4.29it/s] 196it [00:43, 4.34it/s] 196it [00:43, 4.54it/s] +2025-05-25 23:50:27,950 - INFO - Epoch: 75, Objective: tensor([1224.8317], device='cuda:0', grad_fn=), Loss: 0.005707655567675829, KL/n: 20.583492279052734 + 0it [00:00, ?it/s]2025-05-25 23:50:28,354 - INFO - [Epoch 076 | Batch 0000] IWAE-loss 3191.0737 | mean log_px -0.0381 | KL -1011.61 + 1it [00:00, 2.99it/s] 2it [00:00, 3.79it/s] 3it [00:00, 4.14it/s] 4it [00:00, 4.33it/s] 5it [00:01, 4.27it/s] 6it [00:01, 4.40it/s] 7it [00:01, 4.48it/s] 8it [00:01, 4.52it/s] 9it [00:02, 4.58it/s] 10it [00:02, 4.60it/s] 11it [00:02, 4.63it/s] 12it [00:02, 4.65it/s] 13it [00:02, 4.67it/s] 14it [00:03, 4.64it/s] 15it [00:03, 4.48it/s] 16it [00:03, 4.57it/s] 17it [00:03, 4.61it/s] 18it [00:04, 4.63it/s] 19it [00:04, 4.65it/s] 20it [00:04, 4.66it/s] 21it [00:04, 4.68it/s] 22it [00:04, 4.51it/s] 23it [00:05, 4.55it/s] 24it [00:05, 4.58it/s] 25it [00:05, 4.60it/s] 26it [00:05, 4.62it/s] 27it [00:05, 4.63it/s] 28it [00:06, 4.63it/s] 29it [00:06, 4.65it/s] 30it [00:06, 4.49it/s] 31it [00:06, 4.54it/s] 32it [00:07, 4.57it/s] 33it [00:07, 4.60it/s] 34it [00:07, 4.61it/s] 35it [00:07, 4.63it/s] 36it [00:07, 4.64it/s] 37it [00:08, 4.64it/s] 38it [00:08, 4.64it/s] 39it [00:08, 4.49it/s] 40it [00:08, 4.54it/s] 41it [00:09, 4.53it/s] 42it [00:09, 4.57it/s] 43it [00:09, 4.59it/s] 44it [00:09, 4.61it/s] 45it [00:09, 4.63it/s] 46it [00:10, 4.63it/s] 47it [00:10, 4.48it/s] 48it [00:10, 4.54it/s] 49it [00:10, 4.57it/s] 50it [00:10, 4.60it/s]2025-05-25 23:50:39,239 - INFO - [Epoch 076 | Batch 0050] IWAE-loss 1105.2787 | mean log_px -0.0032 | KL -1006.82 + 51it [00:11, 4.61it/s] 52it [00:11, 4.51it/s] 53it [00:11, 4.56it/s] 54it [00:11, 4.58it/s] 55it [00:12, 4.60it/s] 56it [00:12, 4.63it/s] 57it [00:12, 4.63it/s] 58it [00:12, 4.64it/s] 59it [00:12, 4.64it/s] 60it [00:13, 4.64it/s] 61it [00:13, 4.66it/s] 62it [00:13, 4.65it/s] 63it [00:13, 4.67it/s] 64it [00:14, 4.66it/s] 65it [00:14, 4.63it/s] 66it [00:14, 4.48it/s] 67it [00:14, 4.55it/s] 68it [00:14, 4.58it/s] 69it [00:15, 4.61it/s] 70it [00:15, 4.62it/s] 71it [00:15, 4.61it/s] 72it [00:15, 4.62it/s] 73it [00:16, 4.48it/s] 74it [00:16, 4.55it/s] 75it [00:16, 4.58it/s] 76it [00:16, 4.58it/s] 77it [00:16, 4.61it/s] 78it [00:17, 4.62it/s] 79it [00:17, 4.48it/s] 80it [00:17, 4.55it/s] 81it [00:17, 4.58it/s] 82it [00:17, 4.60it/s] 83it [00:18, 4.61it/s] 84it [00:18, 4.61it/s] 85it [00:18, 4.63it/s] 86it [00:18, 4.48it/s] 87it [00:19, 4.54it/s] 88it [00:19, 4.58it/s] 89it [00:19, 4.60it/s] 90it [00:19, 4.61it/s] 91it [00:19, 4.63it/s] 92it [00:20, 4.63it/s] 93it [00:20, 4.41it/s] 94it [00:20, 4.49it/s] 95it [00:20, 4.54it/s] 96it [00:21, 4.57it/s] 97it [00:21, 4.61it/s] 98it [00:21, 4.62it/s] 99it [00:21, 4.63it/s] 100it [00:21, 4.63it/s]2025-05-25 23:50:50,143 - INFO - [Epoch 076 | Batch 0100] IWAE-loss 1797.6439 | mean log_px -0.0222 | KL -1009.94 + 101it [00:22, 4.40it/s] 102it [00:22, 4.33it/s] 103it [00:22, 4.33it/s] 104it [00:22, 4.39it/s] 105it [00:23, 4.30it/s] 106it [00:23, 4.34it/s] 107it [00:23, 4.43it/s] 108it [00:23, 4.49it/s] 109it [00:23, 4.55it/s] 110it [00:24, 4.42it/s] 111it [00:24, 4.50it/s] 112it [00:24, 4.53it/s] 113it [00:24, 4.56it/s] 114it [00:25, 4.59it/s] 115it [00:25, 4.60it/s] 116it [00:25, 4.60it/s] 117it [00:25, 4.62it/s] 118it [00:25, 4.62it/s] 119it [00:26, 4.64it/s] 120it [00:26, 4.48it/s] 121it [00:26, 4.55it/s] 122it [00:26, 4.57it/s] 123it [00:27, 4.60it/s] 124it [00:27, 4.61it/s] 125it [00:27, 4.62it/s] 126it [00:27, 4.62it/s] 127it [00:27, 4.63it/s] 128it [00:28, 4.62it/s] 129it [00:28, 4.48it/s] 130it [00:28, 4.53it/s] 131it [00:28, 4.57it/s] 132it [00:28, 4.59it/s] 133it [00:29, 4.46it/s] 134it [00:29, 4.52it/s] 135it [00:29, 4.55it/s] 136it [00:29, 4.58it/s] 137it [00:30, 4.61it/s] 138it [00:30, 4.47it/s] 139it [00:30, 4.54it/s] 140it [00:30, 4.57it/s] 141it [00:30, 4.59it/s] 142it [00:31, 4.61it/s] 143it [00:31, 4.62it/s] 144it [00:31, 4.57it/s] 145it [00:31, 4.52it/s] 146it [00:32, 4.57it/s] 147it [00:32, 4.59it/s] 148it [00:32, 4.60it/s] 149it [00:32, 4.61it/s] 150it [00:32, 4.63it/s]2025-05-25 23:51:01,157 - INFO - [Epoch 076 | Batch 0150] IWAE-loss 1153.4496 | mean log_px -0.0023 | KL -1007.40 + 151it [00:33, 4.64it/s] 152it [00:33, 4.48it/s] 153it [00:33, 4.55it/s] 154it [00:33, 4.57it/s] 155it [00:34, 4.62it/s] 156it [00:34, 4.63it/s] 157it [00:34, 4.49it/s] 158it [00:34, 4.55it/s] 159it [00:34, 4.59it/s] 160it [00:35, 4.59it/s] 161it [00:35, 4.61it/s] 162it [00:35, 4.62it/s] 163it [00:35, 4.64it/s] 164it [00:35, 4.64it/s] 165it [00:36, 4.65it/s] 166it [00:36, 4.65it/s] 167it [00:36, 4.65it/s] 168it [00:36, 4.65it/s] 169it [00:37, 4.49it/s] 170it [00:37, 4.46it/s] 171it [00:37, 4.54it/s] 172it [00:37, 4.58it/s] 173it [00:37, 4.62it/s] 174it [00:38, 4.63it/s] 175it [00:38, 4.64it/s] 176it [00:38, 4.65it/s] 177it [00:38, 4.66it/s] 178it [00:39, 4.66it/s] 179it [00:39, 4.68it/s] 180it [00:39, 4.66it/s] 181it [00:39, 4.65it/s] 182it [00:39, 4.65it/s] 183it [00:40, 4.51it/s] 184it [00:40, 4.55it/s] 185it [00:40, 4.59it/s] 186it [00:40, 4.60it/s] 187it [00:40, 4.63it/s] 188it [00:41, 4.63it/s] 189it [00:41, 4.64it/s] 190it [00:41, 4.63it/s] 191it [00:41, 4.64it/s] 192it [00:42, 4.50it/s] 193it [00:42, 4.58it/s] 194it [00:42, 4.58it/s] 195it [00:42, 4.46it/s] 196it [00:42, 4.54it/s] 196it [00:43, 4.56it/s] +2025-05-25 23:51:11,087 - INFO - Epoch: 76, Objective: tensor([1119.1392], device='cuda:0', grad_fn=), Loss: 0.006396050099283457, KL/n: 20.540983200073242 + 0it [00:00, ?it/s]2025-05-25 23:51:11,676 - INFO - [Epoch 077 | Batch 0000] IWAE-loss 1210.2894 | mean log_px -0.0075 | KL -1004.59 + 1it [00:00, 2.98it/s] 2it [00:00, 3.71it/s] 3it [00:00, 4.09it/s] 4it [00:00, 4.28it/s] 5it [00:01, 4.41it/s] 6it [00:01, 4.48it/s] 7it [00:01, 4.52it/s] 8it [00:01, 4.40it/s] 9it [00:02, 4.49it/s] 10it [00:02, 4.53it/s] 11it [00:02, 4.56it/s] 12it [00:02, 4.44it/s] 13it [00:02, 4.50it/s] 14it [00:03, 4.53it/s] 15it [00:03, 4.56it/s] 16it [00:03, 4.59it/s] 17it [00:03, 4.62it/s] 18it [00:04, 4.62it/s] 19it [00:04, 4.63it/s] 20it [00:04, 4.63it/s] 21it [00:04, 4.50it/s] 22it [00:04, 4.55it/s] 23it [00:05, 4.57it/s] 24it [00:05, 4.59it/s] 25it [00:05, 4.61it/s] 26it [00:05, 4.61it/s] 27it [00:06, 4.62it/s] 28it [00:06, 4.62it/s] 29it [00:06, 4.63it/s] 30it [00:06, 4.49it/s] 31it [00:06, 4.55it/s] 32it [00:07, 4.56it/s] 33it [00:07, 4.59it/s] 34it [00:07, 4.60it/s] 35it [00:07, 4.62it/s] 36it [00:07, 4.61it/s] 37it [00:08, 4.61it/s] 38it [00:08, 4.62it/s] 39it [00:08, 4.63it/s] 40it [00:08, 4.64it/s] 41it [00:09, 4.64it/s] 42it [00:09, 4.63it/s] 43it [00:09, 4.63it/s] 44it [00:09, 4.61it/s] 45it [00:09, 4.62it/s] 46it [00:10, 4.52it/s] 47it [00:10, 4.49it/s] 48it [00:10, 4.54it/s] 49it [00:10, 4.58it/s] 50it [00:11, 4.60it/s]2025-05-25 23:51:22,585 - INFO - [Epoch 077 | Batch 0050] IWAE-loss 1236.3286 | mean log_px -0.0053 | KL -1002.10 + 51it [00:11, 4.63it/s] 52it [00:11, 4.48it/s] 53it [00:11, 4.54it/s] 54it [00:11, 4.57it/s] 55it [00:12, 4.60it/s] 56it [00:12, 4.62it/s] 57it [00:12, 4.63it/s] 58it [00:12, 4.64it/s] 59it [00:12, 4.64it/s] 60it [00:13, 4.45it/s] 61it [00:13, 4.52it/s] 62it [00:13, 4.56it/s] 63it [00:13, 4.58it/s] 64it [00:14, 4.60it/s] 65it [00:14, 4.62it/s] 66it [00:14, 4.60it/s] 67it [00:14, 4.59it/s] 68it [00:14, 4.60it/s] 69it [00:15, 4.63it/s] 70it [00:15, 4.63it/s] 71it [00:15, 4.64it/s] 72it [00:15, 4.63it/s] 73it [00:16, 4.63it/s] 74it [00:16, 4.63it/s] 75it [00:16, 4.63it/s] 76it [00:16, 4.50it/s] 77it [00:16, 4.56it/s] 78it [00:17, 4.58it/s] 79it [00:17, 4.59it/s] 80it [00:17, 4.62it/s] 81it [00:17, 4.63it/s] 82it [00:17, 4.63it/s] 83it [00:18, 4.63it/s] 84it [00:18, 4.63it/s] 85it [00:18, 4.64it/s] 86it [00:18, 4.63it/s] 87it [00:19, 4.63it/s] 88it [00:19, 4.63it/s] 89it [00:19, 4.64it/s] 90it [00:19, 4.64it/s] 91it [00:19, 4.64it/s] 92it [00:20, 4.65it/s] 93it [00:20, 4.65it/s] 94it [00:20, 4.65it/s] 95it [00:20, 4.64it/s] 96it [00:21, 4.42it/s] 97it [00:21, 4.41it/s] 98it [00:21, 4.43it/s] 99it [00:21, 4.45it/s] 100it [00:21, 4.48it/s]2025-05-25 23:51:33,502 - INFO - [Epoch 077 | Batch 0100] IWAE-loss 1310.2383 | mean log_px -0.0126 | KL -997.80 + 101it [00:22, 4.48it/s] 102it [00:22, 4.50it/s] 103it [00:22, 4.53it/s] 104it [00:22, 4.56it/s] 105it [00:23, 4.58it/s] 106it [00:23, 4.59it/s] 107it [00:23, 4.60it/s] 108it [00:23, 4.60it/s] 109it [00:23, 4.62it/s] 110it [00:24, 4.61it/s] 111it [00:24, 4.62it/s] 112it [00:24, 4.62it/s] 113it [00:24, 4.63it/s] 114it [00:24, 4.62it/s] 115it [00:25, 4.51it/s] 116it [00:25, 4.56it/s] 117it [00:25, 4.58it/s] 118it [00:25, 4.60it/s] 119it [00:26, 4.61it/s] 120it [00:26, 4.61it/s] 121it [00:26, 4.59it/s] 122it [00:26, 4.41it/s] 123it [00:26, 4.46it/s] 124it [00:27, 4.48it/s] 125it [00:27, 4.50it/s] 126it [00:27, 4.53it/s] 127it [00:27, 4.57it/s] 128it [00:28, 4.61it/s] 129it [00:28, 4.65it/s] 130it [00:28, 4.67it/s] 131it [00:28, 4.69it/s] 132it [00:28, 4.70it/s] 133it [00:29, 4.71it/s] 134it [00:29, 4.71it/s] 135it [00:29, 4.72it/s] 136it [00:29, 4.72it/s] 137it [00:29, 4.72it/s] 138it [00:30, 4.65it/s] 139it [00:30, 4.69it/s] 140it [00:30, 4.69it/s] 141it [00:30, 4.71it/s] 142it [00:31, 4.71it/s] 143it [00:31, 4.55it/s] 144it [00:31, 4.61it/s] 145it [00:31, 4.64it/s] 146it [00:31, 4.68it/s] 147it [00:32, 4.69it/s] 148it [00:32, 4.70it/s] 149it [00:32, 4.71it/s] 150it [00:32, 4.72it/s]2025-05-25 23:51:44,301 - INFO - [Epoch 077 | Batch 0150] IWAE-loss 1114.1711 | mean log_px -0.0020 | KL -998.09 + 151it [00:32, 4.72it/s] 152it [00:33, 4.72it/s] 153it [00:33, 4.56it/s] 154it [00:33, 4.62it/s] 155it [00:33, 4.66it/s] 156it [00:34, 4.68it/s] 157it [00:34, 4.70it/s] 158it [00:34, 4.68it/s] 159it [00:34, 4.70it/s] 160it [00:34, 4.70it/s] 161it [00:35, 4.71it/s] 162it [00:35, 4.71it/s] 163it [00:35, 4.72it/s] 164it [00:35, 4.72it/s] 165it [00:35, 4.71it/s] 166it [00:36, 4.71it/s] 167it [00:36, 4.72it/s] 168it [00:36, 4.71it/s] 169it [00:36, 4.72it/s] 170it [00:37, 4.72it/s] 171it [00:37, 4.74it/s] 172it [00:37, 4.72it/s] 173it [00:37, 4.73it/s] 174it [00:37, 4.73it/s] 175it [00:38, 4.73it/s] 176it [00:38, 4.52it/s] 177it [00:38, 4.60it/s] 178it [00:38, 4.63it/s] 179it [00:38, 4.67it/s] 180it [00:39, 4.68it/s] 181it [00:39, 4.70it/s] 182it [00:39, 4.71it/s] 183it [00:39, 4.72it/s] 184it [00:39, 4.72it/s] 185it [00:40, 4.73it/s] 186it [00:40, 4.73it/s] 187it [00:40, 4.73it/s] 188it [00:40, 4.73it/s] 189it [00:41, 4.73it/s] 190it [00:41, 4.73it/s] 191it [00:41, 4.51it/s] 192it [00:41, 4.53it/s] 193it [00:41, 4.60it/s] 194it [00:42, 4.64it/s] 195it [00:42, 4.52it/s] 196it [00:42, 4.58it/s] 196it [00:42, 4.59it/s] +2025-05-25 23:51:54,069 - INFO - Epoch: 77, Objective: tensor([1058.8920], device='cuda:0', grad_fn=), Loss: 0.0013972671004012227, KL/n: 20.369314193725586 + 0it [00:00, ?it/s]2025-05-25 23:51:54,471 - INFO - [Epoch 078 | Batch 0000] IWAE-loss 1110.0542 | mean log_px -0.0045 | KL -998.70 + 1it [00:00, 2.83it/s] 2it [00:00, 3.58it/s] 3it [00:00, 4.00it/s] 4it [00:01, 4.21it/s] 5it [00:01, 4.35it/s] 6it [00:01, 4.38it/s] 7it [00:01, 4.49it/s] 8it [00:01, 4.40it/s] 9it [00:02, 4.46it/s] 10it [00:02, 3.54it/s] 11it [00:02, 3.81it/s] 12it [00:02, 3.98it/s] 13it [00:03, 4.17it/s] 14it [00:03, 4.23it/s] 15it [00:03, 4.36it/s] 16it [00:03, 4.41it/s] 17it [00:04, 4.47it/s] 18it [00:04, 4.48it/s] 19it [00:04, 4.54it/s] 20it [00:04, 4.53it/s] 21it [00:04, 4.58it/s] 22it [00:05, 4.54it/s] 23it [00:05, 4.45it/s] 24it [00:05, 4.50it/s] 25it [00:05, 4.57it/s] 26it [00:06, 4.57it/s] 27it [00:06, 4.63it/s] 28it [00:06, 4.63it/s] 29it [00:06, 4.63it/s] 30it [00:06, 4.60it/s] 31it [00:07, 4.43it/s] 32it [00:07, 4.48it/s] 33it [00:07, 4.54it/s] 34it [00:07, 4.58it/s] 35it [00:08, 4.63it/s] 36it [00:08, 4.65it/s] 37it [00:08, 4.67it/s] 38it [00:08, 4.67it/s] 39it [00:08, 4.66it/s] 40it [00:09, 4.64it/s] 41it [00:09, 4.66it/s] 42it [00:09, 4.51it/s] 43it [00:09, 4.58it/s] 44it [00:09, 4.61it/s] 45it [00:10, 4.64it/s] 46it [00:10, 4.55it/s] 47it [00:10, 4.58it/s] 48it [00:10, 4.58it/s] 49it [00:11, 4.63it/s] 50it [00:11, 4.63it/s]2025-05-25 23:52:05,622 - INFO - [Epoch 078 | Batch 0050] IWAE-loss 1141.6960 | mean log_px -0.0026 | KL -994.03 + 51it [00:11, 4.62it/s] 52it [00:11, 4.57it/s] 53it [00:11, 4.61it/s] 54it [00:12, 4.64it/s] 55it [00:12, 4.67it/s] 56it [00:12, 4.59it/s] 57it [00:12, 4.59it/s] 58it [00:13, 4.54it/s] 59it [00:13, 4.54it/s] 60it [00:13, 4.50it/s] 61it [00:13, 4.52it/s] 62it [00:13, 4.50it/s] 63it [00:14, 4.51it/s] 64it [00:14, 4.51it/s] 65it [00:14, 4.56it/s] 66it [00:14, 4.53it/s] 67it [00:14, 4.58it/s] 68it [00:15, 4.54it/s] 69it [00:15, 4.54it/s] 70it [00:15, 4.59it/s] 71it [00:15, 4.59it/s] 72it [00:16, 4.61it/s] 73it [00:16, 4.65it/s] 74it [00:16, 4.67it/s] 75it [00:16, 4.67it/s] 76it [00:16, 4.59it/s] 77it [00:17, 4.55it/s] 78it [00:17, 4.55it/s] 79it [00:17, 4.53it/s] 80it [00:17, 4.53it/s] 81it [00:18, 4.56it/s] 82it [00:18, 4.54it/s] 83it [00:18, 4.52it/s] 84it [00:18, 4.52it/s] 85it [00:18, 4.52it/s] 86it [00:19, 4.58it/s] 87it [00:19, 4.60it/s] 88it [00:19, 4.57it/s] 89it [00:19, 4.59it/s] 90it [00:20, 4.62it/s] 91it [00:20, 4.57it/s] 92it [00:20, 4.52it/s] 93it [00:20, 4.52it/s] 94it [00:20, 4.50it/s] 95it [00:21, 4.52it/s] 96it [00:21, 4.49it/s] 97it [00:21, 4.51it/s] 98it [00:21, 4.51it/s] 99it [00:22, 4.50it/s] 100it [00:22, 4.55it/s]2025-05-25 23:52:16,603 - INFO - [Epoch 078 | Batch 0100] IWAE-loss 1110.1791 | mean log_px -0.0030 | KL -994.81 + 101it [00:22, 4.38it/s] 102it [00:22, 4.46it/s] 103it [00:22, 4.52it/s] 104it [00:23, 4.50it/s] 105it [00:23, 4.50it/s] 106it [00:23, 4.49it/s] 107it [00:23, 4.48it/s] 108it [00:24, 4.52it/s] 109it [00:24, 4.55it/s] 110it [00:24, 4.36it/s] 111it [00:24, 4.48it/s] 112it [00:24, 4.46it/s] 113it [00:25, 4.49it/s] 114it [00:25, 4.50it/s] 115it [00:25, 4.54it/s] 116it [00:25, 4.39it/s] 117it [00:26, 4.51it/s] 118it [00:26, 4.57it/s] 119it [00:26, 4.60it/s] 120it [00:26, 4.57it/s] 121it [00:26, 4.56it/s] 122it [00:27, 4.52it/s] 123it [00:27, 4.58it/s] 124it [00:27, 4.55it/s] 125it [00:27, 4.57it/s] 126it [00:28, 4.52it/s] 127it [00:28, 4.52it/s] 128it [00:28, 4.50it/s] 129it [00:28, 4.47it/s] 130it [00:28, 4.49it/s] 131it [00:29, 4.52it/s] 132it [00:29, 4.56it/s] 133it [00:29, 4.54it/s] 134it [00:29, 4.53it/s] 135it [00:30, 4.41it/s] 136it [00:30, 4.36it/s] 137it [00:30, 4.45it/s] 138it [00:30, 4.44it/s] 139it [00:30, 4.47it/s] 140it [00:31, 4.46it/s] 141it [00:31, 4.46it/s] 142it [00:31, 4.45it/s] 143it [00:31, 4.49it/s] 144it [00:32, 4.48it/s] 145it [00:32, 4.46it/s] 146it [00:32, 4.45it/s] 147it [00:32, 4.45it/s] 148it [00:32, 4.44it/s] 149it [00:33, 4.44it/s] 150it [00:33, 4.45it/s]2025-05-25 23:52:27,758 - INFO - [Epoch 078 | Batch 0150] IWAE-loss 1227.6323 | mean log_px -0.0173 | KL -994.20 + 151it [00:33, 4.43it/s] 152it [00:33, 4.51it/s] 153it [00:34, 4.50it/s] 154it [00:34, 4.48it/s] 155it [00:34, 4.51it/s] 156it [00:34, 4.49it/s] 157it [00:34, 4.36it/s] 158it [00:35, 4.45it/s] 159it [00:35, 4.46it/s] 160it [00:35, 4.46it/s] 161it [00:35, 4.48it/s] 162it [00:36, 4.50it/s] 163it [00:36, 4.53it/s] 164it [00:36, 4.51it/s] 165it [00:36, 4.50it/s] 166it [00:36, 4.51it/s] 167it [00:37, 4.39it/s] 168it [00:37, 4.42it/s] 169it [00:37, 4.47it/s] 170it [00:37, 4.50it/s] 171it [00:38, 4.55it/s] 172it [00:38, 4.57it/s] 173it [00:38, 4.55it/s] 174it [00:38, 4.53it/s] 175it [00:38, 4.50it/s] 176it [00:39, 4.51it/s] 177it [00:39, 4.55it/s] 178it [00:39, 4.59it/s] 179it [00:39, 4.58it/s] 180it [00:40, 4.58it/s] 181it [00:40, 4.54it/s] 182it [00:40, 4.36it/s] 183it [00:40, 4.43it/s] 184it [00:40, 4.49it/s] 185it [00:41, 4.49it/s] 186it [00:41, 4.52it/s] 187it [00:41, 4.58it/s] 188it [00:41, 4.53it/s] 189it [00:42, 4.55it/s] 190it [00:42, 4.55it/s] 191it [00:42, 4.57it/s] 192it [00:42, 4.56it/s] 193it [00:42, 4.57it/s] 194it [00:43, 4.57it/s] 195it [00:43, 4.48it/s] 196it [00:43, 4.49it/s] 196it [00:43, 4.49it/s] +2025-05-25 23:52:37,874 - INFO - Epoch: 78, Objective: tensor([2114.0513], device='cuda:0', grad_fn=), Loss: 0.018417079001665115, KL/n: 20.35153579711914 + 0it [00:00, ?it/s]2025-05-25 23:52:38,271 - INFO - [Epoch 079 | Batch 0000] IWAE-loss 1181.8622 | mean log_px -0.0096 | KL -996.42 + 1it [00:00, 2.86it/s] 2it [00:00, 3.64it/s] 3it [00:00, 4.01it/s] 4it [00:01, 4.14it/s] 5it [00:01, 4.20it/s] 6it [00:01, 4.29it/s] 7it [00:01, 4.21it/s] 8it [00:01, 4.34it/s] 9it [00:02, 4.41it/s] 10it [00:02, 4.47it/s] 11it [00:02, 4.49it/s] 12it [00:02, 4.52it/s] 13it [00:03, 4.48it/s] 14it [00:03, 4.48it/s] 15it [00:03, 4.44it/s] 16it [00:03, 4.45it/s] 17it [00:03, 4.47it/s] 18it [00:04, 4.48it/s] 19it [00:04, 4.48it/s] 20it [00:04, 4.30it/s] 21it [00:04, 4.38it/s] 22it [00:05, 4.43it/s] 23it [00:05, 4.38it/s] 24it [00:05, 4.43it/s] 25it [00:05, 4.41it/s] 26it [00:05, 4.45it/s] 27it [00:06, 4.44it/s] 28it [00:06, 4.42it/s] 29it [00:06, 4.31it/s] 30it [00:06, 4.39it/s] 31it [00:07, 4.39it/s] 32it [00:07, 4.39it/s] 33it [00:07, 4.42it/s] 34it [00:07, 4.46it/s] 35it [00:08, 4.46it/s] 36it [00:08, 4.48it/s] 37it [00:08, 4.38it/s] 38it [00:08, 4.46it/s] 39it [00:08, 4.41it/s] 40it [00:09, 4.48it/s] 41it [00:09, 4.43it/s] 42it [00:09, 4.45it/s] 43it [00:09, 4.47it/s] 44it [00:10, 4.48it/s] 45it [00:10, 4.32it/s] 46it [00:10, 4.39it/s] 47it [00:10, 4.36it/s] 48it [00:10, 4.38it/s] 49it [00:11, 4.34it/s] 50it [00:11, 4.36it/s]2025-05-25 23:52:49,616 - INFO - [Epoch 079 | Batch 0050] IWAE-loss 1083.8743 | mean log_px -0.0050 | KL -990.57 + 51it [00:11, 4.33it/s] 52it [00:11, 4.40it/s] 53it [00:12, 4.35it/s] 54it [00:12, 4.41it/s] 55it [00:12, 4.43it/s] 56it [00:12, 4.42it/s] 57it [00:13, 4.44it/s] 58it [00:13, 4.47it/s] 59it [00:13, 4.52it/s] 60it [00:13, 4.53it/s] 61it [00:13, 4.57it/s] 62it [00:14, 4.54it/s] 63it [00:14, 4.47it/s] 64it [00:14, 4.49it/s] 65it [00:14, 4.49it/s] 66it [00:15, 4.47it/s] 67it [00:15, 4.47it/s] 68it [00:15, 4.46it/s] 69it [00:15, 4.28it/s] 70it [00:15, 4.26it/s] 71it [00:16, 4.25it/s] 72it [00:16, 4.32it/s] 73it [00:16, 4.35it/s] 74it [00:16, 4.40it/s] 75it [00:17, 4.38it/s] 76it [00:17, 4.47it/s] 77it [00:17, 4.37it/s] 78it [00:17, 4.33it/s] 79it [00:18, 4.34it/s] 80it [00:18, 4.44it/s] 81it [00:18, 4.38it/s] 82it [00:18, 4.27it/s] 83it [00:18, 4.31it/s] 84it [00:19, 4.36it/s] 85it [00:19, 4.35it/s] 86it [00:19, 4.38it/s] 87it [00:19, 4.36it/s] 88it [00:20, 4.41it/s] 89it [00:20, 4.29it/s] 90it [00:20, 4.37it/s] 91it [00:20, 4.37it/s] 92it [00:20, 4.40it/s] 93it [00:21, 4.40it/s] 94it [00:21, 4.44it/s] 95it [00:21, 4.43it/s] 96it [00:21, 4.32it/s] 97it [00:22, 4.40it/s] 98it [00:22, 4.39it/s] 99it [00:22, 4.41it/s] 100it [00:22, 4.47it/s]2025-05-25 23:53:00,959 - INFO - [Epoch 079 | Batch 0100] IWAE-loss 1205.5616 | mean log_px -0.0082 | KL -991.58 + 101it [00:23, 4.47it/s] 102it [00:23, 4.42it/s] 103it [00:23, 4.40it/s] 104it [00:23, 4.29it/s] 105it [00:23, 4.32it/s] 106it [00:24, 4.36it/s] 107it [00:24, 4.38it/s] 108it [00:24, 4.41it/s] 109it [00:24, 4.43it/s] 110it [00:25, 4.47it/s] 111it [00:25, 4.33it/s] 112it [00:25, 4.41it/s] 113it [00:25, 4.45it/s] 114it [00:25, 4.50it/s] 115it [00:26, 4.46it/s] 116it [00:26, 4.53it/s] 117it [00:26, 4.36it/s] 118it [00:26, 4.38it/s] 119it [00:27, 4.38it/s] 120it [00:27, 4.41it/s] 121it [00:27, 4.45it/s] 122it [00:27, 4.44it/s] 123it [00:28, 4.29it/s] 124it [00:28, 4.37it/s] 125it [00:28, 4.43it/s] 126it [00:28, 4.38it/s] 127it [00:28, 4.47it/s] 128it [00:29, 4.49it/s] 129it [00:29, 4.45it/s] 130it [00:29, 4.50it/s] 131it [00:29, 4.47it/s] 132it [00:30, 4.49it/s] 133it [00:30, 4.46it/s] 134it [00:30, 4.48it/s] 135it [00:30, 4.40it/s] 136it [00:30, 4.46it/s] 137it [00:31, 4.40it/s] 138it [00:31, 4.40it/s] 139it [00:31, 4.35it/s] 140it [00:31, 4.39it/s] 141it [00:32, 4.38it/s] 142it [00:32, 4.43it/s] 143it [00:32, 4.36it/s] 144it [00:32, 4.41it/s] 145it [00:32, 4.44it/s] 146it [00:33, 4.49it/s] 147it [00:33, 4.47it/s] 148it [00:33, 4.45it/s] 149it [00:33, 4.43it/s] 150it [00:34, 4.42it/s]2025-05-25 23:53:12,280 - INFO - [Epoch 079 | Batch 0150] IWAE-loss 1199.3240 | mean log_px -0.0036 | KL -990.65 + 151it [00:34, 4.43it/s] 152it [00:34, 4.44it/s] 153it [00:34, 4.48it/s] 154it [00:35, 4.40it/s] 155it [00:35, 4.45it/s] 156it [00:35, 4.49it/s] 157it [00:35, 4.53it/s] 158it [00:35, 4.56it/s] 159it [00:36, 4.58it/s] 160it [00:36, 4.58it/s] 161it [00:36, 4.59it/s] 162it [00:36, 4.58it/s] 163it [00:36, 4.56it/s] 164it [00:37, 4.51it/s] 165it [00:37, 4.54it/s] 166it [00:37, 4.56it/s] 167it [00:37, 4.57it/s] 168it [00:38, 4.56it/s] 169it [00:38, 4.54it/s] 170it [00:38, 4.53it/s] 171it [00:38, 4.49it/s] 172it [00:38, 4.48it/s] 173it [00:39, 4.52it/s] 174it [00:39, 4.44it/s] 175it [00:39, 4.49it/s] 176it [00:39, 4.49it/s] 177it [00:40, 4.52it/s] 178it [00:40, 4.42it/s] 179it [00:40, 4.48it/s] 180it [00:40, 4.48it/s] 181it [00:40, 4.44it/s] 182it [00:41, 4.47it/s] 183it [00:41, 4.52it/s] 184it [00:41, 4.48it/s] 185it [00:41, 4.53it/s] 186it [00:42, 4.43it/s] 187it [00:42, 4.45it/s] 188it [00:42, 4.44it/s] 189it [00:42, 4.49it/s] 190it [00:42, 4.42it/s] 191it [00:43, 4.35it/s] 192it [00:43, 4.34it/s] 193it [00:43, 4.43it/s] 194it [00:43, 4.39it/s] 195it [00:44, 4.34it/s] 196it [00:44, 4.39it/s] 196it [00:44, 4.41it/s] +2025-05-25 23:53:22,450 - INFO - Epoch: 79, Objective: tensor([1057.2749], device='cuda:0', grad_fn=), Loss: 0.0020423263777047396, KL/n: 20.246395111083984 + 0it [00:00, ?it/s]2025-05-25 23:53:23,035 - INFO - [Epoch 080 | Batch 0000] IWAE-loss 1272.5481 | mean log_px -0.0040 | KL -991.26 + 1it [00:00, 2.94it/s] 2it [00:00, 3.69it/s] 3it [00:00, 4.08it/s] 4it [00:01, 4.17it/s] 5it [00:01, 4.28it/s] 6it [00:01, 4.33it/s] 7it [00:01, 4.35it/s] 8it [00:01, 4.35it/s] 9it [00:02, 4.35it/s] 10it [00:02, 4.38it/s] 11it [00:02, 4.38it/s] 12it [00:02, 4.45it/s] 13it [00:03, 4.41it/s] 14it [00:03, 4.45it/s] 15it [00:03, 4.51it/s] 16it [00:03, 4.55it/s] 17it [00:03, 4.49it/s] 18it [00:04, 4.47it/s] 19it [00:04, 4.29it/s] 20it [00:04, 4.32it/s] 21it [00:04, 4.36it/s] 22it [00:05, 4.36it/s] 23it [00:05, 4.38it/s] 24it [00:05, 4.35it/s] 25it [00:05, 4.38it/s] 26it [00:05, 4.39it/s] 27it [00:06, 4.44it/s] 28it [00:06, 4.36it/s] 29it [00:06, 4.37it/s] 30it [00:06, 4.38it/s] 31it [00:07, 4.37it/s] 32it [00:07, 4.40it/s] 33it [00:07, 4.45it/s] 34it [00:07, 4.43it/s] 35it [00:08, 4.42it/s] 36it [00:08, 4.49it/s] 37it [00:08, 4.53it/s] 38it [00:08, 4.49it/s] 39it [00:08, 4.48it/s] 40it [00:09, 4.47it/s] 41it [00:09, 4.47it/s] 42it [00:09, 4.50it/s] 43it [00:09, 4.52it/s] 44it [00:10, 4.49it/s] 45it [00:10, 4.47it/s] 46it [00:10, 4.48it/s] 47it [00:10, 4.48it/s] 48it [00:10, 4.52it/s] 49it [00:11, 4.48it/s] 50it [00:11, 4.51it/s]2025-05-25 23:53:34,280 - INFO - [Epoch 080 | Batch 0050] IWAE-loss 1194.4015 | mean log_px -0.0039 | KL -991.29 + 51it [00:11, 4.52it/s] 52it [00:11, 4.50it/s] 53it [00:12, 4.52it/s] 54it [00:12, 4.53it/s] 55it [00:12, 4.47it/s] 56it [00:12, 4.47it/s] 57it [00:12, 4.48it/s] 58it [00:13, 4.50it/s] 59it [00:13, 4.48it/s] 60it [00:13, 4.45it/s] 61it [00:13, 4.45it/s] 62it [00:14, 4.46it/s] 63it [00:14, 4.50it/s] 64it [00:14, 4.47it/s] 65it [00:14, 4.44it/s] 66it [00:14, 4.46it/s] 67it [00:15, 4.32it/s] 68it [00:15, 4.36it/s] 69it [00:15, 4.42it/s] 70it [00:15, 4.43it/s] 71it [00:16, 4.45it/s] 72it [00:16, 4.50it/s] 73it [00:16, 4.52it/s] 74it [00:16, 4.53it/s] 75it [00:16, 4.48it/s] 76it [00:17, 4.47it/s] 77it [00:17, 4.48it/s] 78it [00:17, 4.51it/s] 79it [00:17, 4.50it/s] 80it [00:18, 4.50it/s] 81it [00:18, 4.46it/s] 82it [00:18, 4.45it/s] 83it [00:18, 4.44it/s] 84it [00:18, 4.44it/s] 85it [00:19, 4.29it/s] 86it [00:19, 4.34it/s] 87it [00:19, 4.40it/s] 88it [00:19, 4.41it/s] 89it [00:20, 4.42it/s] 90it [00:20, 4.41it/s] 91it [00:20, 4.39it/s] 92it [00:20, 4.41it/s] 93it [00:21, 4.45it/s] 94it [00:21, 4.43it/s] 95it [00:21, 4.45it/s] 96it [00:21, 4.49it/s] 97it [00:21, 4.50it/s] 98it [00:22, 4.40it/s] 99it [00:22, 4.51it/s] 100it [00:22, 4.56it/s]2025-05-25 23:53:45,508 - INFO - [Epoch 080 | Batch 0100] IWAE-loss 1640.9240 | mean log_px -0.0125 | KL -990.32 + 101it [00:22, 4.51it/s] 102it [00:23, 4.55it/s] 103it [00:23, 4.48it/s] 104it [00:23, 4.49it/s] 105it [00:23, 4.49it/s] 106it [00:23, 4.41it/s] 107it [00:24, 4.42it/s] 108it [00:24, 4.41it/s] 109it [00:24, 4.42it/s] 110it [00:24, 4.45it/s] 111it [00:25, 4.48it/s] 112it [00:25, 4.51it/s] 113it [00:25, 4.52it/s] 114it [00:25, 4.53it/s] 115it [00:25, 4.55it/s] 116it [00:26, 4.53it/s] 117it [00:26, 4.47it/s] 118it [00:26, 4.53it/s] 119it [00:26, 4.37it/s] 120it [00:27, 4.39it/s] 121it [00:27, 4.45it/s] 122it [00:27, 4.50it/s] 123it [00:27, 4.49it/s] 124it [00:27, 4.47it/s] 125it [00:28, 4.43it/s] 126it [00:28, 4.44it/s] 127it [00:28, 4.40it/s] 128it [00:28, 4.42it/s] 129it [00:29, 4.40it/s] 130it [00:29, 4.41it/s] 131it [00:29, 4.48it/s] 132it [00:29, 4.51it/s] 133it [00:29, 4.48it/s] 134it [00:30, 4.50it/s] 135it [00:30, 4.53it/s] 136it [00:30, 4.51it/s] 137it [00:30, 4.50it/s] 138it [00:31, 4.48it/s] 139it [00:31, 4.49it/s] 140it [00:31, 4.51it/s] 141it [00:31, 4.48it/s] 142it [00:31, 4.45it/s] 143it [00:32, 4.42it/s] 144it [00:32, 4.41it/s] 145it [00:32, 4.47it/s] 146it [00:32, 4.47it/s] 147it [00:33, 4.51it/s] 148it [00:33, 4.50it/s] 149it [00:33, 4.52it/s] 150it [00:33, 4.49it/s]2025-05-25 23:53:56,689 - INFO - [Epoch 080 | Batch 0150] IWAE-loss 1795.7816 | mean log_px -0.0194 | KL -987.38 + 151it [00:34, 4.36it/s] 152it [00:34, 4.43it/s] 153it [00:34, 4.48it/s] 154it [00:34, 4.48it/s] 155it [00:34, 4.31it/s] 156it [00:35, 4.36it/s] 157it [00:35, 4.42it/s] 158it [00:35, 4.40it/s] 159it [00:35, 4.31it/s] 160it [00:36, 4.37it/s] 161it [00:36, 4.44it/s] 162it [00:36, 4.44it/s] 163it [00:36, 4.47it/s] 164it [00:36, 4.49it/s] 165it [00:37, 4.43it/s] 166it [00:37, 4.31it/s] 167it [00:37, 4.36it/s] 168it [00:37, 4.41it/s] 169it [00:38, 4.45it/s] 170it [00:38, 4.43it/s] 171it [00:38, 4.39it/s] 172it [00:38, 4.40it/s] 173it [00:39, 4.36it/s] 174it [00:39, 4.39it/s] 175it [00:39, 4.42it/s] 176it [00:39, 4.45it/s] 177it [00:39, 4.34it/s] 178it [00:40, 4.34it/s] 179it [00:40, 4.38it/s] 180it [00:40, 4.44it/s] 181it [00:40, 4.46it/s] 182it [00:41, 4.52it/s] 183it [00:41, 4.49it/s] 184it [00:41, 4.49it/s] 185it [00:41, 4.52it/s] 186it [00:41, 4.57it/s] 187it [00:42, 4.36it/s] 188it [00:42, 4.44it/s] 189it [00:42, 4.46it/s] 190it [00:42, 4.47it/s] 191it [00:43, 4.46it/s] 192it [00:43, 4.46it/s] 193it [00:43, 4.49it/s] 194it [00:43, 4.38it/s] 195it [00:43, 4.35it/s] 196it [00:44, 4.45it/s] 196it [00:44, 4.43it/s] +2025-05-25 23:54:07,010 - INFO - Epoch: 80, Objective: tensor([1140.7397], device='cuda:0', grad_fn=), Loss: 0.0032359547913074493, KL/n: 20.226318359375 + 0it [00:00, ?it/s]2025-05-25 23:54:07,420 - INFO - [Epoch 081 | Batch 0000] IWAE-loss 1103.5593 | mean log_px -0.0022 | KL -990.32 + 1it [00:00, 2.97it/s] 2it [00:00, 3.73it/s] 3it [00:00, 4.12it/s] 4it [00:01, 4.19it/s] 5it [00:01, 4.38it/s] 6it [00:01, 3.45it/s] 7it [00:01, 3.78it/s] 8it [00:02, 4.02it/s] 9it [00:02, 4.22it/s] 10it [00:02, 4.34it/s] 11it [00:02, 4.45it/s] 12it [00:02, 4.37it/s] 13it [00:03, 4.48it/s] 14it [00:03, 4.55it/s] 15it [00:03, 4.59it/s] 16it [00:03, 4.62it/s] 17it [00:03, 4.65it/s] 18it [00:04, 4.49it/s] 19it [00:04, 4.55it/s] 20it [00:04, 4.57it/s] 21it [00:04, 4.58it/s] 22it [00:05, 4.46it/s] 23it [00:05, 4.52it/s] 24it [00:05, 4.54it/s] 25it [00:05, 4.57it/s] 26it [00:05, 4.59it/s] 27it [00:06, 4.61it/s] 28it [00:06, 4.62it/s] 29it [00:06, 4.63it/s] 30it [00:06, 4.63it/s] 31it [00:07, 4.62it/s] 32it [00:07, 4.63it/s] 33it [00:07, 4.63it/s] 34it [00:07, 4.63it/s] 35it [00:07, 4.50it/s] 36it [00:08, 4.54it/s] 37it [00:08, 4.57it/s] 38it [00:08, 4.60it/s] 39it [00:08, 4.62it/s] 40it [00:09, 4.62it/s] 41it [00:09, 4.63it/s] 42it [00:09, 4.63it/s] 43it [00:09, 4.62it/s] 44it [00:09, 4.49it/s] 45it [00:10, 4.55it/s] 46it [00:10, 4.55it/s] 47it [00:10, 4.59it/s] 48it [00:10, 4.59it/s] 49it [00:10, 4.61it/s] 50it [00:11, 4.61it/s]2025-05-25 23:54:18,495 - INFO - [Epoch 081 | Batch 0050] IWAE-loss 1255.6204 | mean log_px -0.0048 | KL -987.30 + 51it [00:11, 4.62it/s] 52it [00:11, 4.63it/s] 53it [00:11, 4.63it/s] 54it [00:12, 4.63it/s] 55it [00:12, 4.63it/s] 56it [00:12, 4.60it/s] 57it [00:12, 4.62it/s] 58it [00:12, 4.62it/s] 59it [00:13, 4.63it/s] 60it [00:13, 4.49it/s] 61it [00:13, 4.55it/s] 62it [00:13, 4.58it/s] 63it [00:14, 4.60it/s] 64it [00:14, 4.61it/s] 65it [00:14, 4.59it/s] 66it [00:14, 4.46it/s] 67it [00:14, 4.53it/s] 68it [00:15, 4.55it/s] 69it [00:15, 4.59it/s] 70it [00:15, 4.60it/s] 71it [00:15, 4.61it/s] 72it [00:16, 4.52it/s] 73it [00:16, 4.57it/s] 74it [00:16, 4.58it/s] 75it [00:16, 4.60it/s] 76it [00:16, 4.61it/s] 77it [00:17, 4.61it/s] 78it [00:17, 4.63it/s] 79it [00:17, 4.63it/s] 80it [00:17, 4.63it/s] 81it [00:17, 4.49it/s] 82it [00:18, 4.55it/s] 83it [00:18, 4.58it/s] 84it [00:18, 4.57it/s] 85it [00:18, 4.60it/s] 86it [00:19, 4.61it/s] 87it [00:19, 4.62it/s] 88it [00:19, 4.63it/s] 89it [00:19, 4.63it/s] 90it [00:19, 4.48it/s] 91it [00:20, 4.51it/s] 92it [00:20, 4.55it/s] 93it [00:20, 4.57it/s] 94it [00:20, 4.59it/s] 95it [00:21, 4.60it/s] 96it [00:21, 4.61it/s] 97it [00:21, 4.62it/s] 98it [00:21, 4.47it/s] 99it [00:21, 4.53it/s] 100it [00:22, 4.55it/s]2025-05-25 23:54:29,415 - INFO - [Epoch 081 | Batch 0100] IWAE-loss 1271.0948 | mean log_px -0.0054 | KL -990.43 + 101it [00:22, 4.58it/s] 102it [00:22, 4.55it/s] 103it [00:22, 4.50it/s] 104it [00:22, 4.53it/s] 105it [00:23, 4.54it/s] 106it [00:23, 4.42it/s] 107it [00:23, 4.48it/s] 108it [00:23, 4.51it/s] 109it [00:24, 4.54it/s] 110it [00:24, 4.57it/s] 111it [00:24, 4.58it/s] 112it [00:24, 4.58it/s] 113it [00:24, 4.59it/s] 114it [00:25, 4.61it/s] 115it [00:25, 4.62it/s] 116it [00:25, 4.63it/s] 117it [00:25, 4.50it/s] 118it [00:26, 4.55it/s] 119it [00:26, 4.57it/s] 120it [00:26, 4.58it/s] 121it [00:26, 4.60it/s] 122it [00:26, 4.62it/s] 123it [00:27, 4.62it/s] 124it [00:27, 4.61it/s] 125it [00:27, 4.62it/s] 126it [00:27, 4.61it/s] 127it [00:28, 4.52it/s] 128it [00:28, 4.57it/s] 129it [00:28, 4.59it/s] 130it [00:28, 4.59it/s] 131it [00:28, 4.61it/s] 132it [00:29, 4.61it/s] 133it [00:29, 4.63it/s] 134it [00:29, 4.62it/s] 135it [00:29, 4.61it/s] 136it [00:30, 4.46it/s] 137it [00:30, 4.53it/s] 138it [00:30, 4.55it/s] 139it [00:30, 4.58it/s] 140it [00:30, 4.59it/s] 141it [00:31, 4.61it/s] 142it [00:31, 4.52it/s] 143it [00:31, 4.57it/s] 144it [00:31, 4.58it/s] 145it [00:31, 4.61it/s] 146it [00:32, 4.60it/s] 147it [00:32, 4.61it/s] 148it [00:32, 4.63it/s] 149it [00:32, 4.64it/s] 150it [00:33, 4.64it/s]2025-05-25 23:54:40,335 - INFO - [Epoch 081 | Batch 0150] IWAE-loss 1643.7526 | mean log_px -0.0269 | KL -987.94 + 151it [00:33, 4.63it/s] 152it [00:33, 4.50it/s] 153it [00:33, 4.56it/s] 154it [00:33, 4.57it/s] 155it [00:34, 4.60it/s] 156it [00:34, 4.60it/s] 157it [00:34, 4.61it/s] 158it [00:34, 4.60it/s] 159it [00:34, 4.60it/s] 160it [00:35, 4.62it/s] 161it [00:35, 4.60it/s] 162it [00:35, 4.61it/s] 163it [00:35, 4.48it/s] 164it [00:36, 4.49it/s] 165it [00:36, 4.54it/s] 166it [00:36, 4.56it/s] 167it [00:36, 4.59it/s] 168it [00:36, 4.60it/s] 169it [00:37, 4.60it/s] 170it [00:37, 4.58it/s] 171it [00:37, 4.55it/s] 172it [00:37, 4.42it/s] 173it [00:38, 4.49it/s] 174it [00:38, 4.52it/s] 175it [00:38, 4.56it/s] 176it [00:38, 4.58it/s] 177it [00:38, 4.59it/s] 178it [00:39, 4.60it/s] 179it [00:39, 4.62it/s] 180it [00:39, 4.63it/s] 181it [00:39, 4.63it/s] 182it [00:40, 4.62it/s] 183it [00:40, 4.48it/s] 184it [00:40, 4.53it/s] 185it [00:40, 4.57it/s] 186it [00:40, 4.59it/s] 187it [00:41, 4.61it/s] 188it [00:41, 4.59it/s] 189it [00:41, 4.61it/s] 190it [00:41, 4.46it/s] 191it [00:42, 4.52it/s] 192it [00:42, 4.55it/s] 193it [00:42, 4.58it/s] 194it [00:42, 4.58it/s] 195it [00:42, 4.42it/s] 196it [00:43, 4.42it/s] 196it [00:43, 4.54it/s] +2025-05-25 23:54:50,363 - INFO - Epoch: 81, Objective: tensor([1722.9547], device='cuda:0', grad_fn=), Loss: 0.013793299905955791, KL/n: 20.196060180664062 + 0it [00:00, ?it/s]2025-05-25 23:54:50,784 - INFO - [Epoch 082 | Batch 0000] IWAE-loss 1131.7792 | mean log_px -0.0034 | KL -989.71 + 1it [00:00, 2.71it/s] 2it [00:00, 3.55it/s] 3it [00:00, 3.98it/s] 4it [00:01, 4.20it/s] 5it [00:01, 4.36it/s] 6it [00:01, 4.45it/s] 7it [00:01, 4.49it/s] 8it [00:01, 4.40it/s] 9it [00:02, 4.33it/s] 10it [00:02, 4.41it/s] 11it [00:02, 4.32it/s] 12it [00:02, 4.42it/s] 13it [00:03, 4.49it/s] 14it [00:03, 4.55it/s] 15it [00:03, 4.59it/s] 16it [00:03, 4.61it/s] 17it [00:03, 4.58it/s] 18it [00:04, 4.60it/s] 19it [00:04, 4.62it/s] 20it [00:04, 4.64it/s] 21it [00:04, 4.65it/s] 22it [00:04, 4.66it/s] 23it [00:05, 4.66it/s] 24it [00:05, 4.66it/s] 25it [00:05, 4.64it/s] 26it [00:05, 4.64it/s] 27it [00:06, 4.66it/s] 28it [00:06, 4.66it/s] 29it [00:06, 4.67it/s] 30it [00:06, 4.66it/s] 31it [00:06, 4.66it/s] 32it [00:07, 4.65it/s] 33it [00:07, 4.51it/s] 34it [00:07, 4.56it/s] 35it [00:07, 4.59it/s] 36it [00:07, 4.61it/s] 37it [00:08, 4.63it/s] 38it [00:08, 4.62it/s] 39it [00:08, 4.64it/s] 40it [00:08, 4.65it/s] 41it [00:09, 4.50it/s] 42it [00:09, 4.52it/s] 43it [00:09, 4.58it/s] 44it [00:09, 4.60it/s] 45it [00:09, 4.62it/s] 46it [00:10, 4.63it/s] 47it [00:10, 4.66it/s] 48it [00:10, 4.49it/s] 49it [00:10, 4.48it/s] 50it [00:11, 4.46it/s]2025-05-25 23:55:01,739 - INFO - [Epoch 082 | Batch 0050] IWAE-loss 1399.6855 | mean log_px -0.0098 | KL -989.36 + 51it [00:11, 4.46it/s] 52it [00:11, 4.53it/s] 53it [00:11, 4.57it/s] 54it [00:11, 4.53it/s] 55it [00:12, 4.55it/s] 56it [00:12, 4.55it/s] 57it [00:12, 4.45it/s] 58it [00:12, 4.53it/s] 59it [00:13, 4.58it/s] 60it [00:13, 4.60it/s] 61it [00:13, 4.63it/s] 62it [00:13, 4.64it/s] 63it [00:13, 4.50it/s] 64it [00:14, 4.54it/s] 65it [00:14, 4.59it/s] 66it [00:14, 4.61it/s] 67it [00:14, 4.63it/s] 68it [00:15, 4.61it/s] 69it [00:15, 4.62it/s] 70it [00:15, 4.63it/s] 71it [00:15, 4.65it/s] 72it [00:15, 4.65it/s] 73it [00:16, 4.67it/s] 74it [00:16, 4.66it/s] 75it [00:16, 4.52it/s] 76it [00:16, 4.56it/s] 77it [00:16, 4.60it/s] 78it [00:17, 4.61it/s] 79it [00:17, 4.63it/s] 80it [00:17, 4.65it/s] 81it [00:17, 4.66it/s] 82it [00:18, 4.66it/s] 83it [00:18, 4.66it/s] 84it [00:18, 4.65it/s] 85it [00:18, 4.67it/s] 86it [00:18, 4.65it/s] 87it [00:19, 4.63it/s] 88it [00:19, 4.61it/s] 89it [00:19, 4.64it/s] 90it [00:19, 4.65it/s] 91it [00:19, 4.66it/s] 92it [00:20, 4.64it/s] 93it [00:20, 4.66it/s] 94it [00:20, 4.51it/s] 95it [00:20, 4.54it/s] 96it [00:21, 4.57it/s] 97it [00:21, 4.61it/s] 98it [00:21, 4.62it/s] 99it [00:21, 4.64it/s] 100it [00:21, 4.64it/s]2025-05-25 23:55:12,577 - INFO - [Epoch 082 | Batch 0100] IWAE-loss 1105.8473 | mean log_px -0.0035 | KL -983.66 + 101it [00:22, 4.51it/s] 102it [00:22, 4.55it/s] 103it [00:22, 4.59it/s] 104it [00:22, 4.61it/s] 105it [00:23, 4.63it/s] 106it [00:23, 4.65it/s] 107it [00:23, 4.66it/s] 108it [00:23, 4.50it/s] 109it [00:23, 4.56it/s] 110it [00:24, 4.59it/s] 111it [00:24, 4.61it/s] 112it [00:24, 4.50it/s] 113it [00:24, 4.45it/s] 114it [00:25, 4.49it/s] 115it [00:25, 4.55it/s] 116it [00:25, 4.58it/s] 117it [00:25, 4.62it/s] 118it [00:25, 4.63it/s] 119it [00:26, 4.63it/s] 120it [00:26, 4.50it/s] 121it [00:26, 4.54it/s] 122it [00:26, 4.57it/s] 123it [00:26, 4.62it/s] 124it [00:27, 4.63it/s] 125it [00:27, 4.65it/s] 126it [00:27, 4.65it/s] 127it [00:27, 4.65it/s] 128it [00:28, 4.60it/s] 129it [00:28, 4.63it/s] 130it [00:28, 4.54it/s] 131it [00:28, 4.56it/s] 132it [00:28, 4.62it/s] 133it [00:29, 4.66it/s] 134it [00:29, 4.68it/s] 135it [00:29, 4.69it/s] 136it [00:29, 4.53it/s] 137it [00:29, 4.61it/s] 138it [00:30, 4.63it/s] 139it [00:30, 4.66it/s] 140it [00:30, 4.68it/s] 141it [00:30, 4.70it/s] 142it [00:31, 4.71it/s] 143it [00:31, 4.55it/s] 144it [00:31, 4.62it/s] 145it [00:31, 4.65it/s] 146it [00:31, 4.67it/s] 147it [00:32, 4.68it/s] 148it [00:32, 4.66it/s] 149it [00:32, 4.68it/s] 150it [00:32, 4.69it/s]2025-05-25 23:55:23,424 - INFO - [Epoch 082 | Batch 0150] IWAE-loss 1394.0895 | mean log_px -0.0172 | KL -984.26 + 151it [00:32, 4.70it/s] 152it [00:33, 4.71it/s] 153it [00:33, 4.72it/s] 154it [00:33, 4.72it/s] 155it [00:33, 4.56it/s] 156it [00:34, 4.63it/s] 157it [00:34, 4.67it/s] 158it [00:34, 4.67it/s] 159it [00:34, 4.69it/s] 160it [00:34, 4.71it/s] 161it [00:35, 4.72it/s] 162it [00:35, 4.72it/s] 163it [00:35, 4.73it/s] 164it [00:35, 4.72it/s] 165it [00:35, 4.73it/s] 166it [00:36, 4.56it/s] 167it [00:36, 4.62it/s] 168it [00:36, 4.66it/s] 169it [00:36, 4.69it/s] 170it [00:37, 4.69it/s] 171it [00:37, 4.57it/s] 172it [00:37, 4.64it/s] 173it [00:37, 4.67it/s] 174it [00:37, 4.68it/s] 175it [00:38, 4.70it/s] 176it [00:38, 4.54it/s] 177it [00:38, 4.62it/s] 178it [00:38, 4.64it/s] 179it [00:38, 4.67it/s] 180it [00:39, 4.69it/s] 181it [00:39, 4.71it/s] 182it [00:39, 4.71it/s] 183it [00:39, 4.72it/s] 184it [00:40, 4.73it/s] 185it [00:40, 4.56it/s] 186it [00:40, 4.63it/s] 187it [00:40, 4.67it/s] 188it [00:40, 4.69it/s] 189it [00:41, 4.69it/s] 190it [00:41, 4.70it/s] 191it [00:41, 4.70it/s] 192it [00:41, 4.71it/s] 193it [00:41, 4.52it/s] 194it [00:42, 4.45it/s] 195it [00:42, 4.21it/s] 196it [00:42, 4.20it/s] 196it [00:42, 4.58it/s] +2025-05-25 23:55:33,312 - INFO - Epoch: 82, Objective: tensor([1214.3734], device='cuda:0', grad_fn=), Loss: 0.005592620465904474, KL/n: 20.130046844482422 + 0it [00:00, ?it/s]2025-05-25 23:55:33,902 - INFO - [Epoch 083 | Batch 0000] IWAE-loss 1186.2911 | mean log_px -0.0061 | KL -989.00 + 1it [00:00, 2.92it/s] 2it [00:00, 3.71it/s] 3it [00:00, 3.89it/s] 4it [00:01, 4.15it/s] 5it [00:01, 4.28it/s] 6it [00:01, 4.39it/s] 7it [00:01, 4.47it/s] 8it [00:01, 4.51it/s] 9it [00:02, 4.54it/s] 10it [00:02, 4.56it/s] 11it [00:02, 4.57it/s] 12it [00:02, 4.58it/s] 13it [00:02, 4.58it/s] 14it [00:03, 4.56it/s] 15it [00:03, 4.57it/s] 16it [00:03, 4.57it/s] 17it [00:03, 4.58it/s] 18it [00:04, 4.58it/s] 19it [00:04, 4.53it/s] 20it [00:04, 4.51it/s] 21it [00:04, 4.54it/s] 22it [00:04, 4.54it/s] 23it [00:05, 4.55it/s] 24it [00:05, 4.56it/s] 25it [00:05, 4.56it/s] 26it [00:05, 4.54it/s] 27it [00:06, 4.57it/s] 28it [00:06, 4.54it/s] 29it [00:06, 4.56it/s] 30it [00:06, 4.52it/s] 31it [00:06, 4.53it/s] 32it [00:07, 4.56it/s] 33it [00:07, 4.44it/s] 34it [00:07, 4.51it/s] 35it [00:07, 4.54it/s] 36it [00:08, 4.57it/s] 37it [00:08, 4.59it/s] 38it [00:08, 4.60it/s] 39it [00:08, 4.61it/s] 40it [00:08, 4.47it/s] 41it [00:09, 4.53it/s] 42it [00:09, 4.56it/s] 43it [00:09, 4.59it/s] 44it [00:09, 4.60it/s] 45it [00:10, 4.61it/s] 46it [00:10, 4.51it/s] 47it [00:10, 4.40it/s] 48it [00:10, 4.33it/s] 49it [00:10, 4.43it/s] 50it [00:11, 4.49it/s]2025-05-25 23:55:44,928 - INFO - [Epoch 083 | Batch 0050] IWAE-loss 1646.4308 | mean log_px -0.0101 | KL -982.95 + 51it [00:11, 4.54it/s] 52it [00:11, 4.56it/s] 53it [00:11, 4.57it/s] 54it [00:12, 4.59it/s] 55it [00:12, 4.45it/s] 56it [00:12, 4.51it/s] 57it [00:12, 4.54it/s] 58it [00:12, 4.56it/s] 59it [00:13, 4.55it/s] 60it [00:13, 4.57it/s] 61it [00:13, 4.59it/s] 62it [00:13, 4.45it/s] 63it [00:14, 4.52it/s] 64it [00:14, 4.55it/s] 65it [00:14, 4.57it/s] 66it [00:14, 4.44it/s] 67it [00:14, 4.49it/s] 68it [00:15, 4.52it/s] 69it [00:15, 4.55it/s] 70it [00:15, 4.49it/s] 71it [00:15, 4.51it/s] 72it [00:15, 4.54it/s] 73it [00:16, 4.42it/s] 74it [00:16, 4.48it/s] 75it [00:16, 4.53it/s] 76it [00:16, 4.54it/s] 77it [00:17, 4.43it/s] 78it [00:17, 4.49it/s] 79it [00:17, 4.52it/s] 80it [00:17, 4.55it/s] 81it [00:17, 4.58it/s] 82it [00:18, 4.58it/s] 83it [00:18, 4.44it/s] 84it [00:18, 4.50it/s] 85it [00:18, 4.53it/s] 86it [00:19, 4.53it/s] 87it [00:19, 4.52it/s] 88it [00:19, 4.53it/s] 89it [00:19, 4.57it/s] 90it [00:19, 4.43it/s] 91it [00:20, 4.50it/s] 92it [00:20, 4.53it/s] 93it [00:20, 4.56it/s] 94it [00:20, 4.57it/s] 95it [00:21, 4.59it/s] 96it [00:21, 4.59it/s] 97it [00:21, 4.45it/s] 98it [00:21, 4.52it/s] 99it [00:21, 4.55it/s] 100it [00:22, 4.57it/s]2025-05-25 23:55:55,968 - INFO - [Epoch 083 | Batch 0100] IWAE-loss 1244.4196 | mean log_px -0.0098 | KL -981.24 + 101it [00:22, 4.59it/s] 102it [00:22, 4.60it/s] 103it [00:22, 4.61it/s] 104it [00:23, 4.43it/s] 105it [00:23, 4.49it/s] 106it [00:23, 4.52it/s] 107it [00:23, 4.56it/s] 108it [00:23, 4.54it/s] 109it [00:24, 4.56it/s] 110it [00:24, 4.57it/s] 111it [00:24, 4.43it/s] 112it [00:24, 4.49it/s] 113it [00:25, 4.38it/s] 114it [00:25, 4.45it/s] 115it [00:25, 4.50it/s] 116it [00:25, 4.52it/s] 117it [00:25, 4.46it/s] 118it [00:26, 4.50it/s] 119it [00:26, 4.53it/s] 120it [00:26, 4.55it/s] 121it [00:26, 4.45it/s] 122it [00:27, 4.51it/s] 123it [00:27, 4.53it/s] 124it [00:27, 4.54it/s] 125it [00:27, 4.57it/s] 126it [00:27, 4.58it/s] 127it [00:28, 4.58it/s] 128it [00:28, 4.44it/s] 129it [00:28, 4.51it/s] 130it [00:28, 4.54it/s] 131it [00:29, 4.56it/s] 132it [00:29, 4.43it/s] 133it [00:29, 4.48it/s] 134it [00:29, 4.51it/s] 135it [00:29, 4.52it/s] 136it [00:30, 4.55it/s] 137it [00:30, 4.50it/s] 138it [00:30, 4.51it/s] 139it [00:30, 4.40it/s] 140it [00:31, 4.49it/s] 141it [00:31, 4.54it/s] 142it [00:31, 4.54it/s] 143it [00:31, 4.59it/s] 144it [00:31, 4.60it/s] 145it [00:32, 4.47it/s] 146it [00:32, 4.52it/s] 147it [00:32, 4.56it/s] 148it [00:32, 4.57it/s] 149it [00:33, 4.59it/s] 150it [00:33, 4.61it/s]2025-05-25 23:56:07,022 - INFO - [Epoch 083 | Batch 0150] IWAE-loss 1072.7214 | mean log_px -0.0020 | KL -980.33 + 151it [00:33, 4.54it/s] 152it [00:33, 4.58it/s] 153it [00:33, 4.46it/s] 154it [00:34, 4.52it/s] 155it [00:34, 4.42it/s] 156it [00:34, 4.46it/s] 157it [00:34, 4.51it/s] 158it [00:35, 4.55it/s] 159it [00:35, 4.58it/s] 160it [00:35, 4.60it/s] 161it [00:35, 4.47it/s] 162it [00:35, 4.53it/s] 163it [00:36, 4.57it/s] 164it [00:36, 4.59it/s] 165it [00:36, 4.61it/s] 166it [00:36, 4.62it/s] 167it [00:36, 4.64it/s] 168it [00:37, 4.49it/s] 169it [00:37, 4.55it/s] 170it [00:37, 4.58it/s] 171it [00:37, 4.60it/s] 172it [00:38, 4.60it/s] 173it [00:38, 4.62it/s] 174it [00:38, 4.63it/s] 175it [00:38, 4.48it/s] 176it [00:38, 4.52it/s] 177it [00:39, 4.55it/s] 178it [00:39, 4.57it/s] 179it [00:39, 4.60it/s] 180it [00:39, 4.61it/s] 181it [00:40, 4.47it/s] 182it [00:40, 4.54it/s] 183it [00:40, 4.57it/s] 184it [00:40, 4.59it/s] 185it [00:40, 4.60it/s] 186it [00:41, 4.61it/s] 187it [00:41, 4.62it/s] 188it [00:41, 4.48it/s] 189it [00:41, 4.53it/s] 190it [00:42, 4.55it/s] 191it [00:42, 4.58it/s] 192it [00:42, 4.60it/s] 193it [00:42, 4.62it/s] 194it [00:42, 4.62it/s] 195it [00:43, 4.25it/s] 196it [00:43, 4.23it/s] 196it [00:43, 4.51it/s] +2025-05-25 23:56:17,114 - INFO - Epoch: 83, Objective: tensor([1636.0144], device='cuda:0', grad_fn=), Loss: 0.006700733210891485, KL/n: 19.999908447265625 + 0it [00:00, ?it/s]2025-05-25 23:56:17,488 - INFO - [Epoch 084 | Batch 0000] IWAE-loss 1054.2181 | mean log_px -0.0055 | KL -978.12 + 1it [00:00, 3.31it/s] 2it [00:00, 4.00it/s] 3it [00:00, 4.27it/s] 4it [00:00, 4.40it/s] 5it [00:01, 4.49it/s] 6it [00:01, 4.37it/s] 7it [00:01, 4.47it/s] 8it [00:01, 4.51it/s] 9it [00:02, 4.55it/s] 10it [00:02, 4.57it/s] 11it [00:02, 4.56it/s] 12it [00:02, 4.59it/s] 13it [00:02, 4.60it/s] 14it [00:03, 4.59it/s] 15it [00:03, 4.60it/s] 16it [00:03, 4.45it/s] 17it [00:03, 4.52it/s] 18it [00:04, 4.54it/s] 19it [00:04, 4.57it/s] 20it [00:04, 4.58it/s] 21it [00:04, 4.59it/s] 22it [00:04, 4.59it/s] 23it [00:05, 4.60it/s] 24it [00:05, 4.61it/s] 25it [00:05, 4.46it/s] 26it [00:05, 4.51it/s] 27it [00:05, 4.55it/s] 28it [00:06, 4.58it/s] 29it [00:06, 4.59it/s] 30it [00:06, 4.60it/s] 31it [00:06, 4.61it/s] 32it [00:07, 4.61it/s] 33it [00:07, 4.61it/s] 34it [00:07, 4.59it/s] 35it [00:07, 4.46it/s] 36it [00:07, 4.51it/s] 37it [00:08, 4.54it/s] 38it [00:08, 4.55it/s] 39it [00:08, 4.58it/s] 40it [00:08, 4.59it/s] 41it [00:09, 4.60it/s] 42it [00:09, 4.60it/s] 43it [00:09, 4.47it/s] 44it [00:09, 4.50it/s] 45it [00:09, 4.54it/s] 46it [00:10, 4.55it/s] 47it [00:10, 4.56it/s] 48it [00:10, 4.56it/s] 49it [00:10, 4.58it/s] 50it [00:11, 4.60it/s]2025-05-25 23:56:28,436 - INFO - [Epoch 084 | Batch 0050] IWAE-loss 1040.5332 | mean log_px -0.0009 | KL -971.92 + 51it [00:11, 4.60it/s] 52it [00:11, 3.55it/s] 53it [00:11, 3.83it/s] 54it [00:12, 4.03it/s] 55it [00:12, 4.20it/s] 56it [00:12, 4.31it/s] 57it [00:12, 4.40it/s] 58it [00:12, 4.47it/s] 59it [00:13, 4.52it/s] 60it [00:13, 4.40it/s] 61it [00:13, 4.47it/s] 62it [00:13, 4.48it/s] 63it [00:14, 4.52it/s] 64it [00:14, 4.55it/s] 65it [00:14, 4.56it/s] 66it [00:14, 4.43it/s] 67it [00:14, 4.49it/s] 68it [00:15, 4.52it/s] 69it [00:15, 4.54it/s] 70it [00:15, 4.56it/s] 71it [00:15, 4.52it/s] 72it [00:16, 4.52it/s] 73it [00:16, 4.54it/s] 74it [00:16, 4.55it/s] 75it [00:16, 4.54it/s] 76it [00:16, 4.55it/s] 77it [00:17, 4.55it/s] 78it [00:17, 4.55it/s] 79it [00:17, 4.58it/s] 80it [00:17, 4.44it/s] 81it [00:18, 4.36it/s] 82it [00:18, 4.37it/s] 83it [00:18, 4.43it/s] 84it [00:18, 4.48it/s] 85it [00:18, 4.53it/s] 86it [00:19, 4.55it/s] 87it [00:19, 4.59it/s] 88it [00:19, 4.44it/s] 89it [00:19, 4.48it/s] 90it [00:20, 4.52it/s] 91it [00:20, 4.56it/s] 92it [00:20, 4.57it/s] 93it [00:20, 4.57it/s] 94it [00:20, 4.58it/s] 95it [00:21, 4.59it/s] 96it [00:21, 4.60it/s] 97it [00:21, 4.61it/s] 98it [00:21, 4.47it/s] 99it [00:22, 4.53it/s] 100it [00:22, 4.56it/s]2025-05-25 23:56:39,666 - INFO - [Epoch 084 | Batch 0100] IWAE-loss 1327.8715 | mean log_px -0.0200 | KL -971.95 + 101it [00:22, 4.59it/s] 102it [00:22, 4.60it/s] 103it [00:22, 4.60it/s] 104it [00:23, 4.61it/s] 105it [00:23, 4.62it/s] 106it [00:23, 4.63it/s] 107it [00:23, 4.49it/s] 108it [00:24, 4.53it/s] 109it [00:24, 4.56it/s] 110it [00:24, 4.57it/s] 111it [00:24, 4.60it/s] 112it [00:24, 4.61it/s] 113it [00:25, 4.59it/s] 114it [00:25, 4.60it/s] 115it [00:25, 4.47it/s] 116it [00:25, 4.52it/s] 117it [00:25, 4.56it/s] 118it [00:26, 4.57it/s] 119it [00:26, 4.45it/s] 120it [00:26, 4.51it/s] 121it [00:26, 4.55it/s] 122it [00:27, 4.57it/s] 123it [00:27, 4.60it/s] 124it [00:27, 4.60it/s] 125it [00:27, 4.60it/s] 126it [00:27, 4.61it/s] 127it [00:28, 4.61it/s] 128it [00:28, 4.61it/s] 129it [00:28, 4.62it/s] 130it [00:28, 4.62it/s] 131it [00:29, 4.62it/s] 132it [00:29, 4.62it/s] 133it [00:29, 4.48it/s] 134it [00:29, 4.54it/s] 135it [00:29, 4.57it/s] 136it [00:30, 4.58it/s] 137it [00:30, 4.59it/s] 138it [00:30, 4.60it/s] 139it [00:30, 4.62it/s] 140it [00:30, 4.62it/s] 141it [00:31, 4.64it/s] 142it [00:31, 4.49it/s] 143it [00:31, 4.55it/s] 144it [00:31, 4.57it/s] 145it [00:32, 4.59it/s] 146it [00:32, 4.58it/s] 147it [00:32, 4.60it/s] 148it [00:32, 4.52it/s] 149it [00:32, 4.44it/s] 150it [00:33, 4.34it/s]2025-05-25 23:56:50,637 - INFO - [Epoch 084 | Batch 0150] IWAE-loss 1146.8926 | mean log_px -0.0061 | KL -970.53 + 151it [00:33, 4.43it/s] 152it [00:33, 4.48it/s] 153it [00:33, 4.52it/s] 154it [00:34, 4.56it/s] 155it [00:34, 4.59it/s] 156it [00:34, 4.60it/s] 157it [00:34, 4.55it/s] 158it [00:34, 4.58it/s] 159it [00:35, 4.61it/s] 160it [00:35, 4.63it/s] 161it [00:35, 4.60it/s] 162it [00:35, 4.62it/s] 163it [00:36, 4.59it/s] 164it [00:36, 4.49it/s] 165it [00:36, 4.42it/s] 166it [00:36, 4.49it/s] 167it [00:36, 4.53it/s] 168it [00:37, 4.52it/s] 169it [00:37, 4.51it/s] 170it [00:37, 4.46it/s] 171it [00:37, 4.52it/s] 172it [00:38, 4.57it/s] 173it [00:38, 4.58it/s] 174it [00:38, 4.44it/s] 175it [00:38, 4.52it/s] 176it [00:38, 4.55it/s] 177it [00:39, 4.59it/s] 178it [00:39, 4.59it/s] 179it [00:39, 4.62it/s] 180it [00:39, 4.44it/s] 181it [00:40, 4.52it/s] 182it [00:40, 4.53it/s] 183it [00:40, 4.48it/s] 184it [00:40, 4.53it/s] 185it [00:40, 4.57it/s] 186it [00:41, 4.57it/s] 187it [00:41, 4.41it/s] 188it [00:41, 4.48it/s] 189it [00:41, 4.53it/s] 190it [00:42, 4.48it/s] 191it [00:42, 4.53it/s] 192it [00:42, 4.56it/s] 193it [00:42, 4.58it/s] 194it [00:42, 4.58it/s] 195it [00:43, 4.35it/s] 196it [00:43, 4.33it/s] 196it [00:43, 4.51it/s] +2025-05-25 23:57:00,722 - INFO - Epoch: 84, Objective: tensor([1178.6591], device='cuda:0', grad_fn=), Loss: 0.002942966530099511, KL/n: 19.77838897705078 + 0it [00:00, ?it/s]2025-05-25 23:57:01,147 - INFO - [Epoch 085 | Batch 0000] IWAE-loss 1131.1300 | mean log_px -0.0023 | KL -968.19 + 1it [00:00, 2.83it/s] 2it [00:00, 3.62it/s] 3it [00:00, 3.85it/s] 4it [00:01, 3.92it/s] 5it [00:01, 4.08it/s] 6it [00:01, 4.25it/s] 7it [00:01, 4.09it/s] 8it [00:02, 4.15it/s] 9it [00:02, 4.27it/s] 10it [00:02, 4.23it/s] 11it [00:02, 4.21it/s] 12it [00:02, 4.15it/s] 13it [00:03, 4.18it/s] 14it [00:03, 4.06it/s] 15it [00:03, 4.12it/s] 16it [00:03, 4.26it/s] 17it [00:04, 4.32it/s] 18it [00:04, 4.37it/s] 19it [00:04, 4.45it/s] 20it [00:04, 4.32it/s] 21it [00:05, 4.41it/s] 22it [00:05, 4.46it/s] 23it [00:05, 4.47it/s] 24it [00:05, 4.51it/s] 25it [00:05, 4.47it/s] 26it [00:06, 4.37it/s] 27it [00:06, 4.35it/s] 28it [00:06, 4.45it/s] 29it [00:06, 4.35it/s] 30it [00:07, 4.41it/s] 31it [00:07, 4.45it/s] 32it [00:07, 4.51it/s] 33it [00:07, 4.54it/s] 34it [00:07, 4.56it/s] 35it [00:08, 4.53it/s] 36it [00:08, 4.42it/s] 37it [00:08, 4.50it/s] 38it [00:08, 4.41it/s] 39it [00:09, 4.42it/s] 40it [00:09, 4.36it/s] 41it [00:09, 4.39it/s] 42it [00:09, 4.40it/s] 43it [00:09, 4.47it/s] 44it [00:10, 4.33it/s] 45it [00:10, 4.28it/s] 46it [00:10, 4.40it/s] 47it [00:10, 4.37it/s] 48it [00:11, 4.26it/s] 49it [00:11, 4.16it/s] 50it [00:11, 4.30it/s]2025-05-25 23:57:12,634 - INFO - [Epoch 085 | Batch 0050] IWAE-loss 1197.8279 | mean log_px -0.0056 | KL -967.47 + 51it [00:11, 4.39it/s] 52it [00:12, 4.32it/s] 53it [00:12, 4.27it/s] 54it [00:12, 4.35it/s] 55it [00:12, 4.28it/s] 56it [00:13, 4.26it/s] 57it [00:13, 4.30it/s] 58it [00:13, 4.24it/s] 59it [00:13, 4.26it/s] 60it [00:13, 4.10it/s] 61it [00:14, 4.25it/s] 62it [00:14, 4.35it/s] 63it [00:14, 4.27it/s] 64it [00:14, 4.18it/s] 65it [00:15, 4.24it/s] 66it [00:15, 4.33it/s] 67it [00:15, 4.42it/s] 68it [00:15, 4.49it/s] 69it [00:16, 4.51it/s] 70it [00:16, 4.54it/s] 71it [00:16, 4.41it/s] 72it [00:16, 4.30it/s] 73it [00:16, 4.13it/s] 74it [00:17, 4.28it/s] 75it [00:17, 4.30it/s] 76it [00:17, 4.27it/s] 77it [00:17, 4.24it/s] 78it [00:18, 4.28it/s] 79it [00:18, 4.14it/s] 80it [00:18, 4.16it/s] 81it [00:18, 4.21it/s] 82it [00:19, 4.25it/s] 83it [00:19, 4.23it/s] 84it [00:19, 4.23it/s] 85it [00:19, 4.33it/s] 86it [00:20, 4.28it/s] 87it [00:20, 4.28it/s] 88it [00:20, 4.37it/s] 89it [00:20, 4.31it/s] 90it [00:20, 4.29it/s] 91it [00:21, 4.34it/s] 92it [00:21, 4.28it/s] 93it [00:21, 4.32it/s] 94it [00:21, 4.27it/s] 95it [00:22, 4.31it/s] 96it [00:22, 4.41it/s] 97it [00:22, 4.49it/s] 98it [00:22, 4.48it/s] 99it [00:22, 4.50it/s] 100it [00:23, 4.51it/s]2025-05-25 23:57:24,210 - INFO - [Epoch 085 | Batch 0100] IWAE-loss 1239.2491 | mean log_px -0.0051 | KL -968.42 + 101it [00:23, 4.40it/s] 102it [00:23, 4.47it/s] 103it [00:23, 4.51it/s] 104it [00:24, 4.49it/s] 105it [00:24, 4.53it/s] 106it [00:24, 4.54it/s] 107it [00:24, 4.58it/s] 108it [00:24, 4.39it/s] 109it [00:25, 4.44it/s] 110it [00:25, 4.41it/s] 111it [00:25, 4.49it/s] 112it [00:25, 4.54it/s] 113it [00:26, 4.58it/s] 114it [00:26, 4.58it/s] 115it [00:26, 4.59it/s] 116it [00:26, 4.56it/s] 117it [00:26, 4.44it/s] 118it [00:27, 4.51it/s] 119it [00:27, 4.48it/s] 120it [00:27, 4.53it/s] 121it [00:27, 4.55it/s] 122it [00:28, 4.53it/s] 123it [00:28, 4.51it/s] 124it [00:28, 4.56it/s] 125it [00:28, 4.59it/s] 126it [00:28, 4.43it/s] 127it [00:29, 4.51it/s] 128it [00:29, 4.55it/s] 129it [00:29, 4.41it/s] 130it [00:29, 4.46it/s] 131it [00:30, 4.36it/s] 132it [00:30, 4.43it/s] 133it [00:30, 4.46it/s] 134it [00:30, 4.51it/s] 135it [00:30, 4.44it/s] 136it [00:31, 4.50it/s] 137it [00:31, 4.52it/s] 138it [00:31, 4.56it/s] 139it [00:31, 4.57it/s] 140it [00:32, 4.52it/s] 141it [00:32, 4.57it/s] 142it [00:32, 4.59it/s] 143it [00:32, 4.61it/s] 144it [00:32, 4.46it/s] 145it [00:33, 4.48it/s] 146it [00:33, 4.52it/s] 147it [00:33, 4.53it/s] 148it [00:33, 4.33it/s] 149it [00:34, 4.31it/s] 150it [00:34, 4.26it/s]2025-05-25 23:57:35,368 - INFO - [Epoch 085 | Batch 0150] IWAE-loss 1040.0924 | mean log_px -0.0081 | KL -968.21 + 151it [00:34, 4.36it/s] 152it [00:34, 4.23it/s] 153it [00:35, 4.18it/s] 154it [00:35, 4.17it/s] 155it [00:35, 4.25it/s] 156it [00:35, 4.20it/s] 157it [00:35, 4.31it/s] 158it [00:36, 4.40it/s] 159it [00:36, 4.47it/s] 160it [00:36, 4.48it/s] 161it [00:36, 4.53it/s] 162it [00:37, 4.48it/s] 163it [00:37, 4.34it/s] 164it [00:37, 4.41it/s] 165it [00:37, 4.49it/s] 166it [00:37, 4.53it/s] 167it [00:38, 4.57it/s] 168it [00:38, 4.58it/s] 169it [00:38, 4.61it/s] 170it [00:38, 4.41it/s] 171it [00:39, 4.51it/s] 172it [00:39, 4.56it/s] 173it [00:39, 4.52it/s] 174it [00:39, 4.57it/s] 175it [00:39, 4.61it/s] 176it [00:40, 4.62it/s] 177it [00:40, 4.50it/s] 178it [00:40, 4.57it/s] 179it [00:40, 4.61it/s] 180it [00:41, 4.57it/s] 181it [00:41, 4.53it/s] 182it [00:41, 4.51it/s] 183it [00:41, 4.52it/s] 184it [00:41, 4.37it/s] 185it [00:42, 4.46it/s] 186it [00:42, 4.53it/s] 187it [00:42, 4.59it/s] 188it [00:42, 4.60it/s] 189it [00:43, 4.64it/s] 190it [00:43, 4.65it/s] 191it [00:43, 4.68it/s] 192it [00:43, 4.68it/s] 193it [00:43, 4.69it/s] 194it [00:44, 4.70it/s] 195it [00:44, 4.45it/s] 196it [00:44, 4.54it/s] 196it [00:44, 4.39it/s] +2025-05-25 23:57:45,493 - INFO - Epoch: 85, Objective: tensor([1487.8380], device='cuda:0', grad_fn=), Loss: 0.007994958199560642, KL/n: 19.7778263092041 + 0it [00:00, ?it/s]2025-05-25 23:57:46,075 - INFO - [Epoch 086 | Batch 0000] IWAE-loss 1127.4233 | mean log_px -0.0047 | KL -967.19 + 1it [00:00, 2.81it/s] 2it [00:00, 3.65it/s] 3it [00:00, 4.07it/s] 4it [00:00, 4.29it/s] 5it [00:01, 4.42it/s] 6it [00:01, 4.49it/s] 7it [00:01, 4.56it/s] 8it [00:01, 4.60it/s] 9it [00:02, 4.48it/s] 10it [00:02, 4.56it/s] 11it [00:02, 4.60it/s] 12it [00:02, 4.63it/s] 13it [00:02, 4.66it/s] 14it [00:03, 4.67it/s] 15it [00:03, 4.68it/s] 16it [00:03, 4.52it/s] 17it [00:03, 4.59it/s] 18it [00:04, 4.62it/s] 19it [00:04, 4.65it/s] 20it [00:04, 4.66it/s] 21it [00:04, 4.67it/s] 22it [00:04, 4.68it/s] 23it [00:05, 4.69it/s] 24it [00:05, 4.69it/s] 25it [00:05, 4.57it/s] 26it [00:05, 4.62it/s] 27it [00:05, 4.59it/s] 28it [00:06, 4.63it/s] 29it [00:06, 4.65it/s] 30it [00:06, 4.50it/s] 31it [00:06, 4.55it/s] 32it [00:07, 4.61it/s] 33it [00:07, 4.64it/s] 34it [00:07, 4.65it/s] 35it [00:07, 4.67it/s] 36it [00:07, 4.52it/s] 37it [00:08, 4.59it/s] 38it [00:08, 4.61it/s] 39it [00:08, 4.63it/s] 40it [00:08, 4.61it/s] 41it [00:09, 4.62it/s] 42it [00:09, 4.49it/s] 43it [00:09, 4.57it/s] 44it [00:09, 4.60it/s] 45it [00:09, 4.63it/s] 46it [00:10, 4.65it/s] 47it [00:10, 4.67it/s] 48it [00:10, 4.66it/s] 49it [00:10, 4.68it/s] 50it [00:10, 4.68it/s]2025-05-25 23:57:56,903 - INFO - [Epoch 086 | Batch 0050] IWAE-loss 1551.1642 | mean log_px -0.0101 | KL -964.08 + 51it [00:11, 4.52it/s] 52it [00:11, 4.57it/s] 53it [00:11, 4.62it/s] 54it [00:11, 4.48it/s] 55it [00:12, 4.56it/s] 56it [00:12, 4.60it/s] 57it [00:12, 4.63it/s] 58it [00:12, 4.64it/s] 59it [00:12, 4.66it/s] 60it [00:13, 4.67it/s] 61it [00:13, 4.52it/s] 62it [00:13, 4.59it/s] 63it [00:13, 4.62it/s] 64it [00:13, 4.65it/s] 65it [00:14, 4.65it/s] 66it [00:14, 4.65it/s] 67it [00:14, 4.51it/s] 68it [00:14, 4.52it/s] 69it [00:15, 4.57it/s] 70it [00:15, 4.60it/s] 71it [00:15, 4.63it/s] 72it [00:15, 4.65it/s] 73it [00:15, 4.67it/s] 74it [00:16, 4.66it/s] 75it [00:16, 4.67it/s] 76it [00:16, 4.52it/s] 77it [00:16, 4.58it/s] 78it [00:17, 4.62it/s] 79it [00:17, 4.64it/s] 80it [00:17, 4.59it/s] 81it [00:17, 4.64it/s] 82it [00:17, 4.65it/s] 83it [00:18, 4.51it/s] 84it [00:18, 4.57it/s] 85it [00:18, 4.61it/s] 86it [00:18, 4.64it/s] 87it [00:18, 4.62it/s] 88it [00:19, 4.64it/s] 89it [00:19, 4.66it/s] 90it [00:19, 4.67it/s] 91it [00:19, 4.54it/s] 92it [00:20, 4.60it/s] 93it [00:20, 4.63it/s] 94it [00:20, 4.64it/s] 95it [00:20, 4.66it/s] 96it [00:20, 4.67it/s] 97it [00:21, 4.69it/s] 98it [00:21, 4.53it/s] 99it [00:21, 4.59it/s] 100it [00:21, 4.62it/s]2025-05-25 23:58:07,757 - INFO - [Epoch 086 | Batch 0100] IWAE-loss 1123.9008 | mean log_px -0.0059 | KL -964.63 + 101it [00:22, 4.64it/s] 102it [00:22, 4.66it/s] 103it [00:22, 4.66it/s] 104it [00:22, 4.67it/s] 105it [00:22, 4.56it/s] 106it [00:23, 4.60it/s] 107it [00:23, 4.65it/s] 108it [00:23, 4.65it/s] 109it [00:23, 4.62it/s] 110it [00:23, 4.38it/s] 111it [00:24, 4.31it/s] 112it [00:24, 4.25it/s] 113it [00:24, 4.21it/s] 114it [00:24, 4.27it/s] 115it [00:25, 4.31it/s] 116it [00:25, 4.27it/s] 117it [00:25, 4.41it/s] 118it [00:25, 4.49it/s] 119it [00:26, 4.55it/s] 120it [00:26, 4.59it/s] 121it [00:26, 4.62it/s] 122it [00:26, 4.47it/s] 123it [00:26, 4.55it/s] 124it [00:27, 4.56it/s] 125it [00:27, 4.60it/s] 126it [00:27, 4.62it/s] 127it [00:27, 4.64it/s] 128it [00:27, 4.66it/s] 129it [00:28, 4.67it/s] 130it [00:28, 4.68it/s] 131it [00:28, 4.52it/s] 132it [00:28, 4.53it/s] 133it [00:29, 4.59it/s] 134it [00:29, 4.61it/s] 135it [00:29, 4.64it/s] 136it [00:29, 4.65it/s] 137it [00:29, 4.66it/s] 138it [00:30, 4.55it/s] 139it [00:30, 4.61it/s] 140it [00:30, 4.62it/s] 141it [00:30, 4.65it/s] 142it [00:31, 4.66it/s] 143it [00:31, 4.67it/s] 144it [00:31, 4.67it/s] 145it [00:31, 4.68it/s] 146it [00:31, 4.68it/s] 147it [00:32, 4.69it/s] 148it [00:32, 4.69it/s] 149it [00:32, 4.69it/s] 150it [00:32, 4.69it/s]2025-05-25 23:58:18,695 - INFO - [Epoch 086 | Batch 0150] IWAE-loss 1505.1322 | mean log_px -0.0137 | KL -965.18 + 151it [00:32, 4.69it/s] 152it [00:33, 4.69it/s] 153it [00:33, 4.53it/s] 154it [00:33, 4.59it/s] 155it [00:33, 4.62it/s] 156it [00:34, 4.64it/s] 157it [00:34, 4.66it/s] 158it [00:34, 4.66it/s] 159it [00:34, 4.68it/s] 160it [00:34, 4.68it/s] 161it [00:35, 4.69it/s] 162it [00:35, 4.52it/s] 163it [00:35, 4.59it/s] 164it [00:35, 4.62it/s] 165it [00:35, 4.65it/s] 166it [00:36, 4.66it/s] 167it [00:36, 4.67it/s] 168it [00:36, 4.51it/s] 169it [00:36, 4.58it/s] 170it [00:37, 4.61it/s] 171it [00:37, 4.64it/s] 172it [00:37, 4.66it/s] 173it [00:37, 4.67it/s] 174it [00:37, 4.68it/s] 175it [00:38, 4.69it/s] 176it [00:38, 4.69it/s] 177it [00:38, 4.54it/s] 178it [00:38, 4.60it/s] 179it [00:39, 4.63it/s] 180it [00:39, 4.64it/s] 181it [00:39, 4.66it/s] 182it [00:39, 4.67it/s] 183it [00:39, 4.68it/s] 184it [00:40, 4.68it/s] 185it [00:40, 4.64it/s] 186it [00:40, 4.49it/s] 187it [00:40, 4.57it/s] 188it [00:40, 4.60it/s] 189it [00:41, 4.63it/s] 190it [00:41, 4.64it/s] 191it [00:41, 4.67it/s] 192it [00:41, 4.51it/s] 193it [00:42, 4.58it/s] 194it [00:42, 4.61it/s] 195it [00:42, 4.49it/s] 196it [00:42, 4.51it/s] 196it [00:42, 4.58it/s] +2025-05-25 23:58:28,590 - INFO - Epoch: 86, Objective: tensor([1302.8038], device='cuda:0', grad_fn=), Loss: 0.0075148637406528, KL/n: 19.660505294799805 + 0it [00:00, ?it/s]2025-05-25 23:58:29,005 - INFO - [Epoch 087 | Batch 0000] IWAE-loss 1044.9692 | mean log_px -0.0016 | KL -964.23 + 1it [00:00, 2.89it/s] 2it [00:00, 3.53it/s] 3it [00:00, 3.82it/s] 4it [00:01, 4.05it/s] 5it [00:01, 4.21it/s] 6it [00:01, 4.34it/s] 7it [00:01, 4.44it/s] 8it [00:01, 4.50it/s] 9it [00:02, 4.54it/s] 10it [00:02, 4.56it/s] 11it [00:02, 4.58it/s] 12it [00:02, 4.59it/s] 13it [00:02, 4.61it/s] 14it [00:03, 4.62it/s] 15it [00:03, 4.61it/s] 16it [00:03, 4.62it/s] 17it [00:03, 4.63it/s] 18it [00:04, 4.62it/s] 19it [00:04, 4.62it/s] 20it [00:04, 4.63it/s] 21it [00:04, 4.64it/s] 22it [00:04, 4.63it/s] 23it [00:05, 4.64it/s] 24it [00:05, 4.63it/s] 25it [00:05, 4.64it/s] 26it [00:05, 3.67it/s] 27it [00:06, 3.90it/s] 28it [00:06, 4.09it/s] 29it [00:06, 4.24it/s] 30it [00:06, 4.35it/s] 31it [00:07, 4.43it/s] 32it [00:07, 4.49it/s] 33it [00:07, 4.54it/s] 34it [00:07, 4.56it/s] 35it [00:07, 4.58it/s] 36it [00:08, 4.60it/s] 37it [00:08, 4.61it/s] 38it [00:08, 4.61it/s] 39it [00:08, 4.58it/s] 40it [00:09, 4.59it/s] 41it [00:09, 4.54it/s] 42it [00:09, 4.57it/s] 43it [00:09, 4.59it/s] 44it [00:09, 4.61it/s] 45it [00:10, 4.62it/s] 46it [00:10, 4.62it/s] 47it [00:10, 4.59it/s] 48it [00:10, 4.60it/s] 49it [00:10, 4.62it/s] 50it [00:11, 4.62it/s]2025-05-25 23:58:40,074 - INFO - [Epoch 087 | Batch 0050] IWAE-loss 1112.0288 | mean log_px -0.0045 | KL -961.18 + 51it [00:11, 4.63it/s] 52it [00:11, 4.64it/s] 53it [00:11, 4.64it/s] 54it [00:12, 4.64it/s] 55it [00:12, 4.58it/s] 56it [00:12, 4.52it/s] 57it [00:12, 4.53it/s] 58it [00:12, 4.53it/s] 59it [00:13, 4.52it/s] 60it [00:13, 4.52it/s] 61it [00:13, 4.49it/s] 62it [00:13, 4.53it/s] 63it [00:14, 4.57it/s] 64it [00:14, 4.59it/s] 65it [00:14, 4.61it/s] 66it [00:14, 4.62it/s] 67it [00:14, 4.63it/s] 68it [00:15, 4.62it/s] 69it [00:15, 4.63it/s] 70it [00:15, 4.63it/s] 71it [00:15, 4.60it/s] 72it [00:15, 4.61it/s] 73it [00:16, 4.61it/s] 74it [00:16, 4.61it/s] 75it [00:16, 4.62it/s] 76it [00:16, 4.62it/s] 77it [00:17, 4.56it/s] 78it [00:17, 4.59it/s] 79it [00:17, 4.61it/s] 80it [00:17, 4.62it/s] 81it [00:17, 4.62it/s] 82it [00:18, 4.62it/s] 83it [00:18, 4.65it/s] 84it [00:18, 4.63it/s] 85it [00:18, 4.62it/s] 86it [00:19, 4.62it/s] 87it [00:19, 4.63it/s] 88it [00:19, 4.55it/s] 89it [00:19, 4.58it/s] 90it [00:19, 4.60it/s] 91it [00:20, 4.60it/s] 92it [00:20, 4.59it/s] 93it [00:20, 4.60it/s] 94it [00:20, 4.61it/s] 95it [00:20, 4.63it/s] 96it [00:21, 4.63it/s] 97it [00:21, 4.64it/s] 98it [00:21, 4.62it/s] 99it [00:21, 4.63it/s] 100it [00:22, 4.62it/s]2025-05-25 23:58:50,946 - INFO - [Epoch 087 | Batch 0100] IWAE-loss 1093.4396 | mean log_px -0.0022 | KL -958.57 + 101it [00:22, 4.62it/s] 102it [00:22, 4.62it/s] 103it [00:22, 4.64it/s] 104it [00:22, 4.62it/s] 105it [00:23, 4.63it/s] 106it [00:23, 4.61it/s] 107it [00:23, 4.47it/s] 108it [00:23, 4.50it/s] 109it [00:24, 4.38it/s] 110it [00:24, 4.40it/s] 111it [00:24, 4.48it/s] 112it [00:24, 4.48it/s] 113it [00:24, 4.49it/s] 114it [00:25, 4.55it/s] 115it [00:25, 4.43it/s] 116it [00:25, 4.44it/s] 117it [00:25, 4.50it/s] 118it [00:26, 4.47it/s] 119it [00:26, 4.53it/s] 120it [00:26, 4.56it/s] 121it [00:26, 4.44it/s] 122it [00:26, 4.44it/s] 123it [00:27, 4.52it/s] 124it [00:27, 4.56it/s] 125it [00:27, 4.60it/s] 126it [00:27, 4.62it/s] 127it [00:28, 4.49it/s] 128it [00:28, 4.55it/s] 129it [00:28, 4.59it/s] 130it [00:28, 4.62it/s] 131it [00:28, 4.48it/s] 132it [00:29, 4.54it/s] 133it [00:29, 4.58it/s] 134it [00:29, 4.59it/s] 135it [00:29, 4.62it/s] 136it [00:30, 4.63it/s] 137it [00:30, 4.49it/s] 138it [00:30, 4.56it/s] 139it [00:30, 4.59it/s] 140it [00:30, 4.62it/s] 141it [00:31, 4.64it/s] 142it [00:31, 4.65it/s] 143it [00:31, 4.51it/s] 144it [00:31, 4.52it/s] 145it [00:31, 4.57it/s] 146it [00:32, 4.58it/s] 147it [00:32, 4.61it/s] 148it [00:32, 4.62it/s] 149it [00:32, 4.48it/s] 150it [00:33, 4.52it/s]2025-05-25 23:59:01,961 - INFO - [Epoch 087 | Batch 0150] IWAE-loss 1118.8979 | mean log_px -0.0022 | KL -959.16 + 151it [00:33, 4.58it/s] 152it [00:33, 4.60it/s] 153it [00:33, 4.57it/s] 154it [00:33, 4.60it/s] 155it [00:34, 4.47it/s] 156it [00:34, 4.53it/s] 157it [00:34, 4.57it/s] 158it [00:34, 4.53it/s] 159it [00:35, 4.57it/s] 160it [00:35, 4.58it/s] 161it [00:35, 4.61it/s] 162it [00:35, 4.48it/s] 163it [00:35, 4.53it/s] 164it [00:36, 4.55it/s] 165it [00:36, 4.59it/s] 166it [00:36, 4.60it/s] 167it [00:36, 4.61it/s] 168it [00:37, 4.61it/s] 169it [00:37, 4.47it/s] 170it [00:37, 4.52it/s] 171it [00:37, 4.56it/s] 172it [00:37, 4.58it/s] 173it [00:38, 4.60it/s] 174it [00:38, 4.61it/s] 175it [00:38, 4.62it/s] 176it [00:38, 4.48it/s] 177it [00:39, 4.53it/s] 178it [00:39, 4.57it/s] 179it [00:39, 4.58it/s] 180it [00:39, 4.60it/s] 181it [00:39, 4.61it/s] 182it [00:40, 4.62it/s] 183it [00:40, 4.48it/s] 184it [00:40, 4.54it/s] 185it [00:40, 4.58it/s] 186it [00:40, 4.59it/s] 187it [00:41, 4.61it/s] 188it [00:41, 4.61it/s] 189it [00:41, 4.62it/s] 190it [00:41, 4.62it/s] 191it [00:42, 4.64it/s] 192it [00:42, 4.63it/s] 193it [00:42, 4.50it/s] 194it [00:42, 4.54it/s] 195it [00:42, 4.25it/s] 196it [00:43, 4.17it/s] 196it [00:43, 4.53it/s] +2025-05-25 23:59:12,035 - INFO - Epoch: 87, Objective: tensor([1106.9209], device='cuda:0', grad_fn=), Loss: 0.006249045487493277, KL/n: 19.581295013427734 + 0it [00:00, ?it/s]2025-05-25 23:59:12,450 - INFO - [Epoch 088 | Batch 0000] IWAE-loss 1091.5936 | mean log_px -0.0041 | KL -957.80 + 1it [00:00, 3.03it/s] 2it [00:00, 3.82it/s] 3it [00:00, 4.18it/s] 4it [00:00, 4.33it/s] 5it [00:01, 4.45it/s] 6it [00:01, 4.35it/s] 7it [00:01, 4.45it/s] 8it [00:01, 4.51it/s] 9it [00:02, 4.56it/s] 10it [00:02, 4.59it/s] 11it [00:02, 4.61it/s] 12it [00:02, 4.62it/s] 13it [00:02, 4.63it/s] 14it [00:03, 4.63it/s] 15it [00:03, 4.49it/s] 16it [00:03, 4.54it/s] 17it [00:03, 4.58it/s] 18it [00:04, 4.60it/s] 19it [00:04, 4.61it/s] 20it [00:04, 4.62it/s] 21it [00:04, 4.49it/s] 22it [00:04, 4.40it/s] 23it [00:05, 4.46it/s] 24it [00:05, 4.52it/s] 25it [00:05, 4.40it/s] 26it [00:05, 4.48it/s] 27it [00:06, 4.53it/s] 28it [00:06, 4.56it/s] 29it [00:06, 4.56it/s] 30it [00:06, 4.58it/s] 31it [00:06, 4.59it/s] 32it [00:07, 4.60it/s] 33it [00:07, 4.59it/s] 34it [00:07, 4.44it/s] 35it [00:07, 4.50it/s] 36it [00:08, 4.55it/s] 37it [00:08, 4.57it/s] 38it [00:08, 4.59it/s] 39it [00:08, 4.61it/s] 40it [00:08, 4.61it/s] 41it [00:09, 4.48it/s] 42it [00:09, 4.52it/s] 43it [00:09, 4.55it/s] 44it [00:09, 4.57it/s] 45it [00:09, 4.58it/s] 46it [00:10, 4.58it/s] 47it [00:10, 4.62it/s] 48it [00:10, 4.61it/s] 49it [00:10, 4.61it/s] 50it [00:11, 4.43it/s]2025-05-25 23:59:23,431 - INFO - [Epoch 088 | Batch 0050] IWAE-loss 1129.9476 | mean log_px -0.0060 | KL -957.38 + 51it [00:11, 4.48it/s] 52it [00:11, 4.52it/s] 53it [00:11, 4.56it/s] 54it [00:11, 4.58it/s] 55it [00:12, 4.59it/s] 56it [00:12, 4.59it/s] 57it [00:12, 4.60it/s] 58it [00:12, 4.61it/s] 59it [00:13, 4.47it/s] 60it [00:13, 4.52it/s] 61it [00:13, 4.56it/s] 62it [00:13, 4.56it/s] 63it [00:13, 4.59it/s] 64it [00:14, 4.60it/s] 65it [00:14, 4.62it/s] 66it [00:14, 4.62it/s] 67it [00:14, 4.59it/s] 68it [00:15, 4.46it/s] 69it [00:15, 4.52it/s] 70it [00:15, 4.55it/s] 71it [00:15, 4.56it/s] 72it [00:15, 4.58it/s] 73it [00:16, 4.57it/s] 74it [00:16, 4.44it/s] 75it [00:16, 4.51it/s] 76it [00:16, 4.55it/s] 77it [00:17, 4.57it/s] 78it [00:17, 4.59it/s] 79it [00:17, 4.60it/s] 80it [00:17, 4.60it/s] 81it [00:17, 4.47it/s] 82it [00:18, 4.53it/s] 83it [00:18, 4.56it/s] 84it [00:18, 4.58it/s] 85it [00:18, 4.60it/s] 86it [00:18, 4.59it/s] 87it [00:19, 4.60it/s] 88it [00:19, 4.47it/s] 89it [00:19, 4.53it/s] 90it [00:19, 4.56it/s] 91it [00:20, 4.57it/s] 92it [00:20, 4.58it/s] 93it [00:20, 4.59it/s] 94it [00:20, 4.60it/s] 95it [00:20, 4.47it/s] 96it [00:21, 4.51it/s] 97it [00:21, 4.56it/s] 98it [00:21, 4.57it/s] 99it [00:21, 4.59it/s] 100it [00:22, 4.60it/s]2025-05-25 23:59:34,384 - INFO - [Epoch 088 | Batch 0100] IWAE-loss 1050.3236 | mean log_px -0.0014 | KL -958.19 + 101it [00:22, 4.45it/s] 102it [00:22, 4.49it/s] 103it [00:22, 4.53it/s] 104it [00:22, 4.56it/s] 105it [00:23, 4.58it/s] 106it [00:23, 4.58it/s] 107it [00:23, 4.60it/s] 108it [00:23, 4.60it/s] 109it [00:24, 4.62it/s] 110it [00:24, 4.48it/s] 111it [00:24, 4.53it/s] 112it [00:24, 4.56it/s] 113it [00:24, 4.59it/s] 114it [00:25, 4.59it/s] 115it [00:25, 4.46it/s] 116it [00:25, 4.52it/s] 117it [00:25, 4.56it/s] 118it [00:26, 4.55it/s] 119it [00:26, 4.59it/s] 120it [00:26, 4.47it/s] 121it [00:26, 4.52it/s] 122it [00:26, 4.55it/s] 123it [00:27, 4.48it/s] 124it [00:27, 4.53it/s] 125it [00:27, 4.57it/s] 126it [00:27, 4.58it/s] 127it [00:27, 4.58it/s] 128it [00:28, 4.46it/s] 129it [00:28, 4.52it/s] 130it [00:28, 4.55it/s] 131it [00:28, 4.57it/s] 132it [00:29, 4.59it/s] 133it [00:29, 4.60it/s] 134it [00:29, 4.51it/s] 135it [00:29, 4.53it/s] 136it [00:29, 4.54it/s] 137it [00:30, 4.57it/s] 138it [00:30, 4.58it/s] 139it [00:30, 4.45it/s] 140it [00:30, 4.50it/s] 141it [00:31, 4.53it/s] 142it [00:31, 4.56it/s] 143it [00:31, 4.57it/s] 144it [00:31, 4.42it/s] 145it [00:31, 4.49it/s] 146it [00:32, 4.54it/s] 147it [00:32, 4.55it/s] 148it [00:32, 4.43it/s] 149it [00:32, 4.48it/s] 150it [00:33, 4.52it/s]2025-05-25 23:59:45,426 - INFO - [Epoch 088 | Batch 0150] IWAE-loss 1027.6443 | mean log_px -0.0013 | KL -960.73 + 151it [00:33, 4.48it/s] 152it [00:33, 4.53it/s] 153it [00:33, 4.53it/s] 154it [00:33, 4.56it/s] 155it [00:34, 4.55it/s] 156it [00:34, 4.58it/s] 157it [00:34, 4.41it/s] 158it [00:34, 4.45it/s] 159it [00:35, 4.50it/s] 160it [00:35, 4.53it/s] 161it [00:35, 4.55it/s] 162it [00:35, 4.57it/s] 163it [00:35, 4.61it/s] 164it [00:36, 4.51it/s] 165it [00:36, 4.56it/s] 166it [00:36, 4.55it/s] 167it [00:36, 4.58it/s] 168it [00:37, 4.59it/s] 169it [00:37, 4.60it/s] 170it [00:37, 4.60it/s] 171it [00:37, 4.60it/s] 172it [00:37, 4.60it/s] 173it [00:38, 4.62it/s] 174it [00:38, 4.62it/s] 175it [00:38, 4.62it/s] 176it [00:38, 4.61it/s] 177it [00:39, 4.48it/s] 178it [00:39, 4.51it/s] 179it [00:39, 4.54it/s] 180it [00:39, 4.56it/s] 181it [00:39, 4.60it/s] 182it [00:40, 4.60it/s] 183it [00:40, 4.61it/s] 184it [00:40, 4.61it/s] 185it [00:40, 4.62it/s] 186it [00:40, 4.48it/s] 187it [00:41, 4.53it/s] 188it [00:41, 4.54it/s] 189it [00:41, 4.56it/s] 190it [00:41, 4.57it/s] 191it [00:42, 4.59it/s] 192it [00:42, 4.59it/s] 193it [00:42, 4.61it/s] 194it [00:42, 4.60it/s] 195it [00:42, 4.22it/s] 196it [00:43, 4.30it/s] 196it [00:43, 4.53it/s] +2025-05-25 23:59:55,469 - INFO - Epoch: 88, Objective: tensor([1130.0813], device='cuda:0', grad_fn=), Loss: 0.0030066303443163633, KL/n: 19.562442779541016 + 0it [00:00, ?it/s]2025-05-25 23:59:56,052 - INFO - [Epoch 089 | Batch 0000] IWAE-loss 1094.9982 | mean log_px -0.0019 | KL -957.34 + 1it [00:00, 3.04it/s] 2it [00:00, 3.78it/s] 3it [00:00, 4.09it/s] 4it [00:00, 4.30it/s] 5it [00:01, 4.32it/s] 6it [00:01, 4.17it/s] 7it [00:01, 4.29it/s] 8it [00:01, 4.39it/s] 9it [00:02, 4.44it/s] 10it [00:02, 4.50it/s] 11it [00:02, 4.53it/s] 12it [00:02, 4.49it/s] 13it [00:03, 4.36it/s] 14it [00:03, 4.44it/s] 15it [00:03, 4.36it/s] 16it [00:03, 4.43it/s] 17it [00:03, 4.49it/s] 18it [00:04, 4.54it/s] 19it [00:04, 4.42it/s] 20it [00:04, 4.21it/s] 21it [00:04, 4.20it/s] 22it [00:05, 4.19it/s] 23it [00:05, 4.32it/s] 24it [00:05, 4.42it/s] 25it [00:05, 4.50it/s] 26it [00:06, 4.26it/s] 27it [00:06, 4.32it/s] 28it [00:06, 4.25it/s] 29it [00:06, 4.30it/s] 30it [00:06, 4.37it/s] 31it [00:07, 4.39it/s] 32it [00:07, 4.46it/s] 33it [00:07, 4.38it/s] 34it [00:07, 4.46it/s] 35it [00:08, 4.51it/s] 36it [00:08, 4.55it/s] 37it [00:08, 4.43it/s] 38it [00:08, 4.46it/s] 39it [00:08, 4.50it/s] 40it [00:09, 4.36it/s] 41it [00:09, 4.31it/s] 42it [00:09, 4.27it/s] 43it [00:09, 4.22it/s] 44it [00:10, 4.33it/s] 45it [00:10, 4.43it/s] 46it [00:10, 4.49it/s] 47it [00:10, 4.38it/s] 48it [00:11, 4.20it/s] 49it [00:11, 4.18it/s] 50it [00:11, 4.17it/s]2025-05-26 00:00:07,481 - INFO - [Epoch 089 | Batch 0050] IWAE-loss 1109.4702 | mean log_px -0.0021 | KL -958.17 + 51it [00:11, 4.27it/s] 52it [00:12, 4.12it/s] 53it [00:12, 4.15it/s] 54it [00:12, 4.15it/s] 55it [00:12, 4.15it/s] 56it [00:12, 4.23it/s] 57it [00:13, 4.20it/s] 58it [00:13, 4.18it/s] 59it [00:13, 4.30it/s] 60it [00:13, 4.20it/s] 61it [00:14, 4.18it/s] 62it [00:14, 4.28it/s] 63it [00:14, 4.39it/s] 64it [00:14, 4.32it/s] 65it [00:15, 4.41it/s] 66it [00:15, 4.48it/s] 67it [00:15, 4.53it/s] 68it [00:15, 4.56it/s] 69it [00:15, 4.59it/s] 70it [00:16, 4.40it/s] 71it [00:16, 4.32it/s] 72it [00:16, 4.26it/s] 73it [00:16, 4.36it/s] 74it [00:17, 4.29it/s] 75it [00:17, 4.40it/s] 76it [00:17, 4.47it/s] 77it [00:17, 4.44it/s] 78it [00:17, 4.51it/s] 79it [00:18, 4.49it/s] 80it [00:18, 4.36it/s] 81it [00:18, 4.46it/s] 82it [00:18, 4.51it/s] 83it [00:19, 4.55it/s] 84it [00:19, 4.58it/s] 85it [00:19, 4.54it/s] 86it [00:19, 4.53it/s] 87it [00:20, 4.29it/s] 88it [00:20, 4.39it/s] 89it [00:20, 4.46it/s] 90it [00:20, 4.48it/s] 91it [00:20, 4.54it/s] 92it [00:21, 4.57it/s] 93it [00:21, 4.44it/s] 94it [00:21, 4.51it/s] 95it [00:21, 4.51it/s] 96it [00:22, 4.41it/s] 97it [00:22, 4.48it/s] 98it [00:22, 4.51it/s] 99it [00:22, 4.26it/s] 100it [00:22, 4.36it/s]2025-05-26 00:00:18,863 - INFO - [Epoch 089 | Batch 0100] IWAE-loss 1056.6552 | mean log_px -0.0079 | KL -953.52 + 101it [00:23, 4.44it/s] 102it [00:23, 4.34it/s] 103it [00:23, 4.42it/s] 104it [00:23, 4.48it/s] 105it [00:24, 4.37it/s] 106it [00:24, 4.41it/s] 107it [00:24, 4.31it/s] 108it [00:24, 4.39it/s] 109it [00:24, 4.43it/s] 110it [00:25, 4.32it/s] 111it [00:25, 4.27it/s] 112it [00:25, 4.38it/s] 113it [00:25, 4.45it/s] 114it [00:26, 4.42it/s] 115it [00:26, 4.34it/s] 116it [00:26, 4.40it/s] 117it [00:26, 4.33it/s] 118it [00:27, 4.27it/s] 119it [00:27, 4.36it/s] 120it [00:27, 4.29it/s] 121it [00:27, 4.23it/s] 122it [00:27, 4.34it/s] 123it [00:28, 4.29it/s] 124it [00:28, 4.25it/s] 125it [00:28, 4.20it/s] 126it [00:28, 4.19it/s] 127it [00:29, 4.23it/s] 128it [00:29, 4.18it/s] 129it [00:29, 4.16it/s] 130it [00:29, 4.15it/s] 131it [00:30, 4.15it/s] 132it [00:30, 4.13it/s] 133it [00:30, 4.13it/s] 134it [00:30, 4.14it/s] 135it [00:31, 4.01it/s] 136it [00:31, 4.04it/s] 137it [00:31, 4.20it/s] 138it [00:31, 4.17it/s] 139it [00:32, 4.16it/s] 140it [00:32, 4.28it/s] 141it [00:32, 4.21it/s] 142it [00:32, 4.34it/s] 143it [00:32, 4.43it/s] 144it [00:33, 4.32it/s] 145it [00:33, 4.41it/s] 146it [00:33, 4.32it/s] 147it [00:33, 4.27it/s] 148it [00:34, 4.25it/s] 149it [00:34, 4.35it/s] 150it [00:34, 4.43it/s]2025-05-26 00:00:30,524 - INFO - [Epoch 089 | Batch 0150] IWAE-loss 1259.3633 | mean log_px -0.0045 | KL -950.79 + 151it [00:34, 4.47it/s] 152it [00:35, 4.51it/s] 153it [00:35, 4.40it/s] 154it [00:35, 4.48it/s] 155it [00:35, 4.50it/s] 156it [00:35, 4.47it/s] 157it [00:36, 4.52it/s] 158it [00:36, 4.55it/s] 159it [00:36, 4.57it/s] 160it [00:36, 4.45it/s] 161it [00:37, 4.52it/s] 162it [00:37, 4.56it/s] 163it [00:37, 4.59it/s] 164it [00:37, 4.60it/s] 165it [00:37, 4.62it/s] 166it [00:38, 4.46it/s] 167it [00:38, 4.52it/s] 168it [00:38, 4.53it/s] 169it [00:38, 4.49it/s] 170it [00:38, 4.52it/s] 171it [00:39, 4.55it/s] 172it [00:39, 4.57it/s] 173it [00:39, 4.44it/s] 174it [00:39, 4.52it/s] 175it [00:40, 4.54it/s] 176it [00:40, 4.57it/s] 177it [00:40, 4.59it/s] 178it [00:40, 4.56it/s] 179it [00:40, 4.41it/s] 180it [00:41, 4.31it/s] 181it [00:41, 4.28it/s] 182it [00:41, 4.36it/s] 183it [00:41, 4.44it/s] 184it [00:42, 4.31it/s] 185it [00:42, 4.32it/s] 186it [00:42, 4.41it/s] 187it [00:42, 4.24it/s] 188it [00:43, 4.35it/s] 189it [00:43, 4.29it/s] 190it [00:43, 4.24it/s] 191it [00:43, 4.29it/s] 192it [00:44, 4.38it/s] 193it [00:44, 4.47it/s] 194it [00:44, 4.38it/s] 195it [00:44, 4.32it/s] 196it [00:44, 4.41it/s] 196it [00:44, 4.36it/s] +2025-05-26 00:00:40,780 - INFO - Epoch: 89, Objective: tensor([1205.1879], device='cuda:0', grad_fn=), Loss: 0.005796458572149277, KL/n: 19.43310546875 + 0it [00:00, ?it/s]2025-05-26 00:00:41,143 - INFO - [Epoch 090 | Batch 0000] IWAE-loss 1041.4233 | mean log_px -0.0023 | KL -952.96 + 1it [00:00, 3.47it/s] 2it [00:00, 3.73it/s] 3it [00:00, 4.11it/s] 4it [00:00, 4.30it/s] 5it [00:01, 4.25it/s] 6it [00:01, 4.38it/s] 7it [00:01, 4.46it/s] 8it [00:01, 4.50it/s] 9it [00:02, 4.49it/s] 10it [00:02, 4.54it/s] 11it [00:02, 3.59it/s] 12it [00:02, 3.86it/s] 13it [00:03, 4.07it/s] 14it [00:03, 4.22it/s] 15it [00:03, 4.35it/s] 16it [00:03, 4.44it/s] 17it [00:03, 4.51it/s] 18it [00:04, 4.40it/s] 19it [00:04, 4.46it/s] 20it [00:04, 4.51it/s] 21it [00:04, 4.56it/s] 22it [00:05, 4.59it/s] 23it [00:05, 4.62it/s] 24it [00:05, 4.48it/s] 25it [00:05, 4.52it/s] 26it [00:05, 4.46it/s] 27it [00:06, 4.52it/s] 28it [00:06, 4.55it/s] 29it [00:06, 4.58it/s] 30it [00:06, 4.60it/s] 31it [00:07, 4.46it/s] 32it [00:07, 4.52it/s] 33it [00:07, 4.56it/s] 34it [00:07, 4.58it/s] 35it [00:07, 4.61it/s] 36it [00:08, 4.62it/s] 37it [00:08, 4.47it/s] 38it [00:08, 4.52it/s] 39it [00:08, 4.57it/s] 40it [00:09, 4.59it/s] 41it [00:09, 4.61it/s] 42it [00:09, 4.60it/s] 43it [00:09, 4.63it/s] 44it [00:09, 4.63it/s] 45it [00:10, 4.65it/s] 46it [00:10, 4.51it/s] 47it [00:10, 4.56it/s] 48it [00:10, 4.59it/s] 49it [00:11, 4.61it/s] 50it [00:11, 4.62it/s]2025-05-26 00:00:52,303 - INFO - [Epoch 090 | Batch 0050] IWAE-loss 1354.5846 | mean log_px -0.0103 | KL -952.79 + 51it [00:11, 4.61it/s] 52it [00:11, 4.62it/s] 53it [00:11, 4.64it/s] 54it [00:12, 4.65it/s] 55it [00:12, 4.51it/s] 56it [00:12, 4.55it/s] 57it [00:12, 4.59it/s] 58it [00:12, 4.60it/s] 59it [00:13, 4.61it/s] 60it [00:13, 4.58it/s] 61it [00:13, 4.60it/s] 62it [00:13, 4.61it/s] 63it [00:14, 4.63it/s] 64it [00:14, 4.49it/s] 65it [00:14, 4.53it/s] 66it [00:14, 4.56it/s] 67it [00:14, 4.55it/s] 68it [00:15, 4.58it/s] 69it [00:15, 4.45it/s] 70it [00:15, 4.51it/s] 71it [00:15, 4.56it/s] 72it [00:16, 4.57it/s] 73it [00:16, 4.60it/s] 74it [00:16, 4.60it/s] 75it [00:16, 4.60it/s] 76it [00:16, 4.45it/s] 77it [00:17, 4.53it/s] 78it [00:17, 4.56it/s] 79it [00:17, 4.58it/s] 80it [00:17, 4.60it/s] 81it [00:18, 4.61it/s] 82it [00:18, 4.62it/s] 83it [00:18, 4.63it/s] 84it [00:18, 4.63it/s] 85it [00:18, 4.45it/s] 86it [00:19, 4.51it/s] 87it [00:19, 4.55it/s] 88it [00:19, 4.57it/s] 89it [00:19, 4.61it/s] 90it [00:19, 4.62it/s] 91it [00:20, 4.63it/s] 92it [00:20, 4.48it/s] 93it [00:20, 4.54it/s] 94it [00:20, 4.58it/s] 95it [00:21, 4.60it/s] 96it [00:21, 4.61it/s] 97it [00:21, 4.63it/s] 98it [00:21, 4.63it/s] 99it [00:21, 4.64it/s] 100it [00:22, 4.65it/s]2025-05-26 00:01:03,220 - INFO - [Epoch 090 | Batch 0100] IWAE-loss 1023.6895 | mean log_px -0.0019 | KL -951.39 + 101it [00:22, 4.50it/s] 102it [00:22, 4.54it/s] 103it [00:22, 4.58it/s] 104it [00:23, 4.60it/s] 105it [00:23, 4.61it/s] 106it [00:23, 4.43it/s] 107it [00:23, 4.51it/s] 108it [00:23, 4.41it/s] 109it [00:24, 4.49it/s] 110it [00:24, 4.52it/s] 111it [00:24, 4.52it/s] 112it [00:24, 4.55it/s] 113it [00:25, 4.58it/s] 114it [00:25, 4.60it/s] 115it [00:25, 4.46it/s] 116it [00:25, 4.53it/s] 117it [00:25, 4.57it/s] 118it [00:26, 4.60it/s] 119it [00:26, 4.60it/s] 120it [00:26, 4.62it/s] 121it [00:26, 4.63it/s] 122it [00:26, 4.63it/s] 123it [00:27, 4.63it/s] 124it [00:27, 4.48it/s] 125it [00:27, 4.52it/s] 126it [00:27, 4.56it/s] 127it [00:28, 4.58it/s] 128it [00:28, 4.60it/s] 129it [00:28, 4.61it/s] 130it [00:28, 4.62it/s] 131it [00:28, 4.53it/s] 132it [00:29, 4.57it/s] 133it [00:29, 4.59it/s] 134it [00:29, 4.60it/s] 135it [00:29, 4.61it/s] 136it [00:30, 4.62it/s] 137it [00:30, 4.49it/s] 138it [00:30, 4.54it/s] 139it [00:30, 4.58it/s] 140it [00:30, 4.60it/s] 141it [00:31, 4.62it/s] 142it [00:31, 4.62it/s] 143it [00:31, 4.61it/s] 144it [00:31, 4.62it/s] 145it [00:32, 4.64it/s] 146it [00:32, 4.48it/s] 147it [00:32, 4.55it/s] 148it [00:32, 4.58it/s] 149it [00:32, 4.61it/s] 150it [00:33, 4.62it/s]2025-05-26 00:01:14,171 - INFO - [Epoch 090 | Batch 0150] IWAE-loss 1153.8442 | mean log_px -0.0029 | KL -949.34 + 151it [00:33, 4.63it/s] 152it [00:33, 4.63it/s] 153it [00:33, 4.64it/s] 154it [00:33, 4.65it/s] 155it [00:34, 4.50it/s] 156it [00:34, 4.56it/s] 157it [00:34, 4.59it/s] 158it [00:34, 4.62it/s] 159it [00:35, 4.63it/s] 160it [00:35, 4.64it/s] 161it [00:35, 4.48it/s] 162it [00:35, 4.54it/s] 163it [00:35, 4.56it/s] 164it [00:36, 4.55it/s] 165it [00:36, 4.44it/s] 166it [00:36, 4.51it/s] 167it [00:36, 4.57it/s] 168it [00:37, 4.58it/s] 169it [00:37, 4.40it/s] 170it [00:37, 4.47it/s] 171it [00:37, 4.52it/s] 172it [00:37, 4.55it/s] 173it [00:38, 4.57it/s] 174it [00:38, 4.45it/s] 175it [00:38, 4.52it/s] 176it [00:38, 4.55it/s] 177it [00:39, 4.57it/s] 178it [00:39, 4.59it/s] 179it [00:39, 4.61it/s] 180it [00:39, 4.62it/s] 181it [00:39, 4.62it/s] 182it [00:40, 4.63it/s] 183it [00:40, 4.50it/s] 184it [00:40, 4.54it/s] 185it [00:40, 4.57it/s] 186it [00:40, 4.59it/s] 187it [00:41, 4.61it/s] 188it [00:41, 4.59it/s] 189it [00:41, 4.62it/s] 190it [00:41, 4.61it/s] 191it [00:42, 4.63it/s] 192it [00:42, 4.48it/s] 193it [00:42, 4.54it/s] 194it [00:42, 4.58it/s] 195it [00:43, 4.28it/s] 196it [00:43, 4.20it/s] 196it [00:43, 4.52it/s] +2025-05-26 00:01:24,256 - INFO - Epoch: 90, Objective: tensor([1778.1040], device='cuda:0', grad_fn=), Loss: 0.016707276925444603, KL/n: 19.43993377685547 + 0it [00:00, ?it/s]2025-05-26 00:01:24,638 - INFO - [Epoch 091 | Batch 0000] IWAE-loss 1187.3732 | mean log_px -0.0049 | KL -951.82 + 1it [00:00, 3.21it/s] 2it [00:00, 3.86it/s] 3it [00:00, 4.20it/s] 4it [00:00, 4.36it/s] 5it [00:01, 4.48it/s] 6it [00:01, 4.53it/s] 7it [00:01, 4.58it/s] 8it [00:01, 4.60it/s] 9it [00:02, 4.39it/s] 10it [00:02, 4.47it/s] 11it [00:02, 4.53it/s] 12it [00:02, 4.40it/s] 13it [00:02, 4.47it/s] 14it [00:03, 4.36it/s] 15it [00:03, 4.45it/s] 16it [00:03, 4.50it/s] 17it [00:03, 4.56it/s] 18it [00:04, 4.54it/s] 19it [00:04, 4.58it/s] 20it [00:04, 4.57it/s] 21it [00:04, 4.46it/s] 22it [00:04, 4.53it/s] 23it [00:05, 4.57it/s] 24it [00:05, 4.59it/s] 25it [00:05, 4.62it/s] 26it [00:05, 4.63it/s] 27it [00:06, 4.49it/s] 28it [00:06, 4.55it/s] 29it [00:06, 4.59it/s] 30it [00:06, 4.61it/s] 31it [00:06, 4.63it/s] 32it [00:07, 4.60it/s] 33it [00:07, 4.61it/s] 34it [00:07, 4.60it/s] 35it [00:07, 4.62it/s] 36it [00:08, 4.47it/s] 37it [00:08, 4.53it/s] 38it [00:08, 4.56it/s] 39it [00:08, 4.57it/s] 40it [00:08, 4.58it/s] 41it [00:09, 4.60it/s] 42it [00:09, 4.61it/s] 43it [00:09, 4.61it/s] 44it [00:09, 4.63it/s] 45it [00:09, 4.48it/s] 46it [00:10, 4.54it/s] 47it [00:10, 4.58it/s] 48it [00:10, 4.61it/s] 49it [00:10, 4.63it/s] 50it [00:11, 4.63it/s]2025-05-26 00:01:35,591 - INFO - [Epoch 091 | Batch 0050] IWAE-loss 1333.3361 | mean log_px -0.0116 | KL -948.98 + 51it [00:11, 4.64it/s] 52it [00:11, 4.65it/s] 53it [00:11, 4.66it/s] 54it [00:11, 4.66it/s] 55it [00:12, 4.67it/s] 56it [00:12, 4.66it/s] 57it [00:12, 4.50it/s] 58it [00:12, 4.55it/s] 59it [00:13, 4.58it/s] 60it [00:13, 4.61it/s] 61it [00:13, 4.63it/s] 62it [00:13, 4.64it/s] 63it [00:13, 4.65it/s] 64it [00:14, 4.48it/s] 65it [00:14, 4.56it/s] 66it [00:14, 4.57it/s] 67it [00:14, 4.61it/s] 68it [00:14, 4.53it/s] 69it [00:15, 4.56it/s] 70it [00:15, 4.53it/s] 71it [00:15, 4.54it/s] 72it [00:15, 4.56it/s] 73it [00:16, 4.44it/s] 74it [00:16, 4.48it/s] 75it [00:16, 4.53it/s] 76it [00:16, 4.55it/s] 77it [00:16, 4.59it/s] 78it [00:17, 4.59it/s] 79it [00:17, 4.61it/s] 80it [00:17, 4.60it/s] 81it [00:17, 4.61it/s] 82it [00:18, 4.46it/s] 83it [00:18, 4.50it/s] 84it [00:18, 4.54it/s] 85it [00:18, 4.57it/s] 86it [00:18, 4.58it/s] 87it [00:19, 4.61it/s] 88it [00:19, 4.62it/s] 89it [00:19, 4.64it/s] 90it [00:19, 4.62it/s] 91it [00:20, 4.48it/s] 92it [00:20, 4.53it/s] 93it [00:20, 4.56it/s] 94it [00:20, 4.59it/s] 95it [00:20, 4.60it/s] 96it [00:21, 4.61it/s] 97it [00:21, 4.61it/s] 98it [00:21, 4.62it/s] 99it [00:21, 4.63it/s] 100it [00:21, 4.45it/s]2025-05-26 00:01:46,539 - INFO - [Epoch 091 | Batch 0100] IWAE-loss 1001.7884 | mean log_px -0.0025 | KL -947.29 + 101it [00:22, 4.49it/s] 102it [00:22, 4.49it/s] 103it [00:22, 4.50it/s] 104it [00:22, 4.53it/s] 105it [00:23, 4.56it/s] 106it [00:23, 4.57it/s] 107it [00:23, 4.57it/s] 108it [00:23, 4.60it/s] 109it [00:23, 4.47it/s] 110it [00:24, 4.53it/s] 111it [00:24, 4.58it/s] 112it [00:24, 4.60it/s] 113it [00:24, 4.63it/s] 114it [00:25, 4.60it/s] 115it [00:25, 4.55it/s] 116it [00:25, 4.59it/s] 117it [00:25, 4.62it/s] 118it [00:25, 4.64it/s] 119it [00:26, 4.66it/s] 120it [00:26, 4.64it/s] 121it [00:26, 4.50it/s] 122it [00:26, 4.51it/s] 123it [00:27, 4.54it/s] 124it [00:27, 4.57it/s] 125it [00:27, 4.60it/s] 126it [00:27, 4.62it/s] 127it [00:27, 4.65it/s] 128it [00:28, 4.48it/s] 129it [00:28, 4.54it/s] 130it [00:28, 4.58it/s] 131it [00:28, 4.58it/s] 132it [00:28, 4.59it/s] 133it [00:29, 4.60it/s] 134it [00:29, 4.59it/s] 135it [00:29, 4.62it/s] 136it [00:29, 4.63it/s] 137it [00:30, 4.49it/s] 138it [00:30, 4.55it/s] 139it [00:30, 4.60it/s] 140it [00:30, 4.62it/s] 141it [00:30, 4.63it/s] 142it [00:31, 4.63it/s] 143it [00:31, 4.65it/s] 144it [00:31, 4.65it/s] 145it [00:31, 4.66it/s] 146it [00:32, 4.51it/s] 147it [00:32, 4.54it/s] 148it [00:32, 4.57it/s] 149it [00:32, 4.60it/s] 150it [00:32, 4.45it/s]2025-05-26 00:01:57,468 - INFO - [Epoch 091 | Batch 0150] IWAE-loss 1206.0220 | mean log_px -0.0106 | KL -951.12 + 151it [00:33, 4.51it/s] 152it [00:33, 4.53it/s] 153it [00:33, 4.58it/s] 154it [00:33, 4.56it/s] 155it [00:34, 4.46it/s] 156it [00:34, 4.52it/s] 157it [00:34, 4.57it/s] 158it [00:34, 4.60it/s] 159it [00:34, 4.61it/s] 160it [00:35, 4.62it/s] 161it [00:35, 4.64it/s] 162it [00:35, 4.63it/s] 163it [00:35, 4.49it/s] 164it [00:35, 4.55it/s] 165it [00:36, 4.60it/s] 166it [00:36, 4.62it/s] 167it [00:36, 4.64it/s] 168it [00:36, 4.64it/s] 169it [00:37, 4.62it/s] 170it [00:37, 4.63it/s] 171it [00:37, 4.65it/s] 172it [00:37, 4.67it/s] 173it [00:37, 4.67it/s] 174it [00:38, 4.50it/s] 175it [00:38, 4.54it/s] 176it [00:38, 4.56it/s] 177it [00:38, 4.59it/s] 178it [00:39, 4.61it/s] 179it [00:39, 4.62it/s] 180it [00:39, 4.62it/s] 181it [00:39, 4.63it/s] 182it [00:39, 4.63it/s] 183it [00:40, 4.49it/s] 184it [00:40, 4.53it/s] 185it [00:40, 4.58it/s] 186it [00:40, 4.61it/s] 187it [00:40, 4.63it/s] 188it [00:41, 4.63it/s] 189it [00:41, 4.49it/s] 190it [00:41, 4.54it/s] 191it [00:41, 4.58it/s] 192it [00:42, 4.60it/s] 193it [00:42, 4.63it/s] 194it [00:42, 4.64it/s] 195it [00:42, 4.22it/s] 196it [00:42, 4.35it/s] 196it [00:43, 4.55it/s] +2025-05-26 00:02:07,450 - INFO - Epoch: 91, Objective: tensor([1234.4763], device='cuda:0', grad_fn=), Loss: 0.004630007315427065, KL/n: 19.411489486694336 + 0it [00:00, ?it/s]2025-05-26 00:02:08,038 - INFO - [Epoch 092 | Batch 0000] IWAE-loss 1096.1681 | mean log_px -0.0068 | KL -950.23 + 1it [00:00, 2.93it/s] 2it [00:00, 3.72it/s] 3it [00:00, 4.07it/s] 4it [00:00, 4.25it/s] 5it [00:01, 4.27it/s] 6it [00:01, 4.28it/s] 7it [00:01, 4.37it/s] 8it [00:01, 4.46it/s] 9it [00:02, 4.52it/s] 10it [00:02, 4.55it/s] 11it [00:02, 4.59it/s] 12it [00:02, 4.61it/s] 13it [00:02, 4.62it/s] 14it [00:03, 4.63it/s] 15it [00:03, 4.47it/s] 16it [00:03, 4.37it/s] 17it [00:03, 4.30it/s] 18it [00:04, 4.22it/s] 19it [00:04, 4.22it/s] 20it [00:04, 4.06it/s] 21it [00:04, 4.20it/s] 22it [00:05, 4.32it/s] 23it [00:05, 4.41it/s] 24it [00:05, 4.47it/s] 25it [00:05, 4.45it/s] 26it [00:06, 4.32it/s] 27it [00:06, 4.17it/s] 28it [00:06, 4.15it/s] 29it [00:06, 4.27it/s] 30it [00:06, 4.36it/s] 31it [00:07, 4.46it/s] 32it [00:07, 4.51it/s] 33it [00:07, 4.55it/s] 34it [00:07, 4.57it/s] 35it [00:08, 4.59it/s] 36it [00:08, 4.61it/s] 37it [00:08, 4.51it/s] 38it [00:08, 4.55it/s] 39it [00:08, 4.42it/s] 40it [00:09, 4.47it/s] 41it [00:09, 4.52it/s] 42it [00:09, 4.28it/s] 43it [00:09, 4.38it/s] 44it [00:10, 4.45it/s] 45it [00:10, 4.35it/s] 46it [00:10, 4.29it/s] 47it [00:10, 4.39it/s] 48it [00:10, 4.46it/s] 49it [00:11, 4.36it/s] 50it [00:11, 4.43it/s]2025-05-26 00:02:19,359 - INFO - [Epoch 092 | Batch 0050] IWAE-loss 1275.9679 | mean log_px -0.0117 | KL -948.22 + 51it [00:11, 4.35it/s] 52it [00:11, 4.42it/s] 53it [00:12, 4.41it/s] 54it [00:12, 4.47it/s] 55it [00:12, 4.44it/s] 56it [00:12, 4.44it/s] 57it [00:12, 4.48it/s] 58it [00:13, 4.40it/s] 59it [00:13, 4.18it/s] 60it [00:13, 4.19it/s] 61it [00:13, 4.31it/s] 62it [00:14, 4.41it/s] 63it [00:14, 4.30it/s] 64it [00:14, 4.24it/s] 65it [00:14, 4.25it/s] 66it [00:15, 4.12it/s] 67it [00:15, 4.19it/s] 68it [00:15, 4.18it/s] 69it [00:15, 4.15it/s] 70it [00:16, 4.26it/s] 71it [00:16, 4.23it/s] 72it [00:16, 4.17it/s] 73it [00:16, 4.19it/s] 74it [00:17, 4.22it/s] 75it [00:17, 4.21it/s] 76it [00:17, 4.20it/s] 77it [00:17, 4.29it/s] 78it [00:17, 4.23it/s] 79it [00:18, 4.25it/s] 80it [00:18, 4.21it/s] 81it [00:18, 4.23it/s] 82it [00:18, 4.33it/s] 83it [00:19, 4.26it/s] 84it [00:19, 4.38it/s] 85it [00:19, 4.17it/s] 86it [00:19, 4.30it/s] 87it [00:20, 4.42it/s] 88it [00:20, 4.51it/s] 89it [00:20, 4.55it/s] 90it [00:20, 4.41it/s] 91it [00:20, 4.39it/s] 92it [00:21, 4.45it/s] 93it [00:21, 4.49it/s] 94it [00:21, 4.27it/s] 95it [00:21, 4.12it/s] 96it [00:22, 4.29it/s] 97it [00:22, 4.24it/s] 98it [00:22, 4.36it/s] 99it [00:22, 4.37it/s] 100it [00:23, 4.47it/s]2025-05-26 00:02:30,947 - INFO - [Epoch 092 | Batch 0100] IWAE-loss 1220.1927 | mean log_px -0.0129 | KL -944.11 + 101it [00:23, 4.53it/s] 102it [00:23, 4.58it/s] 103it [00:23, 4.45it/s] 104it [00:23, 4.51it/s] 105it [00:24, 4.27it/s] 106it [00:24, 4.38it/s] 107it [00:24, 4.32it/s] 108it [00:24, 4.35it/s] 109it [00:25, 4.31it/s] 110it [00:25, 4.41it/s] 111it [00:25, 4.50it/s] 112it [00:25, 4.55it/s] 113it [00:25, 4.60it/s] 114it [00:26, 4.62it/s] 115it [00:26, 4.65it/s] 116it [00:26, 4.66it/s] 117it [00:26, 4.69it/s] 118it [00:27, 4.38it/s] 119it [00:27, 4.39it/s] 120it [00:27, 4.48it/s] 121it [00:27, 4.55it/s] 122it [00:27, 4.53it/s] 123it [00:28, 4.49it/s] 124it [00:28, 4.47it/s] 125it [00:28, 4.38it/s] 126it [00:28, 4.34it/s] 127it [00:29, 4.28it/s] 128it [00:29, 4.20it/s] 129it [00:29, 4.34it/s] 130it [00:29, 4.44it/s] 131it [00:29, 4.52it/s] 132it [00:30, 4.44it/s] 133it [00:30, 4.54it/s] 134it [00:30, 4.40it/s] 135it [00:30, 4.34it/s] 136it [00:31, 4.28it/s] 137it [00:31, 4.39it/s] 138it [00:31, 4.44it/s] 139it [00:31, 4.23it/s] 140it [00:32, 4.21it/s] 141it [00:32, 4.26it/s] 142it [00:32, 4.28it/s] 143it [00:32, 4.11it/s] 144it [00:33, 4.25it/s] 145it [00:33, 4.37it/s] 146it [00:33, 4.43it/s] 147it [00:33, 4.35it/s] 148it [00:33, 4.30it/s] 149it [00:34, 4.26it/s] 150it [00:34, 4.39it/s]2025-05-26 00:02:42,306 - INFO - [Epoch 092 | Batch 0150] IWAE-loss 1267.1647 | mean log_px -0.0153 | KL -942.56 + 151it [00:34, 4.47it/s] 152it [00:34, 4.31it/s] 153it [00:35, 4.29it/s] 154it [00:35, 4.39it/s] 155it [00:35, 4.42it/s] 156it [00:35, 4.35it/s] 157it [00:35, 4.42it/s] 158it [00:36, 4.50it/s] 159it [00:36, 4.56it/s] 160it [00:36, 4.40it/s] 161it [00:36, 4.35it/s] 162it [00:37, 4.26it/s] 163it [00:37, 4.15it/s] 164it [00:37, 4.16it/s] 165it [00:37, 4.29it/s] 166it [00:38, 4.40it/s] 167it [00:38, 4.27it/s] 168it [00:38, 4.38it/s] 169it [00:38, 4.44it/s] 170it [00:38, 4.39it/s] 171it [00:39, 4.47it/s] 172it [00:39, 4.54it/s] 173it [00:39, 4.41it/s] 174it [00:39, 4.35it/s] 175it [00:40, 4.44it/s] 176it [00:40, 4.38it/s] 177it [00:40, 4.42it/s] 178it [00:40, 4.50it/s] 179it [00:40, 4.55it/s] 180it [00:41, 4.59it/s] 181it [00:41, 4.47it/s] 182it [00:41, 4.54it/s] 183it [00:41, 4.41it/s] 184it [00:42, 4.47it/s] 185it [00:42, 4.55it/s] 186it [00:42, 4.43it/s] 187it [00:42, 4.33it/s] 188it [00:43, 4.28it/s] 189it [00:43, 4.39it/s] 190it [00:43, 4.48it/s] 191it [00:43, 4.37it/s] 192it [00:43, 4.45it/s] 193it [00:44, 4.35it/s] 194it [00:44, 4.43it/s] 195it [00:44, 4.17it/s] 196it [00:44, 4.33it/s] 196it [00:44, 4.36it/s] +2025-05-26 00:02:52,701 - INFO - Epoch: 92, Objective: tensor([1376.6708], device='cuda:0', grad_fn=), Loss: 0.012566782534122467, KL/n: 19.321582794189453 + 0it [00:00, ?it/s]2025-05-26 00:02:53,143 - INFO - [Epoch 093 | Batch 0000] IWAE-loss 999.4476 | mean log_px -0.0021 | KL -946.94 + 1it [00:00, 2.71it/s] 2it [00:00, 3.37it/s] 3it [00:00, 3.87it/s] 4it [00:01, 4.16it/s] 5it [00:01, 4.32it/s] 6it [00:01, 4.41it/s] 7it [00:01, 4.38it/s] 8it [00:01, 4.18it/s] 9it [00:02, 4.34it/s] 10it [00:02, 3.43it/s] 11it [00:02, 3.74it/s] 12it [00:03, 3.91it/s] 13it [00:03, 4.12it/s] 14it [00:03, 4.26it/s] 15it [00:03, 4.39it/s] 16it [00:03, 4.35it/s] 17it [00:04, 4.45it/s] 18it [00:04, 4.51it/s] 19it [00:04, 4.54it/s] 20it [00:04, 4.42it/s] 21it [00:05, 4.39it/s] 22it [00:05, 4.26it/s] 23it [00:05, 4.25it/s] 24it [00:05, 4.28it/s] 25it [00:05, 4.25it/s] 26it [00:06, 4.30it/s] 27it [00:06, 4.41it/s] 28it [00:06, 4.45it/s] 29it [00:06, 4.25it/s] 30it [00:07, 4.37it/s] 31it [00:07, 4.45it/s] 32it [00:07, 4.50it/s] 33it [00:07, 4.47it/s] 34it [00:08, 4.48it/s] 35it [00:08, 4.36it/s] 36it [00:08, 4.38it/s] 37it [00:08, 4.34it/s] 38it [00:08, 4.38it/s] 39it [00:09, 4.39it/s] 40it [00:09, 4.41it/s] 41it [00:09, 4.25it/s] 42it [00:09, 4.32it/s] 43it [00:10, 4.35it/s] 44it [00:10, 4.38it/s] 45it [00:10, 4.46it/s] 46it [00:10, 4.40it/s] 47it [00:10, 4.42it/s] 48it [00:11, 4.41it/s] 49it [00:11, 4.45it/s] 50it [00:11, 4.35it/s]2025-05-26 00:03:04,688 - INFO - [Epoch 093 | Batch 0050] IWAE-loss 1235.3208 | mean log_px -0.0091 | KL -945.62 + 51it [00:11, 4.35it/s] 52it [00:12, 4.41it/s] 53it [00:12, 4.45it/s] 54it [00:12, 4.46it/s] 55it [00:12, 4.46it/s] 56it [00:13, 4.36it/s] 57it [00:13, 4.44it/s] 58it [00:13, 4.48it/s] 59it [00:13, 4.46it/s] 60it [00:13, 4.50it/s] 61it [00:14, 4.51it/s] 62it [00:14, 4.31it/s] 63it [00:14, 4.31it/s] 64it [00:14, 4.37it/s] 65it [00:15, 4.38it/s] 66it [00:15, 4.42it/s] 67it [00:15, 4.34it/s] 68it [00:15, 4.33it/s] 69it [00:15, 4.41it/s] 70it [00:16, 4.47it/s] 71it [00:16, 4.30it/s] 72it [00:16, 4.27it/s] 73it [00:16, 4.33it/s] 74it [00:17, 4.35it/s] 75it [00:17, 4.40it/s] 76it [00:17, 4.43it/s] 77it [00:17, 4.22it/s] 78it [00:18, 4.26it/s] 79it [00:18, 4.26it/s] 80it [00:18, 4.29it/s] 81it [00:18, 4.28it/s] 82it [00:19, 4.29it/s] 83it [00:19, 4.27it/s] 84it [00:19, 4.11it/s] 85it [00:19, 4.26it/s] 86it [00:19, 4.28it/s] 87it [00:20, 4.26it/s] 88it [00:20, 4.22it/s] 89it [00:20, 4.34it/s] 90it [00:20, 4.29it/s] 91it [00:21, 4.27it/s] 92it [00:21, 4.30it/s] 93it [00:21, 4.36it/s] 94it [00:21, 4.41it/s] 95it [00:22, 4.49it/s] 96it [00:22, 4.46it/s] 97it [00:22, 4.37it/s] 98it [00:22, 4.45it/s] 99it [00:22, 4.39it/s] 100it [00:23, 4.41it/s]2025-05-26 00:03:16,155 - INFO - [Epoch 093 | Batch 0100] IWAE-loss 1168.9042 | mean log_px -0.0071 | KL -945.60 + 101it [00:23, 4.45it/s] 102it [00:23, 4.47it/s] 103it [00:23, 4.53it/s] 104it [00:24, 4.56it/s] 105it [00:24, 4.54it/s] 106it [00:24, 4.52it/s] 107it [00:24, 4.55it/s] 108it [00:24, 4.58it/s] 109it [00:25, 4.61it/s] 110it [00:25, 4.43it/s] 111it [00:25, 4.21it/s] 112it [00:25, 4.14it/s] 113it [00:26, 4.17it/s] 114it [00:26, 4.18it/s] 115it [00:26, 4.21it/s] 116it [00:26, 4.26it/s] 117it [00:27, 4.25it/s] 118it [00:27, 4.28it/s] 119it [00:27, 4.22it/s] 120it [00:27, 4.33it/s] 121it [00:27, 4.30it/s] 122it [00:28, 4.27it/s] 123it [00:28, 4.28it/s] 124it [00:28, 4.37it/s] 125it [00:28, 4.32it/s] 126it [00:29, 4.33it/s] 127it [00:29, 4.31it/s] 128it [00:29, 4.18it/s] 129it [00:29, 4.29it/s] 130it [00:30, 4.37it/s] 131it [00:30, 4.30it/s] 132it [00:30, 4.37it/s] 133it [00:30, 4.34it/s] 134it [00:31, 4.08it/s] 135it [00:31, 4.12it/s] 136it [00:31, 4.20it/s] 137it [00:31, 4.27it/s] 138it [00:31, 4.35it/s] 139it [00:32, 4.41it/s] 140it [00:32, 4.39it/s] 141it [00:32, 4.31it/s] 142it [00:32, 4.30it/s] 143it [00:33, 4.24it/s] 144it [00:33, 4.20it/s] 145it [00:33, 4.34it/s] 146it [00:33, 4.42it/s] 147it [00:34, 4.49it/s] 148it [00:34, 4.53it/s] 149it [00:34, 4.57it/s] 150it [00:34, 4.59it/s]2025-05-26 00:03:27,644 - INFO - [Epoch 093 | Batch 0150] IWAE-loss 1105.6846 | mean log_px -0.0088 | KL -947.32 + 151it [00:34, 4.59it/s] 152it [00:35, 4.61it/s] 153it [00:35, 4.61it/s] 154it [00:35, 4.41it/s] 155it [00:35, 4.42it/s] 156it [00:35, 4.49it/s] 157it [00:36, 4.50it/s] 158it [00:36, 4.22it/s] 159it [00:36, 4.21it/s] 160it [00:36, 4.28it/s] 161it [00:37, 4.39it/s] 162it [00:37, 4.47it/s] 163it [00:37, 4.47it/s] 164it [00:37, 4.38it/s] 165it [00:38, 4.32it/s] 166it [00:38, 4.40it/s] 167it [00:38, 4.18it/s] 168it [00:38, 4.33it/s] 169it [00:38, 4.41it/s] 170it [00:39, 4.48it/s] 171it [00:39, 4.36it/s] 172it [00:39, 4.40it/s] 173it [00:39, 4.34it/s] 174it [00:40, 4.43it/s] 175it [00:40, 4.36it/s] 176it [00:40, 4.43it/s] 177it [00:40, 4.41it/s] 178it [00:41, 4.32it/s] 179it [00:41, 4.40it/s] 180it [00:41, 4.30it/s] 181it [00:41, 4.38it/s] 182it [00:41, 4.45it/s] 183it [00:42, 4.52it/s] 184it [00:42, 4.55it/s] 185it [00:42, 4.59it/s] 186it [00:42, 4.59it/s] 187it [00:43, 4.61it/s] 188it [00:43, 4.62it/s] 189it [00:43, 4.63it/s] 190it [00:43, 4.62it/s] 191it [00:43, 4.63it/s] 192it [00:44, 4.63it/s] 193it [00:44, 4.43it/s] 194it [00:44, 4.35it/s] 195it [00:44, 4.35it/s] 196it [00:45, 4.46it/s] 196it [00:45, 4.35it/s] +2025-05-26 00:03:37,942 - INFO - Epoch: 93, Objective: tensor([1070.6356], device='cuda:0', grad_fn=), Loss: 0.00409930944442749, KL/n: 19.31393051147461 + 0it [00:00, ?it/s]2025-05-26 00:03:38,355 - INFO - [Epoch 094 | Batch 0000] IWAE-loss 1022.8226 | mean log_px -0.0018 | KL -944.74 + 1it [00:00, 2.93it/s] 2it [00:00, 3.74it/s] 3it [00:00, 3.94it/s] 4it [00:01, 3.99it/s] 5it [00:01, 3.94it/s] 6it [00:01, 4.00it/s] 7it [00:01, 4.14it/s] 8it [00:02, 4.14it/s] 9it [00:02, 4.16it/s] 10it [00:02, 4.13it/s] 11it [00:02, 4.17it/s] 12it [00:02, 4.22it/s] 13it [00:03, 4.36it/s] 14it [00:03, 4.27it/s] 15it [00:03, 4.23it/s] 16it [00:03, 4.33it/s] 17it [00:04, 4.43it/s] 18it [00:04, 4.35it/s] 19it [00:04, 4.45it/s] 20it [00:04, 4.49it/s] 21it [00:05, 4.36it/s] 22it [00:05, 4.44it/s] 23it [00:05, 4.49it/s] 24it [00:05, 4.35it/s] 25it [00:05, 4.44it/s] 26it [00:06, 4.49it/s] 27it [00:06, 4.39it/s] 28it [00:06, 4.32it/s] 29it [00:06, 4.26it/s] 30it [00:07, 4.23it/s] 31it [00:07, 4.31it/s] 32it [00:07, 4.41it/s] 33it [00:07, 4.49it/s] 34it [00:07, 4.35it/s] 35it [00:08, 4.30it/s] 36it [00:08, 4.24it/s] 37it [00:08, 4.34it/s] 38it [00:08, 4.43it/s] 39it [00:09, 4.34it/s] 40it [00:09, 4.41it/s] 41it [00:09, 4.33it/s] 42it [00:09, 4.41it/s] 43it [00:10, 4.48it/s] 44it [00:10, 4.40it/s] 45it [00:10, 4.46it/s] 46it [00:10, 4.35it/s] 47it [00:10, 4.28it/s] 48it [00:11, 4.24it/s] 49it [00:11, 4.33it/s] 50it [00:11, 4.42it/s]2025-05-26 00:03:49,868 - INFO - [Epoch 094 | Batch 0050] IWAE-loss 1190.5052 | mean log_px -0.0090 | KL -945.57 + 51it [00:11, 4.47it/s] 52it [00:12, 4.51it/s] 53it [00:12, 4.27it/s] 54it [00:12, 4.22it/s] 55it [00:12, 4.33it/s] 56it [00:13, 4.42it/s] 57it [00:13, 4.44it/s] 58it [00:13, 4.48it/s] 59it [00:13, 4.44it/s] 60it [00:13, 4.35it/s] 61it [00:14, 4.43it/s] 62it [00:14, 4.47it/s] 63it [00:14, 4.51it/s] 64it [00:14, 4.56it/s] 65it [00:15, 4.45it/s] 66it [00:15, 4.52it/s] 67it [00:15, 4.56it/s] 68it [00:15, 4.41it/s] 69it [00:15, 4.47it/s] 70it [00:16, 4.51it/s] 71it [00:16, 4.39it/s] 72it [00:16, 4.17it/s] 73it [00:16, 4.26it/s] 74it [00:17, 4.28it/s] 75it [00:17, 4.38it/s] 76it [00:17, 4.44it/s] 77it [00:17, 4.48it/s] 78it [00:17, 4.51it/s] 79it [00:18, 4.22it/s] 80it [00:18, 4.33it/s] 81it [00:18, 4.41it/s] 82it [00:18, 4.25it/s] 83it [00:19, 4.23it/s] 84it [00:19, 4.33it/s] 85it [00:19, 4.42it/s] 86it [00:19, 4.48it/s] 87it [00:20, 4.53it/s] 88it [00:20, 4.56it/s] 89it [00:20, 4.59it/s] 90it [00:20, 4.60it/s] 91it [00:20, 4.61it/s] 92it [00:21, 4.43it/s] 93it [00:21, 4.37it/s] 94it [00:21, 4.27it/s] 95it [00:21, 4.27it/s] 96it [00:22, 4.24it/s] 97it [00:22, 4.22it/s] 98it [00:22, 4.20it/s] 99it [00:22, 4.18it/s] 100it [00:23, 4.17it/s]2025-05-26 00:04:01,290 - INFO - [Epoch 094 | Batch 0100] IWAE-loss 1009.5639 | mean log_px -0.0037 | KL -944.66 + 101it [00:23, 4.31it/s] 102it [00:23, 4.23it/s] 103it [00:23, 4.34it/s] 104it [00:23, 4.19it/s] 105it [00:24, 4.31it/s] 106it [00:24, 4.25it/s] 107it [00:24, 4.20it/s] 108it [00:24, 4.18it/s] 109it [00:25, 4.29it/s] 110it [00:25, 4.39it/s] 111it [00:25, 4.26it/s] 112it [00:25, 4.34it/s] 113it [00:26, 4.25it/s] 114it [00:26, 4.20it/s] 115it [00:26, 4.17it/s] 116it [00:26, 4.28it/s] 117it [00:27, 4.38it/s] 118it [00:27, 4.29it/s] 119it [00:27, 4.25it/s] 120it [00:27, 4.19it/s] 121it [00:27, 4.18it/s] 122it [00:28, 4.29it/s] 123it [00:28, 4.38it/s] 124it [00:28, 4.25it/s] 125it [00:28, 4.20it/s] 126it [00:29, 4.27it/s] 127it [00:29, 4.19it/s] 128it [00:29, 4.28it/s] 129it [00:29, 4.33it/s] 130it [00:30, 4.41it/s] 131it [00:30, 4.48it/s] 132it [00:30, 4.24it/s] 133it [00:30, 4.34it/s] 134it [00:30, 4.42it/s] 135it [00:31, 4.32it/s] 136it [00:31, 4.39it/s] 137it [00:31, 4.47it/s] 138it [00:31, 4.36it/s] 139it [00:32, 4.41it/s] 140it [00:32, 4.35it/s] 141it [00:32, 4.44it/s] 142it [00:32, 4.31it/s] 143it [00:33, 4.24it/s] 144it [00:33, 4.33it/s] 145it [00:33, 4.42it/s] 146it [00:33, 4.46it/s] 147it [00:33, 4.52it/s] 148it [00:34, 4.55it/s] 149it [00:34, 4.57it/s] 150it [00:34, 4.58it/s]2025-05-26 00:04:12,804 - INFO - [Epoch 094 | Batch 0150] IWAE-loss 1335.1519 | mean log_px -0.0069 | KL -943.56 + 151it [00:34, 4.61it/s] 152it [00:35, 4.62it/s] 153it [00:35, 4.63it/s] 154it [00:35, 4.63it/s] 155it [00:35, 4.63it/s] 156it [00:35, 4.64it/s] 157it [00:36, 4.64it/s] 158it [00:36, 4.60it/s] 159it [00:36, 4.61it/s] 160it [00:36, 4.62it/s] 161it [00:36, 4.47it/s] 162it [00:37, 4.34it/s] 163it [00:37, 4.41it/s] 164it [00:37, 4.30it/s] 165it [00:37, 4.33it/s] 166it [00:38, 4.41it/s] 167it [00:38, 4.49it/s] 168it [00:38, 4.53it/s] 169it [00:38, 4.40it/s] 170it [00:39, 4.31it/s] 171it [00:39, 4.25it/s] 172it [00:39, 4.35it/s] 173it [00:39, 4.33it/s] 174it [00:39, 4.43it/s] 175it [00:40, 4.33it/s] 176it [00:40, 4.24it/s] 177it [00:40, 4.24it/s] 178it [00:40, 4.34it/s] 179it [00:41, 4.26it/s] 180it [00:41, 4.22it/s] 181it [00:41, 4.29it/s] 182it [00:41, 4.21it/s] 183it [00:42, 4.36it/s] 184it [00:42, 4.28it/s] 185it [00:42, 4.35it/s] 186it [00:42, 4.28it/s] 187it [00:42, 4.37it/s] 188it [00:43, 4.45it/s] 189it [00:43, 4.50it/s] 190it [00:43, 4.53it/s] 191it [00:43, 4.39it/s] 192it [00:44, 4.46it/s] 193it [00:44, 4.50it/s] 194it [00:44, 4.38it/s] 195it [00:44, 4.18it/s] 196it [00:45, 4.30it/s] 196it [00:45, 4.35it/s] +2025-05-26 00:04:23,169 - INFO - Epoch: 94, Objective: tensor([1227.7629], device='cuda:0', grad_fn=), Loss: 0.007183433044701815, KL/n: 19.307418823242188 + 0it [00:00, ?it/s]2025-05-26 00:04:23,758 - INFO - [Epoch 095 | Batch 0000] IWAE-loss 1115.9677 | mean log_px -0.0096 | KL -943.85 + 1it [00:00, 2.74it/s] 2it [00:00, 3.61it/s] 3it [00:00, 4.03it/s] 4it [00:01, 4.24it/s] 5it [00:01, 4.20it/s] 6it [00:01, 4.32it/s] 7it [00:01, 4.27it/s] 8it [00:01, 4.39it/s] 9it [00:02, 4.46it/s] 10it [00:02, 4.53it/s] 11it [00:02, 4.41it/s] 12it [00:02, 4.30it/s] 13it [00:03, 4.03it/s] 14it [00:03, 4.08it/s] 15it [00:03, 4.11it/s] 16it [00:03, 4.09it/s] 17it [00:04, 4.01it/s] 18it [00:04, 4.17it/s] 19it [00:04, 4.26it/s] 20it [00:04, 4.31it/s] 21it [00:04, 4.40it/s] 22it [00:05, 4.46it/s] 23it [00:05, 4.51it/s] 24it [00:05, 4.54it/s] 25it [00:05, 4.59it/s] 26it [00:06, 4.45it/s] 27it [00:06, 4.54it/s] 28it [00:06, 4.58it/s] 29it [00:06, 4.62it/s] 30it [00:06, 4.64it/s] 31it [00:07, 4.66it/s] 32it [00:07, 4.35it/s] 33it [00:07, 4.31it/s] 34it [00:07, 4.37it/s] 35it [00:08, 4.31it/s] 36it [00:08, 4.40it/s] 37it [00:08, 4.49it/s] 38it [00:08, 4.38it/s] 39it [00:09, 4.46it/s] 40it [00:09, 4.53it/s] 41it [00:09, 4.58it/s] 42it [00:09, 4.60it/s] 43it [00:09, 4.46it/s] 44it [00:10, 4.36it/s] 45it [00:10, 4.30it/s] 46it [00:10, 4.28it/s] 47it [00:10, 4.24it/s] 48it [00:11, 4.35it/s] 49it [00:11, 4.28it/s] 50it [00:11, 4.23it/s]2025-05-26 00:04:35,183 - INFO - [Epoch 095 | Batch 0050] IWAE-loss 1069.6550 | mean log_px -0.0162 | KL -945.07 + 51it [00:11, 4.37it/s] 52it [00:11, 4.46it/s] 53it [00:12, 4.42it/s] 54it [00:12, 4.34it/s] 55it [00:12, 4.29it/s] 56it [00:12, 4.38it/s] 57it [00:13, 4.30it/s] 58it [00:13, 4.41it/s] 59it [00:13, 4.49it/s] 60it [00:13, 4.40it/s] 61it [00:14, 4.34it/s] 62it [00:14, 4.43it/s] 63it [00:14, 4.36it/s] 64it [00:14, 4.28it/s] 65it [00:14, 4.26it/s] 66it [00:15, 4.36it/s] 67it [00:15, 4.46it/s] 68it [00:15, 4.53it/s] 69it [00:15, 4.44it/s] 70it [00:16, 4.49it/s] 71it [00:16, 4.40it/s] 72it [00:16, 4.46it/s] 73it [00:16, 4.38it/s] 74it [00:17, 4.31it/s] 75it [00:17, 4.14it/s] 76it [00:17, 4.16it/s] 77it [00:17, 4.17it/s] 78it [00:17, 4.32it/s] 79it [00:18, 4.26it/s] 80it [00:18, 4.36it/s] 81it [00:18, 4.29it/s] 82it [00:18, 4.39it/s] 83it [00:19, 4.28it/s] 84it [00:19, 4.23it/s] 85it [00:19, 4.34it/s] 86it [00:19, 4.41it/s] 87it [00:20, 4.49it/s] 88it [00:20, 4.52it/s] 89it [00:20, 4.55it/s] 90it [00:20, 4.43it/s] 91it [00:20, 4.33it/s] 92it [00:21, 4.24it/s] 93it [00:21, 4.35it/s] 94it [00:21, 4.44it/s] 95it [00:21, 4.49it/s] 96it [00:22, 4.36it/s] 97it [00:22, 4.44it/s] 98it [00:22, 4.33it/s] 99it [00:22, 4.41it/s] 100it [00:22, 4.47it/s]2025-05-26 00:04:46,599 - INFO - [Epoch 095 | Batch 0100] IWAE-loss 1063.1974 | mean log_px -0.0022 | KL -944.21 + 101it [00:23, 4.53it/s] 102it [00:23, 4.56it/s] 103it [00:23, 4.42it/s] 104it [00:23, 4.32it/s] 105it [00:24, 4.40it/s] 106it [00:24, 4.47it/s] 107it [00:24, 4.52it/s] 108it [00:24, 4.56it/s] 109it [00:24, 4.42it/s] 110it [00:25, 4.46it/s] 111it [00:25, 4.51it/s] 112it [00:25, 4.38it/s] 113it [00:25, 4.43it/s] 114it [00:26, 4.35it/s] 115it [00:26, 4.36it/s] 116it [00:26, 4.44it/s] 117it [00:26, 4.50it/s] 118it [00:26, 4.53it/s] 119it [00:27, 4.53it/s] 120it [00:27, 4.40it/s] 121it [00:27, 4.45it/s] 122it [00:27, 4.51it/s] 123it [00:28, 4.54it/s] 124it [00:28, 4.38it/s] 125it [00:28, 4.23it/s] 126it [00:28, 4.35it/s] 127it [00:29, 4.39it/s] 128it [00:29, 4.45it/s] 129it [00:29, 4.35it/s] 130it [00:29, 4.40it/s] 131it [00:29, 4.31it/s] 132it [00:30, 4.24it/s] 133it [00:30, 4.14it/s] 134it [00:30, 4.27it/s] 135it [00:30, 4.37it/s] 136it [00:31, 4.44it/s] 137it [00:31, 4.49it/s] 138it [00:31, 4.53it/s] 139it [00:31, 4.43it/s] 140it [00:32, 4.46it/s] 141it [00:32, 4.51it/s] 142it [00:32, 4.55it/s] 143it [00:32, 4.57it/s] 144it [00:32, 4.58it/s] 145it [00:33, 4.60it/s] 146it [00:33, 4.60it/s] 147it [00:33, 4.61it/s] 148it [00:33, 4.53it/s] 149it [00:33, 4.58it/s] 150it [00:34, 4.59it/s]2025-05-26 00:04:57,838 - INFO - [Epoch 095 | Batch 0150] IWAE-loss 1082.0015 | mean log_px -0.0033 | KL -939.44 + 151it [00:34, 4.50it/s] 152it [00:34, 4.49it/s] 153it [00:34, 4.37it/s] 154it [00:35, 4.43it/s] 155it [00:35, 4.36it/s] 156it [00:35, 4.29it/s] 157it [00:35, 4.25it/s] 158it [00:36, 4.20it/s] 159it [00:36, 4.32it/s] 160it [00:36, 4.40it/s] 161it [00:36, 4.47it/s] 162it [00:36, 4.52it/s] 163it [00:37, 4.42it/s] 164it [00:37, 4.48it/s] 165it [00:37, 4.53it/s] 166it [00:37, 4.56it/s] 167it [00:38, 4.41it/s] 168it [00:38, 4.34it/s] 169it [00:38, 4.18it/s] 170it [00:38, 4.26it/s] 171it [00:39, 4.33it/s] 172it [00:39, 4.40it/s] 173it [00:39, 4.39it/s] 174it [00:39, 4.45it/s] 175it [00:39, 4.31it/s] 176it [00:40, 4.38it/s] 177it [00:40, 4.47it/s] 178it [00:40, 4.21it/s] 179it [00:40, 4.20it/s] 180it [00:41, 4.32it/s] 181it [00:41, 4.44it/s] 182it [00:41, 4.51it/s] 183it [00:41, 4.37it/s] 184it [00:41, 4.48it/s] 185it [00:42, 4.55it/s] 186it [00:42, 4.58it/s] 187it [00:42, 4.61it/s] 188it [00:42, 4.63it/s] 189it [00:43, 4.66it/s] 190it [00:43, 4.66it/s] 191it [00:43, 4.67it/s] 192it [00:43, 4.50it/s] 193it [00:43, 4.56it/s] 194it [00:44, 4.59it/s] 195it [00:44, 4.50it/s] 196it [00:44, 4.56it/s] 196it [00:44, 4.39it/s] +2025-05-26 00:05:08,125 - INFO - Epoch: 95, Objective: tensor([1025.7579], device='cuda:0', grad_fn=), Loss: 0.00621769716963172, KL/n: 19.164661407470703 + 0it [00:00, ?it/s]2025-05-26 00:05:08,542 - INFO - [Epoch 096 | Batch 0000] IWAE-loss 970.0466 | mean log_px -0.0005 | KL -939.20 + 1it [00:00, 2.94it/s] 2it [00:00, 3.74it/s] 3it [00:00, 4.14it/s] 4it [00:00, 4.34it/s] 5it [00:01, 4.46it/s] 6it [00:01, 4.53it/s] 7it [00:01, 4.58it/s] 8it [00:02, 3.59it/s] 9it [00:02, 3.88it/s] 10it [00:02, 4.10it/s] 11it [00:02, 4.27it/s] 12it [00:02, 4.39it/s] 13it [00:03, 4.49it/s] 14it [00:03, 4.55it/s] 15it [00:03, 4.60it/s] 16it [00:03, 4.62it/s] 17it [00:03, 4.65it/s] 18it [00:04, 4.66it/s] 19it [00:04, 4.67it/s] 20it [00:04, 4.66it/s] 21it [00:04, 4.68it/s] 22it [00:05, 4.69it/s] 23it [00:05, 4.70it/s] 24it [00:05, 4.70it/s] 25it [00:05, 4.71it/s] 26it [00:05, 4.70it/s] 27it [00:06, 4.71it/s] 28it [00:06, 4.70it/s] 29it [00:06, 4.56it/s] 30it [00:06, 4.62it/s] 31it [00:06, 4.64it/s] 32it [00:07, 4.66it/s] 33it [00:07, 4.68it/s] 34it [00:07, 4.68it/s] 35it [00:07, 4.70it/s] 36it [00:08, 4.69it/s] 37it [00:08, 4.70it/s] 38it [00:08, 4.70it/s] 39it [00:08, 4.68it/s] 40it [00:08, 4.67it/s] 41it [00:09, 4.68it/s] 42it [00:09, 4.69it/s] 43it [00:09, 4.70it/s] 44it [00:09, 4.69it/s] 45it [00:09, 4.70it/s] 46it [00:10, 4.70it/s] 47it [00:10, 4.71it/s] 48it [00:10, 4.67it/s] 49it [00:10, 4.68it/s] 50it [00:10, 4.69it/s]2025-05-26 00:05:19,404 - INFO - [Epoch 096 | Batch 0050] IWAE-loss 988.4781 | mean log_px -0.0008 | KL -937.70 + 51it [00:11, 4.69it/s] 52it [00:11, 4.69it/s] 53it [00:11, 4.70it/s] 54it [00:11, 4.70it/s] 55it [00:12, 4.71it/s] 56it [00:12, 4.70it/s] 57it [00:12, 4.71it/s] 58it [00:12, 4.70it/s] 59it [00:12, 4.71it/s] 60it [00:13, 4.71it/s] 61it [00:13, 4.71it/s] 62it [00:13, 4.71it/s] 63it [00:13, 4.71it/s] 64it [00:13, 4.71it/s] 65it [00:14, 4.71it/s] 66it [00:14, 4.71it/s] 67it [00:14, 4.71it/s] 68it [00:14, 4.71it/s] 69it [00:15, 4.71it/s] 70it [00:15, 4.71it/s] 71it [00:15, 4.71it/s] 72it [00:15, 4.70it/s] 73it [00:15, 4.71it/s] 74it [00:16, 4.70it/s] 75it [00:16, 4.70it/s] 76it [00:16, 4.55it/s] 77it [00:16, 4.60it/s] 78it [00:16, 4.63it/s] 79it [00:17, 4.66it/s] 80it [00:17, 4.67it/s] 81it [00:17, 4.68it/s] 82it [00:17, 4.69it/s] 83it [00:18, 4.70it/s] 84it [00:18, 4.70it/s] 85it [00:18, 4.70it/s] 86it [00:18, 4.69it/s] 87it [00:18, 4.69it/s] 88it [00:19, 4.60it/s] 89it [00:19, 4.65it/s] 90it [00:19, 4.66it/s] 91it [00:19, 4.53it/s] 92it [00:19, 4.56it/s] 93it [00:20, 4.63it/s] 94it [00:20, 4.65it/s] 95it [00:20, 4.67it/s] 96it [00:20, 4.64it/s] 97it [00:21, 4.56it/s] 98it [00:21, 4.58it/s] 99it [00:21, 4.60it/s] 100it [00:21, 4.47it/s]2025-05-26 00:05:30,143 - INFO - [Epoch 096 | Batch 0100] IWAE-loss 1141.4642 | mean log_px -0.0031 | KL -935.62 + 101it [00:21, 4.52it/s] 102it [00:22, 4.54it/s] 103it [00:22, 4.58it/s] 104it [00:22, 4.61it/s] 105it [00:22, 4.64it/s] 106it [00:23, 4.65it/s] 107it [00:23, 4.67it/s] 108it [00:23, 4.53it/s] 109it [00:23, 4.59it/s] 110it [00:23, 4.61it/s] 111it [00:24, 4.64it/s] 112it [00:24, 4.65it/s] 113it [00:24, 4.66it/s] 114it [00:24, 4.67it/s] 115it [00:24, 4.69it/s] 116it [00:25, 4.49it/s] 117it [00:25, 4.50it/s] 118it [00:25, 4.56it/s] 119it [00:25, 4.60it/s] 120it [00:26, 4.62it/s] 121it [00:26, 4.63it/s] 122it [00:26, 4.53it/s] 123it [00:26, 4.57it/s] 124it [00:26, 4.56it/s] 125it [00:27, 4.60it/s] 126it [00:27, 4.61it/s] 127it [00:27, 4.62it/s] 128it [00:27, 4.63it/s] 129it [00:28, 4.50it/s] 130it [00:28, 4.55it/s] 131it [00:28, 4.58it/s] 132it [00:28, 4.60it/s] 133it [00:28, 4.62it/s] 134it [00:29, 4.63it/s] 135it [00:29, 4.64it/s] 136it [00:29, 4.56it/s] 137it [00:29, 4.60it/s] 138it [00:29, 4.62it/s] 139it [00:30, 4.63it/s] 140it [00:30, 4.63it/s] 141it [00:30, 4.64it/s] 142it [00:30, 4.65it/s] 143it [00:31, 4.65it/s] 144it [00:31, 4.65it/s] 145it [00:31, 4.59it/s] 146it [00:31, 4.63it/s] 147it [00:31, 4.63it/s] 148it [00:32, 4.64it/s] 149it [00:32, 4.62it/s] 150it [00:32, 4.63it/s]2025-05-26 00:05:40,984 - INFO - [Epoch 096 | Batch 0150] IWAE-loss 1193.1945 | mean log_px -0.0053 | KL -933.20 + 151it [00:32, 4.64it/s] 152it [00:32, 4.63it/s] 153it [00:33, 4.63it/s] 154it [00:33, 4.64it/s] 155it [00:33, 4.50it/s] 156it [00:33, 4.56it/s] 157it [00:34, 4.59it/s] 158it [00:34, 4.61it/s] 159it [00:34, 4.63it/s] 160it [00:34, 4.50it/s] 161it [00:34, 4.55it/s] 162it [00:35, 4.58it/s] 163it [00:35, 4.61it/s] 164it [00:35, 4.62it/s] 165it [00:35, 4.65it/s] 166it [00:36, 4.65it/s] 167it [00:36, 4.66it/s] 168it [00:36, 4.65it/s] 169it [00:36, 4.65it/s] 170it [00:36, 4.63it/s] 171it [00:37, 4.50it/s] 172it [00:37, 4.54it/s] 173it [00:37, 4.59it/s] 174it [00:37, 4.59it/s] 175it [00:38, 4.62it/s] 176it [00:38, 4.63it/s] 177it [00:38, 4.64it/s] 178it [00:38, 4.65it/s] 179it [00:38, 4.65it/s] 180it [00:39, 4.51it/s] 181it [00:39, 4.56it/s] 182it [00:39, 4.58it/s] 183it [00:39, 4.61it/s] 184it [00:39, 4.62it/s] 185it [00:40, 4.63it/s] 186it [00:40, 4.63it/s] 187it [00:40, 4.65it/s] 188it [00:40, 4.65it/s] 189it [00:41, 4.65it/s] 190it [00:41, 4.65it/s] 191it [00:41, 4.65it/s] 192it [00:41, 4.65it/s] 193it [00:41, 4.65it/s] 194it [00:42, 4.64it/s] 195it [00:42, 4.30it/s] 196it [00:42, 4.26it/s] 196it [00:42, 4.59it/s] +2025-05-26 00:05:50,958 - INFO - Epoch: 96, Objective: tensor([1514.7576], device='cuda:0', grad_fn=), Loss: 0.014402041211724281, KL/n: 19.02967071533203 + 0it [00:00, ?it/s]2025-05-26 00:05:51,353 - INFO - [Epoch 097 | Batch 0000] IWAE-loss 1021.1172 | mean log_px -0.0019 | KL -929.78 + 1it [00:00, 2.88it/s] 2it [00:00, 3.62it/s] 3it [00:00, 3.85it/s] 4it [00:01, 3.97it/s] 5it [00:01, 4.19it/s] 6it [00:01, 4.15it/s] 7it [00:01, 4.32it/s] 8it [00:01, 4.32it/s] 9it [00:02, 4.38it/s] 10it [00:02, 4.31it/s] 11it [00:02, 4.42it/s] 12it [00:02, 4.49it/s] 13it [00:03, 4.43it/s] 14it [00:03, 4.36it/s] 15it [00:03, 4.44it/s] 16it [00:03, 4.41it/s] 17it [00:04, 4.33it/s] 18it [00:04, 4.27it/s] 19it [00:04, 4.25it/s] 20it [00:04, 4.30it/s] 21it [00:04, 4.28it/s] 22it [00:05, 4.29it/s] 23it [00:05, 4.32it/s] 24it [00:05, 4.22it/s] 25it [00:05, 4.34it/s] 26it [00:06, 4.36it/s] 27it [00:06, 4.37it/s] 28it [00:06, 4.34it/s] 29it [00:06, 4.36it/s] 30it [00:07, 4.30it/s] 31it [00:07, 4.33it/s] 32it [00:07, 4.26it/s] 33it [00:07, 4.30it/s] 34it [00:07, 4.28it/s] 35it [00:08, 4.13it/s] 36it [00:08, 4.14it/s] 37it [00:08, 4.17it/s] 38it [00:08, 4.29it/s] 39it [00:09, 4.25it/s] 40it [00:09, 4.31it/s] 41it [00:09, 4.30it/s] 42it [00:09, 4.32it/s] 43it [00:10, 4.37it/s] 44it [00:10, 4.34it/s] 45it [00:10, 4.31it/s] 46it [00:10, 4.25it/s] 47it [00:10, 4.34it/s] 48it [00:11, 4.39it/s] 49it [00:11, 4.44it/s] 50it [00:11, 4.39it/s]2025-05-26 00:06:02,926 - INFO - [Epoch 097 | Batch 0050] IWAE-loss 1236.9264 | mean log_px -0.0168 | KL -931.44 + 51it [00:11, 4.26it/s] 52it [00:12, 4.23it/s] 53it [00:12, 4.21it/s] 54it [00:12, 4.32it/s] 55it [00:12, 4.41it/s] 56it [00:13, 4.47it/s] 57it [00:13, 4.37it/s] 58it [00:13, 4.18it/s] 59it [00:13, 4.30it/s] 60it [00:14, 4.28it/s] 61it [00:14, 4.24it/s] 62it [00:14, 4.23it/s] 63it [00:14, 4.25it/s] 64it [00:14, 4.34it/s] 65it [00:15, 4.33it/s] 66it [00:15, 3.98it/s] 67it [00:15, 4.13it/s] 68it [00:15, 4.25it/s] 69it [00:16, 4.36it/s] 70it [00:16, 4.44it/s] 71it [00:16, 4.47it/s] 72it [00:16, 4.22it/s] 73it [00:17, 4.23it/s] 74it [00:17, 4.36it/s] 75it [00:17, 4.40it/s] 76it [00:17, 4.34it/s] 77it [00:17, 4.31it/s] 78it [00:18, 4.32it/s] 79it [00:18, 4.30it/s] 80it [00:18, 4.28it/s] 81it [00:18, 4.29it/s] 82it [00:19, 4.29it/s] 83it [00:19, 4.27it/s] 84it [00:19, 4.22it/s] 85it [00:19, 4.29it/s] 86it [00:20, 4.38it/s] 87it [00:20, 4.43it/s] 88it [00:20, 4.36it/s] 89it [00:20, 4.29it/s] 90it [00:20, 4.39it/s] 91it [00:21, 4.42it/s] 92it [00:21, 4.32it/s] 93it [00:21, 4.31it/s] 94it [00:21, 4.19it/s] 95it [00:22, 4.30it/s] 96it [00:22, 4.30it/s] 97it [00:22, 4.27it/s] 98it [00:22, 4.25it/s] 99it [00:23, 4.24it/s] 100it [00:23, 4.25it/s]2025-05-26 00:06:14,590 - INFO - [Epoch 097 | Batch 0100] IWAE-loss 1532.8635 | mean log_px -0.0209 | KL -929.81 + 101it [00:23, 4.29it/s] 102it [00:23, 4.30it/s] 103it [00:24, 4.31it/s] 104it [00:24, 4.30it/s] 105it [00:24, 4.29it/s] 106it [00:24, 4.17it/s] 107it [00:24, 4.18it/s] 108it [00:25, 4.30it/s] 109it [00:25, 4.40it/s] 110it [00:25, 4.48it/s] 111it [00:25, 4.49it/s] 112it [00:26, 4.41it/s] 113it [00:26, 4.49it/s] 114it [00:26, 4.25it/s] 115it [00:26, 4.24it/s] 116it [00:27, 4.22it/s] 117it [00:27, 4.24it/s] 118it [00:27, 4.25it/s] 119it [00:27, 4.24it/s] 120it [00:27, 4.25it/s] 121it [00:28, 4.22it/s] 122it [00:28, 4.30it/s] 123it [00:28, 4.31it/s] 124it [00:28, 4.37it/s] 125it [00:29, 4.38it/s] 126it [00:29, 4.33it/s] 127it [00:29, 4.35it/s] 128it [00:29, 4.29it/s] 129it [00:30, 4.39it/s] 130it [00:30, 4.43it/s] 131it [00:30, 4.50it/s] 132it [00:30, 4.54it/s] 133it [00:30, 4.56it/s] 134it [00:31, 4.60it/s] 135it [00:31, 4.61it/s] 136it [00:31, 4.60it/s] 137it [00:31, 4.46it/s] 138it [00:32, 4.48it/s] 139it [00:32, 4.53it/s] 140it [00:32, 4.54it/s] 141it [00:32, 4.56it/s] 142it [00:32, 4.58it/s] 143it [00:33, 4.40it/s] 144it [00:33, 4.33it/s] 145it [00:33, 4.38it/s] 146it [00:33, 4.38it/s] 147it [00:34, 4.44it/s] 148it [00:34, 4.35it/s] 149it [00:34, 4.31it/s] 150it [00:34, 4.24it/s]2025-05-26 00:06:26,024 - INFO - [Epoch 097 | Batch 0150] IWAE-loss 995.0831 | mean log_px -0.0014 | KL -931.08 + 151it [00:34, 4.28it/s] 152it [00:35, 4.31it/s] 153it [00:35, 4.37it/s] 154it [00:35, 4.46it/s] 155it [00:35, 4.37it/s] 156it [00:36, 4.30it/s] 157it [00:36, 4.27it/s] 158it [00:36, 4.27it/s] 159it [00:36, 4.37it/s] 160it [00:37, 4.28it/s] 161it [00:37, 4.24it/s] 162it [00:37, 4.24it/s] 163it [00:37, 4.22it/s] 164it [00:38, 4.21it/s] 165it [00:38, 4.23it/s] 166it [00:38, 4.29it/s] 167it [00:38, 4.25it/s] 168it [00:38, 4.09it/s] 169it [00:39, 4.07it/s] 170it [00:39, 4.16it/s] 171it [00:39, 4.16it/s] 172it [00:39, 4.25it/s] 173it [00:40, 4.27it/s] 174it [00:40, 4.11it/s] 175it [00:40, 4.18it/s] 176it [00:40, 4.13it/s] 177it [00:41, 4.10it/s] 178it [00:41, 4.13it/s] 179it [00:41, 4.19it/s] 180it [00:41, 4.19it/s] 181it [00:42, 4.04it/s] 182it [00:42, 4.09it/s] 183it [00:42, 4.09it/s] 184it [00:42, 4.15it/s] 185it [00:43, 4.17it/s] 186it [00:43, 4.28it/s] 187it [00:43, 4.37it/s] 188it [00:43, 4.24it/s] 189it [00:43, 4.29it/s] 190it [00:44, 4.30it/s] 191it [00:44, 4.36it/s] 192it [00:44, 4.34it/s] 193it [00:44, 4.41it/s] 194it [00:45, 4.33it/s] 195it [00:45, 4.30it/s] 196it [00:45, 4.34it/s] 196it [00:45, 4.29it/s] +2025-05-26 00:06:36,767 - INFO - Epoch: 97, Objective: tensor([1209.1625], device='cuda:0', grad_fn=), Loss: 0.0060317241586744785, KL/n: 19.005821228027344 + 0it [00:00, ?it/s]2025-05-26 00:06:37,361 - INFO - [Epoch 098 | Batch 0000] IWAE-loss 1119.8661 | mean log_px -0.0051 | KL -930.75 + 1it [00:00, 2.82it/s] 2it [00:00, 3.48it/s] 3it [00:00, 3.77it/s] 4it [00:01, 3.89it/s] 5it [00:01, 4.05it/s] 6it [00:01, 4.22it/s] 7it [00:01, 4.35it/s] 8it [00:01, 4.33it/s] 9it [00:02, 4.24it/s] 10it [00:02, 4.33it/s] 11it [00:02, 4.42it/s] 12it [00:02, 4.47it/s] 13it [00:03, 4.52it/s] 14it [00:03, 4.42it/s] 15it [00:03, 4.44it/s] 16it [00:03, 4.45it/s] 17it [00:03, 4.50it/s] 18it [00:04, 4.28it/s] 19it [00:04, 4.33it/s] 20it [00:04, 4.39it/s] 21it [00:04, 4.30it/s] 22it [00:05, 4.18it/s] 23it [00:05, 4.22it/s] 24it [00:05, 4.27it/s] 25it [00:05, 4.39it/s] 26it [00:06, 4.43it/s] 27it [00:06, 4.33it/s] 28it [00:06, 4.43it/s] 29it [00:06, 4.49it/s] 30it [00:06, 4.54it/s] 31it [00:07, 4.43it/s] 32it [00:07, 4.48it/s] 33it [00:07, 4.50it/s] 34it [00:07, 4.50it/s] 35it [00:08, 4.29it/s] 36it [00:08, 4.30it/s] 37it [00:08, 4.40it/s] 38it [00:08, 4.45it/s] 39it [00:09, 4.51it/s] 40it [00:09, 4.54it/s] 41it [00:09, 4.57it/s] 42it [00:09, 4.53it/s] 43it [00:09, 4.56it/s] 44it [00:10, 4.44it/s] 45it [00:10, 4.50it/s] 46it [00:10, 4.33it/s] 47it [00:10, 4.30it/s] 48it [00:11, 4.39it/s] 49it [00:11, 4.41it/s] 50it [00:11, 4.48it/s]2025-05-26 00:06:48,752 - INFO - [Epoch 098 | Batch 0050] IWAE-loss 1496.3966 | mean log_px -0.0128 | KL -928.12 + 51it [00:11, 4.21it/s] 52it [00:11, 4.22it/s] 53it [00:12, 4.33it/s] 54it [00:12, 4.39it/s] 55it [00:12, 4.45it/s] 56it [00:12, 4.50it/s] 57it [00:13, 4.38it/s] 58it [00:13, 4.18it/s] 59it [00:13, 4.26it/s] 60it [00:13, 4.35it/s] 61it [00:14, 4.43it/s] 62it [00:14, 4.43it/s] 63it [00:14, 4.50it/s] 64it [00:14, 4.54it/s] 65it [00:14, 4.57it/s] 66it [00:15, 4.46it/s] 67it [00:15, 4.53it/s] 68it [00:15, 4.40it/s] 69it [00:15, 4.46it/s] 70it [00:16, 4.51it/s] 71it [00:16, 4.56it/s] 72it [00:16, 4.42it/s] 73it [00:16, 4.32it/s] 74it [00:16, 4.29it/s] 75it [00:17, 4.38it/s] 76it [00:17, 4.28it/s] 77it [00:17, 4.21it/s] 78it [00:17, 4.22it/s] 79it [00:18, 4.32it/s] 80it [00:18, 4.37it/s] 81it [00:18, 4.33it/s] 82it [00:18, 4.26it/s] 83it [00:19, 4.24it/s] 84it [00:19, 4.28it/s] 85it [00:19, 4.15it/s] 86it [00:19, 4.14it/s] 87it [00:20, 4.27it/s] 88it [00:20, 4.13it/s] 89it [00:20, 4.24it/s] 90it [00:20, 4.28it/s] 91it [00:20, 4.31it/s] 92it [00:21, 4.20it/s] 93it [00:21, 4.30it/s] 94it [00:21, 4.38it/s] 95it [00:21, 4.44it/s] 96it [00:22, 4.42it/s] 97it [00:22, 4.49it/s] 98it [00:22, 4.45it/s] 99it [00:22, 4.41it/s] 100it [00:22, 4.47it/s]2025-05-26 00:07:00,246 - INFO - [Epoch 098 | Batch 0100] IWAE-loss 1277.2687 | mean log_px -0.0050 | KL -925.47 + 101it [00:23, 4.36it/s] 102it [00:23, 4.41it/s] 103it [00:23, 4.45it/s] 104it [00:23, 4.50it/s] 105it [00:24, 4.39it/s] 106it [00:24, 4.47it/s] 107it [00:24, 4.51it/s] 108it [00:24, 4.43it/s] 109it [00:25, 4.34it/s] 110it [00:25, 4.28it/s] 111it [00:25, 4.31it/s] 112it [00:25, 4.27it/s] 113it [00:25, 4.22it/s] 114it [00:26, 4.10it/s] 115it [00:26, 4.15it/s] 116it [00:26, 4.23it/s] 117it [00:26, 4.23it/s] 118it [00:27, 4.31it/s] 119it [00:27, 4.28it/s] 120it [00:27, 4.25it/s] 121it [00:27, 4.36it/s] 122it [00:28, 4.44it/s] 123it [00:28, 4.47it/s] 124it [00:28, 4.39it/s] 125it [00:28, 4.38it/s] 126it [00:28, 4.38it/s] 127it [00:29, 4.45it/s] 128it [00:29, 4.50it/s] 129it [00:29, 4.46it/s] 130it [00:29, 4.41it/s] 131it [00:30, 4.28it/s] 132it [00:30, 4.29it/s] 133it [00:30, 4.23it/s] 134it [00:30, 4.35it/s] 135it [00:31, 4.39it/s] 136it [00:31, 4.42it/s] 137it [00:31, 4.47it/s] 138it [00:31, 4.47it/s] 139it [00:31, 4.48it/s] 140it [00:32, 4.48it/s] 141it [00:32, 4.52it/s] 142it [00:32, 4.46it/s] 143it [00:32, 4.47it/s] 144it [00:33, 4.50it/s] 145it [00:33, 4.46it/s] 146it [00:33, 4.43it/s] 147it [00:33, 4.49it/s] 148it [00:33, 4.44it/s] 149it [00:34, 4.40it/s] 150it [00:34, 4.26it/s]2025-05-26 00:07:11,675 - INFO - [Epoch 098 | Batch 0150] IWAE-loss 1349.3285 | mean log_px -0.0118 | KL -923.47 + 151it [00:34, 4.32it/s] 152it [00:34, 4.41it/s] 153it [00:35, 4.45it/s] 154it [00:35, 4.50it/s] 155it [00:35, 4.49it/s] 156it [00:35, 4.50it/s] 157it [00:35, 4.55it/s] 158it [00:36, 4.53it/s] 159it [00:36, 4.36it/s] 160it [00:36, 4.43it/s] 161it [00:36, 4.49it/s] 162it [00:37, 4.52it/s] 163it [00:37, 4.54it/s] 164it [00:37, 4.52it/s] 165it [00:37, 4.56it/s] 166it [00:37, 4.57it/s] 167it [00:38, 4.42it/s] 168it [00:38, 4.46it/s] 169it [00:38, 4.46it/s] 170it [00:38, 4.47it/s] 171it [00:39, 4.50it/s] 172it [00:39, 4.52it/s] 173it [00:39, 4.56it/s] 174it [00:39, 4.58it/s] 175it [00:39, 4.60it/s] 176it [00:40, 4.62it/s] 177it [00:40, 4.63it/s] 178it [00:40, 4.64it/s] 179it [00:40, 4.50it/s] 180it [00:41, 4.56it/s] 181it [00:41, 4.59it/s] 182it [00:41, 4.61it/s] 183it [00:41, 4.56it/s] 184it [00:41, 4.60it/s] 185it [00:42, 4.55it/s] 186it [00:42, 4.38it/s] 187it [00:42, 4.44it/s] 188it [00:42, 4.48it/s] 189it [00:43, 4.41it/s] 190it [00:43, 4.42it/s] 191it [00:43, 4.48it/s] 192it [00:43, 4.45it/s] 193it [00:43, 4.37it/s] 194it [00:44, 4.45it/s] 195it [00:44, 4.37it/s] 196it [00:44, 4.41it/s] 196it [00:44, 4.38it/s] +2025-05-26 00:07:21,803 - INFO - Epoch: 98, Objective: tensor([995.9705], device='cuda:0', grad_fn=), Loss: 0.005432826466858387, KL/n: 18.876163482666016 + 0it [00:00, ?it/s]2025-05-26 00:07:22,223 - INFO - [Epoch 099 | Batch 0000] IWAE-loss 1048.8071 | mean log_px -0.0020 | KL -923.30 + 1it [00:00, 2.92it/s] 2it [00:00, 3.61it/s] 3it [00:00, 4.03it/s] 4it [00:01, 4.23it/s] 5it [00:01, 4.20it/s] 6it [00:01, 4.34it/s] 7it [00:01, 4.44it/s] 8it [00:01, 4.47it/s] 9it [00:02, 4.52it/s] 10it [00:02, 4.53it/s] 11it [00:02, 4.52it/s] 12it [00:02, 4.54it/s] 13it [00:02, 4.52it/s] 14it [00:03, 4.54it/s] 15it [00:03, 4.56it/s] 16it [00:03, 4.58it/s] 17it [00:03, 4.43it/s] 18it [00:04, 4.50it/s] 19it [00:04, 4.54it/s] 20it [00:04, 4.55it/s] 21it [00:04, 4.54it/s] 22it [00:04, 4.54it/s] 23it [00:05, 4.57it/s] 24it [00:05, 4.46it/s] 25it [00:05, 4.52it/s] 26it [00:05, 4.54it/s] 27it [00:06, 4.56it/s] 28it [00:06, 4.57it/s] 29it [00:06, 4.59it/s] 30it [00:06, 4.59it/s] 31it [00:06, 4.47it/s] 32it [00:07, 4.52it/s] 33it [00:07, 4.54it/s] 34it [00:07, 4.57it/s] 35it [00:07, 4.58it/s] 36it [00:08, 4.59it/s] 37it [00:08, 4.59it/s] 38it [00:08, 4.58it/s] 39it [00:08, 4.59it/s] 40it [00:08, 4.57it/s] 41it [00:09, 4.45it/s] 42it [00:09, 4.49it/s] 43it [00:09, 4.53it/s] 44it [00:09, 4.55it/s] 45it [00:10, 4.57it/s] 46it [00:10, 4.58it/s] 47it [00:10, 4.57it/s] 48it [00:10, 4.53it/s] 49it [00:10, 4.56it/s] 50it [00:11, 4.41it/s]2025-05-26 00:07:33,259 - INFO - [Epoch 099 | Batch 0050] IWAE-loss 1050.6475 | mean log_px -0.0048 | KL -926.41 + 51it [00:11, 4.48it/s] 52it [00:11, 4.42it/s] 53it [00:11, 4.45it/s] 54it [00:12, 4.48it/s] 55it [00:12, 4.51it/s] 56it [00:12, 4.50it/s] 57it [00:12, 4.54it/s] 58it [00:12, 4.33it/s] 59it [00:13, 4.37it/s] 60it [00:13, 4.43it/s] 61it [00:13, 4.48it/s] 62it [00:13, 4.53it/s] 63it [00:14, 4.57it/s] 64it [00:14, 4.61it/s] 65it [00:14, 4.64it/s] 66it [00:14, 4.65it/s] 67it [00:14, 4.63it/s] 68it [00:15, 4.50it/s] 69it [00:15, 4.56it/s] 70it [00:15, 4.60it/s] 71it [00:15, 4.63it/s] 72it [00:15, 4.65it/s] 73it [00:16, 4.65it/s] 74it [00:16, 4.66it/s] 75it [00:16, 4.68it/s] 76it [00:16, 4.68it/s] 77it [00:17, 3.59it/s] 78it [00:17, 3.86it/s] 79it [00:17, 4.06it/s] 80it [00:17, 4.22it/s] 81it [00:18, 4.36it/s] 82it [00:18, 4.45it/s] 83it [00:18, 4.53it/s] 84it [00:18, 4.57it/s] 85it [00:18, 4.61it/s] 86it [00:19, 4.51it/s] 87it [00:19, 4.56it/s] 88it [00:19, 4.59it/s] 89it [00:19, 4.59it/s] 90it [00:20, 4.60it/s] 91it [00:20, 4.52it/s] 92it [00:20, 4.57it/s] 93it [00:20, 4.60it/s] 94it [00:20, 4.63it/s] 95it [00:21, 4.59it/s] 96it [00:21, 4.62it/s] 97it [00:21, 4.65it/s] 98it [00:21, 4.66it/s] 99it [00:22, 4.67it/s] 100it [00:22, 4.67it/s]2025-05-26 00:07:44,339 - INFO - [Epoch 099 | Batch 0100] IWAE-loss 1040.0406 | mean log_px -0.0042 | KL -928.02 + 101it [00:22, 4.68it/s] 102it [00:22, 4.69it/s] 103it [00:22, 4.69it/s] 104it [00:23, 4.50it/s] 105it [00:23, 4.56it/s] 106it [00:23, 4.59it/s] 107it [00:23, 4.62it/s] 108it [00:23, 4.64it/s] 109it [00:24, 4.66it/s] 110it [00:24, 4.67it/s] 111it [00:24, 4.69it/s] 112it [00:24, 4.69it/s] 113it [00:25, 4.68it/s] 114it [00:25, 4.66it/s] 115it [00:25, 4.64it/s] 116it [00:25, 4.65it/s] 117it [00:25, 4.67it/s] 118it [00:26, 4.67it/s] 119it [00:26, 4.64it/s] 120it [00:26, 4.65it/s] 121it [00:26, 4.65it/s] 122it [00:26, 4.67it/s] 123it [00:27, 4.51it/s] 124it [00:27, 4.57it/s] 125it [00:27, 4.62it/s] 126it [00:27, 4.64it/s] 127it [00:28, 4.66it/s] 128it [00:28, 4.67it/s] 129it [00:28, 4.68it/s] 130it [00:28, 4.69it/s] 131it [00:28, 4.69it/s] 132it [00:29, 4.51it/s] 133it [00:29, 4.59it/s] 134it [00:29, 4.61it/s] 135it [00:29, 4.64it/s] 136it [00:30, 4.65it/s] 137it [00:30, 4.65it/s] 138it [00:30, 4.66it/s] 139it [00:30, 4.67it/s] 140it [00:30, 4.66it/s] 141it [00:31, 4.67it/s] 142it [00:31, 4.52it/s] 143it [00:31, 4.58it/s] 144it [00:31, 4.61it/s] 145it [00:31, 4.64it/s] 146it [00:32, 4.65it/s] 147it [00:32, 4.51it/s] 148it [00:32, 4.53it/s] 149it [00:32, 4.57it/s] 150it [00:33, 4.61it/s]2025-05-26 00:07:55,144 - INFO - [Epoch 099 | Batch 0150] IWAE-loss 1044.7759 | mean log_px -0.0017 | KL -930.69 + 151it [00:33, 4.64it/s] 152it [00:33, 4.66it/s] 153it [00:33, 4.66it/s] 154it [00:33, 4.50it/s] 155it [00:34, 4.39it/s] 156it [00:34, 4.32it/s] 157it [00:34, 4.24it/s] 158it [00:34, 4.35it/s] 159it [00:35, 4.44it/s] 160it [00:35, 4.40it/s] 161it [00:35, 4.49it/s] 162it [00:35, 4.39it/s] 163it [00:36, 4.33it/s] 164it [00:36, 4.42it/s] 165it [00:36, 4.50it/s] 166it [00:36, 4.38it/s] 167it [00:36, 4.30it/s] 168it [00:37, 4.26it/s] 169it [00:37, 4.37it/s] 170it [00:37, 4.32it/s] 171it [00:37, 4.23it/s] 172it [00:38, 4.18it/s] 173it [00:38, 4.10it/s] 174it [00:38, 4.24it/s] 175it [00:38, 4.34it/s] 176it [00:39, 4.42it/s] 177it [00:39, 4.47it/s] 178it [00:39, 4.52it/s] 179it [00:39, 4.55it/s] 180it [00:39, 4.57it/s] 181it [00:40, 4.40it/s] 182it [00:40, 4.45it/s] 183it [00:40, 4.50it/s] 184it [00:40, 4.38it/s] 185it [00:41, 4.28it/s] 186it [00:41, 4.36it/s] 187it [00:41, 4.28it/s] 188it [00:41, 4.36it/s] 189it [00:41, 4.45it/s] 190it [00:42, 4.44it/s] 191it [00:42, 4.34it/s] 192it [00:42, 4.41it/s] 193it [00:42, 4.47it/s] 194it [00:43, 4.51it/s] 195it [00:43, 4.42it/s] 196it [00:43, 4.49it/s] 196it [00:43, 4.50it/s] +2025-05-26 00:08:05,540 - INFO - Epoch: 99, Objective: tensor([1112.6666], device='cuda:0', grad_fn=), Loss: 0.0035745336208492517, KL/n: 18.98943328857422 +2025-05-26 00:08:05,552 - INFO - Select objective: bbb + 0it [00:00, ?it/s] 2it [00:00, 15.39it/s] 5it [00:00, 21.76it/s] 8it [00:00, 24.76it/s] 12it [00:00, 26.61it/s] 15it [00:00, 26.07it/s] 18it [00:00, 26.51it/s] 21it [00:00, 26.48it/s] 24it [00:00, 27.30it/s] 27it [00:01, 27.72it/s] 30it [00:01, 28.38it/s] 33it [00:01, 28.70it/s] 36it [00:01, 28.90it/s] 39it [00:01, 28.96it/s] 43it [00:01, 29.09it/s] 46it [00:01, 29.11it/s] 49it [00:01, 29.09it/s] 53it [00:01, 29.10it/s] 56it [00:02, 29.11it/s] 60it [00:02, 29.28it/s] 63it [00:02, 28.28it/s] 67it [00:02, 29.74it/s] 70it [00:02, 29.64it/s] 73it [00:02, 28.95it/s] 77it [00:02, 29.29it/s] 80it [00:02, 29.08it/s] 84it [00:02, 29.40it/s] 87it [00:03, 29.06it/s] 91it [00:03, 29.08it/s] 95it [00:03, 29.43it/s] 99it [00:03, 29.67it/s] 102it [00:03, 29.03it/s] 106it [00:03, 29.35it/s] 109it [00:03, 29.11it/s] 113it [00:03, 29.35it/s] 116it [00:04, 29.17it/s] 120it [00:04, 29.39it/s] 123it [00:04, 29.14it/s] 126it [00:04, 29.16it/s] 129it [00:04, 29.18it/s] 132it [00:04, 29.18it/s] 136it [00:04, 29.56it/s] 139it [00:04, 29.24it/s] 143it [00:04, 29.50it/s] 146it [00:05, 29.21it/s] 150it [00:05, 29.47it/s] 153it [00:05, 29.18it/s] 157it [00:05, 29.42it/s] 160it [00:05, 29.19it/s] 164it [00:05, 29.43it/s] 167it [00:05, 29.16it/s] 171it [00:05, 29.66it/s] 174it [00:06, 29.39it/s] 177it [00:06, 29.06it/s] 180it [00:06, 28.33it/s] 183it [00:06, 28.14it/s] 187it [00:06, 28.99it/s] 190it [00:06, 29.04it/s] 193it [00:06, 28.16it/s] 196it [00:06, 28.52it/s] 199it [00:06, 28.50it/s] 202it [00:07, 28.28it/s] 206it [00:07, 28.60it/s] 209it [00:07, 28.18it/s] 213it [00:07, 28.56it/s] 216it [00:07, 28.31it/s] 219it [00:07, 28.70it/s] 222it [00:07, 28.29it/s] 226it [00:07, 28.18it/s] 230it [00:08, 28.68it/s] 233it [00:08, 27.84it/s] 236it [00:08, 28.26it/s] 239it [00:08, 28.03it/s] 243it [00:08, 28.37it/s] 246it [00:08, 28.00it/s] 249it [00:08, 27.58it/s] 252it [00:08, 27.82it/s] 255it [00:08, 27.68it/s] 258it [00:09, 27.93it/s] 261it [00:09, 27.87it/s] 264it [00:09, 27.95it/s] 268it [00:09, 28.61it/s] 271it [00:09, 28.66it/s] 275it [00:09, 28.81it/s] 279it [00:09, 27.11it/s] 280it [00:09, 28.38it/s] +2025-05-26 00:08:15,572 - INFO - Epoch: 0, Objective: 0.012997487559914589, Loss: 0.004764337092638016, KL/n: 0.008233150467276573 + 0it [00:00, ?it/s] 2it [00:00, 16.22it/s] 5it [00:00, 22.62it/s] 8it [00:00, 25.51it/s] 11it [00:00, 26.97it/s] 14it [00:00, 27.84it/s] 17it [00:00, 28.11it/s] 21it [00:00, 28.71it/s] 25it [00:00, 29.23it/s] 28it [00:01, 28.92it/s] 31it [00:01, 29.16it/s] 34it [00:01, 29.27it/s] 37it [00:01, 29.21it/s] 40it [00:01, 29.31it/s] 43it [00:01, 29.23it/s] 46it [00:01, 29.44it/s] 49it [00:01, 29.28it/s] 53it [00:01, 29.52it/s] 57it [00:02, 29.03it/s] 60it [00:02, 29.05it/s] 63it [00:02, 27.40it/s] 67it [00:02, 28.84it/s] 70it [00:02, 28.40it/s] 74it [00:02, 28.92it/s] 77it [00:02, 28.82it/s] 80it [00:02, 29.01it/s] 83it [00:02, 28.90it/s] 87it [00:03, 29.05it/s] 91it [00:03, 29.13it/s] 95it [00:03, 29.57it/s] 98it [00:03, 28.92it/s] 102it [00:03, 29.10it/s] 105it [00:03, 29.09it/s] 108it [00:03, 28.72it/s] 112it [00:03, 29.24it/s] 115it [00:04, 28.77it/s] 118it [00:04, 29.09it/s] 121it [00:04, 29.21it/s] 124it [00:04, 29.24it/s] 127it [00:04, 29.05it/s] 131it [00:04, 28.89it/s] 135it [00:04, 29.68it/s] 138it [00:04, 29.02it/s] 142it [00:04, 29.41it/s] 145it [00:05, 29.19it/s] 149it [00:05, 29.53it/s] 152it [00:05, 29.32it/s] 156it [00:05, 29.29it/s] 160it [00:05, 29.64it/s] 163it [00:05, 29.37it/s] 167it [00:05, 29.39it/s] 171it [00:05, 29.92it/s] 174it [00:06, 29.36it/s] 178it [00:06, 29.63it/s] 181it [00:06, 29.35it/s] 185it [00:06, 29.34it/s] 189it [00:06, 29.39it/s] 193it [00:06, 29.99it/s] 196it [00:06, 29.32it/s] 200it [00:06, 29.56it/s] 203it [00:07, 29.33it/s] 206it [00:07, 29.34it/s] 210it [00:07, 29.67it/s] 213it [00:07, 29.40it/s] 217it [00:07, 29.60it/s] 220it [00:07, 29.35it/s] 224it [00:07, 29.94it/s] 227it [00:07, 29.32it/s] 231it [00:07, 29.35it/s] 235it [00:08, 29.86it/s] 238it [00:08, 29.29it/s] 242it [00:08, 29.88it/s] 245it [00:08, 29.23it/s] 249it [00:08, 29.95it/s] 252it [00:08, 29.29it/s] 256it [00:08, 29.22it/s] 260it [00:08, 29.55it/s] 264it [00:09, 29.71it/s] 267it [00:09, 29.16it/s] 271it [00:09, 29.51it/s] 275it [00:09, 29.72it/s] 278it [00:09, 29.74it/s] 280it [00:09, 28.90it/s] +2025-05-26 00:08:25,609 - INFO - Epoch: 1, Objective: 0.02253018133342266, Loss: 0.011764063499867916, KL/n: 0.010766117833554745 + 0it [00:00, ?it/s] 1it [00:00, 9.56it/s] 4it [00:00, 20.26it/s] 8it [00:00, 25.40it/s] 11it [00:00, 25.96it/s] 15it [00:00, 27.40it/s] 18it [00:00, 27.73it/s] 21it [00:00, 27.84it/s] 24it [00:00, 26.98it/s] 27it [00:01, 27.13it/s] 30it [00:01, 27.04it/s] 33it [00:01, 27.03it/s] 36it [00:01, 27.31it/s] 39it [00:01, 27.53it/s] 42it [00:01, 27.64it/s] 46it [00:01, 28.00it/s] 49it [00:01, 27.58it/s] 52it [00:01, 27.66it/s] 55it [00:02, 27.46it/s] 58it [00:02, 27.63it/s] 61it [00:02, 27.87it/s] 64it [00:02, 27.97it/s] 67it [00:02, 28.18it/s] 70it [00:02, 28.20it/s] 73it [00:02, 28.33it/s] 76it [00:02, 28.38it/s] 79it [00:02, 28.43it/s] 82it [00:02, 28.46it/s] 85it [00:03, 28.47it/s] 88it [00:03, 28.34it/s] 91it [00:03, 28.43it/s] 94it [00:03, 28.41it/s] 97it [00:03, 28.44it/s] 100it [00:03, 28.88it/s] 103it [00:03, 28.64it/s] 106it [00:03, 28.04it/s] 109it [00:03, 28.11it/s] 112it [00:04, 28.08it/s] 115it [00:04, 28.55it/s] 118it [00:04, 28.49it/s] 121it [00:04, 28.51it/s] 124it [00:04, 28.17it/s] 127it [00:04, 28.60it/s] 130it [00:04, 28.77it/s] 133it [00:04, 28.17it/s] 136it [00:04, 28.11it/s] 139it [00:05, 27.97it/s] 142it [00:05, 27.82it/s] 145it [00:05, 28.11it/s] 148it [00:05, 28.47it/s] 151it [00:05, 28.48it/s] 154it [00:05, 28.38it/s] 157it [00:05, 28.46it/s] 160it [00:05, 28.47it/s] 163it [00:05, 28.56it/s] 166it [00:05, 28.61it/s] 169it [00:06, 28.67it/s] 172it [00:06, 28.70it/s] 175it [00:06, 28.66it/s] 178it [00:06, 28.65it/s] 181it [00:06, 28.65it/s] 184it [00:06, 28.68it/s] 187it [00:06, 28.67it/s] 190it [00:06, 28.54it/s] 193it [00:06, 28.47it/s] 196it [00:07, 28.56it/s] 199it [00:07, 28.58it/s] 202it [00:07, 28.60it/s] 205it [00:07, 28.73it/s] 208it [00:07, 28.69it/s] 211it [00:07, 28.69it/s] 214it [00:07, 28.87it/s] 217it [00:07, 29.03it/s] 220it [00:07, 28.69it/s] 223it [00:07, 28.44it/s] 226it [00:08, 28.54it/s] 229it [00:08, 28.54it/s] 232it [00:08, 28.58it/s] 235it [00:08, 28.48it/s] 238it [00:08, 28.46it/s] 241it [00:08, 28.59it/s] 244it [00:08, 28.62it/s] 247it [00:08, 28.79it/s] 251it [00:08, 28.80it/s] 254it [00:09, 28.76it/s] 257it [00:09, 28.38it/s] 260it [00:09, 28.81it/s] 263it [00:09, 28.63it/s] 266it [00:09, 28.82it/s] 269it [00:09, 28.53it/s] 272it [00:09, 28.43it/s] 275it [00:09, 27.48it/s] 278it [00:09, 27.66it/s] 280it [00:10, 27.89it/s] +2025-05-26 00:08:36,009 - INFO - Epoch: 2, Objective: 0.0173969529569149, Loss: 0.010943357832729816, KL/n: 0.006453594658523798 + 0%| | 0/84 [00:00), Loss: 0.12093358486890793, KL/n: 71.92169952392578 + 0it [00:00, ?it/s]2025-05-26 00:50:25,022 - INFO - [Epoch 001 | Batch 0000] IWAE-loss 13690.8154 | mean log_px -0.1453 | KL -3523.02 + 1it [00:00, 7.31it/s] 4it [00:00, 15.77it/s] 7it [00:00, 18.47it/s] 10it [00:00, 19.89it/s] 13it [00:00, 20.75it/s] 16it [00:00, 21.25it/s] 19it [00:00, 21.19it/s] 22it [00:01, 21.42it/s] 25it [00:01, 21.61it/s] 28it [00:01, 21.50it/s] 31it [00:01, 21.65it/s] 34it [00:01, 21.68it/s] 37it [00:01, 21.25it/s] 40it [00:01, 21.29it/s] 43it [00:02, 21.48it/s] 46it [00:02, 21.53it/s] 49it [00:02, 21.58it/s]2025-05-26 00:50:27,332 - INFO - [Epoch 001 | Batch 0050] IWAE-loss 15761.3760 | mean log_px -0.1751 | KL -3505.56 + 52it [00:02, 21.65it/s] 55it [00:02, 21.75it/s] 58it [00:02, 21.78it/s] 61it [00:02, 21.86it/s] 64it [00:03, 21.94it/s] 67it [00:03, 22.00it/s] 70it [00:03, 22.02it/s] 73it [00:03, 21.97it/s] 76it [00:03, 22.00it/s] 79it [00:03, 21.99it/s] 82it [00:03, 21.93it/s] 85it [00:03, 21.97it/s] 88it [00:04, 21.96it/s] 91it [00:04, 22.03it/s] 94it [00:04, 21.72it/s] 97it [00:04, 21.74it/s] 100it [00:04, 21.60it/s]2025-05-26 00:50:29,617 - INFO - [Epoch 001 | Batch 0100] IWAE-loss 8625.5391 | mean log_px -0.0734 | KL -3488.73 + 103it [00:04, 21.67it/s] 106it [00:04, 21.74it/s] 109it [00:05, 21.74it/s] 112it [00:05, 21.84it/s] 115it [00:05, 21.78it/s] 118it [00:05, 21.84it/s] 121it [00:05, 21.40it/s] 124it [00:05, 21.43it/s] 127it [00:05, 21.58it/s] 130it [00:06, 21.52it/s] 133it [00:06, 21.62it/s] 136it [00:06, 21.38it/s] 139it [00:06, 21.35it/s] 142it [00:06, 21.39it/s] 145it [00:06, 21.43it/s] 148it [00:06, 21.54it/s]2025-05-26 00:50:31,938 - INFO - [Epoch 001 | Batch 0150] IWAE-loss 12978.5107 | mean log_px -0.1358 | KL -3474.39 + 151it [00:07, 21.46it/s] 154it [00:07, 21.24it/s] 157it [00:07, 21.31it/s] 160it [00:07, 21.33it/s] 163it [00:07, 21.33it/s] 166it [00:07, 21.30it/s] 169it [00:07, 21.31it/s] 172it [00:08, 21.51it/s] 175it [00:08, 21.52it/s] 178it [00:08, 21.70it/s] 181it [00:08, 21.74it/s] 184it [00:08, 21.72it/s] 187it [00:08, 21.68it/s] 190it [00:08, 21.75it/s] 193it [00:08, 21.82it/s] 196it [00:09, 21.19it/s] 196it [00:09, 21.28it/s] +2025-05-26 00:50:34,123 - INFO - Epoch: 1, Objective: tensor([7917.6831], device='cuda:0', grad_fn=), Loss: 0.06973542273044586, KL/n: 70.5917739868164 + 0it [00:00, ?it/s]2025-05-26 00:50:34,370 - INFO - [Epoch 002 | Batch 0000] IWAE-loss 9796.9766 | mean log_px -0.0906 | KL -3455.17 + 1it [00:00, 6.75it/s] 4it [00:00, 15.06it/s] 7it [00:00, 18.01it/s] 10it [00:00, 19.46it/s] 13it [00:00, 20.41it/s] 16it [00:00, 20.91it/s] 19it [00:00, 21.35it/s] 22it [00:01, 21.21it/s] 25it [00:01, 20.93it/s] 28it [00:01, 21.27it/s] 31it [00:01, 21.63it/s] 34it [00:01, 21.76it/s] 37it [00:01, 21.89it/s] 40it [00:01, 22.00it/s] 43it [00:02, 21.88it/s] 46it [00:02, 21.95it/s] 49it [00:02, 21.57it/s]2025-05-26 00:50:36,674 - INFO - [Epoch 002 | Batch 0050] IWAE-loss 10460.7930 | mean log_px -0.1003 | KL -3439.36 + 52it [00:02, 21.62it/s] 55it [00:02, 21.70it/s] 58it [00:02, 21.86it/s] 61it [00:02, 21.96it/s] 64it [00:03, 21.99it/s] 67it [00:03, 22.06it/s] 70it [00:03, 22.14it/s] 73it [00:03, 22.19it/s] 76it [00:03, 21.97it/s] 79it [00:03, 21.59it/s] 82it [00:03, 21.64it/s] 85it [00:04, 21.74it/s] 88it [00:04, 21.86it/s] 91it [00:04, 21.88it/s] 94it [00:04, 21.85it/s] 97it [00:04, 21.90it/s] 100it [00:04, 22.00it/s]2025-05-26 00:50:38,952 - INFO - [Epoch 002 | Batch 0100] IWAE-loss 8140.4873 | mean log_px -0.0674 | KL -3422.42 + 103it [00:04, 22.03it/s] 106it [00:04, 21.77it/s] 109it [00:05, 21.93it/s] 112it [00:05, 21.99it/s] 115it [00:05, 21.82it/s] 118it [00:05, 21.45it/s] 121it [00:05, 21.63it/s] 124it [00:05, 21.62it/s] 127it [00:05, 21.32it/s] 130it [00:06, 21.55it/s] 133it [00:06, 21.71it/s] 136it [00:06, 21.92it/s] 139it [00:06, 21.87it/s] 142it [00:06, 21.94it/s] 145it [00:06, 22.07it/s] 148it [00:06, 21.83it/s]2025-05-26 00:50:41,252 - INFO - [Epoch 002 | Batch 0150] IWAE-loss 7733.3540 | mean log_px -0.0618 | KL -3408.06 + 151it [00:07, 21.79it/s] 154it [00:07, 21.97it/s] 157it [00:07, 22.03it/s] 160it [00:07, 21.57it/s] 163it [00:07, 21.70it/s] 166it [00:07, 21.68it/s] 169it [00:07, 21.73it/s] 172it [00:07, 21.82it/s] 175it [00:08, 21.88it/s] 178it [00:08, 21.88it/s] 181it [00:08, 21.75it/s] 184it [00:08, 21.74it/s] 187it [00:08, 21.28it/s] 190it [00:08, 21.52it/s] 193it [00:08, 21.69it/s] 196it [00:09, 21.16it/s] 196it [00:09, 21.37it/s] +2025-05-26 00:50:43,418 - INFO - Epoch: 2, Objective: tensor([7370.5742], device='cuda:0', grad_fn=), Loss: 0.06012947857379913, KL/n: 69.19798278808594 + 0it [00:00, ?it/s]2025-05-26 00:50:43,792 - INFO - [Epoch 003 | Batch 0000] IWAE-loss 5602.7324 | mean log_px -0.0317 | KL -3385.35 + 1it [00:00, 9.70it/s] 4it [00:00, 17.86it/s] 7it [00:00, 19.99it/s] 10it [00:00, 20.85it/s] 13it [00:00, 21.19it/s] 16it [00:00, 21.55it/s] 19it [00:00, 21.76it/s] 22it [00:01, 21.92it/s] 25it [00:01, 22.00it/s] 28it [00:01, 22.06it/s] 31it [00:01, 22.05it/s] 34it [00:01, 22.10it/s] 37it [00:01, 22.15it/s] 40it [00:01, 22.21it/s] 43it [00:01, 22.18it/s] 46it [00:02, 22.21it/s] 49it [00:02, 22.21it/s]2025-05-26 00:50:46,049 - INFO - [Epoch 003 | Batch 0050] IWAE-loss 8468.1914 | mean log_px -0.0728 | KL -3369.91 + 52it [00:02, 22.18it/s] 55it [00:02, 22.19it/s] 58it [00:02, 22.23it/s] 61it [00:02, 22.17it/s] 64it [00:02, 22.18it/s] 67it [00:03, 22.26it/s] 70it [00:03, 22.30it/s] 73it [00:03, 22.32it/s] 76it [00:03, 22.28it/s] 79it [00:03, 22.34it/s] 82it [00:03, 22.33it/s] 85it [00:03, 22.36it/s] 88it [00:04, 22.35it/s] 91it [00:04, 22.33it/s] 94it [00:04, 22.31it/s] 97it [00:04, 22.28it/s] 100it [00:04, 22.31it/s]2025-05-26 00:50:48,292 - INFO - [Epoch 003 | Batch 0100] IWAE-loss 5962.8643 | mean log_px -0.0373 | KL -3352.94 + 103it [00:04, 22.28it/s] 106it [00:04, 22.31it/s] 109it [00:04, 22.33it/s] 112it [00:05, 22.35it/s] 115it [00:05, 22.34it/s] 118it [00:05, 22.38it/s] 121it [00:05, 22.38it/s] 124it [00:05, 22.37it/s] 127it [00:05, 22.22it/s] 130it [00:05, 22.10it/s] 133it [00:06, 22.02it/s] 136it [00:06, 21.98it/s] 139it [00:06, 21.85it/s] 142it [00:06, 21.99it/s] 145it [00:06, 22.10it/s] 148it [00:06, 22.14it/s]2025-05-26 00:50:50,546 - INFO - [Epoch 003 | Batch 0150] IWAE-loss 7306.3408 | mean log_px -0.0568 | KL -3329.74 + 151it [00:06, 22.19it/s] 154it [00:06, 22.25it/s] 157it [00:07, 22.29it/s] 160it [00:07, 22.33it/s] 163it [00:07, 22.31it/s] 166it [00:07, 22.32it/s] 169it [00:07, 22.19it/s] 172it [00:07, 22.74it/s] 175it [00:07, 23.02it/s] 178it [00:08, 23.23it/s] 181it [00:08, 23.36it/s] 184it [00:08, 23.47it/s] 187it [00:08, 23.59it/s] 190it [00:08, 23.64it/s] 193it [00:08, 23.63it/s] 196it [00:08, 22.79it/s] 196it [00:08, 22.07it/s] +2025-05-26 00:50:52,596 - INFO - Epoch: 3, Objective: tensor([7772.2793], device='cuda:0', grad_fn=), Loss: 0.0681769996881485, KL/n: 67.7220458984375 + 0it [00:00, ?it/s]2025-05-26 00:50:52,834 - INFO - [Epoch 004 | Batch 0000] IWAE-loss 4399.7803 | mean log_px -0.0155 | KL -3312.68 + 1it [00:00, 7.53it/s] 4it [00:00, 16.72it/s] 7it [00:00, 19.72it/s] 10it [00:00, 21.13it/s] 13it [00:00, 21.98it/s] 16it [00:00, 22.46it/s] 19it [00:00, 22.68it/s] 22it [00:01, 22.94it/s] 25it [00:01, 23.06it/s] 28it [00:01, 23.13it/s] 31it [00:01, 23.23it/s] 34it [00:01, 23.28it/s] 37it [00:01, 23.33it/s] 40it [00:01, 23.40it/s] 43it [00:01, 23.44it/s] 46it [00:02, 23.48it/s] 49it [00:02, 23.44it/s]2025-05-26 00:50:54,975 - INFO - [Epoch 004 | Batch 0050] IWAE-loss 5235.7969 | mean log_px -0.0277 | KL -3297.28 + 52it [00:02, 23.30it/s] 55it [00:02, 23.30it/s] 58it [00:02, 23.31it/s] 61it [00:02, 23.38it/s] 64it [00:02, 23.47it/s] 67it [00:02, 23.45it/s] 70it [00:03, 23.44it/s] 73it [00:03, 23.47it/s] 76it [00:03, 23.40it/s] 79it [00:03, 23.38it/s] 82it [00:03, 23.42it/s] 85it [00:03, 23.44it/s] 88it [00:03, 23.41it/s] 91it [00:03, 23.44it/s] 94it [00:04, 23.41it/s] 97it [00:04, 23.38it/s] 100it [00:04, 23.37it/s]2025-05-26 00:50:57,112 - INFO - [Epoch 004 | Batch 0100] IWAE-loss 6412.3574 | mean log_px -0.0448 | KL -3279.16 + 103it [00:04, 23.33it/s] 106it [00:04, 23.43it/s] 109it [00:04, 23.43it/s] 112it [00:04, 23.37it/s] 115it [00:05, 23.34it/s] 118it [00:05, 23.41it/s] 121it [00:05, 23.32it/s] 124it [00:05, 23.43it/s] 127it [00:05, 23.51it/s] 130it [00:05, 23.21it/s] 133it [00:05, 22.84it/s] 136it [00:05, 22.58it/s] 139it [00:06, 22.46it/s] 142it [00:06, 22.37it/s] 145it [00:06, 22.28it/s] 148it [00:06, 22.28it/s]2025-05-26 00:50:59,301 - INFO - [Epoch 004 | Batch 0150] IWAE-loss 6559.6768 | mean log_px -0.0472 | KL -3257.82 + 151it [00:06, 22.20it/s] 154it [00:06, 22.08it/s] 157it [00:06, 21.91it/s] 160it [00:07, 21.96it/s] 163it [00:07, 22.07it/s] 166it [00:07, 22.13it/s] 169it [00:07, 22.16it/s] 172it [00:07, 22.21it/s] 175it [00:07, 22.23it/s] 178it [00:07, 22.26it/s] 181it [00:07, 22.25it/s] 184it [00:08, 22.31it/s] 187it [00:08, 22.33it/s] 190it [00:08, 22.32it/s] 193it [00:08, 22.14it/s] 196it [00:08, 21.39it/s] 196it [00:08, 22.51it/s] +2025-05-26 00:51:01,429 - INFO - Epoch: 4, Objective: tensor([4521.8008], device='cuda:0', grad_fn=), Loss: 0.014925037510693073, KL/n: 66.19470977783203 + 0it [00:00, ?it/s]2025-05-26 00:51:01,839 - INFO - [Epoch 005 | Batch 0000] IWAE-loss 4365.7705 | mean log_px -0.0160 | KL -3246.27 + 1it [00:00, 7.43it/s] 4it [00:00, 15.93it/s] 7it [00:00, 18.87it/s] 10it [00:00, 20.10it/s] 13it [00:00, 20.84it/s] 16it [00:00, 21.20it/s] 19it [00:00, 21.20it/s] 22it [00:01, 20.90it/s] 25it [00:01, 21.24it/s] 28it [00:01, 21.46it/s] 31it [00:01, 21.56it/s] 34it [00:01, 21.33it/s] 37it [00:01, 21.36it/s] 40it [00:01, 21.48it/s] 43it [00:02, 21.56it/s] 46it [00:02, 21.52it/s] 49it [00:02, 21.62it/s]2025-05-26 00:51:04,151 - INFO - [Epoch 005 | Batch 0050] IWAE-loss 6463.9565 | mean log_px -0.0463 | KL -3222.36 + 52it [00:02, 21.74it/s] 55it [00:02, 21.86it/s] 58it [00:02, 21.95it/s] 61it [00:02, 22.01it/s] 64it [00:03, 22.04it/s] 67it [00:03, 22.00it/s] 70it [00:03, 21.72it/s] 73it [00:03, 21.60it/s] 76it [00:03, 21.65it/s] 79it [00:03, 21.83it/s] 82it [00:03, 21.55it/s] 85it [00:04, 21.68it/s] 88it [00:04, 21.84it/s] 91it [00:04, 21.96it/s] 94it [00:04, 22.07it/s] 97it [00:04, 22.17it/s] 100it [00:04, 22.04it/s]2025-05-26 00:51:06,432 - INFO - [Epoch 005 | Batch 0100] IWAE-loss 5583.0811 | mean log_px -0.0340 | KL -3205.42 + 103it [00:04, 21.69it/s] 106it [00:04, 21.81it/s] 109it [00:05, 21.92it/s] 112it [00:05, 22.01it/s] 115it [00:05, 21.95it/s] 118it [00:05, 22.02it/s] 121it [00:05, 21.85it/s] 124it [00:05, 21.91it/s] 127it [00:05, 22.04it/s] 130it [00:06, 21.96it/s] 133it [00:06, 22.03it/s] 136it [00:06, 21.85it/s] 139it [00:06, 21.86it/s] 142it [00:06, 22.02it/s] 145it [00:06, 21.95it/s] 148it [00:06, 22.05it/s]2025-05-26 00:51:08,713 - INFO - [Epoch 005 | Batch 0150] IWAE-loss 4417.1646 | mean log_px -0.0177 | KL -3177.87 + 151it [00:07, 21.94it/s] 154it [00:07, 21.96it/s] 157it [00:07, 22.05it/s] 160it [00:07, 22.11it/s] 163it [00:07, 22.15it/s] 166it [00:07, 21.91it/s] 169it [00:07, 21.81it/s] 172it [00:07, 21.62it/s] 175it [00:08, 21.67it/s] 178it [00:08, 21.72it/s] 181it [00:08, 21.64it/s] 184it [00:08, 21.72it/s] 187it [00:08, 21.92it/s] 190it [00:08, 22.04it/s] 193it [00:08, 22.12it/s] 196it [00:09, 21.24it/s] 196it [00:09, 21.44it/s] +2025-05-26 00:51:10,873 - INFO - Epoch: 5, Objective: tensor([4335.2500], device='cuda:0', grad_fn=), Loss: 0.015179956331849098, KL/n: 64.59697723388672 + 0it [00:00, ?it/s]2025-05-26 00:51:11,115 - INFO - [Epoch 006 | Batch 0000] IWAE-loss 7553.4102 | mean log_px -0.0627 | KL -3165.42 + 1it [00:00, 7.11it/s] 4it [00:00, 15.69it/s] 7it [00:00, 18.66it/s] 10it [00:00, 20.12it/s] 13it [00:00, 20.77it/s] 16it [00:00, 20.82it/s] 19it [00:00, 20.83it/s] 22it [00:01, 21.17it/s] 25it [00:01, 21.52it/s] 28it [00:01, 21.64it/s] 31it [00:01, 21.17it/s] 34it [00:01, 21.42it/s] 37it [00:01, 21.68it/s] 40it [00:01, 21.70it/s] 43it [00:02, 21.88it/s] 46it [00:02, 21.81it/s] 49it [00:02, 21.90it/s]2025-05-26 00:51:13,416 - INFO - [Epoch 006 | Batch 0050] IWAE-loss 6326.8926 | mean log_px -0.0454 | KL -3147.69 + 52it [00:02, 21.96it/s] 55it [00:02, 21.79it/s] 58it [00:02, 21.91it/s] 61it [00:02, 22.04it/s] 64it [00:03, 22.11it/s] 67it [00:03, 22.08it/s] 70it [00:03, 21.99it/s] 73it [00:03, 21.95it/s] 76it [00:03, 21.64it/s] 79it [00:03, 21.64it/s] 82it [00:03, 21.81it/s] 85it [00:03, 21.71it/s] 88it [00:04, 21.85it/s] 91it [00:04, 21.90it/s] 94it [00:04, 21.97it/s] 97it [00:04, 22.07it/s] 100it [00:04, 22.16it/s]2025-05-26 00:51:15,694 - INFO - [Epoch 006 | Batch 0100] IWAE-loss 5364.2666 | mean log_px -0.0320 | KL -3122.95 + 103it [00:04, 22.20it/s] 106it [00:04, 22.23it/s] 109it [00:05, 22.02it/s] 112it [00:05, 22.09it/s] 115it [00:05, 21.89it/s] 118it [00:05, 22.01it/s] 121it [00:05, 21.97it/s] 124it [00:05, 22.05it/s] 127it [00:05, 22.13it/s] 130it [00:06, 22.18it/s] 133it [00:06, 22.23it/s] 136it [00:06, 22.15it/s] 139it [00:06, 22.19it/s] 142it [00:06, 22.26it/s] 145it [00:06, 22.02it/s] 148it [00:06, 21.98it/s]2025-05-26 00:51:17,958 - INFO - [Epoch 006 | Batch 0150] IWAE-loss 4960.6333 | mean log_px -0.0265 | KL -3102.87 + 151it [00:06, 22.05it/s] 154it [00:07, 22.12it/s] 157it [00:07, 22.18it/s] 160it [00:07, 22.25it/s] 163it [00:07, 22.19it/s] 166it [00:07, 22.07it/s] 169it [00:07, 22.14it/s] 172it [00:07, 22.18it/s] 175it [00:08, 22.21it/s] 178it [00:08, 21.91it/s] 181it [00:08, 21.90it/s] 184it [00:08, 21.97it/s] 187it [00:08, 22.01it/s] 190it [00:08, 21.92it/s] 193it [00:08, 22.01it/s] 196it [00:09, 21.22it/s] 196it [00:09, 21.55it/s] +2025-05-26 00:51:20,096 - INFO - Epoch: 6, Objective: tensor([4002.5366], device='cuda:0', grad_fn=), Loss: 0.014043943025171757, KL/n: 63.04303741455078 + 0it [00:00, ?it/s]2025-05-26 00:51:20,508 - INFO - [Epoch 007 | Batch 0000] IWAE-loss 4168.6924 | mean log_px -0.0154 | KL -3089.99 + 1it [00:00, 7.75it/s] 4it [00:00, 15.96it/s] 7it [00:00, 18.73it/s] 10it [00:00, 20.06it/s] 13it [00:00, 20.88it/s] 16it [00:00, 21.40it/s] 19it [00:00, 21.75it/s] 22it [00:01, 21.96it/s] 25it [00:01, 22.12it/s] 28it [00:01, 22.18it/s] 31it [00:01, 22.22it/s] 34it [00:01, 22.28it/s] 37it [00:01, 22.25it/s] 40it [00:01, 22.29it/s] 43it [00:02, 22.27it/s] 46it [00:02, 22.29it/s] 49it [00:02, 22.31it/s]2025-05-26 00:51:22,763 - INFO - [Epoch 007 | Batch 0050] IWAE-loss 5024.4258 | mean log_px -0.0279 | KL -3069.91 + 52it [00:02, 22.22it/s] 55it [00:02, 22.21it/s] 58it [00:02, 22.23it/s] 61it [00:02, 22.28it/s] 64it [00:02, 22.30it/s] 67it [00:03, 22.33it/s] 70it [00:03, 22.30it/s] 73it [00:03, 22.28it/s] 76it [00:03, 22.28it/s] 79it [00:03, 22.03it/s] 82it [00:03, 22.02it/s] 85it [00:03, 22.08it/s] 88it [00:04, 22.10it/s] 91it [00:04, 22.12it/s] 94it [00:04, 22.08it/s] 97it [00:04, 22.07it/s] 100it [00:04, 22.11it/s]2025-05-26 00:51:25,020 - INFO - [Epoch 007 | Batch 0100] IWAE-loss 7533.5576 | mean log_px -0.0640 | KL -3050.10 + 103it [00:04, 22.12it/s] 106it [00:04, 22.08it/s] 109it [00:04, 22.13it/s] 112it [00:05, 22.15it/s] 115it [00:05, 22.16it/s] 118it [00:05, 22.17it/s] 121it [00:05, 22.21it/s] 124it [00:05, 22.23it/s] 127it [00:05, 22.22it/s] 130it [00:05, 22.15it/s] 133it [00:06, 22.17it/s] 136it [00:06, 22.20it/s] 139it [00:06, 22.16it/s] 142it [00:06, 22.18it/s] 145it [00:06, 22.18it/s] 148it [00:06, 22.16it/s]2025-05-26 00:51:27,274 - INFO - [Epoch 007 | Batch 0150] IWAE-loss 3631.8569 | mean log_px -0.0086 | KL -3031.87 + 151it [00:06, 22.17it/s] 154it [00:07, 22.14it/s] 157it [00:07, 22.17it/s] 160it [00:07, 22.18it/s] 163it [00:07, 22.20it/s] 166it [00:07, 22.13it/s] 169it [00:07, 22.14it/s] 172it [00:07, 22.14it/s] 175it [00:07, 22.17it/s] 178it [00:08, 22.23it/s] 181it [00:08, 22.24it/s] 184it [00:08, 22.23it/s] 187it [00:08, 22.18it/s] 190it [00:08, 22.12it/s] 193it [00:08, 22.14it/s] 196it [00:08, 21.38it/s] 196it [00:09, 21.77it/s] +2025-05-26 00:51:29,412 - INFO - Epoch: 7, Objective: tensor([4562.2344], device='cuda:0', grad_fn=), Loss: 0.01897793635725975, KL/n: 61.56135559082031 + 0it [00:00, ?it/s]2025-05-26 00:51:29,650 - INFO - [Epoch 008 | Batch 0000] IWAE-loss 4630.2363 | mean log_px -0.0231 | KL -3012.64 + 1it [00:00, 7.36it/s] 4it [00:00, 16.10it/s] 7it [00:00, 19.00it/s] 10it [00:00, 20.34it/s] 13it [00:00, 21.07it/s] 16it [00:00, 21.52it/s] 19it [00:00, 21.84it/s] 22it [00:01, 22.04it/s] 25it [00:01, 22.11it/s] 28it [00:01, 22.16it/s] 31it [00:01, 22.22it/s] 34it [00:01, 22.23it/s] 37it [00:01, 22.28it/s] 40it [00:01, 22.34it/s] 43it [00:02, 22.39it/s] 46it [00:02, 22.39it/s] 49it [00:02, 22.38it/s]2025-05-26 00:51:31,888 - INFO - [Epoch 008 | Batch 0050] IWAE-loss 5133.2124 | mean log_px -0.0305 | KL -3000.24 + 52it [00:02, 22.31it/s] 55it [00:02, 22.38it/s] 58it [00:02, 22.41it/s] 61it [00:02, 22.35it/s] 64it [00:02, 22.39it/s] 67it [00:03, 22.36it/s] 70it [00:03, 22.37it/s] 73it [00:03, 22.37it/s] 76it [00:03, 22.27it/s] 79it [00:03, 22.28it/s] 82it [00:03, 22.25it/s] 85it [00:03, 22.25it/s] 88it [00:04, 22.23it/s] 91it [00:04, 22.23it/s] 94it [00:04, 22.25it/s] 97it [00:04, 22.23it/s] 100it [00:04, 22.32it/s]2025-05-26 00:51:34,132 - INFO - [Epoch 008 | Batch 0100] IWAE-loss 4019.6748 | mean log_px -0.0149 | KL -2976.74 + 103it [00:04, 21.90it/s] 106it [00:04, 21.72it/s] 109it [00:04, 21.70it/s] 112it [00:05, 21.74it/s] 115it [00:05, 21.78it/s] 118it [00:05, 21.81it/s] 121it [00:05, 21.81it/s] 124it [00:05, 21.70it/s] 127it [00:05, 21.76it/s] 130it [00:05, 21.82it/s] 133it [00:06, 21.86it/s] 136it [00:06, 22.09it/s] 139it [00:06, 21.98it/s] 142it [00:06, 22.11it/s] 145it [00:06, 22.22it/s] 148it [00:06, 22.30it/s]2025-05-26 00:51:36,412 - INFO - [Epoch 008 | Batch 0150] IWAE-loss 4051.5142 | mean log_px -0.0157 | KL -2953.42 + 151it [00:06, 22.27it/s] 154it [00:07, 22.30it/s] 157it [00:07, 22.35it/s] 160it [00:07, 22.34it/s] 163it [00:07, 22.38it/s] 166it [00:07, 22.41it/s] 169it [00:07, 22.39it/s] 172it [00:07, 22.40it/s] 175it [00:07, 22.42it/s] 178it [00:08, 22.43it/s] 181it [00:08, 22.42it/s] 184it [00:08, 22.47it/s] 187it [00:08, 22.47it/s] 190it [00:08, 22.49it/s] 193it [00:08, 22.46it/s] 196it [00:08, 21.61it/s] 196it [00:08, 21.84it/s] +2025-05-26 00:51:38,513 - INFO - Epoch: 8, Objective: tensor([5165.6943], device='cuda:0', grad_fn=), Loss: 0.03255581110715866, KL/n: 59.97182083129883 + 0it [00:00, ?it/s]2025-05-26 00:51:38,929 - INFO - [Epoch 009 | Batch 0000] IWAE-loss 4720.2944 | mean log_px -0.0254 | KL -2938.85 + 1it [00:00, 7.23it/s] 4it [00:00, 15.73it/s] 7it [00:00, 18.58it/s] 10it [00:00, 19.66it/s] 13it [00:00, 20.02it/s] 16it [00:00, 20.65it/s] 19it [00:00, 20.98it/s] 22it [00:01, 21.28it/s] 25it [00:01, 21.47it/s] 28it [00:01, 21.29it/s] 31it [00:01, 21.13it/s] 34it [00:01, 21.05it/s] 37it [00:01, 20.93it/s] 40it [00:01, 20.99it/s] 43it [00:02, 21.04it/s] 46it [00:02, 21.17it/s] 49it [00:02, 21.41it/s]2025-05-26 00:51:41,274 - INFO - [Epoch 009 | Batch 0050] IWAE-loss 4931.5698 | mean log_px -0.0289 | KL -2910.87 + 52it [00:02, 21.44it/s] 55it [00:02, 21.58it/s] 58it [00:02, 21.70it/s] 61it [00:02, 21.83it/s] 64it [00:03, 21.77it/s] 67it [00:03, 21.42it/s] 70it [00:03, 21.44it/s] 73it [00:03, 21.62it/s] 76it [00:03, 21.62it/s] 79it [00:03, 21.72it/s] 82it [00:03, 21.77it/s] 85it [00:04, 21.64it/s] 88it [00:04, 21.63it/s] 91it [00:04, 21.32it/s] 94it [00:04, 21.24it/s] 97it [00:04, 21.39it/s] 100it [00:04, 21.55it/s]2025-05-26 00:51:43,591 - INFO - [Epoch 009 | Batch 0100] IWAE-loss 3226.4368 | mean log_px -0.0049 | KL -2883.32 + 103it [00:04, 21.41it/s] 106it [00:05, 21.58it/s] 109it [00:05, 21.63it/s] 112it [00:05, 21.17it/s] 115it [00:05, 21.14it/s] 118it [00:05, 21.12it/s] 121it [00:05, 21.34it/s] 124it [00:05, 21.20it/s] 127it [00:06, 21.28it/s] 130it [00:06, 21.05it/s] 133it [00:06, 21.25it/s] 136it [00:06, 21.51it/s] 139it [00:06, 21.35it/s] 142it [00:06, 21.34it/s] 145it [00:06, 20.86it/s] 148it [00:07, 21.13it/s]2025-05-26 00:51:45,945 - INFO - [Epoch 009 | Batch 0150] IWAE-loss 4148.7690 | mean log_px -0.0183 | KL -2865.70 + 151it [00:07, 21.33it/s] 154it [00:07, 21.46it/s] 157it [00:07, 21.60it/s] 160it [00:07, 21.70it/s] 163it [00:07, 21.68it/s] 166it [00:07, 21.73it/s] 169it [00:07, 21.86it/s] 172it [00:08, 21.88it/s] 175it [00:08, 21.58it/s] 178it [00:08, 21.42it/s] 181it [00:08, 21.41it/s] 184it [00:08, 21.26it/s] 187it [00:08, 21.04it/s] 190it [00:08, 21.29it/s] 193it [00:09, 21.17it/s] 196it [00:09, 20.34it/s] 196it [00:09, 21.00it/s] +2025-05-26 00:51:48,151 - INFO - Epoch: 9, Objective: tensor([6045.8955], device='cuda:0', grad_fn=), Loss: 0.04524506628513336, KL/n: 58.223628997802734 + 0it [00:00, ?it/s]2025-05-26 00:51:48,386 - INFO - [Epoch 010 | Batch 0000] IWAE-loss 4079.0732 | mean log_px -0.0176 | KL -2849.20 + 1it [00:00, 7.58it/s] 4it [00:00, 15.99it/s] 7it [00:00, 18.75it/s] 10it [00:00, 19.73it/s] 13it [00:00, 20.03it/s] 16it [00:00, 20.40it/s] 19it [00:00, 20.76it/s] 22it [00:01, 21.00it/s] 25it [00:01, 21.06it/s] 28it [00:01, 21.12it/s] 31it [00:01, 21.24it/s] 34it [00:01, 21.31it/s] 37it [00:01, 21.22it/s] 40it [00:01, 21.40it/s] 43it [00:02, 21.60it/s] 46it [00:02, 21.45it/s] 49it [00:02, 21.53it/s]2025-05-26 00:51:50,722 - INFO - [Epoch 010 | Batch 0050] IWAE-loss 3398.4265 | mean log_px -0.0081 | KL -2830.84 + 52it [00:02, 21.61it/s] 55it [00:02, 21.67it/s] 58it [00:02, 21.76it/s] 61it [00:02, 21.65it/s] 64it [00:03, 21.49it/s] 67it [00:03, 21.52it/s] 70it [00:03, 21.63it/s] 73it [00:03, 21.66it/s] 76it [00:03, 21.75it/s] 79it [00:03, 21.81it/s] 82it [00:03, 21.84it/s] 85it [00:04, 21.90it/s] 88it [00:04, 21.93it/s] 91it [00:04, 21.96it/s] 94it [00:04, 21.91it/s] 97it [00:04, 21.93it/s] 100it [00:04, 22.02it/s]2025-05-26 00:51:53,013 - INFO - [Epoch 010 | Batch 0100] IWAE-loss 4126.5190 | mean log_px -0.0187 | KL -2819.67 + 103it [00:04, 21.93it/s] 106it [00:04, 21.98it/s] 109it [00:05, 21.92it/s] 112it [00:05, 21.91it/s] 115it [00:05, 21.94it/s] 118it [00:05, 22.02it/s] 121it [00:05, 22.04it/s] 124it [00:05, 22.09it/s] 127it [00:05, 22.09it/s] 130it [00:06, 22.07it/s] 133it [00:06, 22.02it/s] 136it [00:06, 22.03it/s] 139it [00:06, 22.06it/s] 142it [00:06, 22.05it/s] 145it [00:06, 22.09it/s] 148it [00:06, 22.11it/s]2025-05-26 00:51:55,282 - INFO - [Epoch 010 | Batch 0150] IWAE-loss 3436.2886 | mean log_px -0.0092 | KL -2791.42 + 151it [00:07, 22.04it/s] 154it [00:07, 22.03it/s] 157it [00:07, 22.07it/s] 160it [00:07, 22.06it/s] 163it [00:07, 22.07it/s] 166it [00:07, 22.03it/s] 169it [00:07, 21.82it/s] 172it [00:07, 21.90it/s] 175it [00:08, 21.90it/s] 178it [00:08, 21.91it/s] 181it [00:08, 21.82it/s] 184it [00:08, 21.89it/s] 187it [00:08, 21.87it/s] 190it [00:08, 21.88it/s] 193it [00:08, 21.91it/s] 196it [00:09, 20.96it/s] 196it [00:09, 21.40it/s] +2025-05-26 00:51:57,440 - INFO - Epoch: 10, Objective: tensor([3808.8560], device='cuda:0', grad_fn=), Loss: 0.012912021018564701, KL/n: 56.78377914428711 + 0it [00:00, ?it/s]2025-05-26 00:51:57,847 - INFO - [Epoch 011 | Batch 0000] IWAE-loss 3735.8105 | mean log_px -0.0137 | KL -2778.63 + 1it [00:00, 7.34it/s] 4it [00:00, 15.79it/s] 7it [00:00, 18.41it/s] 10it [00:00, 19.28it/s] 13it [00:00, 19.40it/s] 16it [00:00, 19.74it/s] 19it [00:01, 20.18it/s] 22it [00:01, 20.54it/s] 25it [00:01, 20.99it/s] 28it [00:01, 21.33it/s] 31it [00:01, 21.24it/s] 34it [00:01, 21.32it/s] 37it [00:01, 21.08it/s] 40it [00:01, 21.37it/s] 43it [00:02, 21.49it/s] 46it [00:02, 21.60it/s] 49it [00:02, 21.61it/s]2025-05-26 00:52:00,199 - INFO - [Epoch 011 | Batch 0050] IWAE-loss 3468.8289 | mean log_px -0.0101 | KL -2763.26 + 52it [00:02, 21.42it/s] 55it [00:02, 21.42it/s] 58it [00:02, 21.59it/s] 61it [00:02, 21.74it/s] 64it [00:03, 21.65it/s] 67it [00:03, 21.71it/s] 70it [00:03, 21.83it/s] 73it [00:03, 21.75it/s] 76it [00:03, 21.42it/s] 79it [00:03, 21.54it/s] 82it [00:03, 21.27it/s] 85it [00:04, 21.30it/s] 88it [00:04, 21.49it/s] 91it [00:04, 21.61it/s] 94it [00:04, 21.59it/s] 97it [00:04, 21.35it/s] 100it [00:04, 21.45it/s]2025-05-26 00:52:02,526 - INFO - [Epoch 011 | Batch 0100] IWAE-loss 3982.6140 | mean log_px -0.0177 | KL -2743.38 + 103it [00:04, 21.38it/s] 106it [00:05, 21.53it/s] 109it [00:05, 21.33it/s] 112it [00:05, 21.26it/s] 115it [00:05, 21.37it/s] 118it [00:05, 21.35it/s] 121it [00:05, 21.29it/s] 124it [00:05, 21.38it/s] 127it [00:06, 21.41it/s] 130it [00:06, 21.51it/s] 133it [00:06, 21.48it/s] 136it [00:06, 21.58it/s] 139it [00:06, 21.49it/s] 142it [00:06, 21.20it/s] 145it [00:06, 21.26it/s] 148it [00:07, 21.33it/s]2025-05-26 00:52:04,864 - INFO - [Epoch 011 | Batch 0150] IWAE-loss 3325.7747 | mean log_px -0.0087 | KL -2718.81 + 151it [00:07, 21.32it/s] 154it [00:07, 21.30it/s] 157it [00:07, 21.37it/s] 160it [00:07, 21.35it/s] 163it [00:07, 21.37it/s] 166it [00:07, 21.16it/s] 169it [00:08, 20.89it/s] 172it [00:08, 20.96it/s] 175it [00:08, 20.59it/s] 178it [00:08, 20.83it/s] 181it [00:08, 21.04it/s] 184it [00:08, 21.17it/s] 187it [00:08, 21.21it/s] 190it [00:09, 20.97it/s] 193it [00:09, 20.67it/s] 196it [00:09, 19.59it/s] 196it [00:09, 20.86it/s] +2025-05-26 00:52:07,133 - INFO - Epoch: 11, Objective: tensor([2998.2891], device='cuda:0', grad_fn=), Loss: 0.004003533162176609, KL/n: 55.1986083984375 + 0it [00:00, ?it/s]2025-05-26 00:52:07,374 - INFO - [Epoch 012 | Batch 0000] IWAE-loss 2995.9968 | mean log_px -0.0042 | KL -2700.89 + 1it [00:00, 7.00it/s] 4it [00:00, 15.15it/s] 7it [00:00, 17.86it/s] 10it [00:00, 19.44it/s] 13it [00:00, 20.01it/s] 16it [00:00, 20.50it/s] 19it [00:00, 20.96it/s] 22it [00:01, 20.77it/s] 25it [00:01, 20.92it/s] 28it [00:01, 21.06it/s] 31it [00:01, 21.01it/s] 34it [00:01, 21.10it/s] 37it [00:01, 21.37it/s] 40it [00:01, 21.56it/s] 43it [00:02, 21.63it/s] 46it [00:02, 21.74it/s] 49it [00:02, 21.80it/s]2025-05-26 00:52:09,709 - INFO - [Epoch 012 | Batch 0050] IWAE-loss 4000.0366 | mean log_px -0.0189 | KL -2676.46 + 52it [00:02, 21.81it/s] 55it [00:02, 21.81it/s] 58it [00:02, 21.53it/s] 61it [00:02, 21.58it/s] 64it [00:03, 21.48it/s] 67it [00:03, 21.59it/s] 70it [00:03, 21.06it/s] 73it [00:03, 21.32it/s] 76it [00:03, 21.15it/s] 79it [00:03, 21.00it/s] 82it [00:03, 20.94it/s] 85it [00:04, 21.03it/s] 88it [00:04, 21.30it/s] 91it [00:04, 21.35it/s] 94it [00:04, 21.54it/s] 97it [00:04, 21.51it/s] 100it [00:04, 21.10it/s]2025-05-26 00:52:12,063 - INFO - [Epoch 012 | Batch 0100] IWAE-loss 3031.4114 | mean log_px -0.0053 | KL -2658.19 + 103it [00:04, 21.33it/s] 106it [00:05, 21.04it/s] 109it [00:05, 21.29it/s] 112it [00:05, 21.21it/s] 115it [00:05, 21.22it/s] 118it [00:05, 20.80it/s] 121it [00:05, 20.97it/s] 124it [00:05, 21.19it/s] 127it [00:06, 21.23it/s] 130it [00:06, 20.90it/s] 133it [00:06, 20.92it/s] 136it [00:06, 21.16it/s] 139it [00:06, 21.41it/s] 142it [00:06, 21.52it/s] 145it [00:06, 21.30it/s] 148it [00:07, 21.39it/s]2025-05-26 00:52:14,424 - INFO - [Epoch 012 | Batch 0150] IWAE-loss 2994.6003 | mean log_px -0.0050 | KL -2644.78 + 151it [00:07, 21.05it/s] 154it [00:07, 20.82it/s] 157it [00:07, 21.06it/s] 160it [00:07, 21.16it/s] 163it [00:07, 21.34it/s] 166it [00:07, 21.55it/s] 169it [00:08, 21.17it/s] 172it [00:08, 21.17it/s] 175it [00:08, 20.88it/s] 178it [00:08, 20.78it/s] 181it [00:08, 20.78it/s] 184it [00:08, 20.52it/s] 187it [00:08, 20.62it/s] 190it [00:09, 21.00it/s] 193it [00:09, 21.27it/s] 196it [00:09, 20.49it/s] 196it [00:09, 20.84it/s] +2025-05-26 00:52:16,664 - INFO - Epoch: 12, Objective: tensor([3960.7383], device='cuda:0', grad_fn=), Loss: 0.01998310349881649, KL/n: 53.71847915649414 + 0it [00:00, ?it/s]2025-05-26 00:52:17,067 - INFO - [Epoch 013 | Batch 0000] IWAE-loss 3197.8167 | mean log_px -0.0081 | KL -2630.15 + 1it [00:00, 7.56it/s] 4it [00:00, 15.99it/s] 7it [00:00, 18.72it/s] 10it [00:00, 20.06it/s] 13it [00:00, 20.77it/s] 16it [00:00, 21.17it/s] 19it [00:00, 21.44it/s] 22it [00:01, 21.62it/s] 25it [00:01, 21.78it/s] 28it [00:01, 21.91it/s] 31it [00:01, 21.96it/s] 34it [00:01, 21.99it/s] 37it [00:01, 21.90it/s] 40it [00:01, 21.95it/s] 43it [00:02, 21.99it/s] 46it [00:02, 21.91it/s] 49it [00:02, 21.97it/s]2025-05-26 00:52:19,344 - INFO - [Epoch 013 | Batch 0050] IWAE-loss 2726.6543 | mean log_px -0.0018 | KL -2601.42 + 52it [00:02, 21.91it/s] 55it [00:02, 21.93it/s] 58it [00:02, 21.80it/s] 61it [00:02, 21.82it/s] 64it [00:03, 21.82it/s] 67it [00:03, 21.83it/s] 70it [00:03, 21.85it/s] 73it [00:03, 21.87it/s] 76it [00:03, 21.74it/s] 79it [00:03, 21.68it/s] 82it [00:03, 21.70it/s] 85it [00:03, 21.67it/s] 88it [00:04, 21.73it/s] 91it [00:04, 21.65it/s] 94it [00:04, 21.62it/s] 97it [00:04, 21.62it/s] 100it [00:04, 21.69it/s]2025-05-26 00:52:21,646 - INFO - [Epoch 013 | Batch 0100] IWAE-loss 3399.8081 | mean log_px -0.0117 | KL -2581.37 + 103it [00:04, 21.76it/s] 106it [00:04, 21.77it/s] 109it [00:05, 21.82it/s] 112it [00:05, 21.87it/s] 115it [00:05, 21.93it/s] 118it [00:05, 21.95it/s] 121it [00:05, 21.91it/s] 124it [00:05, 21.88it/s] 127it [00:05, 21.92it/s] 130it [00:06, 21.92it/s] 133it [00:06, 21.94it/s] 136it [00:06, 21.89it/s] 139it [00:06, 21.88it/s] 142it [00:06, 21.91it/s] 145it [00:06, 21.94it/s] 148it [00:06, 21.95it/s]2025-05-26 00:52:23,925 - INFO - [Epoch 013 | Batch 0150] IWAE-loss 3674.1050 | mean log_px -0.0158 | KL -2566.51 + 151it [00:06, 21.93it/s] 154it [00:07, 21.95it/s] 157it [00:07, 22.01it/s] 160it [00:07, 21.99it/s] 163it [00:07, 21.98it/s] 166it [00:07, 21.96it/s] 169it [00:07, 21.97it/s] 172it [00:07, 21.96it/s] 175it [00:08, 21.97it/s] 178it [00:08, 21.98it/s] 181it [00:08, 21.91it/s] 184it [00:08, 21.95it/s] 187it [00:08, 21.92it/s] 190it [00:08, 21.94it/s] 193it [00:08, 21.96it/s] 196it [00:09, 20.83it/s] 196it [00:09, 21.47it/s] +2025-05-26 00:52:26,089 - INFO - Epoch: 13, Objective: tensor([2922.7834], device='cuda:0', grad_fn=), Loss: 0.0051163192838430405, KL/n: 52.190059661865234 + 0it [00:00, ?it/s]2025-05-26 00:52:26,321 - INFO - [Epoch 014 | Batch 0000] IWAE-loss 3112.4670 | mean log_px -0.0079 | KL -2556.17 + 1it [00:00, 7.72it/s] 4it [00:00, 16.07it/s] 7it [00:00, 18.77it/s] 10it [00:00, 19.71it/s] 13it [00:00, 20.52it/s] 16it [00:00, 21.04it/s] 19it [00:00, 21.34it/s] 22it [00:01, 21.57it/s] 25it [00:01, 21.70it/s] 28it [00:01, 21.81it/s] 31it [00:01, 21.90it/s] 34it [00:01, 21.93it/s] 37it [00:01, 21.92it/s] 40it [00:01, 21.89it/s] 43it [00:02, 21.77it/s] 46it [00:02, 21.64it/s] 49it [00:02, 21.73it/s]2025-05-26 00:52:28,614 - INFO - [Epoch 014 | Batch 0050] IWAE-loss 3027.8662 | mean log_px -0.0070 | KL -2534.50 + 52it [00:02, 21.77it/s] 55it [00:02, 21.68it/s] 58it [00:02, 21.76it/s] 61it [00:02, 21.80it/s] 64it [00:03, 21.74it/s] 67it [00:03, 21.78it/s] 70it [00:03, 21.82it/s] 73it [00:03, 21.78it/s] 76it [00:03, 21.73it/s] 79it [00:03, 21.83it/s] 82it [00:03, 21.90it/s] 85it [00:03, 22.01it/s] 88it [00:04, 22.07it/s] 91it [00:04, 22.14it/s] 94it [00:04, 22.17it/s] 97it [00:04, 22.05it/s] 100it [00:04, 22.11it/s]2025-05-26 00:52:30,893 - INFO - [Epoch 014 | Batch 0100] IWAE-loss 2848.7947 | mean log_px -0.0048 | KL -2512.65 + 103it [00:04, 22.14it/s] 106it [00:04, 22.20it/s] 109it [00:05, 22.26it/s] 112it [00:05, 22.25it/s] 115it [00:05, 22.29it/s] 118it [00:05, 22.33it/s] 121it [00:05, 22.29it/s] 124it [00:05, 22.28it/s] 127it [00:05, 22.29it/s] 130it [00:05, 22.31it/s] 133it [00:06, 22.30it/s] 136it [00:06, 22.28it/s] 139it [00:06, 22.28it/s] 142it [00:06, 22.29it/s] 145it [00:06, 22.05it/s] 148it [00:06, 22.08it/s]2025-05-26 00:52:33,143 - INFO - [Epoch 014 | Batch 0150] IWAE-loss 3240.1421 | mean log_px -0.0107 | KL -2489.80 + 151it [00:06, 21.94it/s] 154it [00:07, 21.67it/s] 157it [00:07, 21.77it/s] 160it [00:07, 21.96it/s] 163it [00:07, 22.01it/s] 166it [00:07, 22.11it/s] 169it [00:07, 22.17it/s] 172it [00:07, 22.21it/s] 175it [00:08, 22.26it/s] 178it [00:08, 22.23it/s] 181it [00:08, 22.19it/s] 184it [00:08, 22.16it/s] 187it [00:08, 22.15it/s] 190it [00:08, 22.19it/s] 193it [00:08, 22.20it/s] 196it [00:09, 21.17it/s] 196it [00:09, 21.62it/s] +2025-05-26 00:52:35,282 - INFO - Epoch: 14, Objective: tensor([3565.1533], device='cuda:0', grad_fn=), Loss: 0.01591213047504425, KL/n: 50.55557632446289 + 0it [00:00, ?it/s]2025-05-26 00:52:35,687 - INFO - [Epoch 015 | Batch 0000] IWAE-loss 3555.1313 | mean log_px -0.0154 | KL -2474.84 + 1it [00:00, 7.60it/s] 4it [00:00, 16.21it/s] 7it [00:00, 18.85it/s] 10it [00:00, 20.11it/s] 13it [00:00, 20.85it/s] 16it [00:00, 21.04it/s] 19it [00:00, 21.20it/s] 22it [00:01, 21.37it/s] 25it [00:01, 21.40it/s] 28it [00:01, 21.30it/s] 31it [00:01, 21.02it/s] 34it [00:01, 21.24it/s] 37it [00:01, 21.48it/s] 40it [00:01, 21.65it/s] 43it [00:02, 21.78it/s] 46it [00:02, 21.88it/s] 49it [00:02, 21.93it/s]2025-05-26 00:52:37,988 - INFO - [Epoch 015 | Batch 0050] IWAE-loss 2982.5161 | mean log_px -0.0075 | KL -2454.98 + 52it [00:02, 21.96it/s] 55it [00:02, 21.95it/s] 58it [00:02, 21.98it/s] 61it [00:02, 21.96it/s] 64it [00:03, 21.97it/s] 67it [00:03, 21.97it/s] 70it [00:03, 21.97it/s] 73it [00:03, 22.01it/s] 76it [00:03, 22.02it/s] 79it [00:03, 21.99it/s] 82it [00:03, 22.01it/s] 85it [00:03, 21.87it/s] 88it [00:04, 21.88it/s] 91it [00:04, 21.88it/s] 94it [00:04, 21.96it/s] 97it [00:04, 21.99it/s] 100it [00:04, 22.03it/s]2025-05-26 00:52:40,264 - INFO - [Epoch 015 | Batch 0100] IWAE-loss 3035.9165 | mean log_px -0.0087 | KL -2423.99 + 103it [00:04, 18.72it/s] 106it [00:05, 19.55it/s] 109it [00:05, 20.23it/s] 112it [00:05, 20.73it/s] 115it [00:05, 21.12it/s] 118it [00:05, 21.39it/s] 121it [00:05, 21.61it/s] 124it [00:05, 21.79it/s] 127it [00:05, 21.83it/s] 130it [00:06, 21.91it/s] 133it [00:06, 21.77it/s] 136it [00:06, 21.86it/s] 139it [00:06, 21.92it/s] 142it [00:06, 21.93it/s] 145it [00:06, 21.84it/s] 148it [00:06, 21.90it/s]2025-05-26 00:52:42,620 - INFO - [Epoch 015 | Batch 0150] IWAE-loss 4138.2979 | mean log_px -0.0247 | KL -2406.70 + 151it [00:07, 21.90it/s] 154it [00:07, 21.95it/s] 157it [00:07, 21.86it/s] 160it [00:07, 21.84it/s] 163it [00:07, 21.96it/s] 166it [00:07, 22.00it/s] 169it [00:07, 22.04it/s] 172it [00:08, 22.07it/s] 175it [00:08, 22.08it/s] 178it [00:08, 22.02it/s] 181it [00:08, 21.96it/s] 184it [00:08, 21.97it/s] 187it [00:08, 21.78it/s] 190it [00:08, 21.83it/s] 193it [00:08, 21.94it/s] 196it [00:09, 21.25it/s] 196it [00:09, 21.32it/s] +2025-05-26 00:52:44,775 - INFO - Epoch: 15, Objective: tensor([4852.7734], device='cuda:0', grad_fn=), Loss: 0.029993919655680656, KL/n: 49.00598907470703 + 0it [00:00, ?it/s]2025-05-26 00:52:45,194 - INFO - [Epoch 016 | Batch 0000] IWAE-loss 4055.9983 | mean log_px -0.0237 | KL -2396.10 + 1it [00:00, 7.46it/s] 4it [00:00, 16.12it/s] 7it [00:00, 18.82it/s] 10it [00:00, 20.12it/s] 13it [00:00, 20.84it/s] 16it [00:00, 21.23it/s] 19it [00:00, 21.49it/s] 22it [00:01, 21.69it/s] 25it [00:01, 21.82it/s] 28it [00:01, 21.59it/s] 31it [00:01, 21.69it/s] 34it [00:01, 21.78it/s] 37it [00:01, 21.84it/s] 40it [00:01, 21.85it/s] 43it [00:02, 21.93it/s] 46it [00:02, 21.94it/s] 49it [00:02, 21.74it/s]2025-05-26 00:52:47,480 - INFO - [Epoch 016 | Batch 0050] IWAE-loss 2688.3638 | mean log_px -0.0044 | KL -2381.70 + 52it [00:02, 21.70it/s] 55it [00:02, 21.76it/s] 58it [00:02, 21.84it/s] 61it [00:02, 21.90it/s] 64it [00:03, 21.97it/s] 67it [00:03, 21.98it/s] 70it [00:03, 21.98it/s] 73it [00:03, 21.86it/s] 76it [00:03, 21.93it/s] 79it [00:03, 21.97it/s] 82it [00:03, 21.98it/s] 85it [00:03, 21.98it/s] 88it [00:04, 21.98it/s] 91it [00:04, 21.88it/s] 94it [00:04, 22.00it/s] 97it [00:04, 21.99it/s] 100it [00:04, 22.03it/s]2025-05-26 00:52:49,755 - INFO - [Epoch 016 | Batch 0100] IWAE-loss 2744.5737 | mean log_px -0.0053 | KL -2370.17 + 103it [00:04, 22.00it/s] 106it [00:04, 22.02it/s] 109it [00:05, 22.02it/s] 112it [00:05, 22.01it/s] 115it [00:05, 22.04it/s] 118it [00:05, 22.08it/s] 121it [00:05, 22.07it/s] 124it [00:05, 22.06it/s] 127it [00:05, 21.94it/s] 130it [00:06, 21.91it/s] 133it [00:06, 21.79it/s] 136it [00:06, 21.85it/s] 139it [00:06, 21.77it/s] 142it [00:06, 21.85it/s] 145it [00:06, 21.78it/s] 148it [00:06, 21.50it/s]2025-05-26 00:52:52,044 - INFO - [Epoch 016 | Batch 0150] IWAE-loss 2623.0906 | mean log_px -0.0038 | KL -2354.26 + 151it [00:06, 21.53it/s] 154it [00:07, 21.66it/s] 157it [00:07, 21.78it/s] 160it [00:07, 21.87it/s] 163it [00:07, 21.85it/s] 166it [00:07, 21.94it/s] 169it [00:07, 21.96it/s] 172it [00:07, 21.98it/s] 175it [00:08, 21.99it/s] 178it [00:08, 22.00it/s] 181it [00:08, 22.00it/s] 184it [00:08, 22.02it/s] 187it [00:08, 22.01it/s] 190it [00:08, 22.05it/s] 193it [00:08, 22.05it/s] 196it [00:09, 21.27it/s] 196it [00:09, 21.54it/s] +2025-05-26 00:52:54,185 - INFO - Epoch: 16, Objective: tensor([3663.0530], device='cuda:0', grad_fn=), Loss: 0.02340436913073063, KL/n: 47.64633560180664 + 0it [00:00, ?it/s]2025-05-26 00:52:54,433 - INFO - [Epoch 017 | Batch 0000] IWAE-loss 2511.8545 | mean log_px -0.0025 | KL -2335.61 + 1it [00:00, 7.36it/s] 4it [00:00, 16.04it/s] 7it [00:00, 18.63it/s] 10it [00:00, 19.98it/s] 13it [00:00, 20.78it/s] 16it [00:00, 21.25it/s] 19it [00:00, 21.49it/s] 22it [00:01, 21.68it/s] 25it [00:01, 21.77it/s] 28it [00:01, 21.67it/s] 31it [00:01, 21.78it/s] 34it [00:01, 21.88it/s] 37it [00:01, 21.95it/s] 40it [00:01, 21.97it/s] 43it [00:02, 22.01it/s] 46it [00:02, 22.05it/s] 49it [00:02, 22.11it/s]2025-05-26 00:52:56,705 - INFO - [Epoch 017 | Batch 0050] IWAE-loss 2662.0015 | mean log_px -0.0050 | KL -2309.66 + 52it [00:02, 22.05it/s] 55it [00:02, 22.08it/s] 58it [00:02, 22.09it/s] 61it [00:02, 22.10it/s] 64it [00:02, 22.00it/s] 67it [00:03, 22.06it/s] 70it [00:03, 21.89it/s] 73it [00:03, 21.98it/s] 76it [00:03, 21.96it/s] 79it [00:03, 21.93it/s] 82it [00:03, 21.88it/s] 85it [00:03, 21.96it/s] 88it [00:04, 22.02it/s] 91it [00:04, 22.09it/s] 94it [00:04, 22.13it/s] 97it [00:04, 22.16it/s] 100it [00:04, 22.18it/s]2025-05-26 00:52:58,973 - INFO - [Epoch 017 | Batch 0100] IWAE-loss 2909.8647 | mean log_px -0.0087 | KL -2298.74 + 103it [00:04, 22.17it/s] 106it [00:04, 22.17it/s] 109it [00:05, 22.17it/s] 112it [00:05, 22.15it/s] 115it [00:05, 22.17it/s] 118it [00:05, 22.20it/s] 121it [00:05, 22.16it/s] 124it [00:05, 22.16it/s] 127it [00:05, 22.18it/s] 130it [00:05, 22.18it/s] 133it [00:06, 22.19it/s] 136it [00:06, 22.19it/s] 139it [00:06, 22.17it/s] 142it [00:06, 22.10it/s] 145it [00:06, 22.11it/s] 148it [00:06, 22.10it/s]2025-05-26 00:53:01,234 - INFO - [Epoch 017 | Batch 0150] IWAE-loss 2803.2908 | mean log_px -0.0075 | KL -2279.56 + 151it [00:06, 21.92it/s] 154it [00:07, 22.01it/s] 157it [00:07, 22.04it/s] 160it [00:07, 22.07it/s] 163it [00:07, 22.08it/s] 166it [00:07, 22.15it/s] 169it [00:07, 22.19it/s] 172it [00:07, 22.22it/s] 175it [00:08, 22.21it/s] 178it [00:08, 22.21it/s] 181it [00:08, 22.17it/s] 184it [00:08, 22.18it/s] 187it [00:08, 22.16it/s] 190it [00:08, 22.16it/s] 193it [00:08, 22.16it/s] 196it [00:08, 21.29it/s] 196it [00:09, 21.68it/s] +2025-05-26 00:53:03,364 - INFO - Epoch: 17, Objective: tensor([3045.7505], device='cuda:0', grad_fn=), Loss: 0.01564677245914936, KL/n: 46.48301696777344 + 0it [00:00, ?it/s]2025-05-26 00:53:03,604 - INFO - [Epoch 018 | Batch 0000] IWAE-loss 2555.6826 | mean log_px -0.0040 | KL -2275.75 + 1it [00:00, 7.32it/s] 4it [00:00, 15.67it/s] 7it [00:00, 18.40it/s] 10it [00:00, 19.79it/s] 13it [00:00, 20.49it/s] 16it [00:00, 21.08it/s] 19it [00:00, 21.21it/s] 22it [00:01, 21.27it/s] 25it [00:01, 21.18it/s] 28it [00:01, 20.84it/s] 31it [00:01, 20.97it/s] 34it [00:01, 21.22it/s] 37it [00:01, 21.05it/s] 40it [00:01, 21.02it/s] 43it [00:02, 21.10it/s] 46it [00:02, 21.17it/s] 49it [00:02, 21.30it/s]2025-05-26 00:53:05,952 - INFO - [Epoch 018 | Batch 0050] IWAE-loss 3222.3081 | mean log_px -0.0138 | KL -2257.99 + 52it [00:02, 21.08it/s] 55it [00:02, 21.16it/s] 58it [00:02, 21.38it/s] 61it [00:02, 21.20it/s] 64it [00:03, 21.47it/s] 67it [00:03, 21.49it/s] 70it [00:03, 21.67it/s] 73it [00:03, 21.79it/s] 76it [00:03, 21.81it/s] 79it [00:03, 21.35it/s] 82it [00:03, 21.56it/s] 85it [00:04, 21.67it/s] 88it [00:04, 21.75it/s] 91it [00:04, 21.81it/s] 94it [00:04, 21.86it/s] 97it [00:04, 21.88it/s] 100it [00:04, 21.95it/s]2025-05-26 00:53:08,259 - INFO - [Epoch 018 | Batch 0100] IWAE-loss 2693.7666 | mean log_px -0.0064 | KL -2243.76 + 103it [00:04, 21.45it/s] 106it [00:05, 21.22it/s] 109it [00:05, 21.37it/s] 112it [00:05, 21.44it/s] 115it [00:05, 21.36it/s] 118it [00:05, 21.44it/s] 121it [00:05, 21.29it/s] 124it [00:05, 21.17it/s] 127it [00:06, 21.36it/s] 130it [00:06, 21.15it/s] 133it [00:06, 21.01it/s] 136it [00:06, 20.40it/s] 139it [00:06, 20.51it/s] 142it [00:06, 20.82it/s] 145it [00:06, 20.70it/s] 148it [00:07, 21.07it/s]2025-05-26 00:53:10,641 - INFO - [Epoch 018 | Batch 0150] IWAE-loss 2936.1733 | mean log_px -0.0101 | KL -2229.50 + 151it [00:07, 21.00it/s] 154it [00:07, 20.95it/s] 157it [00:07, 20.91it/s] 160it [00:07, 20.93it/s] 163it [00:07, 21.23it/s] 166it [00:07, 21.40it/s] 169it [00:08, 21.59it/s] 172it [00:08, 21.24it/s] 175it [00:08, 21.15it/s] 178it [00:08, 21.37it/s] 181it [00:08, 21.16it/s] 184it [00:08, 21.21it/s] 187it [00:08, 21.39it/s] 190it [00:08, 21.54it/s] 193it [00:09, 21.68it/s] 196it [00:09, 20.70it/s] 196it [00:09, 20.94it/s] +2025-05-26 00:53:12,852 - INFO - Epoch: 18, Objective: tensor([3906.1919], device='cuda:0', grad_fn=), Loss: 0.014312856830656528, KL/n: 45.337520599365234 + 0it [00:00, ?it/s]2025-05-26 00:53:13,410 - INFO - [Epoch 019 | Batch 0000] IWAE-loss 2821.6208 | mean log_px -0.0086 | KL -2218.33 + 1it [00:00, 3.54it/s] 4it [00:00, 11.02it/s] 7it [00:00, 15.38it/s] 10it [00:00, 18.04it/s] 13it [00:00, 19.69it/s] 16it [00:00, 20.76it/s] 19it [00:01, 21.47it/s] 22it [00:01, 21.96it/s] 25it [00:01, 22.15it/s] 28it [00:01, 22.34it/s] 31it [00:01, 22.53it/s] 34it [00:01, 22.54it/s] 37it [00:01, 22.68it/s] 40it [00:01, 22.74it/s] 43it [00:02, 22.79it/s] 46it [00:02, 22.87it/s] 49it [00:02, 22.87it/s]2025-05-26 00:53:15,600 - INFO - [Epoch 019 | Batch 0050] IWAE-loss 2389.0754 | mean log_px -0.0026 | KL -2206.68 + 52it [00:02, 22.78it/s] 55it [00:02, 22.87it/s] 58it [00:02, 22.88it/s] 61it [00:02, 22.91it/s] 64it [00:03, 22.97it/s] 67it [00:03, 22.92it/s] 70it [00:03, 22.95it/s] 73it [00:03, 22.95it/s] 76it [00:03, 22.89it/s] 79it [00:03, 22.98it/s] 82it [00:03, 22.97it/s] 85it [00:03, 23.02it/s] 88it [00:04, 23.10it/s] 91it [00:04, 22.90it/s] 94it [00:04, 22.50it/s] 97it [00:04, 22.20it/s] 100it [00:04, 21.95it/s]2025-05-26 00:53:17,806 - INFO - [Epoch 019 | Batch 0100] IWAE-loss 2718.6865 | mean log_px -0.0075 | KL -2191.54 + 103it [00:04, 21.81it/s] 106it [00:04, 21.72it/s] 109it [00:05, 21.58it/s] 112it [00:05, 21.63it/s] 115it [00:05, 21.57it/s] 118it [00:05, 21.48it/s] 121it [00:05, 21.60it/s] 124it [00:05, 21.62it/s] 127it [00:05, 21.70it/s] 130it [00:06, 21.54it/s] 133it [00:06, 21.50it/s] 136it [00:06, 21.65it/s] 139it [00:06, 21.52it/s] 142it [00:06, 21.54it/s] 145it [00:06, 21.54it/s] 148it [00:06, 21.43it/s]2025-05-26 00:53:20,129 - INFO - [Epoch 019 | Batch 0150] IWAE-loss 2556.6614 | mean log_px -0.0055 | KL -2170.81 + 151it [00:07, 21.37it/s] 154it [00:07, 21.33it/s] 157it [00:07, 21.25it/s] 160it [00:07, 21.41it/s] 163it [00:07, 21.34it/s] 166it [00:07, 21.36it/s] 169it [00:07, 21.45it/s] 172it [00:07, 21.44it/s] 175it [00:08, 21.47it/s] 178it [00:08, 21.47it/s] 181it [00:08, 21.37it/s] 184it [00:08, 21.79it/s] 187it [00:08, 21.96it/s] 190it [00:08, 22.06it/s] 193it [00:08, 22.13it/s] 196it [00:09, 21.09it/s] 196it [00:09, 21.38it/s] +2025-05-26 00:53:22,320 - INFO - Epoch: 19, Objective: tensor([2655.0557], device='cuda:0', grad_fn=), Loss: 0.007992914877831936, KL/n: 44.176509857177734 + 0it [00:00, ?it/s]2025-05-26 00:53:22,746 - INFO - [Epoch 020 | Batch 0000] IWAE-loss 2871.7065 | mean log_px -0.0101 | KL -2165.24 + 1it [00:00, 7.17it/s] 4it [00:00, 15.58it/s] 7it [00:00, 18.56it/s] 10it [00:00, 20.05it/s] 13it [00:00, 20.85it/s] 16it [00:00, 21.16it/s] 19it [00:00, 21.03it/s] 22it [00:01, 21.45it/s] 25it [00:01, 21.66it/s] 28it [00:01, 21.83it/s] 31it [00:01, 21.96it/s] 34it [00:01, 21.91it/s] 37it [00:01, 21.82it/s] 40it [00:01, 21.93it/s] 43it [00:02, 21.94it/s] 46it [00:02, 21.96it/s] 49it [00:02, 21.95it/s]2025-05-26 00:53:25,028 - INFO - [Epoch 020 | Batch 0050] IWAE-loss 2456.0024 | mean log_px -0.0044 | KL -2149.74 + 52it [00:02, 21.93it/s] 55it [00:02, 21.98it/s] 58it [00:02, 22.09it/s] 61it [00:02, 22.08it/s] 64it [00:03, 22.05it/s] 67it [00:03, 22.01it/s] 70it [00:03, 21.91it/s] 73it [00:03, 21.91it/s] 76it [00:03, 21.95it/s] 79it [00:03, 21.97it/s] 82it [00:03, 22.04it/s] 85it [00:03, 22.09it/s] 88it [00:04, 22.14it/s] 91it [00:04, 22.16it/s] 94it [00:04, 22.08it/s] 97it [00:04, 22.07it/s] 100it [00:04, 22.08it/s]2025-05-26 00:53:27,295 - INFO - [Epoch 020 | Batch 0100] IWAE-loss 2405.5493 | mean log_px -0.0039 | KL -2131.52 + 103it [00:04, 22.11it/s] 106it [00:04, 22.04it/s] 109it [00:05, 21.84it/s] 112it [00:05, 21.63it/s] 115it [00:05, 21.62it/s] 118it [00:05, 21.78it/s] 121it [00:05, 21.80it/s] 124it [00:05, 21.87it/s] 127it [00:05, 21.88it/s] 130it [00:06, 21.97it/s] 133it [00:06, 21.94it/s] 136it [00:06, 21.94it/s] 139it [00:06, 22.02it/s] 142it [00:06, 22.08it/s] 145it [00:06, 22.00it/s] 148it [00:06, 22.02it/s]2025-05-26 00:53:29,578 - INFO - [Epoch 020 | Batch 0150] IWAE-loss 2737.5073 | mean log_px -0.0090 | KL -2106.61 + 151it [00:06, 21.99it/s] 154it [00:07, 21.81it/s] 157it [00:07, 21.93it/s] 160it [00:07, 21.82it/s] 163it [00:07, 21.77it/s] 166it [00:07, 21.87it/s] 169it [00:07, 21.97it/s] 172it [00:07, 21.91it/s] 175it [00:08, 21.99it/s] 178it [00:08, 22.08it/s] 181it [00:08, 22.08it/s] 184it [00:08, 21.90it/s] 187it [00:08, 21.77it/s] 190it [00:08, 21.91it/s] 193it [00:08, 21.85it/s] 196it [00:09, 21.02it/s] 196it [00:09, 21.51it/s] +2025-05-26 00:53:31,743 - INFO - Epoch: 20, Objective: tensor([2731.3196], device='cuda:0', grad_fn=), Loss: 0.009444555267691612, KL/n: 42.8438606262207 + 0it [00:00, ?it/s]2025-05-26 00:53:31,976 - INFO - [Epoch 021 | Batch 0000] IWAE-loss 3213.7173 | mean log_px -0.0160 | KL -2096.78 + 1it [00:00, 7.65it/s] 4it [00:00, 16.25it/s] 7it [00:00, 18.97it/s] 10it [00:00, 20.21it/s] 13it [00:00, 20.94it/s] 16it [00:00, 21.35it/s] 19it [00:00, 21.56it/s] 22it [00:01, 21.76it/s] 25it [00:01, 21.88it/s] 28it [00:01, 22.00it/s] 31it [00:01, 22.08it/s] 34it [00:01, 22.17it/s] 37it [00:01, 22.20it/s] 40it [00:01, 22.24it/s] 43it [00:02, 22.25it/s] 46it [00:02, 22.25it/s] 49it [00:02, 22.24it/s]2025-05-26 00:53:34,231 - INFO - [Epoch 021 | Batch 0050] IWAE-loss 2267.6536 | mean log_px -0.0027 | KL -2079.66 + 52it [00:02, 22.24it/s] 55it [00:02, 22.21it/s] 58it [00:02, 22.24it/s] 61it [00:02, 22.28it/s] 64it [00:02, 22.28it/s] 67it [00:03, 22.28it/s] 70it [00:03, 22.27it/s] 73it [00:03, 22.28it/s] 76it [00:03, 22.23it/s] 79it [00:03, 22.22it/s] 82it [00:03, 22.13it/s] 85it [00:03, 22.05it/s] 88it [00:04, 22.07it/s] 91it [00:04, 22.05it/s] 94it [00:04, 21.95it/s] 97it [00:04, 21.97it/s] 100it [00:04, 21.99it/s]2025-05-26 00:53:36,491 - INFO - [Epoch 021 | Batch 0100] IWAE-loss 2419.1885 | mean log_px -0.0051 | KL -2063.60 + 103it [00:04, 21.98it/s] 106it [00:04, 21.99it/s] 109it [00:05, 21.94it/s] 112it [00:05, 22.02it/s] 115it [00:05, 22.05it/s] 118it [00:05, 22.05it/s] 121it [00:05, 22.03it/s] 124it [00:05, 22.06it/s] 127it [00:05, 22.06it/s] 130it [00:05, 22.08it/s] 133it [00:06, 22.06it/s] 136it [00:06, 21.93it/s] 139it [00:06, 21.96it/s] 142it [00:06, 21.97it/s] 145it [00:06, 22.00it/s] 148it [00:06, 22.05it/s]2025-05-26 00:53:38,761 - INFO - [Epoch 021 | Batch 0150] IWAE-loss 2773.1694 | mean log_px -0.0102 | KL -2061.54 + 151it [00:06, 22.03it/s] 154it [00:07, 22.06it/s] 157it [00:07, 22.07it/s] 160it [00:07, 22.06it/s] 163it [00:07, 22.07it/s] 166it [00:07, 22.13it/s] 169it [00:07, 22.09it/s] 172it [00:07, 21.50it/s] 175it [00:08, 21.29it/s] 178it [00:08, 21.37it/s] 181it [00:08, 21.51it/s] 184it [00:08, 21.66it/s] 187it [00:08, 21.82it/s] 190it [00:08, 21.86it/s] 193it [00:08, 21.89it/s] 196it [00:08, 21.08it/s] 196it [00:09, 21.63it/s] +2025-05-26 00:53:40,931 - INFO - Epoch: 21, Objective: tensor([3309.0674], device='cuda:0', grad_fn=), Loss: 0.013829287141561508, KL/n: 41.89488220214844 + 0it [00:00, ?it/s]2025-05-26 00:53:41,174 - INFO - [Epoch 022 | Batch 0000] IWAE-loss 2669.3140 | mean log_px -0.0088 | KL -2052.18 + 1it [00:00, 7.16it/s] 4it [00:00, 15.62it/s] 7it [00:00, 18.61it/s] 10it [00:00, 20.09it/s] 13it [00:00, 20.91it/s] 16it [00:00, 21.33it/s] 19it [00:00, 21.65it/s] 22it [00:01, 21.89it/s] 25it [00:01, 22.05it/s] 28it [00:01, 22.15it/s] 31it [00:01, 22.24it/s] 34it [00:01, 22.19it/s] 37it [00:01, 22.26it/s] 40it [00:01, 22.18it/s] 43it [00:02, 22.24it/s] 46it [00:02, 22.14it/s] 49it [00:02, 22.22it/s]2025-05-26 00:53:43,425 - INFO - [Epoch 022 | Batch 0050] IWAE-loss 2385.3784 | mean log_px -0.0049 | KL -2040.35 + 52it [00:02, 22.20it/s] 55it [00:02, 22.23it/s] 58it [00:02, 22.21it/s] 61it [00:02, 22.16it/s] 64it [00:02, 22.20it/s] 67it [00:03, 22.27it/s] 70it [00:03, 22.15it/s] 73it [00:03, 22.04it/s] 76it [00:03, 22.14it/s] 79it [00:03, 22.18it/s] 82it [00:03, 22.17it/s] 85it [00:03, 22.23it/s] 88it [00:04, 22.14it/s] 91it [00:04, 22.19it/s] 94it [00:04, 22.13it/s] 97it [00:04, 22.17it/s] 100it [00:04, 22.20it/s]2025-05-26 00:53:45,680 - INFO - [Epoch 022 | Batch 0100] IWAE-loss 2369.6106 | mean log_px -0.0049 | KL -2027.23 + 103it [00:04, 22.21it/s] 106it [00:04, 22.20it/s] 109it [00:05, 22.15it/s] 112it [00:05, 22.09it/s] 115it [00:05, 22.01it/s] 118it [00:05, 22.07it/s] 121it [00:05, 22.14it/s] 124it [00:05, 22.18it/s] 127it [00:05, 22.19it/s] 130it [00:05, 22.22it/s] 133it [00:06, 22.10it/s] 136it [00:06, 22.00it/s] 139it [00:06, 22.06it/s] 142it [00:06, 21.99it/s] 145it [00:06, 22.11it/s] 148it [00:06, 22.09it/s]2025-05-26 00:53:47,942 - INFO - [Epoch 022 | Batch 0150] IWAE-loss 2397.6382 | mean log_px -0.0056 | KL -2005.85 + 151it [00:06, 22.08it/s] 154it [00:07, 22.16it/s] 157it [00:07, 22.24it/s] 160it [00:07, 22.30it/s] 163it [00:07, 22.29it/s] 166it [00:07, 22.28it/s] 169it [00:07, 22.10it/s] 172it [00:07, 22.13it/s] 175it [00:07, 22.05it/s] 178it [00:08, 22.00it/s] 181it [00:08, 22.12it/s] 184it [00:08, 22.07it/s] 187it [00:08, 22.14it/s] 190it [00:08, 22.21it/s] 193it [00:08, 22.24it/s] 196it [00:08, 21.40it/s] 196it [00:09, 21.75it/s] +2025-05-26 00:53:50,070 - INFO - Epoch: 22, Objective: tensor([2646.2366], device='cuda:0', grad_fn=), Loss: 0.005156413186341524, KL/n: 40.68004608154297 + 0it [00:00, ?it/s]2025-05-26 00:53:50,479 - INFO - [Epoch 023 | Batch 0000] IWAE-loss 2158.3704 | mean log_px -0.0024 | KL -1992.97 + 1it [00:00, 7.50it/s] 4it [00:00, 16.13it/s] 7it [00:00, 18.60it/s] 10it [00:00, 20.04it/s] 13it [00:00, 20.76it/s] 16it [00:00, 20.95it/s] 19it [00:00, 21.24it/s] 22it [00:01, 21.46it/s] 25it [00:01, 21.64it/s] 28it [00:01, 21.81it/s] 31it [00:01, 21.78it/s] 34it [00:01, 21.68it/s] 37it [00:01, 21.56it/s] 40it [00:01, 21.74it/s] 43it [00:02, 21.74it/s] 46it [00:02, 21.88it/s] 49it [00:02, 21.91it/s]2025-05-26 00:53:52,776 - INFO - [Epoch 023 | Batch 0050] IWAE-loss 2239.9358 | mean log_px -0.0038 | KL -1976.39 + 52it [00:02, 21.70it/s] 55it [00:02, 21.69it/s] 58it [00:02, 21.83it/s] 61it [00:02, 21.78it/s] 64it [00:03, 21.62it/s] 67it [00:03, 21.79it/s] 70it [00:03, 21.89it/s] 73it [00:03, 21.73it/s] 76it [00:03, 21.58it/s] 79it [00:03, 21.78it/s] 82it [00:03, 21.90it/s] 85it [00:03, 21.98it/s] 88it [00:04, 22.08it/s] 91it [00:04, 21.76it/s] 94it [00:04, 21.80it/s] 97it [00:04, 21.95it/s] 100it [00:04, 21.59it/s]2025-05-26 00:53:55,073 - INFO - [Epoch 023 | Batch 0100] IWAE-loss 2226.4197 | mean log_px -0.0037 | KL -1964.17 + 103it [00:04, 21.74it/s] 106it [00:04, 21.90it/s] 109it [00:05, 21.87it/s] 112it [00:05, 21.68it/s] 115it [00:05, 21.70it/s] 118it [00:05, 21.88it/s] 121it [00:05, 21.98it/s] 124it [00:05, 22.01it/s] 127it [00:05, 22.03it/s] 130it [00:06, 22.09it/s] 133it [00:06, 22.14it/s] 136it [00:06, 22.19it/s] 139it [00:06, 22.22it/s] 142it [00:06, 22.23it/s] 145it [00:06, 22.09it/s] 148it [00:06, 21.84it/s]2025-05-26 00:53:57,347 - INFO - [Epoch 023 | Batch 0150] IWAE-loss 2445.9546 | mean log_px -0.0070 | KL -1956.57 + 151it [00:06, 21.74it/s] 154it [00:07, 21.90it/s] 157it [00:07, 21.83it/s] 160it [00:07, 21.76it/s] 163it [00:07, 21.79it/s] 166it [00:07, 21.83it/s] 169it [00:07, 21.79it/s] 172it [00:07, 21.88it/s] 175it [00:08, 21.60it/s] 178it [00:08, 21.41it/s] 181it [00:08, 21.67it/s] 184it [00:08, 21.81it/s] 187it [00:08, 21.84it/s] 190it [00:08, 21.62it/s] 193it [00:08, 21.39it/s] 196it [00:09, 20.64it/s] 196it [00:09, 21.40it/s] +2025-05-26 00:53:59,533 - INFO - Epoch: 23, Objective: tensor([2979.9739], device='cuda:0', grad_fn=), Loss: 0.012888900004327297, KL/n: 39.74480056762695 + 0it [00:00, ?it/s]2025-05-26 00:53:59,752 - INFO - [Epoch 024 | Batch 0000] IWAE-loss 2332.5344 | mean log_px -0.0055 | KL -1946.88 + 1it [00:00, 8.80it/s] 4it [00:00, 17.08it/s] 7it [00:00, 19.48it/s] 10it [00:00, 20.61it/s] 13it [00:00, 21.24it/s] 16it [00:00, 21.56it/s] 19it [00:00, 21.72it/s] 22it [00:01, 21.84it/s] 25it [00:01, 21.99it/s] 28it [00:01, 22.14it/s] 31it [00:01, 22.10it/s] 34it [00:01, 21.69it/s] 37it [00:01, 21.69it/s] 40it [00:01, 21.71it/s] 43it [00:02, 21.81it/s] 46it [00:02, 21.82it/s] 49it [00:02, 21.81it/s]2025-05-26 00:54:02,032 - INFO - [Epoch 024 | Batch 0050] IWAE-loss 2115.7051 | mean log_px -0.0025 | KL -1938.88 + 52it [00:02, 21.78it/s] 55it [00:02, 21.72it/s] 58it [00:02, 21.65it/s] 61it [00:02, 21.70it/s] 64it [00:02, 21.77it/s] 67it [00:03, 21.78it/s] 70it [00:03, 21.83it/s] 73it [00:03, 21.78it/s] 76it [00:03, 21.80it/s] 79it [00:03, 21.84it/s] 82it [00:03, 21.85it/s] 85it [00:03, 21.85it/s] 88it [00:04, 21.84it/s] 91it [00:04, 21.79it/s] 94it [00:04, 21.65it/s] 97it [00:04, 21.55it/s] 100it [00:04, 20.92it/s]2025-05-26 00:54:04,354 - INFO - [Epoch 024 | Batch 0100] IWAE-loss 1992.0907 | mean log_px -0.0009 | KL -1925.89 + 103it [00:04, 20.51it/s] 106it [00:04, 20.88it/s] 109it [00:05, 21.01it/s] 112it [00:05, 21.14it/s] 115it [00:05, 20.96it/s] 118it [00:05, 21.28it/s] 121it [00:05, 21.40it/s] 124it [00:05, 21.51it/s] 127it [00:05, 21.64it/s] 130it [00:06, 21.75it/s] 133it [00:06, 21.89it/s] 136it [00:06, 21.89it/s] 139it [00:06, 21.97it/s] 142it [00:06, 22.03it/s] 145it [00:06, 22.06it/s] 148it [00:06, 22.10it/s]2025-05-26 00:54:06,654 - INFO - [Epoch 024 | Batch 0150] IWAE-loss 1991.2052 | mean log_px -0.0011 | KL -1913.71 + 151it [00:07, 22.09it/s] 154it [00:07, 22.15it/s] 157it [00:07, 22.12it/s] 160it [00:07, 22.11it/s] 163it [00:07, 22.17it/s] 166it [00:07, 22.12it/s] 169it [00:07, 22.08it/s] 172it [00:07, 22.14it/s] 175it [00:08, 22.15it/s] 178it [00:08, 22.15it/s] 181it [00:08, 22.14it/s] 184it [00:08, 22.18it/s] 187it [00:08, 22.17it/s] 190it [00:08, 22.21it/s] 193it [00:08, 22.24it/s] 196it [00:09, 20.83it/s] 196it [00:09, 21.46it/s] +2025-05-26 00:54:08,796 - INFO - Epoch: 24, Objective: tensor([2168.9478], device='cuda:0', grad_fn=), Loss: 0.002955142641440034, KL/n: 38.92694854736328 + 0it [00:00, ?it/s]2025-05-26 00:54:09,344 - INFO - [Epoch 025 | Batch 0000] IWAE-loss 2098.3188 | mean log_px -0.0027 | KL -1907.81 + 1it [00:00, 3.54it/s] 4it [00:00, 10.81it/s] 7it [00:00, 14.52it/s] 10it [00:00, 17.00it/s] 13it [00:00, 18.62it/s] 16it [00:00, 19.28it/s] 19it [00:01, 20.00it/s] 22it [00:01, 20.55it/s] 25it [00:01, 20.97it/s] 28it [00:01, 21.20it/s] 31it [00:01, 21.41it/s] 34it [00:01, 21.56it/s] 37it [00:01, 21.55it/s] 40it [00:02, 20.81it/s] 43it [00:02, 19.89it/s] 46it [00:02, 20.12it/s] 49it [00:02, 20.53it/s]2025-05-26 00:54:11,726 - INFO - [Epoch 025 | Batch 0050] IWAE-loss 2453.8760 | mean log_px -0.0080 | KL -1890.65 + 52it [00:02, 20.67it/s] 55it [00:02, 20.82it/s] 58it [00:02, 20.86it/s] 61it [00:03, 20.80it/s] 64it [00:03, 20.55it/s] 67it [00:03, 20.82it/s] 70it [00:03, 21.05it/s] 73it [00:03, 20.94it/s] 76it [00:03, 21.24it/s] 79it [00:03, 21.74it/s] 82it [00:04, 21.92it/s] 85it [00:04, 21.96it/s] 88it [00:04, 22.16it/s] 91it [00:04, 22.33it/s] 94it [00:04, 22.17it/s] 97it [00:04, 22.30it/s] 100it [00:04, 22.43it/s]2025-05-26 00:54:14,028 - INFO - [Epoch 025 | Batch 0100] IWAE-loss 2108.8333 | mean log_px -0.0033 | KL -1878.15 + 103it [00:05, 22.52it/s] 106it [00:05, 22.68it/s] 109it [00:05, 22.74it/s] 112it [00:05, 22.89it/s] 115it [00:05, 22.62it/s] 118it [00:05, 22.25it/s] 121it [00:05, 22.40it/s] 124it [00:05, 22.44it/s] 127it [00:06, 22.38it/s] 130it [00:06, 22.42it/s] 133it [00:06, 22.58it/s] 136it [00:06, 22.24it/s] 139it [00:06, 22.37it/s] 142it [00:06, 22.27it/s] 145it [00:06, 22.35it/s] 148it [00:07, 22.43it/s]2025-05-26 00:54:16,250 - INFO - [Epoch 025 | Batch 0150] IWAE-loss 2450.2883 | mean log_px -0.0084 | KL -1860.54 + 151it [00:07, 22.58it/s] 154it [00:07, 22.68it/s] 157it [00:07, 22.76it/s] 160it [00:07, 22.64it/s] 163it [00:07, 22.62it/s] 166it [00:07, 22.74it/s] 169it [00:07, 22.80it/s] 172it [00:08, 22.85it/s] 175it [00:08, 22.91it/s] 178it [00:08, 22.93it/s] 181it [00:08, 22.96it/s] 184it [00:08, 22.94it/s] 187it [00:08, 22.96it/s] 190it [00:08, 22.62it/s] 193it [00:09, 22.61it/s] 196it [00:09, 21.56it/s] 196it [00:09, 21.20it/s] +2025-05-26 00:54:18,338 - INFO - Epoch: 25, Objective: tensor([2734.2681], device='cuda:0', grad_fn=), Loss: 0.00301891821436584, KL/n: 37.86283874511719 + 0it [00:00, ?it/s]2025-05-26 00:54:18,773 - INFO - [Epoch 026 | Batch 0000] IWAE-loss 2116.1985 | mean log_px -0.0037 | KL -1853.98 + 1it [00:00, 7.23it/s] 4it [00:00, 15.82it/s] 7it [00:00, 18.56it/s] 10it [00:00, 19.83it/s] 13it [00:00, 20.57it/s] 16it [00:00, 20.90it/s] 19it [00:00, 20.85it/s] 22it [00:01, 21.13it/s] 25it [00:01, 21.39it/s] 28it [00:01, 21.55it/s] 31it [00:01, 21.63it/s] 34it [00:01, 21.67it/s] 37it [00:01, 21.45it/s] 40it [00:01, 21.46it/s] 43it [00:02, 21.60it/s] 46it [00:02, 21.53it/s] 49it [00:02, 21.57it/s]2025-05-26 00:54:21,088 - INFO - [Epoch 026 | Batch 0050] IWAE-loss 3788.1353 | mean log_px -0.0278 | KL -1842.97 + 52it [00:02, 21.51it/s] 55it [00:02, 21.52it/s] 58it [00:02, 21.59it/s] 61it [00:02, 21.72it/s] 64it [00:03, 21.76it/s] 67it [00:03, 21.44it/s] 70it [00:03, 21.55it/s] 73it [00:03, 21.52it/s] 76it [00:03, 21.62it/s] 79it [00:03, 21.69it/s] 82it [00:03, 21.78it/s] 85it [00:04, 21.85it/s] 88it [00:04, 21.87it/s] 91it [00:04, 21.89it/s] 94it [00:04, 21.63it/s] 97it [00:04, 21.18it/s] 100it [00:04, 21.29it/s]2025-05-26 00:54:23,405 - INFO - [Epoch 026 | Batch 0100] IWAE-loss 2104.5164 | mean log_px -0.0038 | KL -1838.11 + 103it [00:04, 21.34it/s] 106it [00:04, 21.47it/s] 109it [00:05, 21.52it/s] 112it [00:05, 21.59it/s] 115it [00:05, 21.56it/s] 118it [00:05, 21.49it/s] 121it [00:05, 21.52it/s] 124it [00:05, 21.58it/s] 127it [00:05, 21.60it/s] 130it [00:06, 21.72it/s] 133it [00:06, 21.77it/s] 136it [00:06, 21.77it/s] 139it [00:06, 21.82it/s] 142it [00:06, 21.79it/s] 145it [00:06, 21.83it/s] 148it [00:06, 21.87it/s]2025-05-26 00:54:25,705 - INFO - [Epoch 026 | Batch 0150] IWAE-loss 3128.1956 | mean log_px -0.0185 | KL -1830.64 + 151it [00:07, 21.80it/s] 154it [00:07, 21.86it/s] 157it [00:07, 21.90it/s] 160it [00:07, 21.84it/s] 163it [00:07, 21.90it/s] 166it [00:07, 21.91it/s] 169it [00:07, 21.94it/s] 172it [00:08, 21.92it/s] 175it [00:08, 21.92it/s] 178it [00:08, 21.62it/s] 181it [00:08, 21.53it/s] 184it [00:08, 21.63it/s] 187it [00:08, 21.67it/s] 190it [00:08, 21.68it/s] 193it [00:08, 21.70it/s] 196it [00:09, 20.60it/s] 196it [00:09, 21.23it/s] +2025-05-26 00:54:27,891 - INFO - Epoch: 26, Objective: tensor([2102.4189], device='cuda:0', grad_fn=), Loss: 0.0038671556394547224, KL/n: 37.17778396606445 + 0it [00:00, ?it/s]2025-05-26 00:54:28,125 - INFO - [Epoch 027 | Batch 0000] IWAE-loss 2036.8278 | mean log_px -0.0030 | KL -1823.89 + 1it [00:00, 7.72it/s] 4it [00:00, 16.33it/s] 7it [00:00, 18.93it/s] 10it [00:00, 19.82it/s] 13it [00:00, 20.54it/s] 16it [00:00, 20.91it/s] 19it [00:00, 21.26it/s] 22it [00:01, 21.50it/s] 25it [00:01, 21.46it/s] 28it [00:01, 21.61it/s] 31it [00:01, 21.61it/s] 34it [00:01, 21.69it/s] 37it [00:01, 21.83it/s] 40it [00:01, 22.05it/s] 43it [00:02, 22.17it/s] 46it [00:02, 22.35it/s] 49it [00:02, 22.46it/s]2025-05-26 00:54:30,402 - INFO - [Epoch 027 | Batch 0050] IWAE-loss 2012.3339 | mean log_px -0.0028 | KL -1813.62 + 52it [00:02, 22.30it/s] 55it [00:02, 22.19it/s] 58it [00:02, 22.18it/s] 61it [00:02, 22.29it/s] 64it [00:02, 22.44it/s] 67it [00:03, 22.45it/s] 70it [00:03, 22.19it/s] 73it [00:03, 22.15it/s] 76it [00:03, 21.99it/s] 79it [00:03, 22.07it/s] 82it [00:03, 22.13it/s] 85it [00:03, 22.30it/s] 88it [00:04, 22.43it/s] 91it [00:04, 22.46it/s] 94it [00:04, 22.54it/s] 97it [00:04, 22.59it/s] 100it [00:04, 22.67it/s]2025-05-26 00:54:32,638 - INFO - [Epoch 027 | Batch 0100] IWAE-loss 1961.9465 | mean log_px -0.0024 | KL -1796.23 + 103it [00:04, 22.68it/s] 106it [00:04, 22.74it/s] 109it [00:04, 22.76it/s] 112it [00:05, 22.89it/s] 115it [00:05, 23.00it/s] 118it [00:05, 23.02it/s] 121it [00:05, 22.79it/s] 124it [00:05, 22.58it/s] 127it [00:05, 22.41it/s] 130it [00:05, 22.44it/s] 133it [00:06, 22.34it/s] 136it [00:06, 22.40it/s] 139it [00:06, 22.47it/s] 142it [00:06, 22.36it/s] 145it [00:06, 22.38it/s] 148it [00:06, 22.39it/s]2025-05-26 00:54:34,857 - INFO - [Epoch 027 | Batch 0150] IWAE-loss 2219.3000 | mean log_px -0.0061 | KL -1792.08 + 151it [00:06, 22.29it/s] 154it [00:06, 22.30it/s] 157it [00:07, 22.20it/s] 160it [00:07, 22.13it/s] 163it [00:07, 21.99it/s] 166it [00:07, 21.93it/s] 169it [00:07, 21.83it/s] 172it [00:07, 21.96it/s] 175it [00:07, 22.17it/s] 178it [00:08, 22.37it/s] 181it [00:08, 22.44it/s] 184it [00:08, 22.47it/s] 187it [00:08, 22.55it/s] 190it [00:08, 22.22it/s] 193it [00:08, 22.19it/s] 196it [00:08, 21.23it/s] 196it [00:08, 21.86it/s] +2025-05-26 00:54:36,985 - INFO - Epoch: 27, Objective: tensor([1918.6759], device='cuda:0', grad_fn=), Loss: 0.0018985853530466557, KL/n: 36.49961471557617 + 0it [00:00, ?it/s]2025-05-26 00:54:37,392 - INFO - [Epoch 028 | Batch 0000] IWAE-loss 2179.4561 | mean log_px -0.0056 | KL -1788.02 + 1it [00:00, 8.31it/s] 4it [00:00, 16.73it/s] 7it [00:00, 19.14it/s] 10it [00:00, 20.33it/s] 13it [00:00, 21.13it/s] 16it [00:00, 21.57it/s] 19it [00:00, 21.89it/s] 22it [00:01, 22.11it/s] 25it [00:01, 21.85it/s] 28it [00:01, 21.79it/s] 31it [00:01, 21.73it/s] 34it [00:01, 21.84it/s] 37it [00:01, 21.95it/s] 40it [00:01, 21.94it/s] 43it [00:02, 22.03it/s] 46it [00:02, 22.09it/s] 49it [00:02, 22.15it/s]2025-05-26 00:54:39,657 - INFO - [Epoch 028 | Batch 0050] IWAE-loss 2144.2183 | mean log_px -0.0053 | KL -1774.67 + 52it [00:02, 22.23it/s] 55it [00:02, 22.25it/s] 58it [00:02, 22.26it/s] 61it [00:02, 22.26it/s] 64it [00:02, 22.30it/s] 67it [00:03, 22.29it/s] 70it [00:03, 22.30it/s] 73it [00:03, 22.31it/s] 76it [00:03, 22.27it/s] 79it [00:03, 22.28it/s] 82it [00:03, 22.28it/s] 85it [00:03, 22.26it/s] 88it [00:04, 22.24it/s] 91it [00:04, 22.22it/s] 94it [00:04, 21.98it/s] 97it [00:04, 21.55it/s] 100it [00:04, 21.56it/s]2025-05-26 00:54:41,923 - INFO - [Epoch 028 | Batch 0100] IWAE-loss 1951.3558 | mean log_px -0.0026 | KL -1766.03 + 103it [00:04, 21.60it/s] 106it [00:04, 21.34it/s] 109it [00:05, 20.91it/s] 112it [00:05, 20.78it/s] 115it [00:05, 21.08it/s] 118it [00:05, 21.20it/s] 121it [00:05, 21.42it/s] 124it [00:05, 21.61it/s] 127it [00:05, 21.50it/s] 130it [00:06, 21.65it/s] 133it [00:06, 21.71it/s] 136it [00:06, 21.65it/s] 139it [00:06, 21.39it/s] 142it [00:06, 21.29it/s] 145it [00:06, 20.86it/s] 148it [00:06, 21.23it/s]2025-05-26 00:54:44,270 - INFO - [Epoch 028 | Batch 0150] IWAE-loss 2483.1685 | mean log_px -0.0105 | KL -1751.18 + 151it [00:06, 21.38it/s] 154it [00:07, 21.45it/s] 157it [00:07, 21.50it/s] 160it [00:07, 21.53it/s] 163it [00:07, 21.43it/s] 166it [00:07, 21.39it/s] 169it [00:07, 21.52it/s] 172it [00:07, 21.69it/s] 175it [00:08, 21.65it/s] 178it [00:08, 21.60it/s] 181it [00:08, 21.70it/s] 184it [00:08, 21.77it/s] 187it [00:08, 21.85it/s] 190it [00:08, 21.85it/s] 193it [00:08, 21.81it/s] 196it [00:09, 20.78it/s] 196it [00:09, 21.40it/s] +2025-05-26 00:54:46,457 - INFO - Epoch: 28, Objective: tensor([2011.8058], device='cuda:0', grad_fn=), Loss: 0.003983728121966124, KL/n: 35.76288986206055 + 0it [00:00, ?it/s]2025-05-26 00:54:46,691 - INFO - [Epoch 029 | Batch 0000] IWAE-loss 2052.3093 | mean log_px -0.0043 | KL -1753.30 + 1it [00:00, 7.34it/s] 4it [00:00, 15.33it/s] 7it [00:00, 18.30it/s] 10it [00:00, 19.51it/s] 13it [00:00, 20.02it/s] 16it [00:00, 20.49it/s] 19it [00:00, 20.85it/s] 22it [00:01, 21.19it/s] 25it [00:01, 21.32it/s] 28it [00:01, 21.27it/s] 31it [00:01, 21.48it/s] 34it [00:01, 21.56it/s] 37it [00:01, 21.69it/s] 40it [00:01, 21.61it/s] 43it [00:02, 21.71it/s] 46it [00:02, 21.50it/s] 49it [00:02, 21.49it/s]2025-05-26 00:54:49,024 - INFO - [Epoch 029 | Batch 0050] IWAE-loss 2241.0840 | mean log_px -0.0070 | KL -1748.66 + 52it [00:02, 21.53it/s] 55it [00:02, 21.50it/s] 58it [00:02, 21.06it/s] 61it [00:02, 21.14it/s] 64it [00:03, 20.79it/s] 67it [00:03, 21.04it/s] 70it [00:03, 21.18it/s] 73it [00:03, 21.44it/s] 76it [00:03, 21.26it/s] 79it [00:03, 21.55it/s] 82it [00:03, 21.45it/s] 85it [00:04, 21.02it/s] 88it [00:04, 20.57it/s] 91it [00:04, 20.52it/s] 94it [00:04, 20.52it/s] 97it [00:04, 20.84it/s] 100it [00:04, 21.13it/s]2025-05-26 00:54:51,405 - INFO - [Epoch 029 | Batch 0100] IWAE-loss 2311.3848 | mean log_px -0.0083 | KL -1732.33 + 103it [00:04, 21.25it/s] 106it [00:05, 21.13it/s] 109it [00:05, 21.37it/s] 112it [00:05, 21.49it/s] 115it [00:05, 21.40it/s] 118it [00:05, 21.22it/s] 121it [00:05, 21.47it/s] 124it [00:05, 21.63it/s] 127it [00:06, 22.07it/s] 130it [00:06, 22.31it/s] 133it [00:06, 22.58it/s] 136it [00:06, 22.52it/s] 139it [00:06, 22.71it/s] 142it [00:06, 22.90it/s] 145it [00:06, 22.92it/s] 148it [00:06, 22.72it/s]2025-05-26 00:54:53,653 - INFO - [Epoch 029 | Batch 0150] IWAE-loss 1927.2134 | mean log_px -0.0028 | KL -1728.49 + 151it [00:07, 22.75it/s] 154it [00:07, 22.54it/s] 157it [00:07, 22.41it/s] 160it [00:07, 22.64it/s] 163it [00:07, 22.35it/s] 166it [00:07, 22.61it/s] 169it [00:07, 22.70it/s] 172it [00:08, 22.44it/s] 175it [00:08, 22.27it/s] 178it [00:08, 22.51it/s] 181it [00:08, 22.69it/s] 184it [00:08, 22.75it/s] 187it [00:08, 22.85it/s] 190it [00:08, 22.53it/s] 193it [00:08, 22.75it/s] 196it [00:09, 21.86it/s] 196it [00:09, 21.40it/s] +2025-05-26 00:54:55,746 - INFO - Epoch: 29, Objective: tensor([3088.2554], device='cuda:0', grad_fn=), Loss: 0.024811862036585808, KL/n: 35.21946716308594 + 0it [00:00, ?it/s]2025-05-26 00:54:55,983 - INFO - [Epoch 030 | Batch 0000] IWAE-loss 1867.4896 | mean log_px -0.0021 | KL -1722.31 + 1it [00:00, 8.16it/s] 4it [00:00, 17.45it/s] 7it [00:00, 20.13it/s] 10it [00:00, 21.37it/s] 13it [00:00, 21.92it/s] 16it [00:00, 22.13it/s] 19it [00:00, 22.42it/s] 22it [00:01, 22.70it/s] 25it [00:01, 22.85it/s] 28it [00:01, 22.75it/s] 31it [00:01, 22.74it/s] 34it [00:01, 22.34it/s] 37it [00:01, 22.18it/s] 40it [00:01, 22.05it/s] 43it [00:01, 22.01it/s] 46it [00:02, 21.93it/s] 49it [00:02, 21.94it/s]2025-05-26 00:54:58,201 - INFO - [Epoch 030 | Batch 0050] IWAE-loss 1927.4747 | mean log_px -0.0030 | KL -1716.35 + 52it [00:02, 21.88it/s] 55it [00:02, 21.72it/s] 58it [00:02, 21.74it/s] 61it [00:02, 21.82it/s] 64it [00:02, 21.82it/s] 67it [00:03, 21.74it/s] 70it [00:03, 21.76it/s] 73it [00:03, 21.60it/s] 76it [00:03, 21.66it/s] 79it [00:03, 21.73it/s] 82it [00:03, 21.73it/s] 85it [00:03, 21.78it/s] 88it [00:04, 21.73it/s] 91it [00:04, 21.72it/s] 94it [00:04, 21.73it/s] 97it [00:04, 21.77it/s] 100it [00:04, 21.78it/s]2025-05-26 00:55:00,504 - INFO - [Epoch 030 | Batch 0100] IWAE-loss 2074.9089 | mean log_px -0.0052 | KL -1708.55 + 103it [00:04, 21.68it/s] 106it [00:04, 21.72it/s] 109it [00:05, 21.72it/s] 112it [00:05, 21.76it/s] 115it [00:05, 21.71it/s] 118it [00:05, 21.58it/s] 121it [00:05, 21.43it/s] 124it [00:05, 21.34it/s] 127it [00:05, 21.51it/s] 130it [00:05, 21.58it/s] 133it [00:06, 21.68it/s] 136it [00:06, 21.67it/s] 139it [00:06, 20.94it/s] 142it [00:06, 20.99it/s] 145it [00:06, 21.05it/s] 148it [00:06, 20.78it/s]2025-05-26 00:55:02,854 - INFO - [Epoch 030 | Batch 0150] IWAE-loss 2048.0806 | mean log_px -0.0050 | KL -1701.15 + 151it [00:06, 20.82it/s] 154it [00:07, 21.06it/s] 157it [00:07, 21.37it/s] 160it [00:07, 21.61it/s] 163it [00:07, 21.81it/s] 166it [00:07, 21.96it/s] 169it [00:07, 22.06it/s] 172it [00:07, 21.95it/s] 175it [00:08, 21.96it/s] 178it [00:08, 21.95it/s] 181it [00:08, 21.94it/s] 184it [00:08, 21.89it/s] 187it [00:08, 21.98it/s] 190it [00:08, 22.07it/s] 193it [00:08, 21.81it/s] 196it [00:09, 20.80it/s] 196it [00:09, 21.47it/s] +2025-05-26 00:55:05,010 - INFO - Epoch: 30, Objective: tensor([2465.2122], device='cuda:0', grad_fn=), Loss: 0.007316778413951397, KL/n: 34.54081344604492 + 0it [00:00, ?it/s]2025-05-26 00:55:05,416 - INFO - [Epoch 031 | Batch 0000] IWAE-loss 2152.2412 | mean log_px -0.0066 | KL -1691.27 + 1it [00:00, 7.45it/s] 4it [00:00, 15.45it/s] 7it [00:00, 17.90it/s] 10it [00:00, 19.33it/s] 13it [00:00, 19.82it/s] 16it [00:00, 20.36it/s] 19it [00:00, 20.31it/s] 22it [00:01, 20.57it/s] 25it [00:01, 20.92it/s] 28it [00:01, 21.08it/s] 31it [00:01, 21.37it/s] 34it [00:01, 21.18it/s] 37it [00:01, 21.33it/s] 40it [00:01, 21.15it/s] 43it [00:02, 21.14it/s] 46it [00:02, 20.95it/s] 49it [00:02, 21.01it/s]2025-05-26 00:55:07,795 - INFO - [Epoch 031 | Batch 0050] IWAE-loss 1977.2633 | mean log_px -0.0042 | KL -1681.93 + 52it [00:02, 20.98it/s] 55it [00:02, 21.13it/s] 58it [00:02, 21.38it/s] 61it [00:02, 21.45it/s] 64it [00:03, 21.36it/s] 67it [00:03, 21.34it/s] 70it [00:03, 21.55it/s] 73it [00:03, 21.62it/s] 76it [00:03, 21.41it/s] 79it [00:03, 21.34it/s] 82it [00:03, 21.44it/s] 85it [00:04, 20.92it/s] 88it [00:04, 21.11it/s] 91it [00:04, 21.00it/s] 94it [00:04, 21.10it/s] 97it [00:04, 21.29it/s] 100it [00:04, 21.42it/s]2025-05-26 00:55:10,134 - INFO - [Epoch 031 | Batch 0100] IWAE-loss 2953.2319 | mean log_px -0.0183 | KL -1674.79 + 103it [00:04, 21.18it/s] 106it [00:05, 21.23it/s] 109it [00:05, 21.41it/s] 112it [00:05, 21.52it/s] 115it [00:05, 21.23it/s] 118it [00:05, 21.22it/s] 121it [00:05, 21.46it/s] 124it [00:05, 21.55it/s] 127it [00:06, 21.68it/s] 130it [00:06, 21.17it/s] 133it [00:06, 21.01it/s] 136it [00:06, 20.65it/s] 139it [00:06, 20.71it/s] 142it [00:06, 20.58it/s] 145it [00:06, 20.79it/s] 148it [00:07, 20.73it/s]2025-05-26 00:55:12,514 - INFO - [Epoch 031 | Batch 0150] IWAE-loss 1856.3757 | mean log_px -0.0027 | KL -1664.40 + 151it [00:07, 20.74it/s] 154it [00:07, 21.10it/s] 157it [00:07, 21.53it/s] 160it [00:07, 21.71it/s] 163it [00:07, 22.12it/s] 166it [00:07, 22.37it/s] 169it [00:08, 22.55it/s] 172it [00:08, 22.79it/s] 175it [00:08, 22.44it/s] 178it [00:08, 22.61it/s] 181it [00:08, 22.86it/s] 184it [00:08, 22.98it/s] 187it [00:08, 23.06it/s] 190it [00:08, 23.06it/s] 193it [00:09, 23.04it/s] 196it [00:09, 21.46it/s] 196it [00:09, 21.08it/s] +2025-05-26 00:55:14,607 - INFO - Epoch: 31, Objective: tensor([1728.7632], device='cuda:0', grad_fn=), Loss: 0.00145659688860178, KL/n: 33.89814758300781 + 0it [00:00, ?it/s]2025-05-26 00:55:14,843 - INFO - [Epoch 032 | Batch 0000] IWAE-loss 1853.4015 | mean log_px -0.0028 | KL -1659.10 + 1it [00:00, 7.48it/s] 4it [00:00, 15.63it/s] 7it [00:00, 17.57it/s] 9it [00:00, 18.27it/s] 12it [00:00, 19.42it/s] 15it [00:00, 20.20it/s] 18it [00:00, 20.62it/s] 21it [00:01, 20.98it/s] 24it [00:01, 21.09it/s] 27it [00:01, 21.32it/s] 30it [00:01, 21.45it/s] 33it [00:01, 21.48it/s] 36it [00:01, 21.12it/s] 39it [00:01, 20.74it/s] 42it [00:02, 20.98it/s] 45it [00:02, 21.07it/s] 48it [00:02, 21.23it/s]2025-05-26 00:55:17,226 - INFO - [Epoch 032 | Batch 0050] IWAE-loss 1850.7280 | mean log_px -0.0029 | KL -1645.28 + 51it [00:02, 20.61it/s] 54it [00:02, 20.62it/s] 57it [00:02, 20.76it/s] 60it [00:02, 21.07it/s] 63it [00:03, 21.10it/s] 66it [00:03, 21.52it/s] 69it [00:03, 22.02it/s] 72it [00:03, 21.99it/s] 75it [00:03, 22.38it/s] 78it [00:03, 22.55it/s] 81it [00:03, 22.63it/s] 84it [00:04, 22.67it/s] 87it [00:04, 22.70it/s] 90it [00:04, 22.76it/s] 93it [00:04, 22.82it/s] 96it [00:04, 22.86it/s] 99it [00:04, 22.17it/s]2025-05-26 00:55:19,477 - INFO - [Epoch 032 | Batch 0100] IWAE-loss 2404.4751 | mean log_px -0.0109 | KL -1642.57 + 102it [00:04, 22.39it/s] 105it [00:04, 22.63it/s] 108it [00:05, 22.87it/s] 111it [00:05, 23.04it/s] 114it [00:05, 23.14it/s] 117it [00:05, 22.88it/s] 120it [00:05, 22.82it/s] 123it [00:05, 22.98it/s] 126it [00:05, 22.99it/s] 129it [00:05, 23.09it/s] 132it [00:06, 23.04it/s] 135it [00:06, 23.04it/s] 138it [00:06, 22.80it/s] 141it [00:06, 22.69it/s] 144it [00:06, 22.94it/s] 147it [00:06, 22.95it/s] 150it [00:06, 23.04it/s]2025-05-26 00:55:21,647 - INFO - [Epoch 032 | Batch 0150] IWAE-loss 1971.9681 | mean log_px -0.0048 | KL -1637.03 + 153it [00:07, 23.02it/s] 156it [00:07, 23.04it/s] 159it [00:07, 23.04it/s] 162it [00:07, 23.18it/s] 165it [00:07, 23.26it/s] 168it [00:07, 23.29it/s] 171it [00:07, 23.04it/s] 174it [00:07, 23.17it/s] 177it [00:08, 23.23it/s] 180it [00:08, 23.32it/s] 183it [00:08, 23.34it/s] 186it [00:08, 23.40it/s] 189it [00:08, 23.33it/s] 192it [00:08, 23.32it/s] 195it [00:08, 22.39it/s] 196it [00:08, 21.92it/s] +2025-05-26 00:55:23,677 - INFO - Epoch: 32, Objective: tensor([2710.9407], device='cuda:0', grad_fn=), Loss: 0.007914373651146889, KL/n: 33.389076232910156 + 0it [00:00, ?it/s]2025-05-26 00:55:24,063 - INFO - [Epoch 033 | Batch 0000] IWAE-loss 1848.1572 | mean log_px -0.0031 | KL -1634.18 + 1it [00:00, 9.33it/s] 4it [00:00, 18.08it/s] 7it [00:00, 20.50it/s] 10it [00:00, 21.55it/s] 13it [00:00, 22.10it/s] 16it [00:00, 22.40it/s] 19it [00:00, 22.54it/s] 22it [00:01, 22.69it/s] 25it [00:01, 22.84it/s] 28it [00:01, 22.91it/s] 31it [00:01, 23.03it/s] 34it [00:01, 23.07it/s] 37it [00:01, 23.02it/s] 40it [00:01, 23.03it/s] 43it [00:01, 23.09it/s] 46it [00:02, 23.08it/s] 49it [00:02, 23.07it/s]2025-05-26 00:55:26,236 - INFO - [Epoch 033 | Batch 0050] IWAE-loss 2684.5029 | mean log_px -0.0151 | KL -1626.44 + 52it [00:02, 23.00it/s] 55it [00:02, 23.01it/s] 58it [00:02, 23.03it/s] 61it [00:02, 23.02it/s] 64it [00:02, 22.92it/s] 67it [00:02, 22.95it/s] 70it [00:03, 23.02it/s] 73it [00:03, 22.97it/s] 76it [00:03, 22.93it/s] 79it [00:03, 22.20it/s] 82it [00:03, 22.09it/s] 85it [00:03, 21.86it/s] 88it [00:03, 21.83it/s] 91it [00:04, 21.68it/s] 94it [00:04, 21.76it/s] 97it [00:04, 21.79it/s] 100it [00:04, 21.73it/s]2025-05-26 00:55:28,482 - INFO - [Epoch 033 | Batch 0100] IWAE-loss 2151.1846 | mean log_px -0.0076 | KL -1619.63 + 103it [00:04, 21.74it/s] 106it [00:04, 21.74it/s] 109it [00:04, 21.74it/s] 112it [00:05, 21.80it/s] 115it [00:05, 21.87it/s] 118it [00:05, 21.89it/s] 121it [00:05, 21.88it/s] 124it [00:05, 21.87it/s] 127it [00:05, 21.57it/s] 130it [00:05, 21.58it/s] 133it [00:05, 21.77it/s] 136it [00:06, 21.89it/s] 139it [00:06, 21.91it/s] 142it [00:06, 22.00it/s] 145it [00:06, 22.04it/s] 148it [00:06, 22.10it/s]2025-05-26 00:55:30,765 - INFO - [Epoch 033 | Batch 0150] IWAE-loss 2086.4846 | mean log_px -0.0067 | KL -1615.08 + 151it [00:06, 22.05it/s] 154it [00:06, 22.11it/s] 157it [00:07, 22.13it/s] 160it [00:07, 22.19it/s] 163it [00:07, 22.20it/s] 166it [00:07, 22.19it/s] 169it [00:07, 22.08it/s] 172it [00:07, 22.12it/s] 175it [00:07, 22.10it/s] 178it [00:08, 22.12it/s] 181it [00:08, 22.02it/s] 184it [00:08, 22.02it/s] 187it [00:08, 22.00it/s] 190it [00:08, 22.03it/s] 193it [00:08, 21.99it/s] 196it [00:08, 21.11it/s] 196it [00:08, 21.94it/s] +2025-05-26 00:55:32,913 - INFO - Epoch: 33, Objective: tensor([2171.1729], device='cuda:0', grad_fn=), Loss: 0.003731202334165573, KL/n: 32.8597297668457 + 0it [00:00, ?it/s]2025-05-26 00:55:33,148 - INFO - [Epoch 034 | Batch 0000] IWAE-loss 1849.3541 | mean log_px -0.0034 | KL -1610.28 + 1it [00:00, 7.46it/s] 4it [00:00, 15.91it/s] 7it [00:00, 18.67it/s] 10it [00:00, 20.35it/s] 13it [00:00, 21.19it/s] 16it [00:00, 21.71it/s] 19it [00:00, 22.04it/s] 22it [00:01, 22.31it/s] 25it [00:01, 22.48it/s] 28it [00:01, 22.54it/s] 31it [00:01, 22.41it/s] 34it [00:01, 22.35it/s] 37it [00:01, 22.31it/s] 40it [00:01, 22.39it/s] 43it [00:02, 22.47it/s] 46it [00:02, 22.35it/s] 49it [00:02, 22.16it/s]2025-05-26 00:55:35,386 - INFO - [Epoch 034 | Batch 0050] IWAE-loss 1982.8550 | mean log_px -0.0054 | KL -1602.26 + 52it [00:02, 22.25it/s] 55it [00:02, 22.28it/s] 58it [00:02, 22.33it/s] 61it [00:02, 22.52it/s] 64it [00:02, 22.54it/s] 67it [00:03, 22.70it/s] 70it [00:03, 22.66it/s] 73it [00:03, 22.64it/s] 76it [00:03, 22.61it/s] 79it [00:03, 22.66it/s] 82it [00:03, 22.61it/s] 85it [00:03, 22.74it/s] 88it [00:04, 22.43it/s] 91it [00:04, 22.56it/s] 94it [00:04, 22.61it/s] 97it [00:04, 22.61it/s] 100it [00:04, 22.76it/s]2025-05-26 00:55:37,595 - INFO - [Epoch 034 | Batch 0100] IWAE-loss 2323.5063 | mean log_px -0.0104 | KL -1593.44 + 103it [00:04, 22.79it/s] 106it [00:04, 22.89it/s] 109it [00:04, 22.87it/s] 112it [00:05, 22.58it/s] 115it [00:05, 22.56it/s] 118it [00:05, 22.69it/s] 121it [00:05, 22.73it/s] 124it [00:05, 22.81it/s] 127it [00:05, 22.90it/s] 130it [00:05, 22.78it/s] 133it [00:05, 22.48it/s] 136it [00:06, 22.29it/s] 139it [00:06, 22.46it/s] 142it [00:06, 22.61it/s] 145it [00:06, 22.72it/s] 148it [00:06, 22.76it/s]2025-05-26 00:55:39,799 - INFO - [Epoch 034 | Batch 0150] IWAE-loss 1896.9507 | mean log_px -0.0044 | KL -1590.16 + 151it [00:06, 22.75it/s] 154it [00:06, 22.75it/s] 157it [00:07, 22.77it/s] 160it [00:07, 22.50it/s] 163it [00:07, 22.39it/s] 166it [00:07, 22.56it/s] 169it [00:07, 22.20it/s] 172it [00:07, 22.08it/s] 175it [00:07, 21.81it/s] 178it [00:08, 21.71it/s] 181it [00:08, 21.63it/s] 184it [00:08, 21.58it/s] 187it [00:08, 21.60it/s] 190it [00:08, 21.11it/s] 193it [00:08, 21.26it/s] 196it [00:08, 20.54it/s] 196it [00:08, 21.96it/s] +2025-05-26 00:55:41,970 - INFO - Epoch: 34, Objective: tensor([1753.0587], device='cuda:0', grad_fn=), Loss: 0.007030913140624762, KL/n: 32.41107177734375 + 0it [00:00, ?it/s]2025-05-26 00:55:42,521 - INFO - [Epoch 035 | Batch 0000] IWAE-loss 1725.0901 | mean log_px -0.0020 | KL -1586.56 + 1it [00:00, 3.57it/s] 4it [00:00, 10.86it/s] 7it [00:00, 14.60it/s] 9it [00:00, 16.07it/s] 12it [00:00, 17.82it/s] 15it [00:00, 19.11it/s] 18it [00:01, 19.94it/s] 21it [00:01, 20.39it/s] 24it [00:01, 20.85it/s] 27it [00:01, 20.92it/s] 30it [00:01, 20.83it/s] 33it [00:01, 21.05it/s] 36it [00:01, 20.86it/s] 39it [00:02, 20.74it/s] 42it [00:02, 20.90it/s] 45it [00:02, 21.16it/s] 48it [00:02, 21.42it/s]2025-05-26 00:55:44,883 - INFO - [Epoch 035 | Batch 0050] IWAE-loss 1760.3423 | mean log_px -0.0026 | KL -1578.82 + 51it [00:02, 21.35it/s] 54it [00:02, 21.24it/s] 57it [00:02, 21.43it/s] 60it [00:03, 21.49it/s] 63it [00:03, 21.68it/s] 66it [00:03, 21.63it/s] 69it [00:03, 21.71it/s] 72it [00:03, 21.41it/s] 75it [00:03, 21.30it/s] 78it [00:03, 21.54it/s] 81it [00:04, 21.57it/s] 84it [00:04, 21.67it/s] 87it [00:04, 21.35it/s] 90it [00:04, 20.83it/s] 93it [00:04, 21.08it/s] 96it [00:04, 20.99it/s] 99it [00:04, 21.08it/s]2025-05-26 00:55:47,228 - INFO - [Epoch 035 | Batch 0100] IWAE-loss 2038.8901 | mean log_px -0.0066 | KL -1573.97 + 102it [00:05, 21.25it/s] 105it [00:05, 21.48it/s] 108it [00:05, 21.47it/s] 111it [00:05, 21.39it/s] 114it [00:05, 21.36it/s] 117it [00:05, 21.49it/s] 120it [00:05, 21.32it/s] 123it [00:06, 21.17it/s] 126it [00:06, 20.82it/s] 129it [00:06, 21.18it/s] 132it [00:06, 21.27it/s] 135it [00:06, 21.47it/s] 138it [00:06, 21.27it/s] 141it [00:06, 21.21it/s] 144it [00:06, 21.43it/s] 147it [00:07, 21.34it/s] 150it [00:07, 20.73it/s]2025-05-26 00:55:49,590 - INFO - [Epoch 035 | Batch 0150] IWAE-loss 1973.0468 | mean log_px -0.0058 | KL -1570.39 + 153it [00:07, 20.84it/s] 156it [00:07, 21.15it/s] 159it [00:07, 21.34it/s] 162it [00:07, 21.41it/s] 165it [00:07, 21.56it/s] 168it [00:08, 21.35it/s] 171it [00:08, 21.59it/s] 174it [00:08, 21.77it/s] 177it [00:08, 22.00it/s] 180it [00:08, 22.01it/s] 183it [00:08, 21.91it/s] 186it [00:08, 21.90it/s] 189it [00:09, 21.65it/s] 192it [00:09, 21.36it/s] 195it [00:09, 20.49it/s] 196it [00:09, 20.61it/s] +2025-05-26 00:55:51,776 - INFO - Epoch: 35, Objective: tensor([1721.1652], device='cuda:0', grad_fn=), Loss: 0.002412135247141123, KL/n: 32.01908493041992 + 0it [00:00, ?it/s]2025-05-26 00:55:52,193 - INFO - [Epoch 036 | Batch 0000] IWAE-loss 1753.4949 | mean log_px -0.0027 | KL -1567.70 + 1it [00:00, 7.37it/s] 4it [00:00, 15.54it/s] 7it [00:00, 18.48it/s] 10it [00:00, 19.66it/s] 13it [00:00, 20.19it/s] 16it [00:00, 20.62it/s] 19it [00:00, 21.11it/s] 22it [00:01, 21.38it/s] 25it [00:01, 21.06it/s] 28it [00:01, 21.29it/s] 31it [00:01, 21.49it/s] 34it [00:01, 21.44it/s] 37it [00:01, 21.02it/s] 40it [00:01, 21.27it/s] 43it [00:02, 21.31it/s] 46it [00:02, 21.07it/s] 49it [00:02, 20.74it/s]2025-05-26 00:55:54,549 - INFO - [Epoch 036 | Batch 0050] IWAE-loss 1824.7357 | mean log_px -0.0037 | KL -1563.47 + 52it [00:02, 20.76it/s] 55it [00:02, 20.95it/s] 58it [00:02, 20.95it/s] 61it [00:02, 21.23it/s] 64it [00:03, 21.25it/s] 67it [00:03, 21.01it/s] 70it [00:03, 21.01it/s] 73it [00:03, 20.93it/s] 76it [00:03, 21.08it/s] 79it [00:03, 21.27it/s] 82it [00:03, 21.33it/s] 85it [00:04, 21.55it/s] 88it [00:04, 21.47it/s] 91it [00:04, 21.57it/s] 94it [00:04, 21.47it/s] 97it [00:04, 21.33it/s] 100it [00:04, 21.28it/s]2025-05-26 00:55:56,901 - INFO - [Epoch 036 | Batch 0100] IWAE-loss 1762.3829 | mean log_px -0.0030 | KL -1552.42 + 103it [00:04, 20.96it/s] 106it [00:05, 21.00it/s] 109it [00:05, 21.15it/s] 112it [00:05, 21.31it/s] 115it [00:05, 21.45it/s] 118it [00:05, 21.22it/s] 121it [00:05, 21.18it/s] 124it [00:05, 20.99it/s] 127it [00:06, 20.89it/s] 130it [00:06, 21.31it/s] 133it [00:06, 21.38it/s] 136it [00:06, 21.50it/s] 139it [00:06, 21.67it/s] 142it [00:06, 21.63it/s] 145it [00:06, 21.68it/s] 148it [00:07, 21.47it/s]2025-05-26 00:55:59,239 - INFO - [Epoch 036 | Batch 0150] IWAE-loss 2007.6768 | mean log_px -0.0065 | KL -1553.06 + 151it [00:07, 21.47it/s] 154it [00:07, 21.34it/s] 157it [00:07, 21.21it/s] 160it [00:07, 21.19it/s] 163it [00:07, 21.14it/s] 166it [00:07, 21.12it/s] 169it [00:08, 21.25it/s] 172it [00:08, 21.49it/s] 175it [00:08, 21.63it/s] 178it [00:08, 21.63it/s] 181it [00:08, 21.71it/s] 184it [00:08, 21.31it/s] 187it [00:08, 21.41it/s] 190it [00:09, 21.52it/s] 193it [00:09, 21.48it/s] 196it [00:09, 20.43it/s] 196it [00:09, 20.90it/s] +2025-05-26 00:56:01,459 - INFO - Epoch: 36, Objective: tensor([1793.2395], device='cuda:0', grad_fn=), Loss: 0.003322906093671918, KL/n: 31.67546844482422 + 0it [00:00, ?it/s]2025-05-26 00:56:01,703 - INFO - [Epoch 037 | Batch 0000] IWAE-loss 1980.2297 | mean log_px -0.0061 | KL -1553.80 + 1it [00:00, 7.25it/s] 4it [00:00, 15.87it/s] 7it [00:00, 18.50it/s] 10it [00:00, 19.73it/s] 13it [00:00, 20.37it/s] 16it [00:00, 20.80it/s] 19it [00:00, 21.11it/s] 22it [00:01, 21.29it/s] 25it [00:01, 21.42it/s] 28it [00:01, 21.37it/s] 31it [00:01, 21.32it/s] 34it [00:01, 21.37it/s] 37it [00:01, 21.62it/s] 40it [00:01, 21.72it/s] 43it [00:02, 21.84it/s] 46it [00:02, 21.95it/s] 49it [00:02, 21.96it/s]2025-05-26 00:56:04,005 - INFO - [Epoch 037 | Batch 0050] IWAE-loss 1743.4265 | mean log_px -0.0028 | KL -1545.66 + 52it [00:02, 21.92it/s] 55it [00:02, 21.96it/s] 58it [00:02, 21.97it/s] 61it [00:02, 21.91it/s] 64it [00:03, 21.94it/s] 67it [00:03, 21.96it/s] 70it [00:03, 21.85it/s] 73it [00:03, 21.86it/s] 76it [00:03, 21.85it/s] 79it [00:03, 21.92it/s] 82it [00:03, 21.92it/s] 85it [00:03, 21.87it/s] 88it [00:04, 21.82it/s] 91it [00:04, 21.89it/s] 94it [00:04, 21.95it/s] 97it [00:04, 21.99it/s] 100it [00:04, 22.00it/s]2025-05-26 00:56:06,286 - INFO - [Epoch 037 | Batch 0100] IWAE-loss 1922.7817 | mean log_px -0.0055 | KL -1536.46 + 103it [00:04, 21.94it/s] 106it [00:04, 21.96it/s] 109it [00:05, 21.98it/s] 112it [00:05, 21.99it/s] 115it [00:05, 22.01it/s] 118it [00:05, 21.99it/s] 121it [00:05, 21.96it/s] 124it [00:05, 21.95it/s] 127it [00:05, 21.90it/s] 130it [00:06, 21.88it/s] 133it [00:06, 21.93it/s] 136it [00:06, 21.92it/s] 139it [00:06, 21.91it/s] 142it [00:06, 21.94it/s] 145it [00:06, 22.00it/s] 148it [00:06, 22.00it/s]2025-05-26 00:56:08,564 - INFO - [Epoch 037 | Batch 0150] IWAE-loss 1774.1985 | mean log_px -0.0034 | KL -1537.65 + 151it [00:06, 21.88it/s] 154it [00:07, 21.93it/s] 157it [00:07, 21.88it/s] 160it [00:07, 21.92it/s] 163it [00:07, 21.98it/s] 166it [00:07, 22.00it/s] 169it [00:07, 21.99it/s] 172it [00:07, 21.93it/s] 175it [00:08, 21.94it/s] 178it [00:08, 22.00it/s] 181it [00:08, 21.99it/s] 184it [00:08, 21.99it/s] 187it [00:08, 21.97it/s] 190it [00:08, 21.99it/s] 193it [00:08, 21.96it/s] 196it [00:09, 20.91it/s] 196it [00:09, 21.46it/s] +2025-05-26 00:56:10,724 - INFO - Epoch: 37, Objective: tensor([2016.8008], device='cuda:0', grad_fn=), Loss: 0.009269584901630878, KL/n: 31.395700454711914 + 0it [00:00, ?it/s]2025-05-26 00:56:10,976 - INFO - [Epoch 038 | Batch 0000] IWAE-loss 1965.4436 | mean log_px -0.0061 | KL -1537.61 + 1it [00:00, 7.19it/s] 4it [00:00, 15.62it/s] 7it [00:00, 18.83it/s] 10it [00:00, 20.06it/s] 13it [00:00, 20.76it/s] 16it [00:00, 21.15it/s] 19it [00:00, 21.26it/s] 22it [00:01, 21.42it/s] 25it [00:01, 21.59it/s] 28it [00:01, 21.58it/s] 31it [00:01, 21.55it/s] 34it [00:01, 21.60it/s] 37it [00:01, 21.76it/s] 40it [00:01, 21.87it/s] 43it [00:02, 21.95it/s] 46it [00:02, 22.06it/s] 49it [00:02, 22.18it/s]2025-05-26 00:56:13,256 - INFO - [Epoch 038 | Batch 0050] IWAE-loss 1686.9346 | mean log_px -0.0022 | KL -1531.69 + 52it [00:02, 22.22it/s] 55it [00:02, 22.22it/s] 58it [00:02, 22.25it/s] 61it [00:02, 22.31it/s] 64it [00:02, 22.22it/s] 67it [00:03, 22.02it/s] 70it [00:03, 21.84it/s] 73it [00:03, 21.87it/s] 76it [00:03, 22.00it/s] 79it [00:03, 22.10it/s] 82it [00:03, 22.01it/s] 85it [00:03, 22.00it/s] 88it [00:04, 21.92it/s] 91it [00:04, 21.88it/s] 94it [00:04, 21.88it/s] 97it [00:04, 21.97it/s] 100it [00:04, 22.07it/s]2025-05-26 00:56:15,527 - INFO - [Epoch 038 | Batch 0100] IWAE-loss 1852.7317 | mean log_px -0.0046 | KL -1529.51 + 103it [00:04, 22.08it/s] 106it [00:04, 22.16it/s] 109it [00:05, 22.02it/s] 112it [00:05, 21.99it/s] 115it [00:05, 21.96it/s] 118it [00:05, 21.96it/s] 121it [00:05, 22.05it/s] 124it [00:05, 22.12it/s] 127it [00:05, 22.22it/s] 130it [00:05, 22.20it/s] 133it [00:06, 22.08it/s] 136it [00:06, 22.01it/s] 139it [00:06, 22.10it/s] 142it [00:06, 22.10it/s] 145it [00:06, 22.20it/s] 148it [00:06, 22.24it/s]2025-05-26 00:56:17,787 - INFO - [Epoch 038 | Batch 0150] IWAE-loss 2156.8225 | mean log_px -0.0090 | KL -1524.95 + 151it [00:06, 22.20it/s] 154it [00:07, 21.92it/s] 157it [00:07, 21.50it/s] 160it [00:07, 21.60it/s] 163it [00:07, 21.62it/s] 166it [00:07, 21.69it/s] 169it [00:07, 21.76it/s] 172it [00:07, 21.76it/s] 175it [00:08, 21.71it/s] 178it [00:08, 21.64it/s] 181it [00:08, 21.72it/s] 184it [00:08, 21.85it/s] 187it [00:08, 21.97it/s] 190it [00:08, 22.09it/s] 193it [00:08, 22.10it/s] 196it [00:09, 21.01it/s] 196it [00:09, 21.55it/s] +2025-05-26 00:56:19,960 - INFO - Epoch: 38, Objective: tensor([1890.7566], device='cuda:0', grad_fn=), Loss: 0.005462957546114922, KL/n: 31.092975616455078 + 0it [00:00, ?it/s]2025-05-26 00:56:20,394 - INFO - [Epoch 039 | Batch 0000] IWAE-loss 1657.1321 | mean log_px -0.0019 | KL -1521.62 + 1it [00:00, 6.79it/s] 4it [00:00, 15.76it/s] 7it [00:00, 18.82it/s] 10it [00:00, 20.33it/s] 13it [00:00, 20.89it/s] 16it [00:00, 21.26it/s] 19it [00:00, 21.53it/s] 22it [00:01, 21.68it/s] 25it [00:01, 21.75it/s] 28it [00:01, 21.85it/s] 31it [00:01, 21.54it/s] 34it [00:01, 21.70it/s] 37it [00:01, 21.89it/s] 40it [00:01, 21.80it/s] 43it [00:02, 21.96it/s] 46it [00:02, 22.13it/s] 49it [00:02, 22.10it/s]2025-05-26 00:56:22,656 - INFO - [Epoch 039 | Batch 0050] IWAE-loss 2213.8079 | mean log_px -0.0100 | KL -1510.99 + 52it [00:02, 22.03it/s] 55it [00:02, 22.01it/s] 58it [00:02, 22.12it/s] 61it [00:02, 22.25it/s] 64it [00:02, 22.49it/s] 67it [00:03, 22.75it/s] 70it [00:03, 22.90it/s] 73it [00:03, 22.97it/s] 76it [00:03, 23.05it/s] 79it [00:03, 23.11it/s] 82it [00:03, 23.16it/s] 85it [00:03, 23.17it/s] 88it [00:04, 23.20it/s] 91it [00:04, 23.21it/s] 94it [00:04, 23.22it/s] 97it [00:04, 22.94it/s] 100it [00:04, 22.55it/s]2025-05-26 00:56:24,846 - INFO - [Epoch 039 | Batch 0100] IWAE-loss 2000.8184 | mean log_px -0.0071 | KL -1506.69 + 103it [00:04, 22.18it/s] 106it [00:04, 22.03it/s] 109it [00:04, 22.01it/s] 112it [00:05, 21.92it/s] 115it [00:05, 21.92it/s] 118it [00:05, 21.92it/s] 121it [00:05, 21.98it/s] 124it [00:05, 21.97it/s] 127it [00:05, 21.94it/s] 130it [00:05, 21.88it/s] 133it [00:06, 21.82it/s] 136it [00:06, 21.78it/s] 139it [00:06, 21.87it/s] 142it [00:06, 21.94it/s] 145it [00:06, 21.92it/s] 148it [00:06, 21.89it/s]2025-05-26 00:56:27,134 - INFO - [Epoch 039 | Batch 0150] IWAE-loss 2544.7124 | mean log_px -0.0149 | KL -1501.78 + 151it [00:06, 21.83it/s] 154it [00:07, 21.84it/s] 157it [00:07, 21.83it/s] 160it [00:07, 21.82it/s] 163it [00:07, 21.60it/s] 166it [00:07, 21.72it/s] 169it [00:07, 21.84it/s] 172it [00:07, 21.96it/s] 175it [00:07, 22.04it/s] 178it [00:08, 21.97it/s] 181it [00:08, 21.96it/s] 184it [00:08, 21.94it/s] 187it [00:08, 21.86it/s] 190it [00:08, 21.90it/s] 193it [00:08, 21.91it/s] 196it [00:08, 20.80it/s] 196it [00:09, 21.69it/s] +2025-05-26 00:56:29,304 - INFO - Epoch: 39, Objective: tensor([1875.9635], device='cuda:0', grad_fn=), Loss: 0.007261547725647688, KL/n: 30.549692153930664 + 0it [00:00, ?it/s]2025-05-26 00:56:29,542 - INFO - [Epoch 040 | Batch 0000] IWAE-loss 1842.3949 | mean log_px -0.0049 | KL -1497.21 + 1it [00:00, 7.50it/s] 4it [00:00, 15.78it/s] 7it [00:00, 18.02it/s] 10it [00:00, 19.27it/s] 13it [00:00, 19.74it/s] 16it [00:00, 20.09it/s] 19it [00:00, 20.46it/s] 22it [00:01, 20.58it/s] 25it [00:01, 20.68it/s] 28it [00:01, 20.48it/s] 31it [00:01, 20.79it/s] 34it [00:01, 21.10it/s] 37it [00:01, 21.22it/s] 40it [00:01, 21.43it/s] 43it [00:02, 21.60it/s] 46it [00:02, 21.58it/s] 49it [00:02, 21.35it/s]2025-05-26 00:56:31,909 - INFO - [Epoch 040 | Batch 0050] IWAE-loss 1698.6771 | mean log_px -0.0029 | KL -1494.70 + 52it [00:02, 21.46it/s] 55it [00:02, 21.61it/s] 58it [00:02, 21.61it/s] 61it [00:02, 21.72it/s] 64it [00:03, 21.24it/s] 67it [00:03, 21.27it/s] 70it [00:03, 21.18it/s] 73it [00:03, 20.93it/s] 76it [00:03, 20.90it/s] 79it [00:03, 21.23it/s] 82it [00:03, 21.45it/s] 85it [00:04, 21.69it/s] 88it [00:04, 21.71it/s] 91it [00:04, 21.67it/s] 94it [00:04, 21.98it/s] 97it [00:04, 22.20it/s] 100it [00:04, 22.08it/s]2025-05-26 00:56:34,223 - INFO - [Epoch 040 | Batch 0100] IWAE-loss 1793.5496 | mean log_px -0.0044 | KL -1482.38 + 103it [00:04, 22.20it/s] 106it [00:05, 21.85it/s] 109it [00:05, 21.51it/s] 112it [00:05, 21.52it/s] 115it [00:05, 21.52it/s] 118it [00:05, 21.10it/s] 121it [00:05, 21.20it/s] 124it [00:05, 21.30it/s] 127it [00:06, 21.09it/s] 130it [00:06, 21.07it/s] 133it [00:06, 20.70it/s] 136it [00:06, 21.02it/s] 139it [00:06, 21.07it/s] 142it [00:06, 21.13it/s] 145it [00:06, 21.26it/s] 148it [00:07, 21.09it/s]2025-05-26 00:56:36,584 - INFO - [Epoch 040 | Batch 0150] IWAE-loss 4117.7095 | mean log_px -0.0376 | KL -1484.14 + 151it [00:07, 21.18it/s] 154it [00:07, 20.81it/s] 157it [00:07, 20.82it/s] 160it [00:07, 20.80it/s] 163it [00:07, 21.00it/s] 166it [00:07, 21.12it/s] 169it [00:08, 21.31it/s] 172it [00:08, 21.42it/s] 175it [00:08, 21.43it/s] 178it [00:08, 21.44it/s] 181it [00:08, 21.47it/s] 184it [00:08, 21.62it/s] 187it [00:08, 21.67it/s] 190it [00:08, 21.67it/s] 193it [00:09, 21.74it/s] 196it [00:09, 20.76it/s] 196it [00:09, 20.95it/s] +2025-05-26 00:56:38,792 - INFO - Epoch: 40, Objective: tensor([1690.6498], device='cuda:0', grad_fn=), Loss: 0.004622005857527256, KL/n: 30.239253997802734 + 0it [00:00, ?it/s]2025-05-26 00:56:39,346 - INFO - [Epoch 041 | Batch 0000] IWAE-loss 1677.8485 | mean log_px -0.0028 | KL -1480.47 + 1it [00:00, 3.50it/s] 4it [00:00, 10.77it/s] 7it [00:00, 14.77it/s] 10it [00:00, 17.13it/s] 13it [00:00, 18.60it/s] 16it [00:00, 19.43it/s] 19it [00:01, 20.06it/s] 22it [00:01, 19.97it/s] 25it [00:01, 20.07it/s] 28it [00:01, 20.48it/s] 31it [00:01, 20.54it/s] 34it [00:01, 20.58it/s] 37it [00:02, 20.66it/s] 40it [00:02, 20.95it/s] 43it [00:02, 21.16it/s] 46it [00:02, 21.20it/s] 49it [00:02, 21.06it/s]2025-05-26 00:56:41,722 - INFO - [Epoch 041 | Batch 0050] IWAE-loss 2171.2034 | mean log_px -0.0100 | KL -1473.00 + 52it [00:02, 21.15it/s] 55it [00:02, 21.10it/s] 58it [00:02, 21.02it/s] 61it [00:03, 21.01it/s] 64it [00:03, 21.03it/s] 67it [00:03, 20.84it/s] 70it [00:03, 20.87it/s] 73it [00:03, 21.10it/s] 76it [00:03, 21.06it/s] 79it [00:03, 21.01it/s] 82it [00:04, 21.20it/s] 85it [00:04, 20.95it/s] 88it [00:04, 21.17it/s] 91it [00:04, 21.36it/s] 94it [00:04, 21.34it/s] 97it [00:04, 21.44it/s] 100it [00:04, 21.22it/s]2025-05-26 00:56:44,091 - INFO - [Epoch 041 | Batch 0100] IWAE-loss 1999.5659 | mean log_px -0.0076 | KL -1466.32 + 103it [00:05, 21.04it/s] 106it [00:05, 20.98it/s] 109it [00:05, 21.17it/s] 112it [00:05, 20.93it/s] 115it [00:05, 20.91it/s] 118it [00:05, 21.00it/s] 121it [00:05, 21.11it/s] 124it [00:06, 20.54it/s] 127it [00:06, 20.76it/s] 130it [00:06, 20.92it/s] 133it [00:06, 21.18it/s] 136it [00:06, 21.27it/s] 139it [00:06, 21.01it/s] 142it [00:06, 21.08it/s] 145it [00:07, 21.20it/s] 148it [00:07, 21.28it/s]2025-05-26 00:56:46,464 - INFO - [Epoch 041 | Batch 0150] IWAE-loss 2395.8970 | mean log_px -0.0134 | KL -1456.24 + 151it [00:07, 21.36it/s] 154it [00:07, 21.49it/s] 157it [00:07, 21.37it/s] 160it [00:07, 20.82it/s] 163it [00:07, 20.17it/s] 166it [00:08, 20.14it/s] 169it [00:08, 20.28it/s] 172it [00:08, 20.66it/s] 175it [00:08, 20.91it/s] 178it [00:08, 21.14it/s] 181it [00:08, 21.31it/s] 184it [00:08, 21.44it/s] 187it [00:09, 21.40it/s] 190it [00:09, 21.42it/s] 193it [00:09, 21.48it/s] 196it [00:09, 20.72it/s] 196it [00:09, 20.37it/s] +2025-05-26 00:56:48,712 - INFO - Epoch: 41, Objective: tensor([1823.1604], device='cuda:0', grad_fn=), Loss: 0.007570958696305752, KL/n: 29.72381019592285 + 0it [00:00, ?it/s]2025-05-26 00:56:49,136 - INFO - [Epoch 042 | Batch 0000] IWAE-loss 1591.7466 | mean log_px -0.0019 | KL -1456.50 + 1it [00:00, 7.14it/s] 4it [00:00, 15.46it/s] 7it [00:00, 17.82it/s] 10it [00:00, 19.30it/s] 13it [00:00, 20.12it/s] 16it [00:00, 20.59it/s] 19it [00:00, 20.85it/s] 22it [00:01, 21.04it/s] 25it [00:01, 21.19it/s] 28it [00:01, 21.26it/s] 31it [00:01, 20.71it/s] 34it [00:01, 20.91it/s] 37it [00:01, 21.18it/s] 40it [00:01, 21.18it/s] 43it [00:02, 21.35it/s] 46it [00:02, 21.41it/s] 49it [00:02, 21.41it/s]2025-05-26 00:56:51,488 - INFO - [Epoch 042 | Batch 0050] IWAE-loss 1625.7894 | mean log_px -0.0025 | KL -1450.46 + 52it [00:02, 21.47it/s] 55it [00:02, 21.58it/s] 58it [00:02, 21.57it/s] 61it [00:02, 21.54it/s] 64it [00:03, 21.36it/s] 67it [00:03, 21.49it/s] 70it [00:03, 21.45it/s] 73it [00:03, 21.37it/s] 76it [00:03, 21.46it/s] 79it [00:03, 21.54it/s] 82it [00:03, 21.57it/s] 85it [00:04, 21.55it/s] 88it [00:04, 21.58it/s] 91it [00:04, 21.63it/s] 94it [00:04, 21.73it/s] 97it [00:04, 21.75it/s] 100it [00:04, 21.70it/s]2025-05-26 00:56:53,806 - INFO - [Epoch 042 | Batch 0100] IWAE-loss 2281.2720 | mean log_px -0.0119 | KL -1445.24 + 103it [00:04, 21.37it/s] 106it [00:05, 21.38it/s] 109it [00:05, 21.50it/s] 112it [00:05, 21.58it/s] 115it [00:05, 21.66it/s] 118it [00:05, 21.69it/s] 121it [00:05, 21.72it/s] 124it [00:05, 21.73it/s] 127it [00:06, 21.78it/s] 130it [00:06, 21.73it/s] 133it [00:06, 21.62it/s] 136it [00:06, 21.57it/s] 139it [00:06, 21.52it/s] 142it [00:06, 21.42it/s] 145it [00:06, 21.43it/s] 148it [00:06, 21.43it/s]2025-05-26 00:56:56,126 - INFO - [Epoch 042 | Batch 0150] IWAE-loss 1771.2439 | mean log_px -0.0046 | KL -1446.79 + 151it [00:07, 21.49it/s] 154it [00:07, 21.43it/s] 157it [00:07, 21.44it/s] 160it [00:07, 21.42it/s] 163it [00:07, 21.13it/s] 166it [00:07, 21.14it/s] 169it [00:07, 21.34it/s] 172it [00:08, 21.49it/s] 175it [00:08, 21.62it/s] 178it [00:08, 21.48it/s] 181it [00:08, 21.55it/s] 184it [00:08, 21.63it/s] 187it [00:08, 21.67it/s] 190it [00:08, 21.71it/s] 193it [00:09, 21.69it/s] 196it [00:09, 20.67it/s] 196it [00:09, 21.06it/s] +2025-05-26 00:56:58,332 - INFO - Epoch: 42, Objective: tensor([2071.3540], device='cuda:0', grad_fn=), Loss: 0.014108674600720406, KL/n: 29.50428009033203 + 0it [00:00, ?it/s]2025-05-26 00:56:58,586 - INFO - [Epoch 043 | Batch 0000] IWAE-loss 2471.4727 | mean log_px -0.0146 | KL -1446.35 + 1it [00:00, 6.53it/s] 4it [00:00, 14.60it/s] 7it [00:00, 17.70it/s] 10it [00:00, 19.21it/s] 13it [00:00, 20.00it/s] 16it [00:00, 20.55it/s] 19it [00:00, 20.87it/s] 22it [00:01, 21.16it/s] 25it [00:01, 21.34it/s] 28it [00:01, 21.50it/s] 31it [00:01, 21.60it/s] 34it [00:01, 21.61it/s] 37it [00:01, 21.32it/s] 40it [00:01, 21.29it/s] 43it [00:02, 21.44it/s] 46it [00:02, 21.50it/s] 49it [00:02, 21.58it/s]2025-05-26 00:57:00,914 - INFO - [Epoch 043 | Batch 0050] IWAE-loss 1602.5768 | mean log_px -0.0023 | KL -1443.20 + 52it [00:02, 21.68it/s] 55it [00:02, 21.72it/s] 58it [00:02, 21.76it/s] 61it [00:02, 21.71it/s] 64it [00:03, 21.75it/s] 67it [00:03, 21.52it/s] 70it [00:03, 21.45it/s] 73it [00:03, 21.50it/s] 76it [00:03, 21.57it/s] 79it [00:03, 21.60it/s] 82it [00:03, 21.64it/s] 85it [00:04, 21.48it/s] 88it [00:04, 21.52it/s] 91it [00:04, 21.60it/s] 94it [00:04, 21.56it/s] 97it [00:04, 21.57it/s] 100it [00:04, 21.55it/s]2025-05-26 00:57:03,230 - INFO - [Epoch 043 | Batch 0100] IWAE-loss 2544.3938 | mean log_px -0.0158 | KL -1437.81 + 103it [00:04, 21.55it/s] 106it [00:05, 21.56it/s] 109it [00:05, 21.55it/s] 112it [00:05, 21.62it/s] 115it [00:05, 21.56it/s] 118it [00:05, 21.58it/s] 121it [00:05, 21.61it/s] 124it [00:05, 21.69it/s] 127it [00:05, 21.70it/s] 130it [00:06, 21.75it/s] 133it [00:06, 21.84it/s] 136it [00:06, 21.89it/s] 139it [00:06, 21.89it/s] 142it [00:06, 21.89it/s] 145it [00:06, 21.97it/s] 148it [00:06, 21.90it/s]2025-05-26 00:57:05,527 - INFO - [Epoch 043 | Batch 0150] IWAE-loss 2123.0671 | mean log_px -0.0099 | KL -1432.95 + 151it [00:07, 21.84it/s] 154it [00:07, 21.90it/s] 157it [00:07, 21.82it/s] 160it [00:07, 21.84it/s] 163it [00:07, 21.77it/s] 166it [00:07, 21.78it/s] 169it [00:07, 21.88it/s] 172it [00:08, 21.90it/s] 175it [00:08, 21.91it/s] 178it [00:08, 21.93it/s] 181it [00:08, 21.96it/s] 184it [00:08, 21.88it/s] 187it [00:08, 21.89it/s] 190it [00:08, 21.84it/s] 193it [00:09, 21.86it/s] 196it [00:09, 20.70it/s] 196it [00:09, 21.22it/s] +2025-05-26 00:57:07,696 - INFO - Epoch: 43, Objective: tensor([1849.3069], device='cuda:0', grad_fn=), Loss: 0.004115985706448555, KL/n: 29.187782287597656 + 0it [00:00, ?it/s]2025-05-26 00:57:08,129 - INFO - [Epoch 044 | Batch 0000] IWAE-loss 1622.7651 | mean log_px -0.0028 | KL -1428.05 + 1it [00:00, 6.97it/s] 4it [00:00, 15.36it/s] 7it [00:00, 18.73it/s] 10it [00:00, 20.22it/s] 13it [00:00, 20.42it/s] 16it [00:00, 20.39it/s] 19it [00:00, 20.88it/s] 22it [00:01, 21.22it/s] 25it [00:01, 21.46it/s] 28it [00:01, 21.52it/s] 31it [00:01, 21.55it/s] 34it [00:01, 21.58it/s] 37it [00:01, 21.69it/s] 40it [00:01, 21.83it/s] 43it [00:02, 21.90it/s] 46it [00:02, 21.96it/s] 49it [00:02, 21.97it/s]2025-05-26 00:57:10,419 - INFO - [Epoch 044 | Batch 0050] IWAE-loss 1785.8911 | mean log_px -0.0052 | KL -1424.84 + 52it [00:02, 21.92it/s] 55it [00:02, 21.89it/s] 58it [00:02, 21.99it/s] 61it [00:02, 21.99it/s] 64it [00:03, 21.96it/s] 67it [00:03, 21.97it/s] 70it [00:03, 21.97it/s] 73it [00:03, 21.99it/s] 76it [00:03, 22.02it/s] 79it [00:03, 21.98it/s] 82it [00:03, 21.99it/s] 85it [00:03, 21.97it/s] 88it [00:04, 22.03it/s] 91it [00:04, 21.83it/s] 94it [00:04, 21.85it/s] 97it [00:04, 21.91it/s] 100it [00:04, 21.92it/s]2025-05-26 00:57:12,698 - INFO - [Epoch 044 | Batch 0100] IWAE-loss 1799.6758 | mean log_px -0.0055 | KL -1414.32 + 103it [00:04, 21.86it/s] 106it [00:04, 21.90it/s] 109it [00:05, 21.95it/s] 112it [00:05, 21.95it/s] 115it [00:05, 21.97it/s] 118it [00:05, 22.02it/s] 121it [00:05, 22.05it/s] 124it [00:05, 22.04it/s] 127it [00:05, 22.05it/s] 130it [00:06, 22.03it/s] 133it [00:06, 22.05it/s] 136it [00:06, 21.97it/s] 139it [00:06, 21.95it/s] 142it [00:06, 21.32it/s] 145it [00:06, 20.90it/s] 148it [00:06, 21.09it/s]2025-05-26 00:57:15,006 - INFO - [Epoch 044 | Batch 0150] IWAE-loss 1856.3705 | mean log_px -0.0064 | KL -1408.81 + 151it [00:07, 21.11it/s] 154it [00:07, 21.24it/s] 157it [00:07, 21.41it/s] 160it [00:07, 21.46it/s] 163it [00:07, 21.56it/s] 166it [00:07, 21.64it/s] 169it [00:07, 21.70it/s] 172it [00:07, 21.74it/s] 175it [00:08, 21.57it/s] 178it [00:08, 21.69it/s] 181it [00:08, 22.03it/s] 184it [00:08, 22.27it/s] 187it [00:08, 21.74it/s] 190it [00:08, 21.68it/s] 193it [00:08, 21.61it/s] 196it [00:09, 20.15it/s] 196it [00:09, 21.31it/s] +2025-05-26 00:57:17,203 - INFO - Epoch: 44, Objective: tensor([1650.4667], device='cuda:0', grad_fn=), Loss: 0.0043082693591713905, KL/n: 28.803646087646484 + 0it [00:00, ?it/s]2025-05-26 00:57:17,453 - INFO - [Epoch 045 | Batch 0000] IWAE-loss 1637.3373 | mean log_px -0.0032 | KL -1411.23 + 1it [00:00, 6.79it/s] 4it [00:00, 14.98it/s] 7it [00:00, 17.95it/s] 10it [00:00, 19.53it/s] 13it [00:00, 20.72it/s] 16it [00:00, 21.57it/s] 19it [00:00, 22.09it/s] 22it [00:01, 22.38it/s] 25it [00:01, 22.39it/s] 28it [00:01, 22.45it/s] 31it [00:01, 22.42it/s] 34it [00:01, 22.31it/s] 37it [00:01, 22.49it/s] 40it [00:01, 22.57it/s] 43it [00:02, 22.68it/s] 46it [00:02, 22.59it/s] 49it [00:02, 22.77it/s]2025-05-26 00:57:19,676 - INFO - [Epoch 045 | Batch 0050] IWAE-loss 2104.2029 | mean log_px -0.0099 | KL -1408.87 + 52it [00:02, 22.77it/s] 55it [00:02, 22.89it/s] 58it [00:02, 22.95it/s] 61it [00:02, 22.96it/s] 64it [00:02, 22.98it/s] 67it [00:03, 23.01it/s] 70it [00:03, 22.99it/s] 73it [00:03, 22.92it/s] 76it [00:03, 22.69it/s] 79it [00:03, 22.40it/s] 82it [00:03, 22.54it/s] 85it [00:03, 22.68it/s] 88it [00:03, 22.73it/s] 91it [00:04, 22.90it/s] 94it [00:04, 22.80it/s] 97it [00:04, 22.79it/s] 100it [00:04, 22.85it/s]2025-05-26 00:57:21,867 - INFO - [Epoch 045 | Batch 0100] IWAE-loss 1605.4434 | mean log_px -0.0029 | KL -1402.01 + 103it [00:04, 22.83it/s] 106it [00:04, 22.77it/s] 109it [00:04, 22.90it/s] 112it [00:05, 22.95it/s] 115it [00:05, 22.98it/s] 118it [00:05, 23.05it/s] 121it [00:05, 23.04it/s] 124it [00:05, 23.02it/s] 127it [00:05, 23.04it/s] 130it [00:05, 22.99it/s] 133it [00:05, 23.06it/s] 136it [00:06, 23.14it/s] 139it [00:06, 23.15it/s] 142it [00:06, 23.23it/s] 145it [00:06, 22.97it/s] 148it [00:06, 22.92it/s]2025-05-26 00:57:24,040 - INFO - [Epoch 045 | Batch 0150] IWAE-loss 2139.8701 | mean log_px -0.0107 | KL -1391.61 + 151it [00:06, 22.90it/s] 154it [00:06, 22.45it/s] 157it [00:07, 22.23it/s] 160it [00:07, 21.81it/s] 163it [00:07, 21.76it/s] 166it [00:07, 21.73it/s] 169it [00:07, 21.73it/s] 172it [00:07, 21.75it/s] 175it [00:07, 21.66it/s] 178it [00:07, 21.63it/s] 181it [00:08, 21.67it/s] 184it [00:08, 21.69it/s] 187it [00:08, 21.63it/s] 190it [00:08, 21.66it/s] 193it [00:08, 21.76it/s] 196it [00:08, 20.64it/s] 196it [00:08, 22.07it/s] +2025-05-26 00:57:26,212 - INFO - Epoch: 45, Objective: tensor([1448.7209], device='cuda:0', grad_fn=), Loss: 0.0009417841793037951, KL/n: 28.448556900024414 + 0it [00:00, ?it/s]2025-05-26 00:57:26,463 - INFO - [Epoch 046 | Batch 0000] IWAE-loss 2507.5264 | mean log_px -0.0159 | KL -1395.98 + 1it [00:00, 7.09it/s] 4it [00:00, 15.05it/s] 7it [00:00, 18.00it/s] 10it [00:00, 19.47it/s] 13it [00:00, 20.00it/s] 16it [00:00, 20.63it/s] 19it [00:00, 21.02it/s] 22it [00:01, 21.20it/s] 25it [00:01, 21.46it/s] 28it [00:01, 21.70it/s] 31it [00:01, 21.93it/s] 34it [00:01, 21.78it/s] 37it [00:01, 21.83it/s] 40it [00:01, 21.75it/s] 43it [00:02, 21.62it/s] 46it [00:02, 21.30it/s] 49it [00:02, 20.91it/s]2025-05-26 00:57:28,793 - INFO - [Epoch 046 | Batch 0050] IWAE-loss 1671.3993 | mean log_px -0.0041 | KL -1383.41 + 52it [00:02, 21.11it/s] 55it [00:02, 21.07it/s] 58it [00:02, 20.98it/s] 61it [00:02, 20.94it/s] 64it [00:03, 21.21it/s] 67it [00:03, 21.43it/s] 70it [00:03, 21.60it/s] 73it [00:03, 21.60it/s] 76it [00:03, 21.55it/s] 79it [00:03, 21.61it/s] 82it [00:03, 21.24it/s] 85it [00:04, 20.72it/s] 88it [00:04, 20.65it/s] 91it [00:04, 20.97it/s] 94it [00:04, 21.08it/s] 97it [00:04, 21.03it/s] 100it [00:04, 21.25it/s]2025-05-26 00:57:31,152 - INFO - [Epoch 046 | Batch 0100] IWAE-loss 1902.7402 | mean log_px -0.0074 | KL -1382.97 + 103it [00:04, 20.97it/s] 106it [00:05, 21.09it/s] 109it [00:05, 21.28it/s] 112it [00:05, 21.46it/s] 115it [00:05, 21.44it/s] 118it [00:05, 21.36it/s] 121it [00:05, 21.05it/s] 124it [00:05, 21.12it/s] 127it [00:06, 20.98it/s] 130it [00:06, 20.92it/s] 133it [00:06, 21.15it/s] 136it [00:06, 21.19it/s] 139it [00:06, 21.29it/s] 142it [00:06, 20.93it/s] 145it [00:06, 21.09it/s] 148it [00:07, 21.21it/s]2025-05-26 00:57:33,511 - INFO - [Epoch 046 | Batch 0150] IWAE-loss 1636.1058 | mean log_px -0.0036 | KL -1382.20 + 151it [00:07, 21.33it/s] 154it [00:07, 21.25it/s] 157it [00:07, 20.88it/s] 160it [00:07, 21.06it/s] 163it [00:07, 21.10it/s] 166it [00:07, 21.29it/s] 169it [00:08, 20.93it/s] 172it [00:08, 21.01it/s] 175it [00:08, 21.09it/s] 178it [00:08, 21.35it/s] 181it [00:08, 21.50it/s] 184it [00:08, 21.60it/s] 187it [00:08, 21.22it/s] 190it [00:09, 21.11it/s] 193it [00:09, 21.00it/s] 196it [00:09, 19.86it/s] 196it [00:09, 20.85it/s] +2025-05-26 00:57:35,749 - INFO - Epoch: 46, Objective: tensor([1802.6743], device='cuda:0', grad_fn=), Loss: 0.006433203816413879, KL/n: 28.203641891479492 + 0it [00:00, ?it/s]2025-05-26 00:57:36,169 - INFO - [Epoch 047 | Batch 0000] IWAE-loss 2782.5513 | mean log_px -0.0200 | KL -1383.00 + 1it [00:00, 7.62it/s] 4it [00:00, 15.79it/s] 7it [00:00, 18.22it/s] 10it [00:00, 19.29it/s] 13it [00:00, 19.80it/s] 16it [00:00, 20.02it/s] 19it [00:00, 20.30it/s] 22it [00:01, 20.62it/s] 25it [00:01, 20.92it/s] 28it [00:01, 21.06it/s] 31it [00:01, 20.97it/s] 34it [00:01, 21.22it/s] 37it [00:01, 21.21it/s] 40it [00:01, 21.34it/s] 43it [00:02, 21.43it/s] 46it [00:02, 21.48it/s] 49it [00:02, 21.58it/s]2025-05-26 00:57:38,527 - INFO - [Epoch 047 | Batch 0050] IWAE-loss 1485.3203 | mean log_px -0.0015 | KL -1377.35 + 52it [00:02, 21.42it/s] 55it [00:02, 21.42it/s] 58it [00:02, 21.35it/s] 61it [00:02, 21.36it/s] 64it [00:03, 21.48it/s] 67it [00:03, 21.31it/s] 70it [00:03, 21.28it/s] 73it [00:03, 21.33it/s] 76it [00:03, 21.37it/s] 79it [00:03, 21.40it/s] 82it [00:03, 21.46it/s] 85it [00:04, 21.49it/s] 88it [00:04, 21.37it/s] 91it [00:04, 21.17it/s] 94it [00:04, 21.15it/s] 97it [00:04, 21.36it/s] 100it [00:04, 21.49it/s]2025-05-26 00:57:40,869 - INFO - [Epoch 047 | Batch 0100] IWAE-loss 1822.8883 | mean log_px -0.0064 | KL -1371.89 + 103it [00:04, 21.53it/s] 106it [00:05, 21.63it/s] 109it [00:05, 21.73it/s] 112it [00:05, 21.75it/s] 115it [00:05, 21.75it/s] 118it [00:05, 21.72it/s] 121it [00:05, 21.75it/s] 124it [00:05, 21.66it/s] 127it [00:06, 21.47it/s] 130it [00:06, 21.07it/s] 133it [00:06, 20.89it/s] 136it [00:06, 21.06it/s] 139it [00:06, 20.99it/s] 142it [00:06, 21.11it/s] 145it [00:06, 21.28it/s] 148it [00:07, 21.43it/s]2025-05-26 00:57:43,205 - INFO - [Epoch 047 | Batch 0150] IWAE-loss 1521.3999 | mean log_px -0.0022 | KL -1370.30 + 151it [00:07, 21.35it/s] 154it [00:07, 21.34it/s] 157it [00:07, 21.48it/s] 160it [00:07, 21.44it/s] 163it [00:07, 21.52it/s] 166it [00:07, 21.18it/s] 169it [00:08, 21.30it/s] 172it [00:08, 21.24it/s] 175it [00:08, 21.07it/s] 178it [00:08, 21.27it/s] 181it [00:08, 21.39it/s] 184it [00:08, 21.42it/s] 187it [00:08, 21.52it/s] 190it [00:08, 21.60it/s] 193it [00:09, 21.58it/s] 196it [00:09, 20.54it/s] 196it [00:09, 20.95it/s] +2025-05-26 00:57:45,422 - INFO - Epoch: 47, Objective: tensor([1651.9421], device='cuda:0', grad_fn=), Loss: 0.005090292543172836, KL/n: 27.957805633544922 + 0it [00:00, ?it/s]2025-05-26 00:57:45,660 - INFO - [Epoch 048 | Batch 0000] IWAE-loss 1497.5374 | mean log_px -0.0018 | KL -1369.39 + 1it [00:00, 7.29it/s] 4it [00:00, 15.37it/s] 7it [00:00, 18.14it/s] 10it [00:00, 19.37it/s] 13it [00:00, 20.20it/s] 16it [00:00, 20.66it/s] 19it [00:00, 20.98it/s] 22it [00:01, 21.16it/s] 25it [00:01, 21.21it/s] 28it [00:01, 21.23it/s] 31it [00:01, 21.16it/s] 34it [00:01, 21.35it/s] 37it [00:01, 21.11it/s] 40it [00:01, 20.91it/s] 43it [00:02, 21.09it/s] 46it [00:02, 21.18it/s] 49it [00:02, 21.21it/s]2025-05-26 00:57:48,019 - INFO - [Epoch 048 | Batch 0050] IWAE-loss 1616.6787 | mean log_px -0.0036 | KL -1363.86 + 52it [00:02, 20.68it/s] 55it [00:02, 20.85it/s] 58it [00:02, 21.13it/s] 61it [00:02, 21.34it/s] 64it [00:03, 21.21it/s] 67it [00:03, 21.36it/s] 70it [00:03, 21.45it/s] 73it [00:03, 21.51it/s] 76it [00:03, 21.55it/s] 79it [00:03, 21.54it/s] 82it [00:03, 21.50it/s] 85it [00:04, 21.04it/s] 88it [00:04, 21.06it/s] 91it [00:04, 20.95it/s] 94it [00:04, 21.18it/s] 97it [00:04, 21.03it/s] 100it [00:04, 21.25it/s]2025-05-26 00:57:50,374 - INFO - [Epoch 048 | Batch 0100] IWAE-loss 1722.9374 | mean log_px -0.0051 | KL -1362.57 + 103it [00:04, 21.25it/s] 106it [00:05, 21.30it/s] 109it [00:05, 21.17it/s] 112it [00:05, 20.71it/s] 115it [00:05, 20.97it/s] 118it [00:05, 21.29it/s] 121it [00:05, 21.11it/s] 124it [00:05, 21.39it/s] 127it [00:06, 21.58it/s] 130it [00:06, 21.72it/s] 133it [00:06, 21.78it/s] 136it [00:06, 21.84it/s] 139it [00:06, 21.63it/s] 142it [00:06, 20.99it/s] 145it [00:06, 20.98it/s] 148it [00:07, 21.05it/s]2025-05-26 00:57:52,720 - INFO - [Epoch 048 | Batch 0150] IWAE-loss 2112.1748 | mean log_px -0.0107 | KL -1362.66 + 151it [00:07, 21.34it/s] 154it [00:07, 21.26it/s] 157it [00:07, 20.94it/s] 160it [00:07, 20.87it/s] 163it [00:07, 20.83it/s] 166it [00:07, 20.55it/s] 169it [00:08, 20.78it/s] 172it [00:08, 21.02it/s] 175it [00:08, 20.77it/s] 178it [00:08, 20.95it/s] 181it [00:08, 21.03it/s] 184it [00:08, 21.24it/s] 187it [00:08, 21.23it/s] 190it [00:09, 21.41it/s] 193it [00:09, 21.25it/s] 196it [00:09, 20.35it/s] 196it [00:09, 20.82it/s] +2025-05-26 00:57:54,968 - INFO - Epoch: 48, Objective: tensor([1470.6415], device='cuda:0', grad_fn=), Loss: 0.0013338052667677402, KL/n: 27.79652976989746 + 0it [00:00, ?it/s]2025-05-26 00:57:55,386 - INFO - [Epoch 049 | Batch 0000] IWAE-loss 1419.2751 | mean log_px -0.0009 | KL -1359.16 + 1it [00:00, 7.05it/s] 4it [00:00, 15.77it/s] 7it [00:00, 18.40it/s] 10it [00:00, 19.88it/s] 13it [00:00, 20.66it/s] 16it [00:00, 21.13it/s] 19it [00:00, 21.43it/s] 22it [00:01, 21.48it/s] 25it [00:01, 21.67it/s] 28it [00:01, 21.79it/s] 31it [00:01, 21.87it/s] 34it [00:01, 21.92it/s] 37it [00:01, 22.00it/s] 40it [00:01, 21.60it/s] 43it [00:02, 21.74it/s] 46it [00:02, 21.64it/s] 49it [00:02, 21.80it/s]2025-05-26 00:57:57,674 - INFO - [Epoch 049 | Batch 0050] IWAE-loss 1543.2958 | mean log_px -0.0027 | KL -1355.80 + 52it [00:02, 21.79it/s] 55it [00:02, 21.46it/s] 58it [00:02, 21.59it/s] 61it [00:02, 21.57it/s] 64it [00:03, 21.45it/s] 67it [00:03, 21.34it/s] 70it [00:03, 21.53it/s] 73it [00:03, 21.70it/s] 76it [00:03, 21.78it/s] 79it [00:03, 21.44it/s] 82it [00:03, 21.63it/s] 85it [00:04, 21.74it/s] 88it [00:04, 21.84it/s] 91it [00:04, 21.95it/s] 94it [00:04, 21.85it/s] 97it [00:04, 21.61it/s] 100it [00:04, 21.61it/s]2025-05-26 00:57:59,988 - INFO - [Epoch 049 | Batch 0100] IWAE-loss 1606.1241 | mean log_px -0.0037 | KL -1346.07 + 103it [00:04, 21.68it/s] 106it [00:04, 21.65it/s] 109it [00:05, 21.76it/s] 112it [00:05, 21.86it/s] 115it [00:05, 21.93it/s] 118it [00:05, 21.99it/s] 121it [00:05, 21.70it/s] 124it [00:05, 21.42it/s] 127it [00:05, 21.60it/s] 130it [00:06, 21.65it/s] 133it [00:06, 21.80it/s] 136it [00:06, 21.87it/s] 139it [00:06, 21.40it/s] 142it [00:06, 21.22it/s] 145it [00:06, 21.51it/s] 148it [00:06, 21.74it/s]2025-05-26 00:58:02,295 - INFO - [Epoch 049 | Batch 0150] IWAE-loss 1674.8267 | mean log_px -0.0048 | KL -1340.20 + 151it [00:07, 21.69it/s] 154it [00:07, 21.90it/s] 157it [00:07, 22.30it/s] 160it [00:07, 22.73it/s] 163it [00:07, 22.66it/s] 166it [00:07, 22.96it/s] 169it [00:07, 23.03it/s] 172it [00:07, 23.14it/s] 175it [00:08, 23.21it/s] 178it [00:08, 23.22it/s] 181it [00:08, 23.30it/s] 184it [00:08, 23.39it/s] 187it [00:08, 22.90it/s] 190it [00:08, 23.05it/s] 193it [00:08, 23.15it/s] 196it [00:09, 22.25it/s] 196it [00:09, 21.61it/s] +2025-05-26 00:58:04,343 - INFO - Epoch: 49, Objective: tensor([1618.0193], device='cuda:0', grad_fn=), Loss: 0.00431447196751833, KL/n: 27.343738555908203 + 0it [00:00, ?it/s]2025-05-26 00:58:04,596 - INFO - [Epoch 050 | Batch 0000] IWAE-loss 1586.2008 | mean log_px -0.0035 | KL -1339.42 + 1it [00:00, 6.84it/s] 4it [00:00, 15.18it/s] 7it [00:00, 18.14it/s] 10it [00:00, 19.48it/s] 13it [00:00, 20.19it/s] 16it [00:00, 20.79it/s] 19it [00:00, 21.22it/s] 22it [00:01, 21.52it/s] 25it [00:01, 21.35it/s] 28it [00:01, 21.44it/s] 31it [00:01, 21.29it/s] 34it [00:01, 21.34it/s] 37it [00:01, 21.24it/s] 40it [00:01, 21.35it/s] 43it [00:02, 21.58it/s] 46it [00:02, 21.73it/s] 49it [00:02, 21.75it/s]2025-05-26 00:58:06,909 - INFO - [Epoch 050 | Batch 0050] IWAE-loss 1525.3423 | mean log_px -0.0027 | KL -1336.66 + 52it [00:02, 21.84it/s] 55it [00:02, 21.94it/s] 58it [00:02, 21.99it/s] 61it [00:02, 21.99it/s] 64it [00:03, 21.53it/s] 67it [00:03, 21.55it/s] 70it [00:03, 21.21it/s] 73it [00:03, 21.49it/s] 76it [00:03, 21.24it/s] 79it [00:03, 21.45it/s] 82it [00:03, 21.56it/s] 85it [00:04, 21.58it/s] 88it [00:04, 21.72it/s] 91it [00:04, 21.81it/s] 94it [00:04, 21.90it/s] 97it [00:04, 21.55it/s] 100it [00:04, 21.70it/s]2025-05-26 00:58:09,220 - INFO - [Epoch 050 | Batch 0100] IWAE-loss 1826.6475 | mean log_px -0.0070 | KL -1333.85 + 103it [00:04, 21.65it/s] 106it [00:05, 21.36it/s] 109it [00:05, 21.36it/s] 112it [00:05, 21.50it/s] 115it [00:05, 21.62it/s] 118it [00:05, 21.35it/s] 121it [00:05, 21.35it/s] 124it [00:05, 21.40it/s] 127it [00:05, 21.51it/s] 130it [00:06, 21.35it/s] 133it [00:06, 20.99it/s] 136it [00:06, 21.33it/s] 139it [00:06, 21.51it/s] 142it [00:06, 21.66it/s] 145it [00:06, 21.42it/s] 148it [00:06, 21.40it/s]2025-05-26 00:58:11,563 - INFO - [Epoch 050 | Batch 0150] IWAE-loss 1705.2615 | mean log_px -0.0053 | KL -1331.09 + 151it [00:07, 21.13it/s] 154it [00:07, 21.41it/s] 157it [00:07, 21.59it/s] 160it [00:07, 21.78it/s] 163it [00:07, 21.70it/s] 166it [00:07, 21.80it/s] 169it [00:07, 21.73it/s] 172it [00:08, 21.42it/s] 175it [00:08, 21.42it/s] 178it [00:08, 21.56it/s] 181it [00:08, 21.56it/s] 184it [00:08, 21.63it/s] 187it [00:08, 21.55it/s] 190it [00:08, 21.52it/s] 193it [00:09, 21.35it/s] 196it [00:09, 20.41it/s] 196it [00:09, 21.11it/s] +2025-05-26 00:58:13,757 - INFO - Epoch: 50, Objective: tensor([1748.8579], device='cuda:0', grad_fn=), Loss: 0.0034362648148089647, KL/n: 27.15498924255371 + 0it [00:00, ?it/s]2025-05-26 00:58:14,311 - INFO - [Epoch 051 | Batch 0000] IWAE-loss 1500.6370 | mean log_px -0.0024 | KL -1332.47 + 1it [00:00, 3.53it/s] 3it [00:00, 9.01it/s] 6it [00:00, 13.90it/s] 9it [00:00, 16.58it/s] 12it [00:00, 18.38it/s] 15it [00:00, 19.47it/s] 18it [00:01, 20.10it/s] 21it [00:01, 20.65it/s] 24it [00:01, 21.05it/s] 27it [00:01, 21.20it/s] 30it [00:01, 21.39it/s] 33it [00:01, 21.35it/s] 36it [00:01, 21.26it/s] 39it [00:02, 21.60it/s] 42it [00:02, 21.44it/s] 45it [00:02, 21.00it/s] 48it [00:02, 20.85it/s]2025-05-26 00:58:16,663 - INFO - [Epoch 051 | Batch 0050] IWAE-loss 1433.8640 | mean log_px -0.0015 | KL -1325.81 + 51it [00:02, 20.75it/s] 54it [00:02, 20.78it/s] 57it [00:02, 20.86it/s] 60it [00:03, 20.81it/s] 63it [00:03, 21.13it/s] 66it [00:03, 21.37it/s] 69it [00:03, 21.62it/s] 72it [00:03, 21.74it/s] 75it [00:03, 21.81it/s] 78it [00:03, 21.80it/s] 81it [00:04, 21.38it/s] 84it [00:04, 21.29it/s] 87it [00:04, 21.48it/s] 90it [00:04, 21.39it/s] 93it [00:04, 21.25it/s] 96it [00:04, 21.18it/s] 99it [00:04, 21.27it/s]2025-05-26 00:58:19,000 - INFO - [Epoch 051 | Batch 0100] IWAE-loss 1984.5623 | mean log_px -0.0094 | KL -1325.75 + 102it [00:05, 21.49it/s] 105it [00:05, 21.71it/s] 108it [00:05, 21.87it/s] 111it [00:05, 21.95it/s] 114it [00:05, 22.06it/s] 117it [00:05, 21.96it/s] 120it [00:05, 21.85it/s] 123it [00:05, 21.26it/s] 126it [00:06, 21.49it/s] 129it [00:06, 21.62it/s] 132it [00:06, 21.78it/s] 135it [00:06, 21.84it/s] 138it [00:06, 21.81it/s] 141it [00:06, 21.85it/s] 144it [00:06, 21.94it/s] 147it [00:07, 21.52it/s] 150it [00:07, 20.82it/s]2025-05-26 00:58:21,314 - INFO - [Epoch 051 | Batch 0150] IWAE-loss 1504.7230 | mean log_px -0.0026 | KL -1323.70 + 153it [00:07, 20.94it/s] 156it [00:07, 20.81it/s] 159it [00:07, 21.08it/s] 162it [00:07, 21.30it/s] 165it [00:07, 21.53it/s] 168it [00:08, 21.50it/s] 171it [00:08, 21.35it/s] 174it [00:08, 21.41it/s] 177it [00:08, 21.62it/s] 180it [00:08, 21.76it/s] 183it [00:08, 21.87it/s] 186it [00:08, 21.93it/s] 189it [00:09, 21.75it/s] 192it [00:09, 21.25it/s] 195it [00:09, 20.36it/s] 196it [00:09, 20.70it/s] +2025-05-26 00:58:23,523 - INFO - Epoch: 51, Objective: tensor([1614.4099], device='cuda:0', grad_fn=), Loss: 0.003150055417791009, KL/n: 26.94906997680664 + 0it [00:00, ?it/s]2025-05-26 00:58:23,946 - INFO - [Epoch 052 | Batch 0000] IWAE-loss 1623.8162 | mean log_px -0.0043 | KL -1321.24 + 1it [00:00, 7.44it/s] 4it [00:00, 15.65it/s] 7it [00:00, 18.48it/s] 10it [00:00, 19.78it/s] 13it [00:00, 20.57it/s] 16it [00:00, 20.85it/s] 19it [00:00, 21.01it/s] 22it [00:01, 21.23it/s] 25it [00:01, 21.48it/s] 28it [00:01, 21.66it/s] 31it [00:01, 21.67it/s] 34it [00:01, 21.74it/s] 37it [00:01, 21.79it/s] 40it [00:01, 21.82it/s] 43it [00:02, 21.89it/s] 46it [00:02, 21.91it/s] 49it [00:02, 21.85it/s]2025-05-26 00:58:26,248 - INFO - [Epoch 052 | Batch 0050] IWAE-loss 1479.0861 | mean log_px -0.0024 | KL -1313.58 + 52it [00:02, 21.76it/s] 55it [00:02, 21.91it/s] 58it [00:02, 21.92it/s] 61it [00:02, 21.98it/s] 64it [00:03, 22.05it/s] 67it [00:03, 22.08it/s] 70it [00:03, 22.15it/s] 73it [00:03, 22.21it/s] 76it [00:03, 22.23it/s] 79it [00:03, 22.22it/s] 82it [00:03, 22.24it/s] 85it [00:03, 22.25it/s] 88it [00:04, 22.21it/s] 91it [00:04, 22.20it/s] 94it [00:04, 22.24it/s] 97it [00:04, 22.20it/s] 100it [00:04, 22.17it/s]2025-05-26 00:58:28,504 - INFO - [Epoch 052 | Batch 0100] IWAE-loss 1882.7440 | mean log_px -0.0082 | KL -1309.20 + 103it [00:04, 22.18it/s] 106it [00:04, 22.25it/s] 109it [00:05, 22.25it/s] 112it [00:05, 22.23it/s] 115it [00:05, 22.24it/s] 118it [00:05, 22.17it/s] 121it [00:05, 22.13it/s] 124it [00:05, 22.23it/s] 127it [00:05, 22.09it/s] 130it [00:05, 22.10it/s] 133it [00:06, 22.14it/s] 136it [00:06, 22.13it/s] 139it [00:06, 22.16it/s] 142it [00:06, 22.20it/s] 145it [00:06, 22.18it/s] 148it [00:06, 22.14it/s]2025-05-26 00:58:30,761 - INFO - [Epoch 052 | Batch 0150] IWAE-loss 1388.5631 | mean log_px -0.0011 | KL -1308.61 + 151it [00:06, 22.03it/s] 154it [00:07, 22.07it/s] 157it [00:07, 22.03it/s] 160it [00:07, 22.00it/s] 163it [00:07, 21.91it/s] 166it [00:07, 21.90it/s] 169it [00:07, 21.89it/s] 172it [00:07, 21.98it/s] 175it [00:08, 21.90it/s] 178it [00:08, 21.83it/s] 181it [00:08, 21.97it/s] 184it [00:08, 21.94it/s] 187it [00:08, 22.02it/s] 190it [00:08, 22.10it/s] 193it [00:08, 22.16it/s] 196it [00:09, 21.36it/s] 196it [00:09, 21.60it/s] +2025-05-26 00:58:32,912 - INFO - Epoch: 52, Objective: tensor([2569.8589], device='cuda:0', grad_fn=), Loss: 0.02012932486832142, KL/n: 26.71076011657715 + 0it [00:00, ?it/s]2025-05-26 00:58:33,152 - INFO - [Epoch 053 | Batch 0000] IWAE-loss 1411.0377 | mean log_px -0.0015 | KL -1308.46 + 1it [00:00, 7.38it/s] 4it [00:00, 16.18it/s] 7it [00:00, 18.95it/s] 10it [00:00, 20.25it/s] 13it [00:00, 20.95it/s] 16it [00:00, 21.36it/s] 19it [00:00, 21.58it/s] 22it [00:01, 21.75it/s] 25it [00:01, 21.85it/s] 28it [00:01, 21.85it/s] 31it [00:01, 21.75it/s] 34it [00:01, 21.50it/s] 37it [00:01, 21.37it/s] 40it [00:01, 21.42it/s] 43it [00:02, 21.50it/s] 46it [00:02, 21.60it/s] 49it [00:02, 21.61it/s]2025-05-26 00:58:35,444 - INFO - [Epoch 053 | Batch 0050] IWAE-loss 1491.8326 | mean log_px -0.0027 | KL -1302.58 + 52it [00:02, 21.59it/s] 55it [00:02, 21.67it/s] 58it [00:02, 21.60it/s] 61it [00:02, 21.63it/s] 64it [00:03, 21.76it/s] 67it [00:03, 21.70it/s] 70it [00:03, 21.85it/s] 73it [00:03, 21.86it/s] 76it [00:03, 21.96it/s] 79it [00:03, 22.01it/s] 82it [00:03, 21.98it/s] 85it [00:03, 21.91it/s] 88it [00:04, 21.94it/s] 91it [00:04, 21.56it/s] 94it [00:04, 21.61it/s] 97it [00:04, 21.66it/s] 100it [00:04, 21.73it/s]2025-05-26 00:58:37,739 - INFO - [Epoch 053 | Batch 0100] IWAE-loss 1390.0989 | mean log_px -0.0013 | KL -1297.10 + 103it [00:04, 21.78it/s] 106it [00:04, 21.85it/s] 109it [00:05, 21.70it/s] 112it [00:05, 21.64it/s] 115it [00:05, 21.71it/s] 118it [00:05, 21.67it/s] 121it [00:05, 21.77it/s] 124it [00:05, 21.69it/s] 127it [00:05, 21.81it/s] 130it [00:06, 21.93it/s] 133it [00:06, 21.91it/s] 136it [00:06, 21.89it/s] 139it [00:06, 21.70it/s] 142it [00:06, 21.79it/s] 145it [00:06, 21.87it/s] 148it [00:06, 21.93it/s]2025-05-26 00:58:40,029 - INFO - [Epoch 053 | Batch 0150] IWAE-loss 1513.5092 | mean log_px -0.0031 | KL -1296.66 + 151it [00:07, 21.94it/s] 154it [00:07, 22.00it/s] 157it [00:07, 22.00it/s] 160it [00:07, 22.02it/s] 163it [00:07, 22.06it/s] 166it [00:07, 22.06it/s] 169it [00:07, 22.07it/s] 172it [00:07, 22.06it/s] 175it [00:08, 22.06it/s] 178it [00:08, 22.07it/s] 181it [00:08, 22.06it/s] 184it [00:08, 22.07it/s] 187it [00:08, 22.06it/s] 190it [00:08, 22.05it/s] 193it [00:08, 22.07it/s] 196it [00:09, 20.94it/s] 196it [00:09, 21.46it/s] +2025-05-26 00:58:42,176 - INFO - Epoch: 53, Objective: tensor([1650.0601], device='cuda:0', grad_fn=), Loss: 0.00238289637491107, KL/n: 26.484121322631836 + 0it [00:00, ?it/s]2025-05-26 00:58:42,416 - INFO - [Epoch 054 | Batch 0000] IWAE-loss 1821.5071 | mean log_px -0.0075 | KL -1298.44 + 1it [00:00, 7.21it/s] 4it [00:00, 16.08it/s] 7it [00:00, 18.72it/s] 10it [00:00, 20.10it/s] 13it [00:00, 20.83it/s] 16it [00:00, 21.18it/s] 19it [00:00, 21.45it/s] 22it [00:01, 21.71it/s] 25it [00:01, 21.64it/s] 28it [00:01, 21.45it/s] 31it [00:01, 21.64it/s] 34it [00:01, 21.84it/s] 37it [00:01, 21.75it/s] 40it [00:01, 21.58it/s] 43it [00:02, 21.58it/s] 46it [00:02, 21.67it/s] 49it [00:02, 21.72it/s]2025-05-26 00:58:44,714 - INFO - [Epoch 054 | Batch 0050] IWAE-loss 1482.0979 | mean log_px -0.0028 | KL -1284.78 + 52it [00:02, 21.31it/s] 55it [00:02, 21.48it/s] 58it [00:02, 21.69it/s] 61it [00:02, 21.82it/s] 64it [00:03, 21.73it/s] 67it [00:03, 21.84it/s] 70it [00:03, 21.57it/s] 73it [00:03, 21.47it/s] 76it [00:03, 21.61it/s] 79it [00:03, 21.55it/s] 82it [00:03, 21.39it/s] 85it [00:04, 21.32it/s] 88it [00:04, 21.32it/s] 91it [00:04, 21.37it/s] 94it [00:04, 21.40it/s] 97it [00:04, 21.62it/s] 100it [00:04, 21.73it/s]2025-05-26 00:58:47,031 - INFO - [Epoch 054 | Batch 0100] IWAE-loss 1503.4625 | mean log_px -0.0031 | KL -1284.76 + 103it [00:04, 21.58it/s] 106it [00:04, 21.36it/s] 109it [00:05, 21.60it/s] 112it [00:05, 21.73it/s] 115it [00:05, 21.87it/s] 118it [00:05, 22.00it/s] 121it [00:05, 22.00it/s] 124it [00:05, 21.75it/s] 127it [00:05, 21.66it/s] 130it [00:06, 21.77it/s] 133it [00:06, 21.87it/s] 136it [00:06, 21.83it/s] 139it [00:06, 21.74it/s] 142it [00:06, 21.57it/s] 145it [00:06, 21.49it/s] 148it [00:06, 21.55it/s]2025-05-26 00:58:49,335 - INFO - [Epoch 054 | Batch 0150] IWAE-loss 1470.8281 | mean log_px -0.0026 | KL -1287.35 + 151it [00:07, 21.70it/s] 154it [00:07, 21.82it/s] 157it [00:07, 21.93it/s] 160it [00:07, 21.90it/s] 163it [00:07, 21.87it/s] 166it [00:07, 21.84it/s] 169it [00:07, 21.62it/s] 172it [00:08, 21.64it/s] 175it [00:08, 21.68it/s] 178it [00:08, 21.84it/s] 181it [00:08, 21.94it/s] 184it [00:08, 21.62it/s] 187it [00:08, 21.50it/s] 190it [00:08, 21.67it/s] 193it [00:08, 21.46it/s] 196it [00:09, 20.69it/s] 196it [00:09, 21.29it/s] +2025-05-26 00:58:51,512 - INFO - Epoch: 54, Objective: tensor([1502.0303], device='cuda:0', grad_fn=), Loss: 0.0024223646614700556, KL/n: 26.179628372192383 + 0it [00:00, ?it/s]2025-05-26 00:58:51,920 - INFO - [Epoch 055 | Batch 0000] IWAE-loss 2042.4064 | mean log_px -0.0109 | KL -1281.15 + 1it [00:00, 7.68it/s] 4it [00:00, 15.96it/s] 7it [00:00, 18.59it/s] 10it [00:00, 19.60it/s] 13it [00:00, 20.24it/s] 16it [00:00, 20.63it/s] 19it [00:00, 21.02it/s] 22it [00:01, 21.14it/s] 25it [00:01, 20.84it/s] 28it [00:01, 21.04it/s] 31it [00:01, 21.25it/s] 34it [00:01, 21.42it/s] 37it [00:01, 21.44it/s] 40it [00:01, 21.44it/s] 43it [00:02, 21.58it/s] 46it [00:02, 21.60it/s] 49it [00:02, 21.41it/s]2025-05-26 00:58:54,260 - INFO - [Epoch 055 | Batch 0050] IWAE-loss 1769.1973 | mean log_px -0.0070 | KL -1279.47 + 52it [00:02, 21.40it/s] 55it [00:02, 21.19it/s] 58it [00:02, 21.33it/s] 61it [00:02, 21.52it/s] 64it [00:03, 21.05it/s] 67it [00:03, 20.32it/s] 70it [00:03, 20.12it/s] 73it [00:03, 20.17it/s] 76it [00:03, 20.85it/s] 79it [00:03, 21.35it/s] 82it [00:03, 21.74it/s] 85it [00:04, 22.03it/s] 88it [00:04, 22.27it/s] 91it [00:04, 22.37it/s] 94it [00:04, 22.59it/s] 97it [00:04, 22.96it/s] 100it [00:04, 23.16it/s]2025-05-26 00:58:56,557 - INFO - [Epoch 055 | Batch 0100] IWAE-loss 1415.7883 | mean log_px -0.0020 | KL -1274.69 + 103it [00:04, 23.29it/s] 106it [00:04, 23.27it/s] 109it [00:05, 23.05it/s] 112it [00:05, 23.17it/s] 115it [00:05, 23.21it/s] 118it [00:05, 23.17it/s] 121it [00:05, 22.99it/s] 124it [00:05, 22.84it/s] 127it [00:05, 23.12it/s] 130it [00:06, 23.32it/s] 133it [00:06, 23.29it/s] 136it [00:06, 23.40it/s] 139it [00:06, 23.24it/s] 142it [00:06, 23.06it/s] 145it [00:06, 23.16it/s] 148it [00:06, 23.28it/s]2025-05-26 00:58:58,717 - INFO - [Epoch 055 | Batch 0150] IWAE-loss 1552.6018 | mean log_px -0.0040 | KL -1274.03 + 151it [00:06, 22.94it/s] 154it [00:07, 23.04it/s] 157it [00:07, 23.23it/s] 160it [00:07, 23.44it/s] 163it [00:07, 23.13it/s] 166it [00:07, 22.79it/s] 169it [00:07, 22.28it/s] 172it [00:07, 21.78it/s] 175it [00:07, 21.64it/s] 178it [00:08, 21.86it/s] 181it [00:08, 21.98it/s] 184it [00:08, 22.18it/s] 187it [00:08, 21.96it/s] 190it [00:08, 21.71it/s] 193it [00:08, 21.18it/s] 196it [00:08, 20.49it/s] 196it [00:09, 21.64it/s] +2025-05-26 00:59:00,873 - INFO - Epoch: 55, Objective: tensor([1506.3440], device='cuda:0', grad_fn=), Loss: 0.002600246574729681, KL/n: 25.974912643432617 + 0it [00:00, ?it/s]2025-05-26 00:59:01,087 - INFO - [Epoch 056 | Batch 0000] IWAE-loss 1480.3961 | mean log_px -0.0030 | KL -1272.85 + 1it [00:00, 9.14it/s] 4it [00:00, 16.86it/s] 7it [00:00, 19.37it/s] 10it [00:00, 20.53it/s] 13it [00:00, 21.09it/s] 16it [00:00, 21.49it/s] 19it [00:00, 21.87it/s] 22it [00:01, 22.05it/s] 25it [00:01, 21.90it/s] 28it [00:01, 21.35it/s] 31it [00:01, 21.42it/s] 34it [00:01, 21.63it/s] 37it [00:01, 21.82it/s] 40it [00:01, 22.06it/s] 43it [00:02, 22.14it/s] 46it [00:02, 22.16it/s] 49it [00:02, 21.68it/s]2025-05-26 00:59:03,378 - INFO - [Epoch 056 | Batch 0050] IWAE-loss 1559.5785 | mean log_px -0.0041 | KL -1269.48 + 52it [00:02, 21.63it/s] 55it [00:02, 21.81it/s] 58it [00:02, 21.77it/s] 61it [00:02, 21.28it/s] 64it [00:03, 21.24it/s] 67it [00:03, 21.35it/s] 70it [00:03, 21.43it/s] 73it [00:03, 21.18it/s] 76it [00:03, 20.95it/s] 79it [00:03, 21.16it/s] 82it [00:03, 21.42it/s] 85it [00:03, 21.46it/s] 88it [00:04, 21.54it/s] 91it [00:04, 21.53it/s] 94it [00:04, 21.63it/s] 97it [00:04, 21.87it/s] 100it [00:04, 21.48it/s]2025-05-26 00:59:05,711 - INFO - [Epoch 056 | Batch 0100] IWAE-loss 1584.8795 | mean log_px -0.0046 | KL -1266.03 + 103it [00:04, 21.65it/s] 106it [00:04, 21.63it/s] 109it [00:05, 21.76it/s] 112it [00:05, 21.76it/s] 115it [00:05, 21.89it/s] 118it [00:05, 21.95it/s] 121it [00:05, 22.04it/s] 124it [00:05, 22.13it/s] 127it [00:05, 22.13it/s] 130it [00:06, 21.92it/s] 133it [00:06, 21.66it/s] 136it [00:06, 21.54it/s] 139it [00:06, 21.56it/s] 142it [00:06, 21.76it/s] 145it [00:06, 21.45it/s] 148it [00:06, 21.67it/s]2025-05-26 00:59:08,001 - INFO - [Epoch 056 | Batch 0150] IWAE-loss 1295.5978 | mean log_px -0.0004 | KL -1265.24 + 151it [00:07, 21.77it/s] 154it [00:07, 21.62it/s] 157it [00:07, 21.67it/s] 160it [00:07, 21.78it/s] 163it [00:07, 21.39it/s] 166it [00:07, 21.63it/s] 169it [00:07, 21.78it/s] 172it [00:07, 21.88it/s] 175it [00:08, 21.95it/s] 178it [00:08, 21.91it/s] 181it [00:08, 22.01it/s] 184it [00:08, 22.08it/s] 187it [00:08, 21.94it/s] 190it [00:08, 21.70it/s] 193it [00:08, 21.74it/s] 196it [00:09, 20.73it/s] 196it [00:09, 21.38it/s] +2025-05-26 00:59:10,172 - INFO - Epoch: 56, Objective: tensor([1870.7029], device='cuda:0', grad_fn=), Loss: 0.009725436568260193, KL/n: 25.758514404296875 + 0it [00:00, ?it/s]2025-05-26 00:59:10,698 - INFO - [Epoch 057 | Batch 0000] IWAE-loss 1536.2001 | mean log_px -0.0040 | KL -1258.14 + 1it [00:00, 3.94it/s] 4it [00:00, 11.87it/s] 7it [00:00, 15.83it/s] 10it [00:00, 18.11it/s] 13it [00:00, 19.52it/s] 16it [00:00, 20.42it/s] 19it [00:01, 20.96it/s] 22it [00:01, 21.40it/s] 25it [00:01, 21.61it/s] 28it [00:01, 21.79it/s] 31it [00:01, 21.92it/s] 34it [00:01, 22.02it/s] 37it [00:01, 22.09it/s] 40it [00:02, 22.12it/s] 43it [00:02, 22.19it/s] 46it [00:02, 22.20it/s] 49it [00:02, 22.20it/s]2025-05-26 00:59:12,948 - INFO - [Epoch 057 | Batch 0050] IWAE-loss 1459.7440 | mean log_px -0.0029 | KL -1259.14 + 52it [00:02, 22.17it/s] 55it [00:02, 22.19it/s] 58it [00:02, 22.24it/s] 61it [00:02, 22.19it/s] 64it [00:03, 22.12it/s] 67it [00:03, 22.06it/s] 70it [00:03, 21.83it/s] 73it [00:03, 21.90it/s] 76it [00:03, 22.00it/s] 79it [00:03, 21.99it/s] 82it [00:03, 22.03it/s] 85it [00:04, 21.94it/s] 88it [00:04, 21.96it/s] 91it [00:04, 21.91it/s] 94it [00:04, 21.84it/s] 97it [00:04, 21.88it/s] 100it [00:04, 21.91it/s]2025-05-26 00:59:15,224 - INFO - [Epoch 057 | Batch 0100] IWAE-loss 1495.4443 | mean log_px -0.0034 | KL -1256.31 + 103it [00:04, 21.94it/s] 106it [00:05, 21.97it/s] 109it [00:05, 21.97it/s] 112it [00:05, 22.01it/s] 115it [00:05, 22.04it/s] 118it [00:05, 22.09it/s] 121it [00:05, 22.09it/s] 124it [00:05, 22.11it/s] 127it [00:05, 22.16it/s] 130it [00:06, 22.17it/s] 133it [00:06, 22.18it/s] 136it [00:06, 22.15it/s] 139it [00:06, 22.17it/s] 142it [00:06, 22.11it/s] 145it [00:06, 22.08it/s] 148it [00:06, 22.60it/s]2025-05-26 00:59:17,470 - INFO - [Epoch 057 | Batch 0150] IWAE-loss 1394.5524 | mean log_px -0.0020 | KL -1254.82 + 151it [00:07, 22.82it/s] 154it [00:07, 23.08it/s] 157it [00:07, 22.91it/s] 160it [00:07, 22.73it/s] 163it [00:07, 22.54it/s] 166it [00:07, 22.41it/s] 169it [00:07, 22.33it/s] 172it [00:07, 22.28it/s] 175it [00:08, 22.21it/s] 178it [00:08, 22.16it/s] 181it [00:08, 22.15it/s] 184it [00:08, 22.13it/s] 187it [00:08, 22.04it/s] 190it [00:08, 22.03it/s] 193it [00:08, 22.05it/s] 196it [00:09, 21.07it/s] 196it [00:09, 21.49it/s] +2025-05-26 00:59:19,589 - INFO - Epoch: 57, Objective: tensor([1602.6106], device='cuda:0', grad_fn=), Loss: 0.002222305629402399, KL/n: 25.651405334472656 + 0it [00:00, ?it/s]2025-05-26 00:59:20,018 - INFO - [Epoch 058 | Batch 0000] IWAE-loss 2159.9016 | mean log_px -0.0129 | KL -1260.20 + 1it [00:00, 7.34it/s] 4it [00:00, 16.01it/s] 7it [00:00, 18.64it/s] 10it [00:00, 19.91it/s] 13it [00:00, 20.61it/s] 16it [00:00, 20.53it/s] 19it [00:00, 20.50it/s] 22it [00:01, 20.78it/s] 25it [00:01, 21.17it/s] 28it [00:01, 21.23it/s] 31it [00:01, 21.47it/s] 34it [00:01, 21.66it/s] 37it [00:01, 21.38it/s] 40it [00:01, 21.61it/s] 43it [00:02, 21.73it/s] 46it [00:02, 21.66it/s] 49it [00:02, 21.49it/s]2025-05-26 00:59:22,347 - INFO - [Epoch 058 | Batch 0050] IWAE-loss 1791.6669 | mean log_px -0.0077 | KL -1254.69 + 52it [00:02, 21.37it/s] 55it [00:02, 21.44it/s] 58it [00:02, 21.51it/s] 61it [00:02, 21.62it/s] 64it [00:03, 21.76it/s] 67it [00:03, 21.39it/s] 70it [00:03, 21.60it/s] 73it [00:03, 21.75it/s] 76it [00:03, 21.70it/s] 79it [00:03, 21.76it/s] 82it [00:03, 21.82it/s] 85it [00:04, 21.45it/s] 88it [00:04, 21.62it/s] 91it [00:04, 21.67it/s] 94it [00:04, 21.60it/s] 97it [00:04, 21.37it/s] 100it [00:04, 21.05it/s]2025-05-26 00:59:24,670 - INFO - [Epoch 058 | Batch 0100] IWAE-loss 1466.7124 | mean log_px -0.0031 | KL -1246.37 + 103it [00:04, 21.05it/s] 106it [00:05, 21.33it/s] 109it [00:05, 21.13it/s] 112it [00:05, 20.96it/s] 115it [00:05, 21.12it/s] 118it [00:05, 21.37it/s] 121it [00:05, 21.44it/s] 124it [00:05, 21.37it/s] 127it [00:06, 21.07it/s] 130it [00:06, 21.21it/s] 133it [00:06, 21.13it/s] 136it [00:06, 20.98it/s] 139it [00:06, 20.72it/s] 142it [00:06, 20.99it/s] 145it [00:06, 20.79it/s] 148it [00:07, 20.85it/s]2025-05-26 00:59:27,045 - INFO - [Epoch 058 | Batch 0150] IWAE-loss 2742.2402 | mean log_px -0.0214 | KL -1245.30 + 151it [00:07, 20.86it/s] 154it [00:07, 21.15it/s] 157it [00:07, 20.93it/s] 160it [00:07, 21.00it/s] 163it [00:07, 20.99it/s] 166it [00:07, 20.98it/s] 169it [00:08, 21.14it/s] 172it [00:08, 21.37it/s] 175it [00:08, 21.30it/s] 178it [00:08, 21.30it/s] 181it [00:08, 21.34it/s] 184it [00:08, 21.28it/s] 187it [00:08, 21.46it/s] 190it [00:08, 21.60it/s] 193it [00:09, 21.52it/s] 196it [00:09, 20.53it/s] 196it [00:09, 20.95it/s] +2025-05-26 00:59:29,265 - INFO - Epoch: 58, Objective: tensor([1529.1616], device='cuda:0', grad_fn=), Loss: 0.004334802273660898, KL/n: 25.400850296020508 + 0it [00:00, ?it/s]2025-05-26 00:59:29,506 - INFO - [Epoch 059 | Batch 0000] IWAE-loss 1488.2743 | mean log_px -0.0035 | KL -1241.31 + 1it [00:00, 7.26it/s] 4it [00:00, 15.42it/s] 7it [00:00, 18.36it/s] 10it [00:00, 19.78it/s] 12it [00:00, 19.83it/s] 15it [00:00, 20.38it/s] 18it [00:00, 20.55it/s] 21it [00:01, 20.83it/s] 24it [00:01, 21.16it/s] 27it [00:01, 21.10it/s] 30it [00:01, 21.00it/s] 33it [00:01, 21.33it/s] 36it [00:01, 21.34it/s] 39it [00:01, 21.55it/s] 42it [00:02, 21.70it/s] 45it [00:02, 21.30it/s] 48it [00:02, 21.51it/s]2025-05-26 00:59:31,845 - INFO - [Epoch 059 | Batch 0050] IWAE-loss 1340.4985 | mean log_px -0.0014 | KL -1240.31 + 51it [00:02, 21.45it/s] 54it [00:02, 21.62it/s] 57it [00:02, 21.57it/s] 60it [00:02, 21.49it/s] 63it [00:03, 21.48it/s] 66it [00:03, 21.62it/s] 69it [00:03, 21.69it/s] 72it [00:03, 21.75it/s] 75it [00:03, 21.79it/s] 78it [00:03, 21.85it/s] 81it [00:03, 21.53it/s] 84it [00:04, 21.23it/s] 87it [00:04, 21.41it/s] 90it [00:04, 21.11it/s] 93it [00:04, 21.36it/s] 96it [00:04, 21.37it/s] 99it [00:04, 21.23it/s]2025-05-26 00:59:34,176 - INFO - [Epoch 059 | Batch 0100] IWAE-loss 1408.7993 | mean log_px -0.0024 | KL -1237.44 + 102it [00:04, 21.30it/s] 105it [00:04, 21.48it/s] 108it [00:05, 21.79it/s] 111it [00:05, 22.01it/s] 114it [00:05, 22.29it/s] 117it [00:05, 22.41it/s] 120it [00:05, 22.13it/s] 123it [00:05, 22.28it/s] 126it [00:05, 22.37it/s] 129it [00:06, 22.18it/s] 132it [00:06, 22.42it/s] 135it [00:06, 22.59it/s] 138it [00:06, 22.72it/s] 141it [00:06, 22.78it/s] 144it [00:06, 22.78it/s] 147it [00:06, 22.81it/s] 150it [00:06, 22.75it/s]2025-05-26 00:59:36,397 - INFO - [Epoch 059 | Batch 0150] IWAE-loss 1331.0359 | mean log_px -0.0013 | KL -1237.22 + 153it [00:07, 22.81it/s] 156it [00:07, 22.33it/s] 159it [00:07, 22.64it/s] 162it [00:07, 22.37it/s] 165it [00:07, 22.34it/s] 168it [00:07, 22.61it/s] 171it [00:07, 22.69it/s] 174it [00:08, 22.49it/s] 177it [00:08, 22.46it/s] 180it [00:08, 22.63it/s] 183it [00:08, 22.62it/s] 186it [00:08, 22.74it/s] 189it [00:08, 22.45it/s] 192it [00:08, 22.58it/s] 195it [00:09, 21.36it/s] 196it [00:09, 21.53it/s] +2025-05-26 00:59:38,499 - INFO - Epoch: 59, Objective: tensor([1505.4119], device='cuda:0', grad_fn=), Loss: 0.0057054548524320126, KL/n: 25.26158905029297 + 0it [00:00, ?it/s]2025-05-26 00:59:38,920 - INFO - [Epoch 060 | Batch 0000] IWAE-loss 1366.1249 | mean log_px -0.0018 | KL -1237.08 + 1it [00:00, 7.85it/s] 4it [00:00, 15.76it/s] 7it [00:00, 18.50it/s] 10it [00:00, 20.43it/s] 13it [00:00, 21.36it/s] 16it [00:00, 21.42it/s] 19it [00:00, 21.51it/s] 22it [00:01, 21.55it/s] 25it [00:01, 21.71it/s] 28it [00:01, 21.66it/s] 31it [00:01, 21.67it/s] 34it [00:01, 21.66it/s] 37it [00:01, 21.62it/s] 40it [00:01, 21.66it/s] 43it [00:02, 21.75it/s] 46it [00:02, 21.71it/s] 49it [00:02, 21.81it/s]2025-05-26 00:59:41,211 - INFO - [Epoch 060 | Batch 0050] IWAE-loss 1476.7156 | mean log_px -0.0035 | KL -1233.95 + 52it [00:02, 21.83it/s] 55it [00:02, 21.75it/s] 58it [00:02, 21.80it/s] 61it [00:02, 21.88it/s] 64it [00:03, 21.83it/s] 67it [00:03, 21.90it/s] 70it [00:03, 21.72it/s] 73it [00:03, 21.71it/s] 76it [00:03, 21.74it/s] 79it [00:03, 21.72it/s] 82it [00:03, 21.71it/s] 85it [00:03, 21.73it/s] 88it [00:04, 21.73it/s] 91it [00:04, 21.64it/s] 94it [00:04, 21.66it/s] 97it [00:04, 21.76it/s] 100it [00:04, 21.65it/s]2025-05-26 00:59:43,512 - INFO - [Epoch 060 | Batch 0100] IWAE-loss 1488.0596 | mean log_px -0.0037 | KL -1231.67 + 103it [00:04, 21.72it/s] 106it [00:04, 21.58it/s] 109it [00:05, 21.71it/s] 112it [00:05, 21.80it/s] 115it [00:05, 21.87it/s] 118it [00:05, 21.68it/s] 121it [00:05, 21.78it/s] 124it [00:05, 21.89it/s] 127it [00:05, 21.76it/s] 130it [00:06, 21.68it/s] 133it [00:06, 21.79it/s] 136it [00:06, 21.86it/s] 139it [00:06, 21.97it/s] 142it [00:06, 22.00it/s] 145it [00:06, 21.99it/s] 148it [00:06, 21.94it/s]2025-05-26 00:59:45,799 - INFO - [Epoch 060 | Batch 0150] IWAE-loss 1706.6774 | mean log_px -0.0068 | KL -1232.75 + 151it [00:07, 21.94it/s] 154it [00:07, 22.00it/s] 157it [00:07, 21.87it/s] 160it [00:07, 21.67it/s] 163it [00:07, 21.79it/s] 166it [00:07, 21.90it/s] 169it [00:07, 21.94it/s] 172it [00:07, 22.02it/s] 175it [00:08, 21.95it/s] 178it [00:08, 21.99it/s] 181it [00:08, 21.91it/s] 184it [00:08, 21.97it/s] 187it [00:08, 22.01it/s] 190it [00:08, 21.74it/s] 193it [00:08, 21.82it/s] 196it [00:09, 20.85it/s] 196it [00:09, 21.42it/s] +2025-05-26 00:59:47,967 - INFO - Epoch: 60, Objective: tensor([2637.8342], device='cuda:0', grad_fn=), Loss: 0.009155135601758957, KL/n: 25.116397857666016 + 0it [00:00, ?it/s]2025-05-26 00:59:48,204 - INFO - [Epoch 061 | Batch 0000] IWAE-loss 1339.3209 | mean log_px -0.0016 | KL -1229.84 + 1it [00:00, 7.42it/s] 4it [00:00, 16.24it/s] 7it [00:00, 18.99it/s] 10it [00:00, 20.30it/s] 13it [00:00, 20.96it/s] 16it [00:00, 21.39it/s] 19it [00:00, 21.67it/s] 22it [00:01, 21.87it/s] 25it [00:01, 21.96it/s] 28it [00:01, 22.05it/s] 31it [00:01, 22.07it/s] 34it [00:01, 22.08it/s] 37it [00:01, 22.14it/s] 40it [00:01, 21.98it/s] 43it [00:02, 22.07it/s] 46it [00:02, 22.11it/s] 49it [00:02, 22.15it/s]2025-05-26 00:59:50,464 - INFO - [Epoch 061 | Batch 0050] IWAE-loss 1501.5515 | mean log_px -0.0039 | KL -1230.01 + 52it [00:02, 22.11it/s] 55it [00:02, 22.13it/s] 58it [00:02, 22.05it/s] 61it [00:02, 22.08it/s] 64it [00:02, 21.94it/s] 67it [00:03, 22.04it/s] 70it [00:03, 22.13it/s] 73it [00:03, 22.14it/s] 76it [00:03, 21.92it/s] 79it [00:03, 21.86it/s] 82it [00:03, 21.92it/s] 85it [00:03, 22.00it/s] 88it [00:04, 22.08it/s] 91it [00:04, 22.12it/s] 94it [00:04, 22.16it/s] 97it [00:04, 22.14it/s] 100it [00:04, 22.19it/s]2025-05-26 00:59:52,731 - INFO - [Epoch 061 | Batch 0100] IWAE-loss 1362.8021 | mean log_px -0.0020 | KL -1221.67 + 103it [00:04, 22.16it/s] 106it [00:04, 22.18it/s] 109it [00:05, 22.24it/s] 112it [00:05, 22.24it/s] 115it [00:05, 22.23it/s] 118it [00:05, 22.25it/s] 121it [00:05, 22.24it/s] 124it [00:05, 22.22it/s] 127it [00:05, 22.21it/s] 130it [00:05, 22.23it/s] 133it [00:06, 22.25it/s] 136it [00:06, 22.23it/s] 139it [00:06, 22.10it/s] 142it [00:06, 22.01it/s] 145it [00:06, 21.72it/s] 148it [00:06, 21.70it/s]2025-05-26 00:59:54,997 - INFO - [Epoch 061 | Batch 0150] IWAE-loss 1680.8140 | mean log_px -0.0066 | KL -1219.91 + 151it [00:06, 21.71it/s] 154it [00:07, 21.65it/s] 157it [00:07, 21.69it/s] 160it [00:07, 21.63it/s] 163it [00:07, 21.51it/s] 166it [00:07, 21.73it/s] 169it [00:07, 21.82it/s] 172it [00:07, 21.97it/s] 175it [00:08, 22.06it/s] 178it [00:08, 21.94it/s] 181it [00:08, 21.99it/s] 184it [00:08, 22.04it/s] 187it [00:08, 22.10it/s] 190it [00:08, 22.10it/s] 193it [00:08, 22.08it/s] 196it [00:08, 21.04it/s] 196it [00:09, 21.63it/s] +2025-05-26 00:59:57,158 - INFO - Epoch: 61, Objective: tensor([1729.2206], device='cuda:0', grad_fn=), Loss: 0.004181381314992905, KL/n: 24.9349308013916 + 0it [00:00, ?it/s]2025-05-26 00:59:57,409 - INFO - [Epoch 062 | Batch 0000] IWAE-loss 1279.5305 | mean log_px -0.0008 | KL -1223.57 + 1it [00:00, 6.82it/s] 4it [00:00, 15.36it/s] 7it [00:00, 18.01it/s] 10it [00:00, 19.23it/s] 13it [00:00, 20.20it/s] 16it [00:00, 20.82it/s] 19it [00:00, 21.26it/s] 22it [00:01, 21.53it/s] 25it [00:01, 21.67it/s] 28it [00:01, 21.83it/s] 31it [00:01, 21.95it/s] 34it [00:01, 21.77it/s] 37it [00:01, 21.82it/s] 40it [00:01, 21.88it/s] 43it [00:02, 21.56it/s] 46it [00:02, 21.72it/s] 49it [00:02, 21.63it/s]2025-05-26 00:59:59,707 - INFO - [Epoch 062 | Batch 0050] IWAE-loss 1681.4735 | mean log_px -0.0067 | KL -1215.36 + 52it [00:02, 21.51it/s] 55it [00:02, 21.60it/s] 58it [00:02, 21.77it/s] 61it [00:02, 21.90it/s] 64it [00:03, 21.98it/s] 67it [00:03, 22.07it/s] 70it [00:03, 22.03it/s] 73it [00:03, 22.03it/s] 76it [00:03, 22.03it/s] 79it [00:03, 22.06it/s] 82it [00:03, 22.06it/s] 85it [00:03, 22.09it/s] 88it [00:04, 21.68it/s] 91it [00:04, 21.78it/s] 94it [00:04, 21.91it/s] 97it [00:04, 21.47it/s] 100it [00:04, 21.50it/s]2025-05-26 01:00:01,998 - INFO - [Epoch 062 | Batch 0100] IWAE-loss 1706.2766 | mean log_px -0.0071 | KL -1210.85 + 103it [00:04, 21.32it/s] 106it [00:04, 21.20it/s] 109it [00:05, 21.25it/s] 112it [00:05, 21.24it/s] 115it [00:05, 21.36it/s] 118it [00:05, 21.40it/s] 121it [00:05, 21.55it/s] 124it [00:05, 21.68it/s] 127it [00:05, 21.75it/s] 130it [00:06, 21.82it/s] 133it [00:06, 21.87it/s] 136it [00:06, 21.91it/s] 139it [00:06, 21.87it/s] 142it [00:06, 21.92it/s] 145it [00:06, 21.96it/s] 148it [00:06, 22.04it/s]2025-05-26 01:00:04,298 - INFO - [Epoch 062 | Batch 0150] IWAE-loss 1398.4180 | mean log_px -0.0027 | KL -1210.68 + 151it [00:07, 22.05it/s] 154it [00:07, 22.06it/s] 157it [00:07, 22.07it/s] 160it [00:07, 22.14it/s] 163it [00:07, 22.13it/s] 166it [00:07, 22.09it/s] 169it [00:07, 22.11it/s] 172it [00:07, 22.15it/s] 175it [00:08, 22.14it/s] 178it [00:08, 22.14it/s] 181it [00:08, 22.10it/s] 184it [00:08, 22.13it/s] 187it [00:08, 22.12it/s] 190it [00:08, 22.04it/s] 193it [00:08, 22.02it/s] 196it [00:09, 21.13it/s] 196it [00:09, 21.41it/s] +2025-05-26 01:00:06,440 - INFO - Epoch: 62, Objective: tensor([1797.6357], device='cuda:0', grad_fn=), Loss: 0.005861968267709017, KL/n: 24.735652923583984 + 0it [00:00, ?it/s]2025-05-26 01:00:06,852 - INFO - [Epoch 063 | Batch 0000] IWAE-loss 1477.4492 | mean log_px -0.0038 | KL -1211.48 + 1it [00:00, 7.30it/s] 4it [00:00, 15.74it/s] 7it [00:00, 18.66it/s] 10it [00:00, 19.31it/s] 13it [00:00, 20.30it/s] 16it [00:00, 20.81it/s] 19it [00:00, 21.26it/s] 22it [00:01, 21.16it/s] 25it [00:01, 21.24it/s] 28it [00:01, 21.52it/s] 31it [00:01, 21.18it/s] 34it [00:01, 21.46it/s] 37it [00:01, 21.55it/s] 40it [00:01, 21.37it/s] 43it [00:02, 21.40it/s] 46it [00:02, 21.34it/s] 49it [00:02, 21.55it/s]2025-05-26 01:00:09,176 - INFO - [Epoch 063 | Batch 0050] IWAE-loss 1315.3348 | mean log_px -0.0016 | KL -1203.62 + 52it [00:02, 21.62it/s] 55it [00:02, 21.35it/s] 58it [00:02, 21.30it/s] 61it [00:02, 21.29it/s] 64it [00:03, 21.27it/s] 67it [00:03, 20.96it/s] 70it [00:03, 21.04it/s] 73it [00:03, 21.34it/s] 76it [00:03, 21.45it/s] 79it [00:03, 21.56it/s] 82it [00:03, 21.43it/s] 85it [00:04, 20.92it/s] 88it [00:04, 20.58it/s] 91it [00:04, 20.45it/s] 94it [00:04, 20.70it/s] 97it [00:04, 20.95it/s] 100it [00:04, 21.01it/s]2025-05-26 01:00:11,556 - INFO - [Epoch 063 | Batch 0100] IWAE-loss 1711.5524 | mean log_px -0.0073 | KL -1201.99 + 103it [00:04, 20.81it/s] 106it [00:05, 21.05it/s] 109it [00:05, 21.08it/s] 112it [00:05, 21.16it/s] 115it [00:05, 20.87it/s] 118it [00:05, 20.90it/s] 121it [00:05, 20.96it/s] 124it [00:05, 20.75it/s] 127it [00:06, 20.99it/s] 130it [00:06, 21.30it/s] 133it [00:06, 20.98it/s] 136it [00:06, 21.34it/s] 139it [00:06, 21.14it/s] 142it [00:06, 21.32it/s] 145it [00:06, 21.53it/s] 148it [00:07, 21.30it/s]2025-05-26 01:00:13,920 - INFO - [Epoch 063 | Batch 0150] IWAE-loss 1332.5717 | mean log_px -0.0019 | KL -1202.94 + 151it [00:07, 21.27it/s] 154it [00:07, 21.40it/s] 157it [00:07, 21.13it/s] 160it [00:07, 21.44it/s] 163it [00:07, 21.62it/s] 166it [00:07, 21.66it/s] 169it [00:08, 21.85it/s] 172it [00:08, 21.86it/s] 175it [00:08, 21.96it/s] 178it [00:08, 21.52it/s] 181it [00:08, 21.22it/s] 184it [00:08, 21.50it/s] 187it [00:08, 21.58it/s] 190it [00:09, 21.77it/s] 193it [00:09, 21.89it/s] 196it [00:09, 20.91it/s] 196it [00:09, 20.93it/s] +2025-05-26 01:00:16,105 - INFO - Epoch: 63, Objective: tensor([1625.1566], device='cuda:0', grad_fn=), Loss: 0.013803411275148392, KL/n: 24.550966262817383 + 0it [00:00, ?it/s]2025-05-26 01:00:16,347 - INFO - [Epoch 064 | Batch 0000] IWAE-loss 1406.9927 | mean log_px -0.0029 | KL -1202.86 + 1it [00:00, 7.06it/s] 4it [00:00, 15.48it/s] 7it [00:00, 18.44it/s] 10it [00:00, 19.49it/s] 13it [00:00, 20.25it/s] 16it [00:00, 20.87it/s] 19it [00:00, 21.20it/s] 22it [00:01, 21.50it/s] 25it [00:01, 21.70it/s] 28it [00:01, 21.85it/s] 31it [00:01, 21.92it/s] 34it [00:01, 21.99it/s] 37it [00:01, 22.03it/s] 40it [00:01, 22.05it/s] 43it [00:02, 22.03it/s] 46it [00:02, 22.06it/s] 49it [00:02, 21.89it/s]2025-05-26 01:00:18,637 - INFO - [Epoch 064 | Batch 0050] IWAE-loss 1443.6868 | mean log_px -0.0035 | KL -1198.06 + 52it [00:02, 21.73it/s] 55it [00:02, 21.82it/s] 58it [00:02, 21.42it/s] 61it [00:02, 21.55it/s] 64it [00:03, 21.66it/s] 67it [00:03, 21.77it/s] 70it [00:03, 21.86it/s] 73it [00:03, 21.65it/s] 76it [00:03, 21.46it/s] 79it [00:03, 21.44it/s] 82it [00:03, 21.48it/s] 85it [00:04, 21.59it/s] 88it [00:04, 21.64it/s] 91it [00:04, 21.77it/s] 94it [00:04, 21.58it/s] 97it [00:04, 21.53it/s] 100it [00:04, 21.52it/s]2025-05-26 01:00:20,958 - INFO - [Epoch 064 | Batch 0100] IWAE-loss 1428.4519 | mean log_px -0.0033 | KL -1198.55 + 103it [00:04, 21.21it/s] 106it [00:04, 21.35it/s] 109it [00:05, 21.56it/s] 112it [00:05, 21.71it/s] 115it [00:05, 21.80it/s] 118it [00:05, 21.84it/s] 121it [00:05, 21.87it/s] 124it [00:05, 21.76it/s] 127it [00:05, 21.90it/s] 130it [00:06, 21.93it/s] 133it [00:06, 21.87it/s] 136it [00:06, 21.91it/s] 139it [00:06, 21.90it/s] 142it [00:06, 21.98it/s] 145it [00:06, 21.95it/s] 148it [00:06, 21.96it/s]2025-05-26 01:00:23,243 - INFO - [Epoch 064 | Batch 0150] IWAE-loss 1627.3311 | mean log_px -0.0062 | KL -1194.62 + 151it [00:07, 21.88it/s] 154it [00:07, 21.97it/s] 157it [00:07, 21.98it/s] 160it [00:07, 22.01it/s] 163it [00:07, 21.61it/s] 166it [00:07, 21.53it/s] 169it [00:07, 21.38it/s] 172it [00:08, 20.65it/s] 175it [00:08, 20.58it/s] 178it [00:08, 20.64it/s] 181it [00:08, 20.58it/s] 184it [00:08, 20.74it/s] 187it [00:08, 21.01it/s] 190it [00:08, 21.07it/s] 193it [00:09, 21.18it/s] 196it [00:09, 20.30it/s] 196it [00:09, 21.19it/s] +2025-05-26 01:00:25,483 - INFO - Epoch: 64, Objective: tensor([1443.9932], device='cuda:0', grad_fn=), Loss: 0.004126382526010275, KL/n: 24.36599349975586 + 0it [00:00, ?it/s]2025-05-26 01:00:25,882 - INFO - [Epoch 065 | Batch 0000] IWAE-loss 1399.9071 | mean log_px -0.0029 | KL -1194.03 + 1it [00:00, 7.46it/s] 4it [00:00, 15.65it/s] 7it [00:00, 18.35it/s] 10it [00:00, 19.63it/s] 13it [00:00, 19.99it/s] 16it [00:00, 20.58it/s] 19it [00:00, 20.54it/s] 22it [00:01, 20.64it/s] 25it [00:01, 20.99it/s] 28it [00:01, 21.36it/s] 31it [00:01, 21.58it/s] 34it [00:01, 21.30it/s] 37it [00:01, 20.93it/s] 40it [00:01, 21.28it/s] 43it [00:02, 21.11it/s] 46it [00:02, 21.34it/s] 49it [00:02, 21.41it/s]2025-05-26 01:00:28,233 - INFO - [Epoch 065 | Batch 0050] IWAE-loss 1613.8787 | mean log_px -0.0061 | KL -1189.74 + 52it [00:02, 21.31it/s] 55it [00:02, 21.20it/s] 58it [00:02, 21.21it/s] 61it [00:02, 20.79it/s] 64it [00:03, 20.74it/s] 67it [00:03, 20.74it/s] 70it [00:03, 20.44it/s] 73it [00:03, 20.41it/s] 76it [00:03, 20.55it/s] 79it [00:03, 20.89it/s] 82it [00:03, 21.13it/s] 85it [00:04, 21.26it/s] 88it [00:04, 20.93it/s] 91it [00:04, 20.96it/s] 94it [00:04, 20.92it/s] 97it [00:04, 21.17it/s] 100it [00:04, 21.48it/s]2025-05-26 01:00:30,620 - INFO - [Epoch 065 | Batch 0100] IWAE-loss 1943.8273 | mean log_px -0.0108 | KL -1187.84 + 103it [00:04, 21.49it/s] 106it [00:05, 21.29it/s] 109it [00:05, 20.99it/s] 112it [00:05, 21.27it/s] 115it [00:05, 21.23it/s] 118it [00:05, 21.36it/s] 121it [00:05, 21.49it/s] 124it [00:05, 21.40it/s] 127it [00:06, 21.05it/s] 130it [00:06, 21.25it/s] 133it [00:06, 21.54it/s] 136it [00:06, 21.77it/s] 139it [00:06, 21.88it/s] 142it [00:06, 21.97it/s] 145it [00:06, 21.94it/s] 148it [00:07, 22.05it/s]2025-05-26 01:00:32,934 - INFO - [Epoch 065 | Batch 0150] IWAE-loss 1562.8031 | mean log_px -0.0055 | KL -1179.59 + 151it [00:07, 22.10it/s] 154it [00:07, 21.80it/s] 157it [00:07, 21.52it/s] 160it [00:07, 21.55it/s] 163it [00:07, 21.74it/s] 166it [00:07, 21.31it/s] 169it [00:08, 21.39it/s] 172it [00:08, 21.67it/s] 175it [00:08, 21.78it/s] 178it [00:08, 21.78it/s] 181it [00:08, 21.90it/s] 184it [00:08, 22.00it/s] 187it [00:08, 21.39it/s] 190it [00:08, 21.51it/s] 193it [00:09, 21.63it/s] 196it [00:09, 20.84it/s] 196it [00:09, 20.96it/s] +2025-05-26 01:00:35,127 - INFO - Epoch: 65, Objective: tensor([1244.6835], device='cuda:0', grad_fn=), Loss: 0.0031122725922614336, KL/n: 24.138437271118164 + 0it [00:00, ?it/s]2025-05-26 01:00:35,366 - INFO - [Epoch 066 | Batch 0000] IWAE-loss 1505.4709 | mean log_px -0.0046 | KL -1183.38 + 1it [00:00, 7.16it/s] 4it [00:00, 15.45it/s] 7it [00:00, 18.13it/s] 10it [00:00, 19.48it/s] 13it [00:00, 20.39it/s] 16it [00:00, 20.90it/s] 19it [00:00, 21.30it/s] 22it [00:01, 21.46it/s] 25it [00:01, 21.66it/s] 28it [00:01, 21.73it/s] 31it [00:01, 21.77it/s] 34it [00:01, 21.81it/s] 37it [00:01, 21.85it/s] 40it [00:01, 21.91it/s] 43it [00:02, 21.91it/s] 46it [00:02, 21.94it/s] 49it [00:02, 21.95it/s]2025-05-26 01:00:37,661 - INFO - [Epoch 066 | Batch 0050] IWAE-loss 2979.2026 | mean log_px -0.0257 | KL -1180.59 + 52it [00:02, 21.88it/s] 55it [00:02, 21.83it/s] 58it [00:02, 21.87it/s] 61it [00:02, 21.85it/s] 64it [00:03, 21.88it/s] 67it [00:03, 21.89it/s] 70it [00:03, 21.81it/s] 73it [00:03, 21.77it/s] 76it [00:03, 21.79it/s] 79it [00:03, 21.75it/s] 82it [00:03, 21.52it/s] 85it [00:03, 21.43it/s] 88it [00:04, 21.58it/s] 91it [00:04, 21.35it/s] 94it [00:04, 21.36it/s] 97it [00:04, 21.28it/s] 100it [00:04, 21.44it/s]2025-05-26 01:00:39,980 - INFO - [Epoch 066 | Batch 0100] IWAE-loss 1724.2590 | mean log_px -0.0078 | KL -1176.66 + 103it [00:04, 21.21it/s] 106it [00:04, 21.30it/s] 109it [00:05, 21.48it/s] 112it [00:05, 21.64it/s] 115it [00:05, 21.65it/s] 118it [00:05, 21.73it/s] 121it [00:05, 21.76it/s] 124it [00:05, 21.77it/s] 127it [00:05, 21.83it/s] 130it [00:06, 21.86it/s] 133it [00:06, 21.86it/s] 136it [00:06, 21.85it/s] 139it [00:06, 21.83it/s] 142it [00:06, 21.82it/s] 145it [00:06, 21.74it/s] 148it [00:06, 21.70it/s]2025-05-26 01:00:42,279 - INFO - [Epoch 066 | Batch 0150] IWAE-loss 1492.8876 | mean log_px -0.0045 | KL -1177.77 + 151it [00:07, 21.58it/s] 154it [00:07, 21.47it/s] 157it [00:07, 21.69it/s] 160it [00:07, 21.66it/s] 163it [00:07, 21.46it/s] 166it [00:07, 21.43it/s] 169it [00:07, 21.42it/s] 172it [00:08, 21.41it/s] 175it [00:08, 21.65it/s] 178it [00:08, 21.54it/s] 181it [00:08, 21.60it/s] 184it [00:08, 21.64it/s] 187it [00:08, 21.58it/s] 190it [00:08, 21.36it/s] 193it [00:09, 21.26it/s] 196it [00:09, 20.65it/s] 196it [00:09, 21.26it/s] +2025-05-26 01:00:44,477 - INFO - Epoch: 66, Objective: tensor([1309.9202], device='cuda:0', grad_fn=), Loss: 0.0016545935068279505, KL/n: 24.009193420410156 + 0it [00:00, ?it/s]2025-05-26 01:00:45,026 - INFO - [Epoch 067 | Batch 0000] IWAE-loss 1319.7920 | mean log_px -0.0021 | KL -1174.74 + 1it [00:00, 3.63it/s] 4it [00:00, 11.23it/s] 7it [00:00, 15.27it/s] 10it [00:00, 17.65it/s] 13it [00:00, 19.20it/s] 16it [00:00, 20.13it/s] 19it [00:01, 20.61it/s] 22it [00:01, 21.00it/s] 25it [00:01, 21.42it/s] 28it [00:01, 21.67it/s] 31it [00:01, 21.88it/s] 34it [00:01, 22.07it/s] 37it [00:01, 22.17it/s] 40it [00:02, 22.16it/s] 43it [00:02, 22.16it/s] 46it [00:02, 22.21it/s] 49it [00:02, 22.13it/s]2025-05-26 01:00:47,286 - INFO - [Epoch 067 | Batch 0050] IWAE-loss 1239.9298 | mean log_px -0.0010 | KL -1171.70 + 52it [00:02, 22.13it/s] 55it [00:02, 22.13it/s] 58it [00:02, 22.10it/s] 61it [00:02, 22.19it/s] 64it [00:03, 22.25it/s] 67it [00:03, 22.25it/s] 70it [00:03, 22.29it/s] 73it [00:03, 22.27it/s] 76it [00:03, 22.27it/s] 79it [00:03, 22.29it/s] 82it [00:03, 22.32it/s] 85it [00:04, 22.34it/s] 88it [00:04, 22.32it/s] 91it [00:04, 22.27it/s] 94it [00:04, 22.28it/s] 97it [00:04, 22.62it/s] 100it [00:04, 22.89it/s]2025-05-26 01:00:49,519 - INFO - [Epoch 067 | Batch 0100] IWAE-loss 1385.4918 | mean log_px -0.0031 | KL -1171.60 + 103it [00:04, 23.07it/s] 106it [00:04, 23.18it/s] 109it [00:05, 23.32it/s] 112it [00:05, 23.39it/s] 115it [00:05, 23.43it/s] 118it [00:05, 23.49it/s] 121it [00:05, 23.46it/s] 124it [00:05, 23.51it/s] 127it [00:05, 23.55it/s] 130it [00:05, 23.56it/s] 133it [00:06, 23.60it/s] 136it [00:06, 23.65it/s] 139it [00:06, 23.53it/s] 142it [00:06, 23.54it/s] 145it [00:06, 23.67it/s] 148it [00:06, 23.64it/s]2025-05-26 01:00:51,639 - INFO - [Epoch 067 | Batch 0150] IWAE-loss 1414.0454 | mean log_px -0.0034 | KL -1174.03 + 151it [00:06, 23.57it/s] 154it [00:07, 23.50it/s] 157it [00:07, 23.50it/s] 160it [00:07, 23.48it/s] 163it [00:07, 23.46it/s] 166it [00:07, 23.46it/s] 169it [00:07, 23.44it/s] 172it [00:07, 23.40it/s] 175it [00:07, 23.38it/s] 178it [00:08, 23.39it/s] 181it [00:08, 23.39it/s] 184it [00:08, 23.41it/s] 187it [00:08, 23.36it/s] 190it [00:08, 23.35it/s] 193it [00:08, 23.36it/s] 196it [00:08, 22.63it/s] 196it [00:08, 22.05it/s] +2025-05-26 01:00:53,665 - INFO - Epoch: 67, Objective: tensor([1395.9412], device='cuda:0', grad_fn=), Loss: 0.0017220848239958286, KL/n: 23.956453323364258 + 0it [00:00, ?it/s]2025-05-26 01:00:54,085 - INFO - [Epoch 068 | Batch 0000] IWAE-loss 1417.4214 | mean log_px -0.0035 | KL -1171.02 + 1it [00:00, 7.68it/s] 4it [00:00, 16.71it/s] 7it [00:00, 19.90it/s] 10it [00:00, 21.27it/s] 13it [00:00, 21.72it/s] 16it [00:00, 21.95it/s] 19it [00:00, 22.15it/s] 22it [00:01, 22.36it/s] 25it [00:01, 22.49it/s] 28it [00:01, 22.70it/s] 31it [00:01, 22.74it/s] 34it [00:01, 22.96it/s] 37it [00:01, 23.08it/s] 40it [00:01, 23.25it/s] 43it [00:01, 23.16it/s] 46it [00:02, 23.29it/s] 49it [00:02, 22.86it/s]2025-05-26 01:00:56,266 - INFO - [Epoch 068 | Batch 0050] IWAE-loss 1651.8307 | mean log_px -0.0069 | KL -1171.39 + 52it [00:02, 22.57it/s] 55it [00:02, 22.28it/s] 58it [00:02, 22.52it/s] 61it [00:02, 22.72it/s] 64it [00:02, 23.01it/s] 67it [00:03, 23.21it/s] 70it [00:03, 23.22it/s] 73it [00:03, 23.05it/s] 76it [00:03, 22.76it/s] 79it [00:03, 22.42it/s] 82it [00:03, 22.15it/s] 85it [00:03, 21.99it/s] 88it [00:03, 22.01it/s] 91it [00:04, 22.03it/s] 94it [00:04, 22.03it/s] 97it [00:04, 21.92it/s] 100it [00:04, 21.62it/s]2025-05-26 01:00:58,512 - INFO - [Epoch 068 | Batch 0100] IWAE-loss 1244.1145 | mean log_px -0.0011 | KL -1169.49 + 103it [00:04, 21.62it/s] 106it [00:04, 21.83it/s] 109it [00:04, 21.57it/s] 112it [00:05, 21.26it/s] 115it [00:05, 21.39it/s] 118it [00:05, 21.08it/s] 121it [00:05, 21.29it/s] 124it [00:05, 21.38it/s] 127it [00:05, 20.97it/s] 130it [00:05, 21.27it/s] 133it [00:06, 21.46it/s] 136it [00:06, 21.67it/s] 139it [00:06, 21.85it/s] 142it [00:06, 21.96it/s] 145it [00:06, 21.36it/s] 148it [00:06, 20.85it/s]2025-05-26 01:01:00,862 - INFO - [Epoch 068 | Batch 0150] IWAE-loss 1535.0297 | mean log_px -0.0053 | KL -1165.77 + 151it [00:06, 20.64it/s] 154it [00:07, 20.68it/s] 157it [00:07, 20.58it/s] 160it [00:07, 20.61it/s] 163it [00:07, 20.77it/s] 166it [00:07, 20.91it/s] 169it [00:07, 20.95it/s] 172it [00:07, 21.12it/s] 175it [00:08, 21.42it/s] 178it [00:08, 21.63it/s] 181it [00:08, 21.79it/s] 184it [00:08, 21.82it/s] 187it [00:08, 21.86it/s] 190it [00:08, 21.87it/s] 193it [00:08, 21.53it/s] 196it [00:09, 20.50it/s] 196it [00:09, 21.52it/s] +2025-05-26 01:01:03,084 - INFO - Epoch: 68, Objective: tensor([1231.7466], device='cuda:0', grad_fn=), Loss: 0.0006337575032375753, KL/n: 23.857040405273438 + 0it [00:00, ?it/s]2025-05-26 01:01:03,320 - INFO - [Epoch 069 | Batch 0000] IWAE-loss 1756.9629 | mean log_px -0.0084 | KL -1171.36 + 1it [00:00, 7.46it/s] 4it [00:00, 15.97it/s] 7it [00:00, 18.74it/s] 10it [00:00, 20.14it/s] 13it [00:00, 20.92it/s] 16it [00:00, 21.17it/s] 19it [00:00, 21.03it/s] 22it [00:01, 21.35it/s] 25it [00:01, 21.58it/s] 28it [00:01, 21.64it/s] 31it [00:01, 21.38it/s] 34it [00:01, 21.59it/s] 37it [00:01, 21.65it/s] 40it [00:01, 21.38it/s] 43it [00:02, 21.59it/s] 46it [00:02, 21.65it/s] 49it [00:02, 21.81it/s]2025-05-26 01:01:05,626 - INFO - [Epoch 069 | Batch 0050] IWAE-loss 1267.2472 | mean log_px -0.0014 | KL -1167.82 + 52it [00:02, 21.59it/s] 55it [00:02, 21.62it/s] 58it [00:02, 21.80it/s] 61it [00:02, 21.96it/s] 64it [00:03, 21.99it/s] 67it [00:03, 21.88it/s] 70it [00:03, 22.03it/s] 73it [00:03, 22.10it/s] 76it [00:03, 22.17it/s] 79it [00:03, 22.15it/s] 82it [00:03, 22.16it/s] 85it [00:03, 22.19it/s] 88it [00:04, 22.31it/s] 91it [00:04, 21.97it/s] 94it [00:04, 21.88it/s] 97it [00:04, 21.81it/s] 100it [00:04, 21.89it/s]2025-05-26 01:01:07,897 - INFO - [Epoch 069 | Batch 0100] IWAE-loss 1318.6864 | mean log_px -0.0022 | KL -1163.78 + 103it [00:04, 21.60it/s] 106it [00:04, 21.69it/s] 109it [00:05, 21.81it/s] 112it [00:05, 21.66it/s] 115it [00:05, 21.69it/s] 118it [00:05, 21.86it/s] 121it [00:05, 21.57it/s] 124it [00:05, 21.77it/s] 127it [00:05, 21.71it/s] 130it [00:06, 21.65it/s] 133it [00:06, 21.77it/s] 136it [00:06, 21.49it/s] 139it [00:06, 21.67it/s] 142it [00:06, 21.84it/s] 145it [00:06, 21.95it/s] 148it [00:06, 21.84it/s]2025-05-26 01:01:10,204 - INFO - [Epoch 069 | Batch 0150] IWAE-loss 1337.0706 | mean log_px -0.0026 | KL -1157.92 + 151it [00:07, 21.61it/s] 154it [00:07, 21.66it/s] 157it [00:07, 21.80it/s] 160it [00:07, 21.89it/s] 163it [00:07, 21.95it/s] 166it [00:07, 22.07it/s] 169it [00:07, 22.14it/s] 172it [00:07, 22.10it/s] 175it [00:08, 21.96it/s] 178it [00:08, 21.91it/s] 181it [00:08, 21.71it/s] 184it [00:08, 21.58it/s] 187it [00:08, 21.75it/s] 190it [00:08, 21.47it/s] 193it [00:08, 21.53it/s] 196it [00:09, 20.89it/s] 196it [00:09, 21.42it/s] +2025-05-26 01:01:12,366 - INFO - Epoch: 69, Objective: tensor([1499.0780], device='cuda:0', grad_fn=), Loss: 0.0031943165231496096, KL/n: 23.625442504882812 + 0it [00:00, ?it/s]2025-05-26 01:01:12,597 - INFO - [Epoch 070 | Batch 0000] IWAE-loss 1227.1208 | mean log_px -0.0010 | KL -1158.62 + 1it [00:00, 7.66it/s] 4it [00:00, 16.34it/s] 7it [00:00, 18.64it/s] 10it [00:00, 20.01it/s] 13it [00:00, 20.79it/s] 16it [00:00, 20.66it/s] 19it [00:00, 21.08it/s] 22it [00:01, 21.08it/s] 25it [00:01, 21.17it/s] 28it [00:01, 21.15it/s] 31it [00:01, 20.83it/s] 34it [00:01, 20.68it/s] 37it [00:01, 20.88it/s] 40it [00:01, 21.19it/s] 43it [00:02, 21.47it/s] 46it [00:02, 21.22it/s] 49it [00:02, 21.08it/s]2025-05-26 01:01:14,949 - INFO - [Epoch 070 | Batch 0050] IWAE-loss 1339.5062 | mean log_px -0.0027 | KL -1152.80 + 52it [00:02, 21.26it/s] 55it [00:02, 21.05it/s] 58it [00:02, 21.02it/s] 61it [00:02, 21.29it/s] 64it [00:03, 21.55it/s] 67it [00:03, 21.76it/s] 70it [00:03, 21.65it/s] 73it [00:03, 21.52it/s] 76it [00:03, 21.70it/s] 79it [00:03, 21.16it/s] 82it [00:03, 21.30it/s] 85it [00:04, 21.06it/s] 88it [00:04, 21.39it/s] 91it [00:04, 21.60it/s] 94it [00:04, 21.77it/s] 97it [00:04, 21.92it/s] 100it [00:04, 21.97it/s]2025-05-26 01:01:17,264 - INFO - [Epoch 070 | Batch 0100] IWAE-loss 1315.9856 | mean log_px -0.0024 | KL -1151.35 + 103it [00:04, 21.98it/s] 106it [00:05, 22.06it/s] 109it [00:05, 22.11it/s] 112it [00:05, 21.48it/s] 115it [00:05, 21.52it/s] 118it [00:05, 21.68it/s] 121it [00:05, 21.80it/s] 124it [00:05, 21.40it/s] 127it [00:06, 21.15it/s] 130it [00:06, 20.73it/s] 133it [00:06, 20.99it/s] 136it [00:06, 21.17it/s] 139it [00:06, 21.15it/s] 142it [00:06, 21.07it/s] 145it [00:06, 21.06it/s] 148it [00:06, 21.41it/s]2025-05-26 01:01:19,607 - INFO - [Epoch 070 | Batch 0150] IWAE-loss 1323.5460 | mean log_px -0.0024 | KL -1154.05 + 151it [00:07, 21.41it/s] 154it [00:07, 21.15it/s] 157it [00:07, 21.29it/s] 160it [00:07, 21.41it/s] 163it [00:07, 21.08it/s] 166it [00:07, 21.39it/s] 169it [00:07, 21.14it/s] 172it [00:08, 21.22it/s] 175it [00:08, 21.11it/s] 178it [00:08, 20.96it/s] 181it [00:08, 20.78it/s] 184it [00:08, 20.92it/s] 187it [00:08, 21.27it/s] 190it [00:08, 21.55it/s] 193it [00:09, 21.77it/s] 196it [00:09, 21.00it/s] 196it [00:09, 21.02it/s] +2025-05-26 01:01:21,818 - INFO - Epoch: 70, Objective: tensor([2284.2085], device='cuda:0', grad_fn=), Loss: 0.006363144144415855, KL/n: 23.562253952026367 + 0it [00:00, ?it/s]2025-05-26 01:01:22,224 - INFO - [Epoch 071 | Batch 0000] IWAE-loss 1722.5839 | mean log_px -0.0081 | KL -1153.26 + 1it [00:00, 7.66it/s] 4it [00:00, 16.51it/s] 7it [00:00, 19.72it/s] 10it [00:00, 21.20it/s] 13it [00:00, 22.07it/s] 16it [00:00, 22.56it/s] 19it [00:00, 22.96it/s] 22it [00:01, 23.12it/s] 25it [00:01, 23.24it/s] 28it [00:01, 23.35it/s] 31it [00:01, 23.38it/s] 34it [00:01, 23.50it/s] 37it [00:01, 23.51it/s] 40it [00:01, 23.48it/s] 43it [00:01, 23.48it/s] 46it [00:02, 23.44it/s] 49it [00:02, 23.42it/s]2025-05-26 01:01:24,359 - INFO - [Epoch 071 | Batch 0050] IWAE-loss 1585.7119 | mean log_px -0.0062 | KL -1153.17 + 52it [00:02, 23.31it/s] 55it [00:02, 22.87it/s] 58it [00:02, 22.03it/s] 61it [00:02, 22.28it/s] 64it [00:02, 22.51it/s] 67it [00:02, 22.75it/s] 70it [00:03, 22.77it/s] 73it [00:03, 22.86it/s] 76it [00:03, 22.86it/s] 79it [00:03, 22.97it/s] 82it [00:03, 23.06it/s] 85it [00:03, 23.11it/s] 88it [00:03, 23.14it/s] 91it [00:04, 23.16it/s] 94it [00:04, 23.17it/s] 97it [00:04, 23.15it/s] 100it [00:04, 23.01it/s]2025-05-26 01:01:26,551 - INFO - [Epoch 071 | Batch 0100] IWAE-loss 1716.2581 | mean log_px -0.0081 | KL -1146.16 + 103it [00:04, 22.91it/s] 106it [00:04, 22.96it/s] 109it [00:04, 22.94it/s] 112it [00:04, 23.01it/s] 115it [00:05, 23.02it/s] 118it [00:05, 23.06it/s] 121it [00:05, 23.07it/s] 124it [00:05, 23.12it/s] 127it [00:05, 23.11it/s] 130it [00:05, 23.14it/s] 133it [00:05, 23.20it/s] 136it [00:05, 23.19it/s] 139it [00:06, 23.13it/s] 142it [00:06, 23.10it/s] 145it [00:06, 23.12it/s] 148it [00:06, 23.13it/s]2025-05-26 01:01:28,716 - INFO - [Epoch 071 | Batch 0150] IWAE-loss 1415.4498 | mean log_px -0.0038 | KL -1146.60 + 151it [00:06, 23.07it/s] 154it [00:06, 23.10it/s] 157it [00:06, 23.13it/s] 160it [00:07, 23.13it/s] 163it [00:07, 23.01it/s] 166it [00:07, 23.00it/s] 169it [00:07, 23.06it/s] 172it [00:07, 23.07it/s] 175it [00:07, 22.98it/s] 178it [00:07, 22.91it/s] 181it [00:07, 22.95it/s] 184it [00:08, 23.03it/s] 187it [00:08, 23.08it/s] 190it [00:08, 23.04it/s] 193it [00:08, 23.08it/s] 196it [00:08, 21.57it/s] 196it [00:08, 22.64it/s] +2025-05-26 01:01:30,773 - INFO - Epoch: 71, Objective: tensor([1199.2096], device='cuda:0', grad_fn=), Loss: 0.0014096980448812246, KL/n: 23.376096725463867 + 0it [00:00, ?it/s]2025-05-26 01:01:31,012 - INFO - [Epoch 072 | Batch 0000] IWAE-loss 1707.1000 | mean log_px -0.0080 | KL -1145.44 + 1it [00:00, 7.49it/s] 4it [00:00, 16.19it/s] 7it [00:00, 18.89it/s] 10it [00:00, 20.12it/s] 13it [00:00, 20.81it/s] 16it [00:00, 21.22it/s] 19it [00:00, 21.39it/s] 22it [00:01, 21.34it/s] 25it [00:01, 21.04it/s] 28it [00:01, 20.99it/s] 31it [00:01, 21.12it/s] 34it [00:01, 21.17it/s] 37it [00:01, 21.36it/s] 40it [00:01, 21.47it/s] 43it [00:02, 21.57it/s] 46it [00:02, 21.67it/s] 49it [00:02, 21.60it/s]2025-05-26 01:01:33,326 - INFO - [Epoch 072 | Batch 0050] IWAE-loss 1334.2335 | mean log_px -0.0028 | KL -1138.06 + 52it [00:02, 21.63it/s] 55it [00:02, 21.72it/s] 58it [00:02, 21.76it/s] 61it [00:02, 21.75it/s] 64it [00:03, 21.76it/s] 67it [00:03, 21.79it/s] 70it [00:03, 21.81it/s] 73it [00:03, 21.81it/s] 76it [00:03, 21.79it/s] 79it [00:03, 21.83it/s] 82it [00:03, 21.85it/s] 85it [00:04, 21.84it/s] 88it [00:04, 21.84it/s] 91it [00:04, 21.87it/s] 94it [00:04, 21.88it/s] 97it [00:04, 21.86it/s] 100it [00:04, 21.86it/s]2025-05-26 01:01:35,615 - INFO - [Epoch 072 | Batch 0100] IWAE-loss 1416.9973 | mean log_px -0.0040 | KL -1136.52 + 103it [00:04, 21.82it/s] 106it [00:04, 21.80it/s] 109it [00:05, 21.81it/s] 112it [00:05, 21.82it/s] 115it [00:05, 21.86it/s] 118it [00:05, 21.87it/s] 121it [00:05, 21.85it/s] 124it [00:05, 21.86it/s] 127it [00:05, 21.82it/s] 130it [00:06, 21.80it/s] 133it [00:06, 21.81it/s] 136it [00:06, 21.82it/s] 139it [00:06, 21.81it/s] 142it [00:06, 21.77it/s] 145it [00:06, 21.77it/s] 148it [00:06, 21.76it/s]2025-05-26 01:01:37,909 - INFO - [Epoch 072 | Batch 0150] IWAE-loss 1384.1274 | mean log_px -0.0035 | KL -1140.45 + 151it [00:07, 21.75it/s] 154it [00:07, 21.76it/s] 157it [00:07, 21.77it/s] 160it [00:07, 21.72it/s] 163it [00:07, 21.76it/s] 166it [00:07, 21.77it/s] 169it [00:07, 21.81it/s] 172it [00:07, 21.80it/s] 175it [00:08, 21.81it/s] 178it [00:08, 21.81it/s] 181it [00:08, 21.83it/s] 184it [00:08, 21.85it/s] 187it [00:08, 21.85it/s] 190it [00:08, 21.84it/s] 193it [00:08, 21.79it/s] 196it [00:09, 20.86it/s] 196it [00:09, 21.36it/s] +2025-05-26 01:01:40,078 - INFO - Epoch: 72, Objective: tensor([1491.2115], device='cuda:0', grad_fn=), Loss: 0.003671560902148485, KL/n: 23.28042221069336 + 0it [00:00, ?it/s]2025-05-26 01:01:40,619 - INFO - [Epoch 073 | Batch 0000] IWAE-loss 1321.8411 | mean log_px -0.0025 | KL -1143.41 + 1it [00:00, 3.76it/s] 4it [00:00, 11.46it/s] 7it [00:00, 15.05it/s] 10it [00:00, 17.42it/s] 13it [00:00, 18.78it/s] 16it [00:00, 19.61it/s] 19it [00:01, 20.12it/s] 22it [00:01, 20.53it/s] 25it [00:01, 20.96it/s] 28it [00:01, 21.10it/s] 31it [00:01, 21.38it/s] 34it [00:01, 21.39it/s] 37it [00:01, 21.60it/s] 40it [00:02, 21.74it/s] 43it [00:02, 21.82it/s] 46it [00:02, 21.85it/s] 49it [00:02, 21.91it/s]2025-05-26 01:01:42,926 - INFO - [Epoch 073 | Batch 0050] IWAE-loss 1394.0846 | mean log_px -0.0037 | KL -1137.44 + 52it [00:02, 21.91it/s] 55it [00:02, 21.97it/s] 58it [00:02, 21.93it/s] 61it [00:03, 21.93it/s] 64it [00:03, 21.95it/s] 67it [00:03, 21.98it/s] 70it [00:03, 21.97it/s] 73it [00:03, 21.82it/s] 76it [00:03, 21.86it/s] 79it [00:03, 21.88it/s] 82it [00:03, 21.87it/s] 85it [00:04, 21.83it/s] 88it [00:04, 21.72it/s] 91it [00:04, 21.65it/s] 94it [00:04, 21.70it/s] 97it [00:04, 21.73it/s] 100it [00:04, 21.55it/s]2025-05-26 01:01:45,222 - INFO - [Epoch 073 | Batch 0100] IWAE-loss 1657.8174 | mean log_px -0.0074 | KL -1137.26 + 103it [00:04, 21.66it/s] 106it [00:05, 21.78it/s] 109it [00:05, 21.84it/s] 112it [00:05, 21.90it/s] 115it [00:05, 21.96it/s] 118it [00:05, 21.93it/s] 121it [00:05, 21.73it/s] 124it [00:05, 21.81it/s] 127it [00:06, 21.86it/s] 130it [00:06, 21.91it/s] 133it [00:06, 21.96it/s] 136it [00:06, 21.97it/s] 139it [00:06, 21.97it/s] 142it [00:06, 21.97it/s] 145it [00:06, 21.94it/s] 148it [00:07, 21.96it/s]2025-05-26 01:01:47,501 - INFO - [Epoch 073 | Batch 0150] IWAE-loss 1873.5570 | mean log_px -0.0106 | KL -1133.77 + 151it [00:07, 21.87it/s] 154it [00:07, 21.76it/s] 157it [00:07, 21.69it/s] 160it [00:07, 21.65it/s] 163it [00:07, 21.63it/s] 166it [00:07, 21.50it/s] 169it [00:07, 21.48it/s] 172it [00:08, 21.49it/s] 175it [00:08, 21.47it/s] 178it [00:08, 21.49it/s] 181it [00:08, 21.61it/s] 184it [00:08, 21.42it/s] 187it [00:08, 21.46it/s] 190it [00:08, 21.49it/s] 193it [00:09, 21.65it/s] 196it [00:09, 20.69it/s] 196it [00:09, 21.01it/s] +2025-05-26 01:01:49,706 - INFO - Epoch: 73, Objective: tensor([1197.7738], device='cuda:0', grad_fn=), Loss: 0.0008110225899145007, KL/n: 23.13855743408203 + 0it [00:00, ?it/s]2025-05-26 01:01:50,126 - INFO - [Epoch 074 | Batch 0000] IWAE-loss 1708.7070 | mean log_px -0.0082 | KL -1131.42 + 1it [00:00, 7.69it/s] 4it [00:00, 16.33it/s] 7it [00:00, 19.00it/s] 10it [00:00, 20.36it/s] 13it [00:00, 20.65it/s] 16it [00:00, 21.13it/s] 19it [00:00, 21.56it/s] 22it [00:01, 21.42it/s] 25it [00:01, 21.72it/s] 28it [00:01, 21.79it/s] 31it [00:01, 21.97it/s] 34it [00:01, 21.84it/s] 37it [00:01, 21.90it/s] 40it [00:01, 22.07it/s] 43it [00:02, 22.19it/s] 46it [00:02, 22.25it/s] 49it [00:02, 22.08it/s]2025-05-26 01:01:52,397 - INFO - [Epoch 074 | Batch 0050] IWAE-loss 1200.7642 | mean log_px -0.0010 | KL -1129.92 + 52it [00:02, 21.75it/s] 55it [00:02, 21.80it/s] 58it [00:02, 22.00it/s] 61it [00:02, 22.01it/s] 64it [00:02, 21.87it/s] 67it [00:03, 21.81it/s] 70it [00:03, 22.00it/s] 73it [00:03, 22.03it/s] 76it [00:03, 21.96it/s] 79it [00:03, 22.00it/s] 82it [00:03, 22.11it/s] 85it [00:03, 22.21it/s] 88it [00:04, 22.26it/s] 91it [00:04, 22.30it/s] 94it [00:04, 21.97it/s] 97it [00:04, 22.04it/s] 100it [00:04, 22.08it/s]2025-05-26 01:01:54,670 - INFO - [Epoch 074 | Batch 0100] IWAE-loss 1299.4302 | mean log_px -0.0025 | KL -1123.19 + 103it [00:04, 22.15it/s] 106it [00:04, 22.17it/s] 109it [00:05, 22.20it/s] 112it [00:05, 22.22it/s] 115it [00:05, 22.10it/s] 118it [00:05, 21.79it/s] 121it [00:05, 21.85it/s] 124it [00:05, 21.84it/s] 127it [00:05, 22.00it/s] 130it [00:05, 21.72it/s] 133it [00:06, 21.93it/s] 136it [00:06, 21.92it/s] 139it [00:06, 22.04it/s] 142it [00:06, 22.15it/s] 145it [00:06, 22.22it/s] 148it [00:06, 22.29it/s]2025-05-26 01:01:56,934 - INFO - [Epoch 074 | Batch 0150] IWAE-loss 1433.4456 | mean log_px -0.0044 | KL -1128.54 + 151it [00:06, 22.29it/s] 154it [00:07, 22.34it/s] 157it [00:07, 22.08it/s] 160it [00:07, 22.06it/s] 163it [00:07, 22.07it/s] 166it [00:07, 22.03it/s] 169it [00:07, 22.15it/s] 172it [00:07, 22.21it/s] 175it [00:08, 22.24it/s] 178it [00:08, 21.90it/s] 181it [00:08, 22.03it/s] 184it [00:08, 22.12it/s] 187it [00:08, 22.22it/s] 190it [00:08, 22.11it/s] 193it [00:08, 21.68it/s] 196it [00:08, 21.04it/s] 196it [00:09, 21.62it/s] +2025-05-26 01:01:59,086 - INFO - Epoch: 74, Objective: tensor([1393.6099], device='cuda:0', grad_fn=), Loss: 0.002161072799935937, KL/n: 23.03531265258789 + 0it [00:00, ?it/s]2025-05-26 01:01:59,321 - INFO - [Epoch 075 | Batch 0000] IWAE-loss 1360.9983 | mean log_px -0.0033 | KL -1128.02 + 1it [00:00, 7.50it/s] 4it [00:00, 15.89it/s] 7it [00:00, 18.33it/s] 10it [00:00, 19.47it/s] 13it [00:00, 20.37it/s] 16it [00:00, 20.99it/s] 19it [00:00, 21.35it/s] 22it [00:01, 21.16it/s] 25it [00:01, 21.13it/s] 28it [00:01, 21.47it/s] 31it [00:01, 21.38it/s] 34it [00:01, 21.42it/s] 37it [00:01, 21.24it/s] 40it [00:01, 21.40it/s] 43it [00:02, 21.60it/s] 46it [00:02, 21.29it/s] 49it [00:02, 21.49it/s]2025-05-26 01:02:01,648 - INFO - [Epoch 075 | Batch 0050] IWAE-loss 1446.0620 | mean log_px -0.0046 | KL -1123.09 + 52it [00:02, 21.71it/s] 55it [00:02, 21.76it/s] 58it [00:02, 21.87it/s] 61it [00:02, 21.85it/s] 64it [00:03, 21.68it/s] 67it [00:03, 21.68it/s] 70it [00:03, 21.73it/s] 73it [00:03, 21.84it/s] 76it [00:03, 21.82it/s] 79it [00:03, 21.80it/s] 82it [00:03, 21.84it/s] 85it [00:04, 21.96it/s] 88it [00:04, 21.67it/s] 91it [00:04, 21.48it/s] 94it [00:04, 20.93it/s] 97it [00:04, 20.93it/s] 100it [00:04, 21.28it/s]2025-05-26 01:02:03,964 - INFO - [Epoch 075 | Batch 0100] IWAE-loss 1414.4138 | mean log_px -0.0042 | KL -1119.46 + 103it [00:04, 21.50it/s] 106it [00:04, 21.69it/s] 109it [00:05, 21.39it/s] 112it [00:05, 21.60it/s] 115it [00:05, 21.63it/s] 118it [00:05, 21.75it/s] 121it [00:05, 21.38it/s] 124it [00:05, 21.39it/s] 127it [00:05, 21.46it/s] 130it [00:06, 21.01it/s] 133it [00:06, 21.31it/s] 136it [00:06, 21.57it/s] 139it [00:06, 21.66it/s] 142it [00:06, 21.44it/s] 145it [00:06, 21.33it/s] 148it [00:06, 21.24it/s]2025-05-26 01:02:06,292 - INFO - [Epoch 075 | Batch 0150] IWAE-loss 1359.6471 | mean log_px -0.0034 | KL -1122.78 + 151it [00:07, 21.48it/s] 154it [00:07, 21.34it/s] 157it [00:07, 21.32it/s] 160it [00:07, 21.21it/s] 163it [00:07, 21.29it/s] 166it [00:07, 21.54it/s] 169it [00:07, 21.75it/s] 172it [00:08, 21.80it/s] 175it [00:08, 21.56it/s] 178it [00:08, 21.12it/s] 181it [00:08, 20.65it/s] 184it [00:08, 21.03it/s] 187it [00:08, 21.13it/s] 190it [00:08, 21.04it/s] 193it [00:09, 21.17it/s] 196it [00:09, 20.49it/s] 196it [00:09, 21.10it/s] +2025-05-26 01:02:08,504 - INFO - Epoch: 75, Objective: tensor([1397.3792], device='cuda:0', grad_fn=), Loss: 0.004019514657557011, KL/n: 22.936187744140625 + 0it [00:00, ?it/s]2025-05-26 01:02:08,930 - INFO - [Epoch 076 | Batch 0000] IWAE-loss 1434.4915 | mean log_px -0.0044 | KL -1125.38 + 1it [00:00, 7.49it/s] 4it [00:00, 15.63it/s] 7it [00:00, 18.45it/s] 10it [00:00, 19.85it/s] 13it [00:00, 20.63it/s] 16it [00:00, 20.87it/s] 19it [00:00, 20.71it/s] 22it [00:01, 21.24it/s] 25it [00:01, 21.52it/s] 28it [00:01, 21.74it/s] 31it [00:01, 21.70it/s] 34it [00:01, 21.83it/s] 37it [00:01, 21.45it/s] 40it [00:01, 21.41it/s] 43it [00:02, 21.55it/s] 46it [00:02, 21.60it/s] 49it [00:02, 21.75it/s]2025-05-26 01:02:11,240 - INFO - [Epoch 076 | Batch 0050] IWAE-loss 1421.8232 | mean log_px -0.0043 | KL -1121.69 + 52it [00:02, 21.85it/s] 55it [00:02, 21.86it/s] 58it [00:02, 21.91it/s] 61it [00:02, 21.98it/s] 64it [00:03, 22.12it/s] 67it [00:03, 21.66it/s] 70it [00:03, 21.83it/s] 73it [00:03, 21.77it/s] 76it [00:03, 21.87it/s] 79it [00:03, 21.94it/s] 82it [00:03, 21.78it/s] 85it [00:04, 21.39it/s] 88it [00:04, 21.61it/s] 91it [00:04, 21.77it/s] 94it [00:04, 21.83it/s] 97it [00:04, 21.92it/s] 100it [00:04, 22.01it/s]2025-05-26 01:02:13,528 - INFO - [Epoch 076 | Batch 0100] IWAE-loss 1293.9081 | mean log_px -0.0024 | KL -1124.54 + 103it [00:04, 22.03it/s] 106it [00:04, 22.06it/s] 109it [00:05, 22.09it/s] 112it [00:05, 21.96it/s] 115it [00:05, 21.71it/s] 118it [00:05, 21.54it/s] 121it [00:05, 21.46it/s] 124it [00:05, 21.64it/s] 127it [00:05, 21.48it/s] 130it [00:06, 21.79it/s] 133it [00:06, 21.98it/s] 136it [00:06, 22.01it/s] 139it [00:06, 22.04it/s] 142it [00:06, 21.56it/s] 145it [00:06, 21.69it/s] 148it [00:06, 21.81it/s]2025-05-26 01:02:15,823 - INFO - [Epoch 076 | Batch 0150] IWAE-loss 1400.8945 | mean log_px -0.0040 | KL -1124.15 + 151it [00:07, 21.92it/s] 154it [00:07, 22.09it/s] 157it [00:07, 21.95it/s] 160it [00:07, 21.96it/s] 163it [00:07, 21.97it/s] 166it [00:07, 21.70it/s] 169it [00:07, 21.26it/s] 172it [00:07, 21.19it/s] 175it [00:08, 21.24it/s] 178it [00:08, 21.27it/s] 181it [00:08, 21.49it/s] 184it [00:08, 21.38it/s] 187it [00:08, 21.38it/s] 190it [00:08, 21.30it/s] 193it [00:08, 21.36it/s] 196it [00:09, 20.75it/s] 196it [00:09, 21.30it/s] +2025-05-26 01:02:18,025 - INFO - Epoch: 76, Objective: tensor([1490.7167], device='cuda:0', grad_fn=), Loss: 0.004884535912424326, KL/n: 22.962539672851562 + 0it [00:00, ?it/s]2025-05-26 01:02:18,272 - INFO - [Epoch 077 | Batch 0000] IWAE-loss 1659.8582 | mean log_px -0.0077 | KL -1123.49 + 1it [00:00, 6.76it/s] 4it [00:00, 15.26it/s] 7it [00:00, 18.31it/s] 10it [00:00, 19.62it/s] 13it [00:00, 20.32it/s] 16it [00:00, 20.91it/s] 19it [00:00, 21.28it/s] 22it [00:01, 21.55it/s] 25it [00:01, 21.37it/s] 28it [00:01, 21.37it/s] 31it [00:01, 21.61it/s] 34it [00:01, 21.64it/s] 37it [00:01, 21.78it/s] 40it [00:01, 21.90it/s] 43it [00:02, 21.96it/s] 46it [00:02, 21.98it/s] 49it [00:02, 21.72it/s]2025-05-26 01:02:20,574 - INFO - [Epoch 077 | Batch 0050] IWAE-loss 1243.6547 | mean log_px -0.0017 | KL -1122.64 + 52it [00:02, 21.46it/s] 55it [00:02, 21.62it/s] 58it [00:02, 21.76it/s] 61it [00:02, 21.73it/s] 64it [00:03, 21.67it/s] 67it [00:03, 21.80it/s] 70it [00:03, 21.89it/s] 73it [00:03, 21.93it/s] 76it [00:03, 21.65it/s] 79it [00:03, 21.76it/s] 82it [00:03, 21.40it/s] 85it [00:04, 21.58it/s] 88it [00:04, 21.55it/s] 91it [00:04, 21.57it/s] 94it [00:04, 21.27it/s] 97it [00:04, 21.02it/s] 100it [00:04, 21.33it/s]2025-05-26 01:02:22,893 - INFO - [Epoch 077 | Batch 0100] IWAE-loss 1202.0288 | mean log_px -0.0012 | KL -1117.81 + 103it [00:04, 21.18it/s] 106it [00:05, 21.14it/s] 109it [00:05, 21.22it/s] 112it [00:05, 20.92it/s] 115it [00:05, 21.12it/s] 118it [00:05, 21.27it/s] 121it [00:05, 20.99it/s] 124it [00:05, 21.09it/s] 127it [00:05, 21.20it/s] 130it [00:06, 21.16it/s] 133it [00:06, 21.34it/s] 136it [00:06, 21.08it/s] 139it [00:06, 21.20it/s] 142it [00:06, 21.38it/s] 145it [00:06, 21.54it/s] 148it [00:06, 21.71it/s]2025-05-26 01:02:25,241 - INFO - [Epoch 077 | Batch 0150] IWAE-loss 1338.6127 | mean log_px -0.0031 | KL -1119.92 + 151it [00:07, 21.76it/s] 154it [00:07, 21.79it/s] 157it [00:07, 21.84it/s] 160it [00:07, 21.86it/s] 163it [00:07, 21.75it/s] 166it [00:07, 21.82it/s] 169it [00:07, 21.87it/s] 172it [00:08, 21.53it/s] 175it [00:08, 21.20it/s] 178it [00:08, 21.42it/s] 181it [00:08, 21.31it/s] 184it [00:08, 21.05it/s] 187it [00:08, 21.32it/s] 190it [00:08, 21.49it/s] 193it [00:09, 21.63it/s] 196it [00:09, 20.41it/s] 196it [00:09, 21.11it/s] +2025-05-26 01:02:27,439 - INFO - Epoch: 77, Objective: tensor([1241.5527], device='cuda:0', grad_fn=), Loss: 0.0019206739962100983, KL/n: 22.899856567382812 + 0it [00:00, ?it/s]2025-05-26 01:02:27,677 - INFO - [Epoch 078 | Batch 0000] IWAE-loss 1261.1355 | mean log_px -0.0020 | KL -1121.20 + 1it [00:00, 7.35it/s] 4it [00:00, 15.78it/s] 7it [00:00, 18.31it/s] 10it [00:00, 19.48it/s] 13it [00:00, 20.27it/s] 16it [00:00, 20.44it/s] 19it [00:00, 20.81it/s] 22it [00:01, 20.78it/s] 25it [00:01, 20.61it/s] 28it [00:01, 20.60it/s] 31it [00:01, 20.49it/s] 34it [00:01, 20.31it/s] 37it [00:01, 20.32it/s] 40it [00:02, 20.19it/s] 43it [00:02, 20.59it/s] 46it [00:02, 20.71it/s] 49it [00:02, 20.83it/s]2025-05-26 01:02:30,081 - INFO - [Epoch 078 | Batch 0050] IWAE-loss 1870.1661 | mean log_px -0.0107 | KL -1118.39 + 52it [00:02, 20.96it/s] 55it [00:02, 20.96it/s] 58it [00:02, 20.86it/s] 61it [00:03, 20.92it/s] 64it [00:03, 20.44it/s] 67it [00:03, 20.66it/s] 70it [00:03, 20.69it/s] 73it [00:03, 20.50it/s] 76it [00:03, 20.76it/s] 79it [00:03, 21.05it/s] 82it [00:04, 21.11it/s] 85it [00:04, 21.01it/s] 88it [00:04, 20.90it/s] 91it [00:04, 20.74it/s] 94it [00:04, 20.35it/s] 97it [00:04, 20.34it/s] 100it [00:04, 20.06it/s]2025-05-26 01:02:32,508 - INFO - [Epoch 078 | Batch 0100] IWAE-loss 1455.6832 | mean log_px -0.0049 | KL -1113.79 + 103it [00:05, 20.17it/s] 106it [00:05, 19.92it/s] 109it [00:05, 20.38it/s] 112it [00:05, 20.71it/s] 115it [00:05, 20.89it/s] 118it [00:05, 20.87it/s] 121it [00:05, 20.78it/s] 124it [00:06, 20.69it/s] 127it [00:06, 20.75it/s] 130it [00:06, 20.62it/s] 133it [00:06, 20.75it/s] 136it [00:06, 20.67it/s] 139it [00:06, 20.89it/s] 142it [00:06, 21.19it/s] 145it [00:07, 21.25it/s] 148it [00:07, 21.29it/s]2025-05-26 01:02:34,902 - INFO - [Epoch 078 | Batch 0150] IWAE-loss 1443.4268 | mean log_px -0.0048 | KL -1108.14 + 151it [00:07, 20.99it/s] 154it [00:07, 20.52it/s] 157it [00:07, 20.74it/s] 160it [00:07, 20.96it/s] 163it [00:07, 21.16it/s] 166it [00:08, 21.32it/s] 169it [00:08, 21.41it/s] 172it [00:08, 21.46it/s] 175it [00:08, 21.54it/s] 178it [00:08, 21.16it/s] 181it [00:08, 21.38it/s] 184it [00:08, 21.43it/s] 187it [00:09, 21.39it/s] 190it [00:09, 21.49it/s] 193it [00:09, 21.73it/s] 196it [00:09, 20.71it/s] 196it [00:09, 20.55it/s] +2025-05-26 01:02:37,110 - INFO - Epoch: 78, Objective: tensor([1191.6497], device='cuda:0', grad_fn=), Loss: 0.0007883315556682646, KL/n: 22.69881248474121 + 0it [00:00, ?it/s]2025-05-26 01:02:37,526 - INFO - [Epoch 079 | Batch 0000] IWAE-loss 1465.2747 | mean log_px -0.0051 | KL -1110.43 + 1it [00:00, 7.27it/s] 4it [00:00, 15.63it/s] 7it [00:00, 18.38it/s] 10it [00:00, 19.89it/s] 13it [00:00, 20.57it/s] 16it [00:00, 20.54it/s] 19it [00:00, 21.03it/s] 22it [00:01, 21.46it/s] 25it [00:01, 21.57it/s] 28it [00:01, 21.76it/s] 31it [00:01, 21.33it/s] 34it [00:01, 21.54it/s] 37it [00:01, 21.13it/s] 40it [00:01, 21.10it/s] 43it [00:02, 21.14it/s] 46it [00:02, 21.09it/s] 49it [00:02, 21.32it/s]2025-05-26 01:02:39,861 - INFO - [Epoch 079 | Batch 0050] IWAE-loss 1269.3641 | mean log_px -0.0023 | KL -1106.26 + 52it [00:02, 21.40it/s] 55it [00:02, 21.50it/s] 58it [00:02, 21.33it/s] 61it [00:02, 21.44it/s] 64it [00:03, 21.69it/s] 67it [00:03, 21.51it/s] 70it [00:03, 21.76it/s] 73it [00:03, 21.78it/s] 76it [00:03, 21.51it/s] 79it [00:03, 21.65it/s] 82it [00:03, 21.84it/s] 85it [00:04, 21.59it/s] 88it [00:04, 21.50it/s] 91it [00:04, 21.63it/s] 94it [00:04, 21.40it/s] 97it [00:04, 21.65it/s] 100it [00:04, 21.49it/s]2025-05-26 01:02:42,176 - INFO - [Epoch 079 | Batch 0100] IWAE-loss 1869.3672 | mean log_px -0.0109 | KL -1103.50 + 103it [00:04, 21.48it/s] 106it [00:05, 21.59it/s] 109it [00:05, 21.58it/s] 112it [00:05, 21.55it/s] 115it [00:05, 21.32it/s] 118it [00:05, 21.55it/s] 121it [00:05, 21.36it/s] 124it [00:05, 21.40it/s] 127it [00:05, 21.30it/s] 130it [00:06, 21.24it/s] 133it [00:06, 21.28it/s] 136it [00:06, 21.43it/s] 139it [00:06, 21.62it/s] 142it [00:06, 21.76it/s] 145it [00:06, 21.80it/s] 148it [00:06, 21.87it/s]2025-05-26 01:02:44,493 - INFO - [Epoch 079 | Batch 0150] IWAE-loss 2335.6721 | mean log_px -0.0176 | KL -1105.85 + 151it [00:07, 21.90it/s] 154it [00:07, 21.60it/s] 157it [00:07, 21.60it/s] 160it [00:07, 21.48it/s] 163it [00:07, 21.07it/s] 166it [00:07, 21.13it/s] 169it [00:07, 20.93it/s] 172it [00:08, 21.02it/s] 175it [00:08, 21.24it/s] 178it [00:08, 21.14it/s] 181it [00:08, 20.55it/s] 184it [00:08, 20.20it/s] 187it [00:08, 20.40it/s] 190it [00:08, 20.58it/s] 193it [00:09, 20.34it/s] 196it [00:09, 19.73it/s] 196it [00:09, 20.94it/s] +2025-05-26 01:02:46,776 - INFO - Epoch: 79, Objective: tensor([1304.4983], device='cuda:0', grad_fn=), Loss: 0.003032541833817959, KL/n: 22.560514450073242 + 0it [00:00, ?it/s]2025-05-26 01:02:47,026 - INFO - [Epoch 080 | Batch 0000] IWAE-loss 1448.7809 | mean log_px -0.0049 | KL -1104.65 + 1it [00:00, 6.88it/s] 4it [00:00, 15.37it/s] 7it [00:00, 18.21it/s] 10it [00:00, 19.60it/s] 13it [00:00, 20.42it/s] 16it [00:00, 20.85it/s] 19it [00:00, 21.07it/s] 22it [00:01, 21.30it/s] 25it [00:01, 21.36it/s] 28it [00:01, 21.51it/s] 31it [00:01, 21.56it/s] 34it [00:01, 21.62it/s] 37it [00:01, 21.55it/s] 40it [00:01, 21.52it/s] 43it [00:02, 21.59it/s] 46it [00:02, 21.50it/s] 49it [00:02, 21.48it/s]2025-05-26 01:02:49,340 - INFO - [Epoch 080 | Batch 0050] IWAE-loss 1250.5239 | mean log_px -0.0021 | KL -1104.49 + 52it [00:02, 21.56it/s] 55it [00:02, 21.63it/s] 58it [00:02, 21.69it/s] 61it [00:02, 21.75it/s] 64it [00:03, 21.80it/s] 67it [00:03, 21.73it/s] 70it [00:03, 21.61it/s] 73it [00:03, 21.58it/s] 76it [00:03, 21.54it/s] 79it [00:03, 21.91it/s] 82it [00:03, 21.96it/s] 85it [00:04, 22.18it/s] 88it [00:04, 22.45it/s] 91it [00:04, 22.56it/s] 94it [00:04, 22.65it/s] 97it [00:04, 22.65it/s] 100it [00:04, 22.57it/s]2025-05-26 01:02:51,601 - INFO - [Epoch 080 | Batch 0100] IWAE-loss 1352.5112 | mean log_px -0.0035 | KL -1105.57 + 103it [00:04, 22.67it/s] 106it [00:04, 22.79it/s] 109it [00:05, 22.90it/s] 112it [00:05, 22.96it/s] 115it [00:05, 22.98it/s] 118it [00:05, 22.78it/s] 121it [00:05, 22.64it/s] 124it [00:05, 22.82it/s] 127it [00:05, 22.93it/s] 130it [00:05, 22.93it/s] 133it [00:06, 22.97it/s] 136it [00:06, 23.04it/s] 139it [00:06, 23.02it/s] 142it [00:06, 22.62it/s] 145it [00:06, 22.41it/s] 148it [00:06, 22.25it/s]2025-05-26 01:02:53,801 - INFO - [Epoch 080 | Batch 0150] IWAE-loss 1357.4445 | mean log_px -0.0036 | KL -1105.70 + 151it [00:06, 22.05it/s] 154it [00:07, 21.91it/s] 157it [00:07, 21.79it/s] 160it [00:07, 21.82it/s] 163it [00:07, 21.76it/s] 166it [00:07, 21.71it/s] 169it [00:07, 21.73it/s] 172it [00:07, 21.67it/s] 175it [00:08, 21.61it/s] 178it [00:08, 21.61it/s] 181it [00:08, 21.62it/s] 184it [00:08, 21.55it/s] 187it [00:08, 21.58it/s] 190it [00:08, 21.69it/s] 193it [00:08, 21.69it/s] 196it [00:09, 20.66it/s] 196it [00:09, 21.58it/s] +2025-05-26 01:02:55,991 - INFO - Epoch: 80, Objective: tensor([1351.9658], device='cuda:0', grad_fn=), Loss: 0.0016598873771727085, KL/n: 22.529890060424805 + 0it [00:00, ?it/s]2025-05-26 01:02:56,403 - INFO - [Epoch 081 | Batch 0000] IWAE-loss 1600.7882 | mean log_px -0.0071 | KL -1105.29 + 1it [00:00, 7.09it/s] 4it [00:00, 15.68it/s] 7it [00:00, 18.38it/s] 10it [00:00, 19.79it/s] 13it [00:00, 20.57it/s] 16it [00:00, 21.02it/s] 19it [00:00, 21.21it/s] 22it [00:01, 21.33it/s] 25it [00:01, 21.29it/s] 28it [00:01, 21.45it/s] 31it [00:01, 21.21it/s] 34it [00:01, 20.96it/s] 37it [00:01, 20.99it/s] 40it [00:01, 21.23it/s] 43it [00:02, 21.37it/s] 46it [00:02, 21.48it/s] 49it [00:02, 21.28it/s]2025-05-26 01:02:58,738 - INFO - [Epoch 081 | Batch 0050] IWAE-loss 1251.4117 | mean log_px -0.0022 | KL -1098.32 + 52it [00:02, 21.07it/s] 55it [00:02, 21.32it/s] 58it [00:02, 21.39it/s] 61it [00:02, 21.47it/s] 64it [00:03, 21.52it/s] 67it [00:03, 21.24it/s] 70it [00:03, 21.26it/s] 73it [00:03, 21.46it/s] 76it [00:03, 21.46it/s] 79it [00:03, 21.26it/s] 82it [00:03, 21.26it/s] 85it [00:04, 21.45it/s] 88it [00:04, 21.49it/s] 91it [00:04, 21.63it/s] 94it [00:04, 21.60it/s] 97it [00:04, 21.17it/s] 100it [00:04, 21.38it/s]2025-05-26 01:03:01,075 - INFO - [Epoch 081 | Batch 0100] IWAE-loss 1582.2231 | mean log_px -0.0070 | KL -1094.54 + 103it [00:04, 21.33it/s] 106it [00:05, 21.44it/s] 109it [00:05, 21.14it/s] 112it [00:05, 21.22it/s] 115it [00:05, 21.44it/s] 118it [00:05, 21.56it/s] 121it [00:05, 21.28it/s] 124it [00:05, 21.07it/s] 127it [00:06, 21.19it/s] 130it [00:06, 21.20it/s] 133it [00:06, 21.16it/s] 136it [00:06, 21.25it/s] 139it [00:06, 21.45it/s] 142it [00:06, 21.44it/s] 145it [00:06, 21.51it/s] 148it [00:07, 21.62it/s]2025-05-26 01:03:03,411 - INFO - [Epoch 081 | Batch 0150] IWAE-loss 1250.8032 | mean log_px -0.0022 | KL -1098.59 + 151it [00:07, 21.68it/s] 154it [00:07, 21.71it/s] 157it [00:07, 21.78it/s] 160it [00:07, 21.63it/s] 163it [00:07, 21.73it/s] 166it [00:07, 21.11it/s] 169it [00:07, 21.26it/s] 172it [00:08, 21.41it/s] 175it [00:08, 21.56it/s] 178it [00:08, 21.27it/s] 181it [00:08, 21.30it/s] 184it [00:08, 21.01it/s] 187it [00:08, 21.19it/s] 190it [00:08, 21.28it/s] 193it [00:09, 21.30it/s] 196it [00:09, 20.22it/s] 196it [00:09, 20.97it/s] +2025-05-26 01:03:05,638 - INFO - Epoch: 81, Objective: tensor([1537.8092], device='cuda:0', grad_fn=), Loss: 0.006072376389056444, KL/n: 22.388904571533203 + 0it [00:00, ?it/s]2025-05-26 01:03:05,876 - INFO - [Epoch 082 | Batch 0000] IWAE-loss 1251.9319 | mean log_px -0.0022 | KL -1100.45 + 1it [00:00, 7.34it/s] 4it [00:00, 15.77it/s] 7it [00:00, 18.43it/s] 10it [00:00, 18.91it/s] 12it [00:00, 18.84it/s] 14it [00:00, 18.86it/s] 16it [00:00, 19.04it/s] 18it [00:00, 19.20it/s] 20it [00:01, 19.29it/s] 22it [00:01, 19.39it/s] 24it [00:01, 19.41it/s] 26it [00:01, 19.45it/s] 28it [00:01, 19.50it/s] 30it [00:01, 19.49it/s] 32it [00:01, 19.52it/s] 34it [00:01, 19.46it/s] 36it [00:01, 19.49it/s] 39it [00:02, 20.42it/s] 42it [00:02, 20.53it/s] 45it [00:02, 20.23it/s] 48it [00:02, 20.40it/s]2025-05-26 01:03:08,370 - INFO - [Epoch 082 | Batch 0050] IWAE-loss 1256.3951 | mean log_px -0.0023 | KL -1097.95 + 51it [00:02, 20.68it/s] 54it [00:02, 20.98it/s] 57it [00:02, 21.08it/s] 60it [00:03, 20.84it/s] 63it [00:03, 21.02it/s] 66it [00:03, 21.20it/s] 69it [00:03, 21.23it/s] 72it [00:03, 21.38it/s] 75it [00:03, 21.43it/s] 78it [00:03, 21.42it/s] 81it [00:04, 21.33it/s] 84it [00:04, 21.48it/s] 87it [00:04, 21.56it/s] 90it [00:04, 21.64it/s] 93it [00:04, 21.76it/s] 96it [00:04, 22.00it/s] 99it [00:04, 21.97it/s]2025-05-26 01:03:10,687 - INFO - [Epoch 082 | Batch 0100] IWAE-loss 1347.2388 | mean log_px -0.0036 | KL -1096.69 + 102it [00:04, 21.86it/s] 105it [00:05, 21.94it/s] 108it [00:05, 21.97it/s] 111it [00:05, 21.50it/s] 114it [00:05, 21.34it/s] 117it [00:05, 21.18it/s] 120it [00:05, 21.22it/s] 123it [00:05, 21.37it/s] 126it [00:06, 21.21it/s] 129it [00:06, 21.51it/s] 132it [00:06, 21.57it/s] 135it [00:06, 21.73it/s] 138it [00:06, 21.81it/s] 141it [00:06, 21.84it/s] 144it [00:06, 21.85it/s] 147it [00:07, 21.93it/s] 150it [00:07, 21.72it/s]2025-05-26 01:03:13,008 - INFO - [Epoch 082 | Batch 0150] IWAE-loss 1190.9883 | mean log_px -0.0014 | KL -1095.24 + 153it [00:07, 21.28it/s] 156it [00:07, 21.54it/s] 159it [00:07, 21.68it/s] 162it [00:07, 21.95it/s] 165it [00:07, 21.94it/s] 168it [00:08, 21.97it/s] 171it [00:08, 22.04it/s] 174it [00:08, 22.08it/s] 177it [00:08, 22.05it/s] 180it [00:08, 21.69it/s] 183it [00:08, 21.66it/s] 186it [00:08, 20.95it/s] 189it [00:09, 21.14it/s] 192it [00:09, 21.35it/s] 195it [00:09, 20.43it/s] 196it [00:09, 20.79it/s] +2025-05-26 01:03:15,193 - INFO - Epoch: 82, Objective: tensor([1430.6716], device='cuda:0', grad_fn=), Loss: 0.0028925351798534393, KL/n: 22.34264373779297 + 0it [00:00, ?it/s]2025-05-26 01:03:15,743 - INFO - [Epoch 083 | Batch 0000] IWAE-loss 1135.5509 | mean log_px -0.0006 | KL -1093.27 + 1it [00:00, 3.56it/s] 4it [00:00, 11.08it/s] 7it [00:00, 15.10it/s] 10it [00:00, 17.46it/s] 13it [00:00, 18.90it/s] 16it [00:00, 19.94it/s] 19it [00:01, 20.63it/s] 22it [00:01, 21.12it/s] 25it [00:01, 21.30it/s] 28it [00:01, 21.47it/s] 31it [00:01, 21.67it/s] 34it [00:01, 21.72it/s] 37it [00:01, 21.86it/s] 40it [00:02, 21.86it/s] 43it [00:02, 21.88it/s] 46it [00:02, 21.94it/s] 49it [00:02, 22.02it/s]2025-05-26 01:03:18,022 - INFO - [Epoch 083 | Batch 0050] IWAE-loss 2081.0850 | mean log_px -0.0141 | KL -1092.85 + 52it [00:02, 21.94it/s] 55it [00:02, 22.01it/s] 58it [00:02, 22.04it/s] 61it [00:03, 22.01it/s] 64it [00:03, 21.99it/s] 67it [00:03, 22.00it/s] 70it [00:03, 22.05it/s] 73it [00:03, 22.08it/s] 76it [00:03, 22.10it/s] 79it [00:03, 22.11it/s] 82it [00:03, 22.10it/s] 85it [00:04, 22.16it/s] 88it [00:04, 22.10it/s] 91it [00:04, 22.11it/s] 94it [00:04, 22.11it/s] 97it [00:04, 22.08it/s] 100it [00:04, 21.93it/s]2025-05-26 01:03:20,292 - INFO - [Epoch 083 | Batch 0100] IWAE-loss 1284.4880 | mean log_px -0.0028 | KL -1088.75 + 103it [00:04, 21.70it/s] 106it [00:05, 21.80it/s] 109it [00:05, 21.89it/s] 112it [00:05, 21.98it/s] 115it [00:05, 21.64it/s] 118it [00:05, 21.67it/s] 121it [00:05, 21.75it/s] 124it [00:05, 22.03it/s] 127it [00:06, 22.39it/s] 130it [00:06, 22.63it/s] 133it [00:06, 22.76it/s] 136it [00:06, 22.84it/s] 139it [00:06, 23.09it/s] 142it [00:06, 23.17it/s] 145it [00:06, 23.23it/s] 148it [00:06, 23.11it/s]2025-05-26 01:03:22,509 - INFO - [Epoch 083 | Batch 0150] IWAE-loss 1417.4686 | mean log_px -0.0047 | KL -1091.69 + 151it [00:07, 23.07it/s] 154it [00:07, 23.15it/s] 157it [00:07, 23.25it/s] 160it [00:07, 23.23it/s] 163it [00:07, 23.23it/s] 166it [00:07, 23.21it/s] 169it [00:07, 23.29it/s] 172it [00:07, 23.33it/s] 175it [00:08, 23.35it/s] 178it [00:08, 23.38it/s] 181it [00:08, 23.39it/s] 184it [00:08, 23.39it/s] 187it [00:08, 23.14it/s] 190it [00:08, 22.66it/s] 193it [00:08, 22.83it/s] 196it [00:09, 22.00it/s] 196it [00:09, 21.61it/s] +2025-05-26 01:03:24,557 - INFO - Epoch: 83, Objective: tensor([1587.5281], device='cuda:0', grad_fn=), Loss: 0.004302951041609049, KL/n: 22.29305076599121 + 0it [00:00, ?it/s]2025-05-26 01:03:24,975 - INFO - [Epoch 084 | Batch 0000] IWAE-loss 1551.5254 | mean log_px -0.0066 | KL -1091.30 + 1it [00:00, 7.75it/s] 4it [00:00, 16.89it/s] 7it [00:00, 19.76it/s] 10it [00:00, 21.01it/s] 13it [00:00, 21.59it/s] 16it [00:00, 22.10it/s] 19it [00:00, 22.39it/s] 22it [00:01, 22.61it/s] 25it [00:01, 22.77it/s] 28it [00:01, 22.66it/s] 31it [00:01, 22.71it/s] 34it [00:01, 22.82it/s] 37it [00:01, 23.00it/s] 40it [00:01, 22.97it/s] 43it [00:01, 23.05it/s] 46it [00:02, 23.11it/s] 49it [00:02, 23.09it/s]2025-05-26 01:03:27,149 - INFO - [Epoch 084 | Batch 0050] IWAE-loss 1144.9756 | mean log_px -0.0008 | KL -1088.44 + 52it [00:02, 23.01it/s] 55it [00:02, 22.96it/s] 58it [00:02, 23.00it/s] 61it [00:02, 23.01it/s] 64it [00:02, 23.00it/s] 67it [00:02, 23.03it/s] 70it [00:03, 23.06it/s] 73it [00:03, 23.11it/s] 76it [00:03, 23.17it/s] 79it [00:03, 23.20it/s] 82it [00:03, 23.16it/s] 85it [00:03, 23.16it/s] 88it [00:03, 23.14it/s] 91it [00:04, 23.16it/s] 94it [00:04, 23.03it/s] 97it [00:04, 23.07it/s] 100it [00:04, 22.79it/s]2025-05-26 01:03:29,322 - INFO - [Epoch 084 | Batch 0100] IWAE-loss 1653.5281 | mean log_px -0.0081 | KL -1086.56 + 103it [00:04, 22.60it/s] 106it [00:04, 22.52it/s] 109it [00:04, 22.65it/s] 112it [00:04, 22.62it/s] 115it [00:05, 22.68it/s] 118it [00:05, 22.79it/s] 121it [00:05, 22.89it/s] 124it [00:05, 22.97it/s] 127it [00:05, 23.02it/s] 130it [00:05, 23.04it/s] 133it [00:05, 22.97it/s] 136it [00:06, 23.01it/s] 139it [00:06, 23.07it/s] 142it [00:06, 23.10it/s] 145it [00:06, 23.07it/s] 148it [00:06, 22.99it/s]2025-05-26 01:03:31,504 - INFO - [Epoch 084 | Batch 0150] IWAE-loss 1298.2114 | mean log_px -0.0031 | KL -1084.70 + 151it [00:06, 22.99it/s] 154it [00:06, 23.02it/s] 157it [00:06, 22.94it/s] 160it [00:07, 22.77it/s] 163it [00:07, 22.81it/s] 166it [00:07, 22.70it/s] 169it [00:07, 22.72it/s] 172it [00:07, 22.69it/s] 175it [00:07, 22.69it/s] 178it [00:07, 22.83it/s] 181it [00:07, 22.91it/s] 184it [00:08, 22.77it/s] 187it [00:08, 22.63it/s] 190it [00:08, 22.74it/s] 193it [00:08, 22.83it/s] 196it [00:08, 22.12it/s] 196it [00:08, 22.49it/s] +2025-05-26 01:03:33,584 - INFO - Epoch: 84, Objective: tensor([1278.3981], device='cuda:0', grad_fn=), Loss: 0.0019393458496779203, KL/n: 22.202301025390625 + 0it [00:00, ?it/s]2025-05-26 01:03:33,816 - INFO - [Epoch 085 | Batch 0000] IWAE-loss 1297.9139 | mean log_px -0.0030 | KL -1086.36 + 1it [00:00, 7.63it/s] 4it [00:00, 15.98it/s] 7it [00:00, 19.17it/s] 10it [00:00, 20.72it/s] 13it [00:00, 21.61it/s] 16it [00:00, 21.58it/s] 19it [00:00, 22.05it/s] 22it [00:01, 22.42it/s] 25it [00:01, 22.61it/s] 28it [00:01, 22.67it/s] 31it [00:01, 22.28it/s] 34it [00:01, 22.52it/s] 37it [00:01, 22.32it/s] 40it [00:01, 22.34it/s] 43it [00:01, 22.48it/s] 46it [00:02, 22.52it/s] 49it [00:02, 22.32it/s]2025-05-26 01:03:36,047 - INFO - [Epoch 085 | Batch 0050] IWAE-loss 1220.5857 | mean log_px -0.0019 | KL -1084.63 + 52it [00:02, 21.66it/s] 55it [00:02, 21.93it/s] 58it [00:02, 21.86it/s] 61it [00:02, 22.06it/s] 64it [00:02, 22.07it/s] 67it [00:03, 22.04it/s] 70it [00:03, 21.79it/s] 73it [00:03, 21.70it/s] 76it [00:03, 21.79it/s] 79it [00:03, 21.29it/s] 82it [00:03, 21.43it/s] 85it [00:03, 21.44it/s] 88it [00:04, 21.14it/s] 91it [00:04, 20.66it/s] 94it [00:04, 20.44it/s] 97it [00:04, 20.58it/s] 100it [00:04, 20.71it/s]2025-05-26 01:03:38,399 - INFO - [Epoch 085 | Batch 0100] IWAE-loss 1190.2637 | mean log_px -0.0016 | KL -1081.08 + 103it [00:04, 20.85it/s] 106it [00:04, 20.75it/s] 109it [00:05, 20.76it/s] 112it [00:05, 20.43it/s] 115it [00:05, 20.73it/s] 118it [00:05, 21.10it/s] 121it [00:05, 21.42it/s] 124it [00:05, 21.51it/s] 127it [00:05, 21.69it/s] 130it [00:06, 21.55it/s] 133it [00:06, 21.48it/s] 136it [00:06, 21.51it/s] 139it [00:06, 21.67it/s] 142it [00:06, 21.93it/s] 145it [00:06, 21.50it/s] 148it [00:06, 21.42it/s]2025-05-26 01:03:40,739 - INFO - [Epoch 085 | Batch 0150] IWAE-loss 1891.0696 | mean log_px -0.0116 | KL -1079.97 + 151it [00:07, 21.36it/s] 154it [00:07, 21.48it/s] 157it [00:07, 21.63it/s] 160it [00:07, 21.76it/s] 163it [00:07, 21.82it/s] 166it [00:07, 21.67it/s] 169it [00:07, 21.18it/s] 172it [00:08, 21.12it/s] 175it [00:08, 20.99it/s] 178it [00:08, 20.98it/s] 181it [00:08, 20.87it/s] 184it [00:08, 21.13it/s] 187it [00:08, 21.08it/s] 190it [00:08, 21.35it/s] 193it [00:09, 20.93it/s] 196it [00:09, 20.44it/s] 196it [00:09, 21.19it/s] +2025-05-26 01:03:42,957 - INFO - Epoch: 85, Objective: tensor([1864.8672], device='cuda:0', grad_fn=), Loss: 0.013502722606062889, KL/n: 22.042320251464844 + 0it [00:00, ?it/s]2025-05-26 01:03:43,206 - INFO - [Epoch 086 | Batch 0000] IWAE-loss 1319.3251 | mean log_px -0.0034 | KL -1079.25 + 1it [00:00, 6.73it/s] 4it [00:00, 15.31it/s] 7it [00:00, 18.44it/s] 10it [00:00, 19.66it/s] 13it [00:00, 20.48it/s] 16it [00:00, 21.18it/s] 19it [00:00, 21.43it/s] 22it [00:01, 21.62it/s] 25it [00:01, 21.27it/s] 28it [00:01, 21.42it/s] 31it [00:01, 21.51it/s] 34it [00:01, 21.67it/s] 37it [00:01, 21.56it/s] 40it [00:01, 21.65it/s] 43it [00:02, 21.78it/s] 46it [00:02, 21.57it/s] 49it [00:02, 21.53it/s]2025-05-26 01:03:45,511 - INFO - [Epoch 086 | Batch 0050] IWAE-loss 1137.4036 | mean log_px -0.0009 | KL -1074.95 + 52it [00:02, 21.65it/s] 55it [00:02, 21.81it/s] 58it [00:02, 21.70it/s] 61it [00:02, 21.64it/s] 64it [00:03, 21.59it/s] 67it [00:03, 21.77it/s] 70it [00:03, 21.89it/s] 73it [00:03, 21.99it/s] 76it [00:03, 22.04it/s] 79it [00:03, 22.09it/s] 82it [00:03, 22.22it/s] 85it [00:03, 22.35it/s] 88it [00:04, 22.29it/s] 91it [00:04, 22.40it/s] 94it [00:04, 21.80it/s] 97it [00:04, 21.77it/s] 100it [00:04, 21.79it/s]2025-05-26 01:03:47,788 - INFO - [Epoch 086 | Batch 0100] IWAE-loss 1209.6168 | mean log_px -0.0019 | KL -1074.95 + 103it [00:04, 21.80it/s] 106it [00:04, 21.82it/s] 109it [00:05, 21.82it/s] 112it [00:05, 21.48it/s] 115it [00:05, 21.25it/s] 118it [00:05, 20.85it/s] 121it [00:05, 20.85it/s] 124it [00:05, 20.73it/s] 127it [00:05, 20.90it/s] 130it [00:06, 21.01it/s] 133it [00:06, 21.02it/s] 136it [00:06, 21.14it/s] 139it [00:06, 21.37it/s] 142it [00:06, 21.45it/s] 145it [00:06, 21.23it/s] 148it [00:06, 21.43it/s]2025-05-26 01:03:50,145 - INFO - [Epoch 086 | Batch 0150] IWAE-loss 1378.2422 | mean log_px -0.0043 | KL -1074.91 + 151it [00:07, 21.43it/s] 154it [00:07, 21.24it/s] 157it [00:07, 21.51it/s] 160it [00:07, 21.54it/s] 163it [00:07, 21.64it/s] 166it [00:07, 21.75it/s] 169it [00:07, 21.83it/s] 172it [00:08, 21.74it/s] 175it [00:08, 21.38it/s] 178it [00:08, 21.54it/s] 181it [00:08, 21.67it/s] 184it [00:08, 21.39it/s] 187it [00:08, 21.36it/s] 190it [00:08, 21.44it/s] 193it [00:09, 21.51it/s] 196it [00:09, 20.46it/s] 196it [00:09, 21.18it/s] +2025-05-26 01:03:52,339 - INFO - Epoch: 86, Objective: tensor([1278.1052], device='cuda:0', grad_fn=), Loss: 0.002963890554383397, KL/n: 22.012950897216797 + 0it [00:00, ?it/s]2025-05-26 01:03:52,744 - INFO - [Epoch 087 | Batch 0000] IWAE-loss 1573.0793 | mean log_px -0.0071 | KL -1076.80 + 1it [00:00, 7.49it/s] 4it [00:00, 15.53it/s] 7it [00:00, 18.28it/s] 10it [00:00, 19.69it/s] 13it [00:00, 20.39it/s] 16it [00:00, 20.94it/s] 19it [00:00, 20.79it/s] 22it [00:01, 20.90it/s] 25it [00:01, 21.27it/s] 28it [00:01, 21.52it/s] 31it [00:01, 21.80it/s] 34it [00:01, 21.93it/s] 37it [00:01, 21.41it/s] 40it [00:01, 21.91it/s] 43it [00:02, 21.87it/s] 46it [00:02, 22.19it/s] 49it [00:02, 22.36it/s]2025-05-26 01:03:55,042 - INFO - [Epoch 087 | Batch 0050] IWAE-loss 1248.2985 | mean log_px -0.0025 | KL -1075.58 + 52it [00:02, 22.17it/s] 55it [00:02, 22.19it/s] 58it [00:02, 21.98it/s] 61it [00:02, 21.71it/s] 64it [00:03, 21.68it/s] 67it [00:03, 21.75it/s] 70it [00:03, 21.75it/s] 73it [00:03, 21.63it/s] 76it [00:03, 21.62it/s] 79it [00:03, 21.62it/s] 82it [00:03, 21.87it/s] 85it [00:03, 22.19it/s] 88it [00:04, 22.15it/s] 91it [00:04, 22.02it/s] 94it [00:04, 21.58it/s] 97it [00:04, 21.56it/s] 100it [00:04, 21.54it/s]2025-05-26 01:03:57,345 - INFO - [Epoch 087 | Batch 0100] IWAE-loss 1123.3193 | mean log_px -0.0007 | KL -1073.03 + 103it [00:04, 21.57it/s] 106it [00:04, 21.24it/s] 109it [00:05, 21.29it/s] 112it [00:05, 21.40it/s] 115it [00:05, 21.52it/s] 118it [00:05, 21.58it/s] 121it [00:05, 21.69it/s] 124it [00:05, 21.62it/s] 127it [00:05, 21.52it/s] 130it [00:06, 21.62it/s] 133it [00:06, 21.59it/s] 136it [00:06, 21.73it/s] 139it [00:06, 21.70it/s] 142it [00:06, 21.78it/s] 145it [00:06, 21.78it/s] 148it [00:06, 21.84it/s]2025-05-26 01:03:59,656 - INFO - [Epoch 087 | Batch 0150] IWAE-loss 1241.6970 | mean log_px -0.0024 | KL -1076.41 + 151it [00:07, 21.73it/s] 154it [00:07, 21.68it/s] 157it [00:07, 21.67it/s] 160it [00:07, 21.59it/s] 163it [00:07, 21.31it/s] 166it [00:07, 21.53it/s] 169it [00:07, 21.37it/s] 172it [00:08, 21.44it/s] 175it [00:08, 21.76it/s] 178it [00:08, 21.89it/s] 181it [00:08, 22.03it/s] 184it [00:08, 21.91it/s] 187it [00:08, 21.56it/s] 190it [00:08, 20.55it/s] 193it [00:09, 20.06it/s] 196it [00:09, 19.75it/s] 196it [00:09, 21.19it/s] +2025-05-26 01:04:01,888 - INFO - Epoch: 87, Objective: tensor([1877.4033], device='cuda:0', grad_fn=), Loss: 0.00889658648520708, KL/n: 21.967613220214844 + 0it [00:00, ?it/s]2025-05-26 01:04:02,128 - INFO - [Epoch 088 | Batch 0000] IWAE-loss 1148.5999 | mean log_px -0.0010 | KL -1075.44 + 1it [00:00, 7.75it/s] 4it [00:00, 16.50it/s] 7it [00:00, 19.13it/s] 10it [00:00, 20.39it/s] 13it [00:00, 21.14it/s] 16it [00:00, 21.58it/s] 19it [00:00, 21.84it/s] 22it [00:01, 22.00it/s] 25it [00:01, 22.10it/s] 28it [00:01, 22.12it/s] 31it [00:01, 22.18it/s] 34it [00:01, 22.27it/s] 37it [00:01, 22.29it/s] 40it [00:01, 22.23it/s] 43it [00:02, 22.26it/s] 46it [00:02, 22.28it/s] 49it [00:02, 22.29it/s]2025-05-26 01:04:04,371 - INFO - [Epoch 088 | Batch 0050] IWAE-loss 1201.1548 | mean log_px -0.0018 | KL -1075.26 + 52it [00:02, 22.25it/s] 55it [00:02, 22.16it/s] 58it [00:02, 22.25it/s] 61it [00:02, 22.23it/s] 64it [00:02, 22.26it/s] 67it [00:03, 22.28it/s] 70it [00:03, 22.32it/s] 73it [00:03, 22.35it/s] 76it [00:03, 22.06it/s] 79it [00:03, 22.38it/s] 82it [00:03, 22.56it/s] 85it [00:03, 22.58it/s] 88it [00:04, 22.72it/s] 91it [00:04, 22.79it/s] 94it [00:04, 22.84it/s] 97it [00:04, 22.66it/s] 100it [00:04, 22.57it/s]2025-05-26 01:04:06,597 - INFO - [Epoch 088 | Batch 0100] IWAE-loss 1168.8257 | mean log_px -0.0014 | KL -1071.57 + 103it [00:04, 22.47it/s] 106it [00:04, 22.43it/s] 109it [00:04, 22.30it/s] 112it [00:05, 22.26it/s] 115it [00:05, 22.32it/s] 118it [00:05, 22.35it/s] 121it [00:05, 22.34it/s] 124it [00:05, 22.38it/s] 127it [00:05, 22.17it/s] 130it [00:05, 22.16it/s] 133it [00:06, 22.20it/s] 136it [00:06, 22.24it/s] 139it [00:06, 22.28it/s] 142it [00:06, 22.32it/s] 145it [00:06, 22.32it/s] 148it [00:06, 22.32it/s]2025-05-26 01:04:08,845 - INFO - [Epoch 088 | Batch 0150] IWAE-loss 1215.9666 | mean log_px -0.0021 | KL -1072.03 + 151it [00:06, 22.12it/s] 154it [00:06, 22.03it/s] 157it [00:07, 22.01it/s] 160it [00:07, 21.36it/s] 163it [00:07, 20.86it/s] 166it [00:07, 21.03it/s] 169it [00:07, 21.14it/s] 172it [00:07, 21.26it/s] 175it [00:07, 21.35it/s] 178it [00:08, 21.43it/s] 181it [00:08, 21.43it/s] 184it [00:08, 21.46it/s] 187it [00:08, 21.40it/s] 190it [00:08, 21.55it/s] 193it [00:08, 21.74it/s] 196it [00:08, 20.52it/s] 196it [00:09, 21.69it/s] +2025-05-26 01:04:11,061 - INFO - Epoch: 88, Objective: tensor([1197.1827], device='cuda:0', grad_fn=), Loss: 0.0014175840187817812, KL/n: 21.834794998168945 + 0it [00:00, ?it/s]2025-05-26 01:04:11,589 - INFO - [Epoch 089 | Batch 0000] IWAE-loss 1161.0184 | mean log_px -0.0013 | KL -1067.50 + 1it [00:00, 3.83it/s] 4it [00:00, 11.63it/s] 7it [00:00, 15.89it/s] 10it [00:00, 18.47it/s] 13it [00:00, 20.09it/s] 16it [00:00, 21.13it/s] 19it [00:01, 21.71it/s] 22it [00:01, 22.19it/s] 25it [00:01, 22.51it/s] 28it [00:01, 22.73it/s] 31it [00:01, 22.45it/s] 34it [00:01, 22.30it/s] 37it [00:01, 22.17it/s] 40it [00:01, 22.14it/s] 43it [00:02, 22.57it/s] 46it [00:02, 22.75it/s] 49it [00:02, 22.78it/s]2025-05-26 01:04:13,782 - INFO - [Epoch 089 | Batch 0050] IWAE-loss 1237.9883 | mean log_px -0.0025 | KL -1064.17 + 52it [00:02, 22.89it/s] 55it [00:02, 22.97it/s] 58it [00:02, 23.05it/s] 61it [00:02, 23.13it/s] 64it [00:03, 23.19it/s] 67it [00:03, 23.15it/s] 70it [00:03, 23.09it/s] 73it [00:03, 23.18it/s] 76it [00:03, 23.21it/s] 79it [00:03, 23.23it/s] 82it [00:03, 23.24it/s] 85it [00:03, 23.24it/s] 88it [00:04, 23.25it/s] 91it [00:04, 23.24it/s] 94it [00:04, 23.23it/s] 97it [00:04, 23.21it/s] 100it [00:04, 23.08it/s]2025-05-26 01:04:15,938 - INFO - [Epoch 089 | Batch 0100] IWAE-loss 1486.8628 | mean log_px -0.0061 | KL -1063.10 + 103it [00:04, 23.06it/s] 106it [00:04, 23.08it/s] 109it [00:04, 23.16it/s] 112it [00:05, 23.20it/s] 115it [00:05, 23.25it/s] 118it [00:05, 23.25it/s] 121it [00:05, 23.16it/s] 124it [00:05, 23.17it/s] 127it [00:05, 23.21it/s] 130it [00:05, 23.18it/s] 133it [00:05, 23.13it/s] 136it [00:06, 23.17it/s] 139it [00:06, 23.22it/s] 142it [00:06, 23.21it/s] 145it [00:06, 23.20it/s] 148it [00:06, 23.23it/s]2025-05-26 01:04:18,093 - INFO - [Epoch 089 | Batch 0150] IWAE-loss 1530.6752 | mean log_px -0.0067 | KL -1061.20 + 151it [00:06, 23.20it/s] 154it [00:06, 23.20it/s] 157it [00:07, 23.14it/s] 160it [00:07, 23.28it/s] 163it [00:07, 23.33it/s] 166it [00:07, 23.36it/s] 169it [00:07, 23.40it/s] 172it [00:07, 23.43it/s] 175it [00:07, 23.44it/s] 178it [00:07, 23.38it/s] 181it [00:08, 23.36it/s] 184it [00:08, 23.27it/s] 187it [00:08, 23.01it/s] 190it [00:08, 22.96it/s] 193it [00:08, 23.04it/s] 196it [00:08, 21.89it/s] 196it [00:08, 22.30it/s] +2025-05-26 01:04:20,141 - INFO - Epoch: 89, Objective: tensor([1157.2705], device='cuda:0', grad_fn=), Loss: 0.001898336224257946, KL/n: 21.666675567626953 + 0it [00:00, ?it/s]2025-05-26 01:04:20,564 - INFO - [Epoch 090 | Batch 0000] IWAE-loss 1386.0161 | mean log_px -0.0046 | KL -1061.24 + 1it [00:00, 7.62it/s] 4it [00:00, 16.33it/s] 7it [00:00, 19.31it/s] 10it [00:00, 20.85it/s] 13it [00:00, 21.73it/s] 16it [00:00, 22.27it/s] 19it [00:00, 22.52it/s] 22it [00:01, 22.64it/s] 25it [00:01, 22.75it/s] 28it [00:01, 22.85it/s] 31it [00:01, 23.00it/s] 34it [00:01, 23.06it/s] 37it [00:01, 23.03it/s] 40it [00:01, 22.90it/s] 43it [00:01, 23.05it/s] 46it [00:02, 23.13it/s] 49it [00:02, 23.17it/s]2025-05-26 01:04:22,735 - INFO - [Epoch 090 | Batch 0050] IWAE-loss 1180.5347 | mean log_px -0.0017 | KL -1059.12 + 52it [00:02, 23.21it/s] 55it [00:02, 23.24it/s] 58it [00:02, 23.24it/s] 61it [00:02, 23.28it/s] 64it [00:02, 23.26it/s] 67it [00:02, 23.27it/s] 70it [00:03, 23.22it/s] 73it [00:03, 23.24it/s] 76it [00:03, 23.31it/s] 79it [00:03, 23.23it/s] 82it [00:03, 23.19it/s] 85it [00:03, 23.20it/s] 88it [00:03, 23.21it/s] 91it [00:04, 23.25it/s] 94it [00:04, 23.00it/s] 97it [00:04, 23.10it/s] 100it [00:04, 23.14it/s]2025-05-26 01:04:24,890 - INFO - [Epoch 090 | Batch 0100] IWAE-loss 1235.2122 | mean log_px -0.0026 | KL -1055.34 + 103it [00:04, 23.16it/s] 106it [00:04, 23.22it/s] 109it [00:04, 23.28it/s] 112it [00:04, 23.33it/s] 115it [00:05, 23.29it/s] 118it [00:05, 23.34it/s] 121it [00:05, 23.36it/s] 124it [00:05, 23.38it/s] 127it [00:05, 23.38it/s] 130it [00:05, 23.38it/s] 133it [00:05, 23.39it/s] 136it [00:05, 23.35it/s] 139it [00:06, 23.35it/s] 142it [00:06, 23.36it/s] 145it [00:06, 23.37it/s] 148it [00:06, 23.39it/s]2025-05-26 01:04:27,030 - INFO - [Epoch 090 | Batch 0150] IWAE-loss 1277.4537 | mean log_px -0.0032 | KL -1056.80 + 151it [00:06, 23.30it/s] 154it [00:06, 23.29it/s] 157it [00:06, 23.27it/s] 160it [00:06, 23.26it/s] 163it [00:07, 23.33it/s] 166it [00:07, 23.34it/s] 169it [00:07, 23.38it/s] 172it [00:07, 23.37it/s] 175it [00:07, 23.39it/s] 178it [00:07, 23.31it/s] 181it [00:07, 23.30it/s] 184it [00:08, 23.38it/s] 187it [00:08, 23.45it/s] 190it [00:08, 23.49it/s] 193it [00:08, 23.47it/s] 196it [00:08, 22.03it/s] 196it [00:08, 22.76it/s] +2025-05-26 01:04:29,069 - INFO - Epoch: 90, Objective: tensor([1520.1176], device='cuda:0', grad_fn=), Loss: 0.009523079730570316, KL/n: 21.633167266845703 + 0it [00:00, ?it/s]2025-05-26 01:04:29,300 - INFO - [Epoch 091 | Batch 0000] IWAE-loss 1401.9963 | mean log_px -0.0049 | KL -1058.18 + 1it [00:00, 8.02it/s] 4it [00:00, 16.26it/s] 7it [00:00, 18.93it/s] 10it [00:00, 19.98it/s] 13it [00:00, 20.33it/s] 16it [00:00, 20.81it/s] 19it [00:00, 21.17it/s] 22it [00:01, 21.48it/s] 25it [00:01, 21.70it/s] 28it [00:01, 21.72it/s] 31it [00:01, 22.01it/s] 34it [00:01, 21.22it/s] 37it [00:01, 21.01it/s] 40it [00:01, 21.04it/s] 43it [00:02, 21.06it/s] 46it [00:02, 21.07it/s] 49it [00:02, 21.10it/s]2025-05-26 01:04:31,638 - INFO - [Epoch 091 | Batch 0050] IWAE-loss 1179.7617 | mean log_px -0.0017 | KL -1058.91 + 52it [00:02, 21.07it/s] 55it [00:02, 20.99it/s] 58it [00:02, 21.06it/s] 61it [00:02, 21.01it/s] 64it [00:03, 20.91it/s] 67it [00:03, 20.84it/s] 70it [00:03, 20.93it/s] 73it [00:03, 20.98it/s] 76it [00:03, 20.97it/s] 79it [00:03, 21.05it/s] 82it [00:03, 21.07it/s] 85it [00:04, 21.18it/s] 88it [00:04, 21.45it/s] 91it [00:04, 21.37it/s] 94it [00:04, 21.21it/s] 97it [00:04, 21.31it/s] 100it [00:04, 21.49it/s]2025-05-26 01:04:34,000 - INFO - [Epoch 091 | Batch 0100] IWAE-loss 1402.5481 | mean log_px -0.0050 | KL -1053.83 + 103it [00:04, 21.59it/s] 106it [00:05, 21.73it/s] 109it [00:05, 21.73it/s] 112it [00:05, 21.36it/s] 115it [00:05, 21.54it/s] 118it [00:05, 21.68it/s] 121it [00:05, 21.71it/s] 124it [00:05, 21.79it/s] 127it [00:06, 21.89it/s] 130it [00:06, 21.90it/s] 133it [00:06, 21.69it/s] 136it [00:06, 21.80it/s] 139it [00:06, 21.79it/s] 142it [00:06, 21.86it/s] 145it [00:06, 21.90it/s] 148it [00:06, 21.90it/s]2025-05-26 01:04:36,292 - INFO - [Epoch 091 | Batch 0150] IWAE-loss 1406.9880 | mean log_px -0.0051 | KL -1052.66 + 151it [00:07, 21.86it/s] 154it [00:07, 21.91it/s] 157it [00:07, 21.97it/s] 160it [00:07, 21.97it/s] 163it [00:07, 21.98it/s] 166it [00:07, 21.91it/s] 169it [00:07, 21.85it/s] 172it [00:08, 21.78it/s] 175it [00:08, 21.84it/s] 178it [00:08, 21.92it/s] 181it [00:08, 22.00it/s] 184it [00:08, 22.05it/s] 187it [00:08, 22.08it/s] 190it [00:08, 22.08it/s] 193it [00:09, 22.10it/s] 196it [00:09, 21.27it/s] 196it [00:09, 21.21it/s] +2025-05-26 01:04:38,439 - INFO - Epoch: 91, Objective: tensor([1671.4491], device='cuda:0', grad_fn=), Loss: 0.011594868265092373, KL/n: 21.481624603271484 + 0it [00:00, ?it/s]2025-05-26 01:04:38,844 - INFO - [Epoch 092 | Batch 0000] IWAE-loss 1374.3456 | mean log_px -0.0046 | KL -1052.16 + 1it [00:00, 9.36it/s] 4it [00:00, 17.55it/s] 7it [00:00, 19.66it/s] 10it [00:00, 20.63it/s] 13it [00:00, 21.15it/s] 16it [00:00, 21.47it/s] 19it [00:00, 21.67it/s] 22it [00:01, 21.83it/s] 25it [00:01, 21.98it/s] 28it [00:01, 21.98it/s] 31it [00:01, 21.91it/s] 34it [00:01, 21.97it/s] 37it [00:01, 22.01it/s] 40it [00:01, 21.80it/s] 43it [00:02, 21.13it/s] 46it [00:02, 21.22it/s] 49it [00:02, 21.40it/s]2025-05-26 01:04:41,142 - INFO - [Epoch 092 | Batch 0050] IWAE-loss 1157.9886 | mean log_px -0.0014 | KL -1056.68 + 52it [00:02, 21.43it/s] 55it [00:02, 21.53it/s] 58it [00:02, 21.52it/s] 61it [00:02, 21.62it/s] 64it [00:03, 21.69it/s] 67it [00:03, 21.72it/s] 70it [00:03, 21.81it/s] 73it [00:03, 21.77it/s] 76it [00:03, 21.79it/s] 79it [00:03, 21.95it/s] 82it [00:03, 21.66it/s] 85it [00:03, 21.25it/s] 88it [00:04, 20.92it/s] 91it [00:04, 21.26it/s] 94it [00:04, 21.56it/s] 97it [00:04, 21.76it/s] 100it [00:04, 21.85it/s]2025-05-26 01:04:43,450 - INFO - [Epoch 092 | Batch 0100] IWAE-loss 1177.0540 | mean log_px -0.0017 | KL -1057.24 + 103it [00:04, 21.89it/s] 106it [00:04, 21.96it/s] 109it [00:05, 21.97it/s] 112it [00:05, 22.03it/s] 115it [00:05, 22.14it/s] 118it [00:05, 21.91it/s] 121it [00:05, 21.85it/s] 124it [00:05, 21.86it/s] 127it [00:05, 21.89it/s] 130it [00:06, 21.69it/s] 133it [00:06, 21.47it/s] 136it [00:06, 21.50it/s] 139it [00:06, 21.65it/s] 142it [00:06, 21.67it/s] 145it [00:06, 21.72it/s] 148it [00:06, 21.71it/s]2025-05-26 01:04:45,746 - INFO - [Epoch 092 | Batch 0150] IWAE-loss 1291.9728 | mean log_px -0.0033 | KL -1061.68 + 151it [00:07, 21.65it/s] 154it [00:07, 21.76it/s] 157it [00:07, 21.84it/s] 160it [00:07, 21.93it/s] 163it [00:07, 22.07it/s] 166it [00:07, 22.07it/s] 169it [00:07, 22.12it/s] 172it [00:07, 22.16it/s] 175it [00:08, 22.15it/s] 178it [00:08, 22.16it/s] 181it [00:08, 22.19it/s] 184it [00:08, 22.20it/s] 187it [00:08, 22.24it/s] 190it [00:08, 22.20it/s] 193it [00:08, 22.15it/s] 196it [00:09, 21.42it/s] 196it [00:09, 21.49it/s] +2025-05-26 01:04:47,881 - INFO - Epoch: 92, Objective: tensor([1443.8928], device='cuda:0', grad_fn=), Loss: 0.0040267230942845345, KL/n: 21.64792823791504 + 0it [00:00, ?it/s]2025-05-26 01:04:48,117 - INFO - [Epoch 093 | Batch 0000] IWAE-loss 1193.6648 | mean log_px -0.0019 | KL -1061.59 + 1it [00:00, 7.72it/s] 4it [00:00, 16.41it/s] 7it [00:00, 19.11it/s] 10it [00:00, 20.30it/s] 13it [00:00, 20.95it/s] 16it [00:00, 21.36it/s] 19it [00:00, 21.68it/s] 22it [00:01, 21.82it/s] 25it [00:01, 22.02it/s] 28it [00:01, 22.06it/s] 31it [00:01, 22.09it/s] 34it [00:01, 22.15it/s] 37it [00:01, 22.12it/s] 40it [00:01, 22.10it/s] 43it [00:02, 22.14it/s] 46it [00:02, 22.09it/s] 49it [00:02, 21.92it/s]2025-05-26 01:04:50,380 - INFO - [Epoch 093 | Batch 0050] IWAE-loss 2028.1854 | mean log_px -0.0139 | KL -1056.76 + 52it [00:02, 21.94it/s] 55it [00:02, 22.02it/s] 58it [00:02, 21.95it/s] 61it [00:02, 22.00it/s] 64it [00:02, 22.08it/s] 67it [00:03, 21.99it/s] 70it [00:03, 21.92it/s] 73it [00:03, 21.87it/s] 76it [00:03, 21.77it/s] 79it [00:03, 21.89it/s] 82it [00:03, 21.96it/s] 85it [00:03, 22.07it/s] 88it [00:04, 22.15it/s] 91it [00:04, 22.06it/s] 94it [00:04, 22.14it/s] 97it [00:04, 22.19it/s] 100it [00:04, 22.09it/s]2025-05-26 01:04:52,649 - INFO - [Epoch 093 | Batch 0100] IWAE-loss 1531.0540 | mean log_px -0.0068 | KL -1055.18 + 103it [00:04, 22.04it/s] 106it [00:04, 22.03it/s] 109it [00:05, 21.96it/s] 112it [00:05, 21.93it/s] 115it [00:05, 21.97it/s] 118it [00:05, 22.00it/s] 121it [00:05, 21.97it/s] 124it [00:05, 21.95it/s] 127it [00:05, 21.97it/s] 130it [00:05, 21.99it/s] 133it [00:06, 21.95it/s] 136it [00:06, 21.98it/s] 139it [00:06, 21.93it/s] 142it [00:06, 21.90it/s] 145it [00:06, 21.97it/s] 148it [00:06, 21.97it/s]2025-05-26 01:04:54,926 - INFO - [Epoch 093 | Batch 0150] IWAE-loss 1170.8704 | mean log_px -0.0016 | KL -1055.53 + 151it [00:06, 21.90it/s] 154it [00:07, 21.84it/s] 157it [00:07, 21.90it/s] 160it [00:07, 21.92it/s] 163it [00:07, 21.94it/s] 166it [00:07, 21.94it/s] 169it [00:07, 21.91it/s] 172it [00:07, 22.03it/s] 175it [00:08, 22.11it/s] 178it [00:08, 22.19it/s] 181it [00:08, 22.17it/s] 184it [00:08, 21.97it/s] 187it [00:08, 22.05it/s] 190it [00:08, 22.09it/s] 193it [00:08, 22.03it/s] 196it [00:08, 21.35it/s] 196it [00:09, 21.64it/s] +2025-05-26 01:04:57,069 - INFO - Epoch: 93, Objective: tensor([1207.0376], device='cuda:0', grad_fn=), Loss: 0.0009715722408145666, KL/n: 21.600297927856445 + 0it [00:00, ?it/s]2025-05-26 01:04:57,310 - INFO - [Epoch 094 | Batch 0000] IWAE-loss 1199.6726 | mean log_px -0.0020 | KL -1057.00 + 1it [00:00, 7.13it/s] 4it [00:00, 15.64it/s] 7it [00:00, 18.60it/s] 10it [00:00, 19.67it/s] 13it [00:00, 20.49it/s] 16it [00:00, 21.00it/s] 19it [00:00, 20.92it/s] 22it [00:01, 21.33it/s] 25it [00:01, 21.40it/s] 28it [00:01, 21.62it/s] 31it [00:01, 21.78it/s] 34it [00:01, 21.54it/s] 37it [00:01, 21.60it/s] 40it [00:01, 21.66it/s] 43it [00:02, 21.80it/s] 46it [00:02, 21.80it/s] 49it [00:02, 21.58it/s]2025-05-26 01:04:59,620 - INFO - [Epoch 094 | Batch 0050] IWAE-loss 1485.6306 | mean log_px -0.0062 | KL -1054.89 + 52it [00:02, 21.47it/s] 55it [00:02, 21.66it/s] 58it [00:02, 21.80it/s] 61it [00:02, 21.50it/s] 64it [00:03, 21.76it/s] 67it [00:03, 21.79it/s] 70it [00:03, 21.88it/s] 73it [00:03, 21.96it/s] 76it [00:03, 22.01it/s] 79it [00:03, 21.65it/s] 82it [00:03, 21.65it/s] 85it [00:04, 21.84it/s] 88it [00:04, 21.94it/s] 91it [00:04, 21.80it/s] 94it [00:04, 21.67it/s] 97it [00:04, 21.76it/s] 100it [00:04, 21.49it/s]2025-05-26 01:05:01,920 - INFO - [Epoch 094 | Batch 0100] IWAE-loss 1346.5598 | mean log_px -0.0042 | KL -1050.64 + 103it [00:04, 21.69it/s] 106it [00:04, 21.87it/s] 109it [00:05, 21.58it/s] 112it [00:05, 21.55it/s] 115it [00:05, 21.67it/s] 118it [00:05, 21.83it/s] 121it [00:05, 21.75it/s] 124it [00:05, 21.85it/s] 127it [00:05, 21.60it/s] 130it [00:06, 21.67it/s] 133it [00:06, 21.53it/s] 136it [00:06, 21.67it/s] 139it [00:06, 21.49it/s] 142it [00:06, 21.72it/s] 145it [00:06, 21.86it/s] 148it [00:06, 21.96it/s]2025-05-26 01:05:04,214 - INFO - [Epoch 094 | Batch 0150] IWAE-loss 1456.9805 | mean log_px -0.0058 | KL -1048.46 + 151it [00:07, 22.00it/s] 154it [00:07, 22.04it/s] 157it [00:07, 21.96it/s] 160it [00:07, 22.05it/s] 163it [00:07, 22.07it/s] 166it [00:07, 22.12it/s] 169it [00:07, 22.09it/s] 172it [00:07, 22.08it/s] 175it [00:08, 22.07it/s] 178it [00:08, 22.11it/s] 181it [00:08, 22.09it/s] 184it [00:08, 22.10it/s] 187it [00:08, 22.13it/s] 190it [00:08, 21.88it/s] 193it [00:08, 21.88it/s] 196it [00:09, 21.00it/s] 196it [00:09, 21.39it/s] +2025-05-26 01:05:06,362 - INFO - Epoch: 94, Objective: tensor([1213.5227], device='cuda:0', grad_fn=), Loss: 0.0016594186890870333, KL/n: 21.40274429321289 + 0it [00:00, ?it/s]2025-05-26 01:05:06,750 - INFO - [Epoch 095 | Batch 0000] IWAE-loss 1238.5165 | mean log_px -0.0027 | KL -1048.67 + 1it [00:00, 9.30it/s] 4it [00:00, 16.92it/s] 7it [00:00, 18.87it/s] 10it [00:00, 19.70it/s] 13it [00:00, 20.51it/s] 16it [00:00, 21.06it/s] 19it [00:00, 21.40it/s] 22it [00:01, 21.30it/s] 25it [00:01, 21.33it/s] 28it [00:01, 21.52it/s] 31it [00:01, 21.73it/s] 34it [00:01, 21.86it/s] 37it [00:01, 21.82it/s] 40it [00:01, 21.76it/s] 43it [00:02, 21.81it/s] 46it [00:02, 21.88it/s] 49it [00:02, 21.93it/s]2025-05-26 01:05:09,059 - INFO - [Epoch 095 | Batch 0050] IWAE-loss 1194.5355 | mean log_px -0.0021 | KL -1044.37 + 52it [00:02, 21.88it/s] 55it [00:02, 21.92it/s] 58it [00:02, 21.93it/s] 61it [00:02, 21.91it/s] 64it [00:03, 21.80it/s] 67it [00:03, 21.82it/s] 70it [00:03, 21.91it/s] 73it [00:03, 22.00it/s] 76it [00:03, 22.02it/s] 79it [00:03, 21.77it/s] 82it [00:03, 21.74it/s] 85it [00:03, 21.58it/s] 88it [00:04, 21.52it/s] 91it [00:04, 21.66it/s] 94it [00:04, 21.66it/s] 97it [00:04, 21.77it/s] 100it [00:04, 21.89it/s]2025-05-26 01:05:11,354 - INFO - [Epoch 095 | Batch 0100] IWAE-loss 1409.6202 | mean log_px -0.0052 | KL -1043.72 + 103it [00:04, 21.74it/s] 106it [00:04, 21.68it/s] 109it [00:05, 21.83it/s] 112it [00:05, 21.94it/s] 115it [00:05, 21.65it/s] 118it [00:05, 21.42it/s] 121it [00:05, 21.01it/s] 124it [00:05, 21.09it/s] 127it [00:05, 20.95it/s] 130it [00:06, 21.27it/s] 133it [00:06, 21.37it/s] 136it [00:06, 21.34it/s] 139it [00:06, 21.40it/s] 142it [00:06, 20.79it/s] 145it [00:06, 20.59it/s] 148it [00:06, 20.85it/s]2025-05-26 01:05:13,720 - INFO - [Epoch 095 | Batch 0150] IWAE-loss 1235.0898 | mean log_px -0.0027 | KL -1044.54 + 151it [00:07, 20.76it/s] 154it [00:07, 20.79it/s] 157it [00:07, 21.00it/s] 160it [00:07, 21.29it/s] 163it [00:07, 21.53it/s] 166it [00:07, 21.22it/s] 169it [00:07, 21.52it/s] 172it [00:08, 21.32it/s] 175it [00:08, 21.55it/s] 178it [00:08, 21.72it/s] 181it [00:08, 21.75it/s] 184it [00:08, 21.90it/s] 187it [00:08, 21.83it/s] 190it [00:08, 21.96it/s] 193it [00:09, 22.05it/s] 196it [00:09, 21.07it/s] 196it [00:09, 21.24it/s] +2025-05-26 01:05:15,899 - INFO - Epoch: 95, Objective: tensor([1647.0312], device='cuda:0', grad_fn=), Loss: 0.008857104927301407, KL/n: 21.305051803588867 + 0it [00:00, ?it/s]2025-05-26 01:05:16,138 - INFO - [Epoch 096 | Batch 0000] IWAE-loss 1608.9626 | mean log_px -0.0081 | KL -1044.60 + 1it [00:00, 7.46it/s] 4it [00:00, 16.16it/s] 7it [00:00, 18.91it/s] 10it [00:00, 20.22it/s] 13it [00:00, 20.96it/s] 16it [00:00, 21.44it/s] 19it [00:00, 21.73it/s] 22it [00:01, 21.95it/s] 25it [00:01, 22.05it/s] 28it [00:01, 22.14it/s] 31it [00:01, 22.13it/s] 34it [00:01, 22.01it/s] 37it [00:01, 22.08it/s] 40it [00:01, 22.11it/s] 43it [00:02, 22.10it/s] 46it [00:02, 22.17it/s] 49it [00:02, 22.21it/s]2025-05-26 01:05:18,391 - INFO - [Epoch 096 | Batch 0050] IWAE-loss 1205.4226 | mean log_px -0.0024 | KL -1040.42 + 52it [00:02, 22.00it/s] 55it [00:02, 22.03it/s] 58it [00:02, 21.98it/s] 61it [00:02, 22.02it/s] 64it [00:02, 21.95it/s] 67it [00:03, 21.83it/s] 70it [00:03, 21.67it/s] 73it [00:03, 21.73it/s] 76it [00:03, 21.79it/s] 79it [00:03, 21.88it/s] 82it [00:03, 21.99it/s] 85it [00:03, 22.05it/s] 88it [00:04, 22.09it/s] 91it [00:04, 22.04it/s] 94it [00:04, 22.04it/s] 97it [00:04, 22.00it/s] 100it [00:04, 22.02it/s]2025-05-26 01:05:20,672 - INFO - [Epoch 096 | Batch 0100] IWAE-loss 1127.3739 | mean log_px -0.0013 | KL -1038.50 + 103it [00:04, 22.07it/s] 106it [00:04, 22.08it/s] 109it [00:05, 22.13it/s] 112it [00:05, 22.19it/s] 115it [00:05, 22.20it/s] 118it [00:05, 22.14it/s] 121it [00:05, 22.13it/s] 124it [00:05, 22.19it/s] 127it [00:05, 22.16it/s] 130it [00:05, 22.15it/s] 133it [00:06, 22.15it/s] 136it [00:06, 22.10it/s] 139it [00:06, 22.17it/s] 142it [00:06, 22.26it/s] 145it [00:06, 22.19it/s] 148it [00:06, 22.13it/s]2025-05-26 01:05:22,927 - INFO - [Epoch 096 | Batch 0150] IWAE-loss 2036.7104 | mean log_px -0.0143 | KL -1036.73 + 151it [00:06, 22.15it/s] 154it [00:07, 22.23it/s] 157it [00:07, 22.24it/s] 160it [00:07, 22.28it/s] 163it [00:07, 22.34it/s] 166it [00:07, 22.28it/s] 169it [00:07, 22.28it/s] 172it [00:07, 22.35it/s] 175it [00:07, 22.39it/s] 178it [00:08, 22.39it/s] 181it [00:08, 22.41it/s] 184it [00:08, 22.40it/s] 187it [00:08, 22.42it/s] 190it [00:08, 22.38it/s] 193it [00:08, 22.33it/s] 196it [00:08, 21.39it/s] 196it [00:09, 21.75it/s] +2025-05-26 01:05:25,041 - INFO - Epoch: 96, Objective: tensor([2096.0850], device='cuda:0', grad_fn=), Loss: 0.016430232673883438, KL/n: 21.143293380737305 + 0it [00:00, ?it/s]2025-05-26 01:05:25,458 - INFO - [Epoch 097 | Batch 0000] IWAE-loss 1159.8892 | mean log_px -0.0018 | KL -1035.70 + 1it [00:00, 7.51it/s] 4it [00:00, 15.95it/s] 7it [00:00, 18.82it/s] 10it [00:00, 20.18it/s] 13it [00:00, 20.90it/s] 16it [00:00, 21.35it/s] 19it [00:00, 21.61it/s] 22it [00:01, 21.83it/s] 25it [00:01, 21.93it/s] 28it [00:01, 21.99it/s] 31it [00:01, 22.07it/s] 34it [00:01, 22.08it/s] 37it [00:01, 22.03it/s] 40it [00:01, 22.05it/s] 43it [00:02, 22.10it/s] 46it [00:02, 22.15it/s] 49it [00:02, 22.16it/s]2025-05-26 01:05:27,718 - INFO - [Epoch 097 | Batch 0050] IWAE-loss 1306.0013 | mean log_px -0.0039 | KL -1034.87 + 52it [00:02, 22.08it/s] 55it [00:02, 22.15it/s] 58it [00:02, 22.17it/s] 61it [00:02, 22.11it/s] 64it [00:02, 22.00it/s] 67it [00:03, 22.00it/s] 70it [00:03, 22.06it/s] 73it [00:03, 22.07it/s] 76it [00:03, 22.12it/s] 79it [00:03, 22.11it/s] 82it [00:03, 22.12it/s] 85it [00:03, 22.15it/s] 88it [00:04, 22.11it/s] 91it [00:04, 22.12it/s] 94it [00:04, 22.05it/s] 97it [00:04, 22.07it/s] 100it [00:04, 22.09it/s]2025-05-26 01:05:29,983 - INFO - [Epoch 097 | Batch 0100] IWAE-loss 1150.6831 | mean log_px -0.0017 | KL -1031.14 + 103it [00:04, 22.04it/s] 106it [00:04, 22.09it/s] 109it [00:05, 22.10it/s] 112it [00:05, 21.89it/s] 115it [00:05, 21.95it/s] 118it [00:05, 22.01it/s] 121it [00:05, 22.07it/s] 124it [00:05, 22.12it/s] 127it [00:05, 22.16it/s] 130it [00:05, 22.17it/s] 133it [00:06, 22.18it/s] 136it [00:06, 22.20it/s] 139it [00:06, 22.17it/s] 142it [00:06, 22.22it/s] 145it [00:06, 22.20it/s] 148it [00:06, 22.19it/s]2025-05-26 01:05:32,243 - INFO - [Epoch 097 | Batch 0150] IWAE-loss 1599.7991 | mean log_px -0.0081 | KL -1035.43 + 151it [00:06, 22.11it/s] 154it [00:07, 22.13it/s] 157it [00:07, 22.11it/s] 160it [00:07, 22.13it/s] 163it [00:07, 22.13it/s] 166it [00:07, 22.19it/s] 169it [00:07, 22.16it/s] 172it [00:07, 22.12it/s] 175it [00:08, 22.10it/s] 178it [00:08, 22.02it/s] 181it [00:08, 22.00it/s] 184it [00:08, 21.96it/s] 187it [00:08, 21.96it/s] 190it [00:08, 21.99it/s] 193it [00:08, 22.06it/s] 196it [00:08, 21.17it/s] 196it [00:09, 21.68it/s] +2025-05-26 01:05:34,392 - INFO - Epoch: 97, Objective: tensor([1189.8542], device='cuda:0', grad_fn=), Loss: 0.0062665208242833614, KL/n: 21.14239501953125 + 0it [00:00, ?it/s]2025-05-26 01:05:34,640 - INFO - [Epoch 098 | Batch 0000] IWAE-loss 1140.4578 | mean log_px -0.0015 | KL -1034.76 + 1it [00:00, 7.13it/s] 4it [00:00, 15.06it/s] 7it [00:00, 18.06it/s] 10it [00:00, 19.67it/s] 13it [00:00, 20.47it/s] 16it [00:00, 21.08it/s] 19it [00:00, 21.22it/s] 22it [00:01, 21.31it/s] 25it [00:01, 21.50it/s] 28it [00:01, 21.27it/s] 31it [00:01, 21.47it/s] 34it [00:01, 21.26it/s] 37it [00:01, 21.53it/s] 40it [00:01, 21.67it/s] 43it [00:02, 21.81it/s] 46it [00:02, 21.90it/s] 49it [00:02, 21.93it/s]2025-05-26 01:05:36,949 - INFO - [Epoch 098 | Batch 0050] IWAE-loss 1207.7708 | mean log_px -0.0025 | KL -1035.08 + 52it [00:02, 21.83it/s] 55it [00:02, 21.77it/s] 58it [00:02, 21.60it/s] 61it [00:02, 21.60it/s] 64it [00:03, 21.37it/s] 67it [00:03, 21.25it/s] 70it [00:03, 21.10it/s] 73it [00:03, 21.05it/s] 76it [00:03, 20.84it/s] 79it [00:03, 20.84it/s] 82it [00:03, 20.92it/s] 85it [00:04, 21.32it/s] 88it [00:04, 21.55it/s] 91it [00:04, 21.71it/s] 94it [00:04, 21.75it/s] 97it [00:04, 21.30it/s] 100it [00:04, 21.34it/s]2025-05-26 01:05:39,301 - INFO - [Epoch 098 | Batch 0100] IWAE-loss 1454.2094 | mean log_px -0.0060 | KL -1034.53 + 103it [00:04, 21.30it/s] 106it [00:05, 21.20it/s] 109it [00:05, 21.39it/s] 112it [00:05, 21.23it/s] 115it [00:05, 21.46it/s] 118it [00:05, 21.76it/s] 121it [00:05, 21.85it/s] 124it [00:05, 22.02it/s] 127it [00:05, 22.10it/s] 130it [00:06, 22.22it/s] 133it [00:06, 22.21it/s] 136it [00:06, 21.72it/s] 139it [00:06, 21.59it/s] 142it [00:06, 21.71it/s] 145it [00:06, 21.37it/s] 148it [00:06, 21.64it/s]2025-05-26 01:05:41,601 - INFO - [Epoch 098 | Batch 0150] IWAE-loss 1581.1775 | mean log_px -0.0078 | KL -1033.05 + 151it [00:07, 21.65it/s] 154it [00:07, 21.41it/s] 157it [00:07, 21.34it/s] 160it [00:07, 21.64it/s] 163it [00:07, 21.87it/s] 166it [00:07, 21.60it/s] 169it [00:07, 21.65it/s] 172it [00:08, 21.86it/s] 175it [00:08, 21.82it/s] 178it [00:08, 21.43it/s] 181it [00:08, 21.22it/s] 184it [00:08, 21.22it/s] 187it [00:08, 21.45it/s] 190it [00:08, 21.41it/s] 193it [00:09, 20.91it/s] 196it [00:09, 19.94it/s] 196it [00:09, 21.09it/s] +2025-05-26 01:05:43,822 - INFO - Epoch: 98, Objective: tensor([1348.1132], device='cuda:0', grad_fn=), Loss: 0.009120768867433071, KL/n: 21.109325408935547 + 0it [00:00, ?it/s]2025-05-26 01:05:44,371 - INFO - [Epoch 099 | Batch 0000] IWAE-loss 1104.5126 | mean log_px -0.0010 | KL -1033.89 + 1it [00:00, 3.68it/s] 4it [00:00, 11.22it/s] 7it [00:00, 14.82it/s] 10it [00:00, 17.10it/s] 13it [00:00, 19.05it/s] 16it [00:00, 20.33it/s] 19it [00:01, 21.19it/s] 22it [00:01, 21.74it/s] 25it [00:01, 22.19it/s] 28it [00:01, 22.57it/s] 31it [00:01, 22.64it/s] 34it [00:01, 22.81it/s] 37it [00:01, 22.89it/s] 40it [00:01, 23.02it/s] 43it [00:02, 22.96it/s] 46it [00:02, 23.12it/s] 49it [00:02, 23.21it/s]2025-05-26 01:05:46,573 - INFO - [Epoch 099 | Batch 0050] IWAE-loss 1190.6581 | mean log_px -0.0023 | KL -1033.13 + 52it [00:02, 23.11it/s] 55it [00:02, 23.13it/s] 58it [00:02, 23.19it/s] 61it [00:02, 23.22it/s] 64it [00:03, 23.24it/s] 67it [00:03, 23.28it/s] 70it [00:03, 23.25it/s] 73it [00:03, 23.22it/s] 76it [00:03, 23.21it/s] 79it [00:03, 23.19it/s] 82it [00:03, 23.21it/s] 85it [00:03, 23.23it/s] 88it [00:04, 23.19it/s] 91it [00:04, 23.24it/s] 94it [00:04, 23.28it/s] 97it [00:04, 23.27it/s] 100it [00:04, 23.25it/s]2025-05-26 01:05:48,724 - INFO - [Epoch 099 | Batch 0100] IWAE-loss 1522.8735 | mean log_px -0.0070 | KL -1034.59 + 103it [00:04, 23.17it/s] 106it [00:04, 23.20it/s] 109it [00:04, 23.17it/s] 112it [00:05, 23.22it/s] 115it [00:05, 23.28it/s] 118it [00:05, 23.30it/s] 121it [00:05, 23.31it/s] 124it [00:05, 23.34it/s] 127it [00:05, 23.37it/s] 130it [00:05, 23.37it/s] 133it [00:05, 23.36it/s] 136it [00:06, 23.37it/s] 139it [00:06, 23.35it/s] 142it [00:06, 23.37it/s] 145it [00:06, 23.41it/s] 148it [00:06, 23.36it/s]2025-05-26 01:05:50,867 - INFO - [Epoch 099 | Batch 0150] IWAE-loss 1226.3561 | mean log_px -0.0028 | KL -1032.36 + 151it [00:06, 23.32it/s] 154it [00:06, 23.33it/s] 157it [00:07, 23.38it/s] 160it [00:07, 23.40it/s] 163it [00:07, 23.44it/s] 166it [00:07, 23.54it/s] 169it [00:07, 23.49it/s] 172it [00:07, 23.51it/s] 175it [00:07, 23.46it/s] 178it [00:07, 23.39it/s] 181it [00:08, 23.39it/s] 184it [00:08, 23.34it/s] 187it [00:08, 23.39it/s] 190it [00:08, 23.39it/s] 193it [00:08, 23.48it/s] 196it [00:08, 22.01it/s] 196it [00:08, 22.33it/s] +2025-05-26 01:05:52,903 - INFO - Epoch: 99, Objective: tensor([1209.9446], device='cuda:0', grad_fn=), Loss: 0.002673196606338024, KL/n: 21.06758689880371 +2025-05-26 01:05:52,907 - INFO - Select objective: bbb + 0it [00:00, ?it/s] 1it [00:00, 9.30it/s] 4it [00:00, 20.50it/s] 7it [00:00, 24.47it/s] 10it [00:00, 26.46it/s] 13it [00:00, 27.52it/s] 16it [00:00, 28.17it/s] 19it [00:00, 28.60it/s] 22it [00:00, 28.86it/s] 25it [00:00, 29.08it/s] 28it [00:01, 29.27it/s] 31it [00:01, 29.04it/s] 35it [00:01, 29.90it/s] 38it [00:01, 29.26it/s] 42it [00:01, 29.57it/s] 45it [00:01, 29.32it/s] 49it [00:01, 29.55it/s] 52it [00:01, 29.37it/s] 56it [00:01, 30.03it/s] 59it [00:02, 29.57it/s] 62it [00:02, 29.30it/s] 65it [00:02, 29.48it/s] 68it [00:02, 29.27it/s] 72it [00:02, 29.60it/s] 75it [00:02, 29.33it/s] 79it [00:02, 29.90it/s] 82it [00:02, 29.38it/s] 86it [00:02, 29.68it/s] 89it [00:03, 29.45it/s] 93it [00:03, 29.68it/s] 96it [00:03, 29.42it/s] 99it [00:03, 29.44it/s] 103it [00:03, 29.95it/s] 106it [00:03, 29.33it/s] 110it [00:03, 30.02it/s] 113it [00:03, 29.57it/s] 116it [00:04, 29.56it/s] 119it [00:04, 29.60it/s] 122it [00:04, 29.33it/s] 126it [00:04, 29.95it/s] 129it [00:04, 29.28it/s] 133it [00:04, 30.00it/s] 136it [00:04, 29.32it/s] 140it [00:04, 29.99it/s] 143it [00:04, 29.22it/s] 147it [00:05, 29.67it/s] 151it [00:05, 29.75it/s] 154it [00:05, 29.28it/s] 158it [00:05, 29.66it/s] 161it [00:05, 29.37it/s] 165it [00:05, 29.72it/s] 169it [00:05, 29.86it/s] 172it [00:05, 29.29it/s] 176it [00:06, 29.81it/s] 179it [00:06, 29.75it/s] 182it [00:06, 29.04it/s] 186it [00:06, 28.52it/s] 189it [00:06, 28.80it/s] 192it [00:06, 28.66it/s] 195it [00:06, 28.81it/s] 199it [00:06, 29.10it/s] 203it [00:06, 29.58it/s] 206it [00:07, 29.33it/s] 210it [00:07, 29.39it/s] 214it [00:07, 29.77it/s] 217it [00:07, 29.30it/s] 221it [00:07, 29.59it/s] 224it [00:07, 29.29it/s] 227it [00:07, 29.40it/s] 230it [00:07, 29.34it/s] 233it [00:07, 28.68it/s] 237it [00:08, 29.24it/s] 241it [00:08, 29.49it/s] 244it [00:08, 29.22it/s] 247it [00:08, 29.12it/s] 250it [00:08, 29.01it/s] 253it [00:08, 28.49it/s] 256it [00:08, 28.61it/s] 260it [00:08, 29.34it/s] 263it [00:09, 29.12it/s] 266it [00:09, 29.35it/s] 270it [00:09, 29.79it/s] 273it [00:09, 28.95it/s] 277it [00:09, 29.83it/s] 280it [00:09, 27.91it/s] 280it [00:09, 28.93it/s] +2025-05-26 01:06:02,931 - INFO - Epoch: 0, Objective: 0.01669873297214508, Loss: 0.008642598986625671, KL/n: 0.008056134916841984 + 0%| | 0/84 [00:00), Loss: 0.11140021681785583, KL/n: 71.59821319580078 + 0it [00:00, ?it/s]2025-05-26 01:18:27,610 - INFO - [Epoch 001 | Batch 0000] IWAE-loss 11894.2480 | mean log_px -0.1369 | KL -3499.28 + 1it [00:00, 3.18it/s] 2it [00:00, 3.60it/s] 3it [00:00, 3.66it/s] 4it [00:01, 3.82it/s] 5it [00:01, 3.93it/s] 6it [00:01, 4.11it/s] 7it [00:01, 4.10it/s] 8it [00:02, 4.18it/s] 9it [00:02, 4.16it/s] 10it [00:02, 4.14it/s] 11it [00:02, 3.98it/s] 12it [00:03, 4.03it/s] 13it [00:03, 4.11it/s] 14it [00:03, 4.21it/s] 15it [00:03, 4.17it/s] 16it [00:03, 4.22it/s] 17it [00:04, 4.22it/s] 18it [00:04, 4.33it/s] 19it [00:04, 4.41it/s] 20it [00:04, 4.42it/s] 21it [00:05, 4.37it/s] 22it [00:05, 4.42it/s] 23it [00:05, 4.36it/s] 24it [00:05, 4.44it/s] 25it [00:05, 4.40it/s] 26it [00:06, 4.10it/s] 27it [00:06, 4.17it/s] 28it [00:06, 4.14it/s] 29it [00:06, 4.23it/s] 30it [00:07, 4.24it/s] 31it [00:07, 4.21it/s] 32it [00:07, 4.31it/s] 33it [00:07, 4.07it/s] 34it [00:08, 4.20it/s] 35it [00:08, 4.21it/s] 36it [00:08, 4.24it/s] 37it [00:08, 4.19it/s] 38it [00:09, 4.14it/s] 39it [00:09, 4.12it/s] 40it [00:09, 4.15it/s] 41it [00:09, 4.24it/s] 42it [00:10, 4.34it/s] 43it [00:10, 4.42it/s] 44it [00:10, 4.47it/s] 45it [00:10, 4.49it/s] 46it [00:10, 4.50it/s] 47it [00:11, 4.46it/s] 48it [00:11, 4.50it/s] 49it [00:11, 4.34it/s] 50it [00:11, 4.43it/s]2025-05-26 01:18:39,386 - INFO - [Epoch 001 | Batch 0050] IWAE-loss 11227.0039 | mean log_px -0.1305 | KL -3490.07 + 51it [00:12, 4.25it/s] 52it [00:12, 4.20it/s] 53it [00:12, 4.30it/s] 54it [00:12, 4.23it/s] 55it [00:13, 4.19it/s] 56it [00:13, 4.17it/s] 57it [00:13, 4.27it/s] 58it [00:13, 4.26it/s] 59it [00:13, 4.23it/s] 60it [00:14, 4.23it/s] 61it [00:14, 4.22it/s] 62it [00:14, 4.31it/s] 63it [00:14, 4.24it/s] 64it [00:15, 4.24it/s] 65it [00:15, 4.28it/s] 66it [00:15, 4.36it/s] 67it [00:15, 4.40it/s] 68it [00:16, 4.34it/s] 69it [00:16, 4.37it/s] 70it [00:16, 4.43it/s] 71it [00:16, 4.38it/s] 72it [00:16, 4.30it/s] 73it [00:17, 4.23it/s] 74it [00:17, 4.18it/s] 75it [00:17, 4.19it/s] 76it [00:17, 4.28it/s] 77it [00:18, 4.38it/s] 78it [00:18, 4.38it/s] 79it [00:18, 4.28it/s] 80it [00:18, 4.31it/s] 81it [00:19, 4.19it/s] 82it [00:19, 4.12it/s] 83it [00:19, 4.16it/s] 84it [00:19, 4.13it/s] 85it [00:20, 4.13it/s] 86it [00:20, 4.14it/s] 87it [00:20, 4.17it/s] 88it [00:20, 4.01it/s] 89it [00:21, 4.03it/s] 90it [00:21, 4.00it/s] 91it [00:21, 4.06it/s] 92it [00:21, 3.89it/s] 93it [00:22, 3.99it/s] 94it [00:22, 4.01it/s] 95it [00:22, 4.12it/s] 96it [00:22, 4.03it/s] 97it [00:23, 4.04it/s] 98it [00:23, 4.04it/s] 99it [00:23, 4.09it/s] 100it [00:23, 4.21it/s]2025-05-26 01:18:51,292 - INFO - [Epoch 001 | Batch 0100] IWAE-loss 8575.6543 | mean log_px -0.0730 | KL -3466.15 + 101it [00:23, 4.31it/s] 102it [00:24, 4.26it/s] 103it [00:24, 4.33it/s] 104it [00:24, 4.17it/s] 105it [00:24, 4.28it/s] 106it [00:25, 4.22it/s] 107it [00:25, 4.16it/s] 108it [00:25, 4.16it/s] 109it [00:25, 4.03it/s] 110it [00:26, 4.09it/s] 111it [00:26, 4.06it/s] 112it [00:26, 4.05it/s] 113it [00:26, 4.05it/s] 114it [00:27, 4.13it/s] 115it [00:27, 4.14it/s] 116it [00:27, 4.14it/s] 117it [00:27, 4.24it/s] 118it [00:28, 4.19it/s] 119it [00:28, 4.31it/s] 120it [00:28, 4.31it/s] 121it [00:28, 4.39it/s] 122it [00:28, 4.36it/s] 123it [00:29, 4.42it/s] 124it [00:29, 4.32it/s] 125it [00:29, 4.30it/s] 126it [00:29, 4.37it/s] 127it [00:30, 4.29it/s] 128it [00:30, 4.24it/s] 129it [00:30, 4.18it/s] 130it [00:30, 4.13it/s] 131it [00:31, 4.13it/s] 132it [00:31, 4.10it/s] 133it [00:31, 4.24it/s] 134it [00:31, 4.27it/s] 135it [00:32, 4.16it/s] 136it [00:32, 4.24it/s] 137it [00:32, 4.10it/s] 138it [00:32, 4.07it/s] 139it [00:33, 4.23it/s] 140it [00:33, 4.34it/s] 141it [00:33, 4.29it/s] 142it [00:33, 4.25it/s] 143it [00:33, 4.20it/s] 144it [00:34, 4.20it/s] 145it [00:34, 4.14it/s] 146it [00:34, 4.14it/s] 147it [00:34, 4.27it/s] 148it [00:35, 4.17it/s] 149it [00:35, 4.16it/s] 150it [00:35, 4.14it/s]2025-05-26 01:19:03,204 - INFO - [Epoch 001 | Batch 0150] IWAE-loss 10918.8730 | mean log_px -0.1088 | KL -3451.89 + 151it [00:35, 4.04it/s] 152it [00:36, 4.11it/s] 153it [00:36, 4.14it/s] 154it [00:36, 4.14it/s] 155it [00:36, 4.14it/s] 156it [00:37, 4.17it/s] 157it [00:37, 4.21it/s] 158it [00:37, 4.19it/s] 159it [00:37, 4.31it/s] 160it [00:38, 4.41it/s] 161it [00:38, 4.22it/s] 162it [00:38, 4.26it/s] 163it [00:38, 4.21it/s] 164it [00:38, 4.29it/s] 165it [00:39, 4.37it/s] 166it [00:39, 4.28it/s] 167it [00:39, 4.25it/s] 168it [00:39, 4.12it/s] 169it [00:40, 4.23it/s] 170it [00:40, 4.30it/s] 171it [00:40, 4.30it/s] 172it [00:40, 4.17it/s] 173it [00:41, 4.29it/s] 174it [00:41, 4.31it/s] 175it [00:41, 4.29it/s] 176it [00:41, 4.23it/s] 177it [00:42, 4.22it/s] 178it [00:42, 4.13it/s] 179it [00:42, 4.16it/s] 180it [00:42, 4.21it/s] 181it [00:43, 4.08it/s] 182it [00:43, 4.17it/s] 183it [00:43, 4.13it/s] 184it [00:43, 4.13it/s] 185it [00:43, 4.12it/s] 186it [00:44, 4.10it/s] 187it [00:44, 4.07it/s] 188it [00:44, 4.19it/s] 189it [00:44, 4.29it/s] 190it [00:45, 4.21it/s] 191it [00:45, 4.22it/s] 192it [00:45, 4.17it/s] 193it [00:45, 4.15it/s] 194it [00:46, 4.18it/s] 195it [00:46, 4.09it/s] 196it [00:46, 4.22it/s] 196it [00:46, 4.20it/s] +2025-05-26 01:19:14,025 - INFO - Epoch: 1, Objective: tensor([9172.7520], device='cuda:0', grad_fn=), Loss: 0.07874009013175964, KL/n: 70.15756225585938 + 0it [00:00, ?it/s]2025-05-26 01:19:14,580 - INFO - [Epoch 002 | Batch 0000] IWAE-loss 7225.7852 | mean log_px -0.0616 | KL -3439.12 + 1it [00:00, 2.96it/s] 2it [00:00, 3.72it/s] 3it [00:00, 4.04it/s] 4it [00:01, 4.22it/s] 5it [00:01, 4.29it/s] 6it [00:01, 4.39it/s] 7it [00:01, 4.45it/s] 8it [00:01, 4.50it/s] 9it [00:02, 4.38it/s] 10it [00:02, 4.44it/s] 11it [00:02, 4.49it/s] 12it [00:02, 4.50it/s] 13it [00:02, 4.55it/s] 14it [00:03, 4.55it/s] 15it [00:03, 4.55it/s] 16it [00:03, 4.51it/s] 17it [00:03, 4.46it/s] 18it [00:04, 4.36it/s] 19it [00:04, 4.44it/s] 20it [00:04, 4.48it/s] 21it [00:04, 4.51it/s] 22it [00:05, 4.52it/s] 23it [00:05, 4.43it/s] 24it [00:05, 4.46it/s] 25it [00:05, 4.42it/s] 26it [00:05, 4.44it/s] 27it [00:06, 4.38it/s] 28it [00:06, 4.40it/s] 29it [00:06, 4.43it/s] 30it [00:06, 4.44it/s] 31it [00:07, 4.49it/s] 32it [00:07, 4.34it/s] 33it [00:07, 4.42it/s] 34it [00:07, 4.45it/s] 35it [00:07, 4.48it/s] 36it [00:08, 4.50it/s] 37it [00:08, 4.54it/s] 38it [00:08, 4.55it/s] 39it [00:08, 4.56it/s] 40it [00:09, 4.52it/s] 41it [00:09, 4.53it/s] 42it [00:09, 4.52it/s] 43it [00:09, 4.54it/s] 44it [00:09, 4.53it/s] 45it [00:10, 4.37it/s] 46it [00:10, 4.41it/s] 47it [00:10, 4.47it/s] 48it [00:10, 4.50it/s] 49it [00:11, 4.46it/s] 50it [00:11, 4.49it/s]2025-05-26 01:19:25,765 - INFO - [Epoch 002 | Batch 0050] IWAE-loss 7740.6035 | mean log_px -0.0618 | KL -3413.71 + 51it [00:11, 4.52it/s] 52it [00:11, 4.49it/s] 53it [00:11, 4.52it/s] 54it [00:12, 4.52it/s] 55it [00:12, 4.54it/s] 56it [00:12, 4.52it/s] 57it [00:12, 4.40it/s] 58it [00:13, 4.45it/s] 59it [00:13, 4.49it/s] 60it [00:13, 4.51it/s] 61it [00:13, 4.49it/s] 62it [00:13, 4.50it/s] 63it [00:14, 4.51it/s] 64it [00:14, 4.52it/s] 65it [00:14, 4.52it/s] 66it [00:14, 4.53it/s] 67it [00:15, 4.54it/s] 68it [00:15, 4.40it/s] 69it [00:15, 4.47it/s] 70it [00:15, 4.47it/s] 71it [00:15, 4.51it/s] 72it [00:16, 4.41it/s] 73it [00:16, 4.47it/s] 74it [00:16, 4.51it/s] 75it [00:16, 4.54it/s] 76it [00:17, 4.50it/s] 77it [00:17, 4.46it/s] 78it [00:17, 4.40it/s] 79it [00:17, 4.42it/s] 80it [00:17, 4.44it/s] 81it [00:18, 4.45it/s] 82it [00:18, 4.46it/s] 83it [00:18, 4.49it/s] 84it [00:18, 4.34it/s] 85it [00:19, 4.41it/s] 86it [00:19, 4.46it/s] 87it [00:19, 4.49it/s] 88it [00:19, 4.51it/s] 89it [00:19, 4.53it/s] 90it [00:20, 4.49it/s] 91it [00:20, 4.49it/s] 92it [00:20, 4.49it/s] 93it [00:20, 4.51it/s] 94it [00:21, 4.52it/s] 95it [00:21, 4.41it/s] 96it [00:21, 4.45it/s] 97it [00:21, 4.49it/s] 98it [00:21, 4.51it/s] 99it [00:22, 4.52it/s] 100it [00:22, 4.52it/s]2025-05-26 01:19:36,916 - INFO - [Epoch 002 | Batch 0100] IWAE-loss 10890.5635 | mean log_px -0.1134 | KL -3399.14 + 101it [00:22, 4.54it/s] 102it [00:22, 4.52it/s] 103it [00:23, 4.55it/s] 104it [00:23, 4.56it/s] 105it [00:23, 4.55it/s] 106it [00:23, 4.56it/s] 107it [00:23, 4.43it/s] 108it [00:24, 4.48it/s] 109it [00:24, 4.53it/s] 110it [00:24, 4.50it/s] 111it [00:24, 4.50it/s] 112it [00:25, 4.52it/s] 113it [00:25, 4.53it/s] 114it [00:25, 4.55it/s] 115it [00:25, 4.48it/s] 116it [00:25, 4.35it/s] 117it [00:26, 4.43it/s] 118it [00:26, 4.47it/s] 119it [00:26, 4.49it/s] 120it [00:26, 4.50it/s] 121it [00:27, 4.39it/s] 122it [00:27, 4.44it/s] 123it [00:27, 4.49it/s] 124it [00:27, 4.49it/s] 125it [00:27, 4.52it/s] 126it [00:28, 4.49it/s] 127it [00:28, 4.52it/s] 128it [00:28, 4.40it/s] 129it [00:28, 4.46it/s] 130it [00:29, 4.50it/s] 131it [00:29, 4.53it/s] 132it [00:29, 4.54it/s] 133it [00:29, 4.55it/s] 134it [00:29, 4.56it/s] 135it [00:30, 4.42it/s] 136it [00:30, 4.45it/s] 137it [00:30, 4.46it/s] 138it [00:30, 4.49it/s] 139it [00:31, 4.52it/s] 140it [00:31, 4.53it/s] 141it [00:31, 4.55it/s] 142it [00:31, 4.38it/s] 143it [00:32, 4.45it/s] 144it [00:32, 4.47it/s] 145it [00:32, 4.48it/s] 146it [00:32, 4.51it/s] 147it [00:32, 4.51it/s] 148it [00:33, 4.48it/s] 149it [00:33, 4.39it/s] 150it [00:33, 4.45it/s]2025-05-26 01:19:48,066 - INFO - [Epoch 002 | Batch 0150] IWAE-loss 6388.3467 | mean log_px -0.0455 | KL -3380.82 + 151it [00:33, 4.50it/s] 152it [00:34, 4.48it/s] 153it [00:34, 4.49it/s] 154it [00:34, 4.53it/s] 155it [00:34, 4.41it/s] 156it [00:34, 4.47it/s] 157it [00:35, 4.51it/s] 158it [00:35, 4.54it/s] 159it [00:35, 4.55it/s] 160it [00:35, 4.54it/s] 161it [00:36, 4.54it/s] 162it [00:36, 4.41it/s] 163it [00:36, 4.48it/s] 164it [00:36, 4.50it/s] 165it [00:36, 4.41it/s] 166it [00:37, 4.44it/s] 167it [00:37, 4.34it/s] 168it [00:37, 4.43it/s] 169it [00:37, 4.40it/s] 170it [00:38, 4.46it/s] 171it [00:38, 4.44it/s] 172it [00:38, 4.47it/s] 173it [00:38, 4.47it/s] 174it [00:38, 4.36it/s] 175it [00:39, 4.44it/s] 176it [00:39, 4.49it/s] 177it [00:39, 4.52it/s] 178it [00:39, 4.53it/s] 179it [00:40, 4.57it/s] 180it [00:40, 4.58it/s] 181it [00:40, 4.44it/s] 182it [00:40, 4.48it/s] 183it [00:40, 4.52it/s] 184it [00:41, 4.53it/s] 185it [00:41, 4.41it/s] 186it [00:41, 4.47it/s] 187it [00:41, 4.45it/s] 188it [00:42, 4.42it/s] 189it [00:42, 4.47it/s] 190it [00:42, 4.45it/s] 191it [00:42, 4.49it/s] 192it [00:42, 4.38it/s] 193it [00:43, 4.44it/s] 194it [00:43, 4.48it/s] 195it [00:43, 4.34it/s] 196it [00:43, 4.36it/s] 196it [00:43, 4.46it/s] +2025-05-26 01:19:58,278 - INFO - Epoch: 2, Objective: tensor([7126.1548], device='cuda:0', grad_fn=), Loss: 0.05375305190682411, KL/n: 68.71427154541016 + 0it [00:00, ?it/s]2025-05-26 01:19:58,659 - INFO - [Epoch 003 | Batch 0000] IWAE-loss 6548.8511 | mean log_px -0.0590 | KL -3364.44 + 1it [00:00, 3.23it/s] 2it [00:00, 3.88it/s] 3it [00:00, 4.20it/s] 4it [00:00, 4.33it/s] 5it [00:01, 4.43it/s] 6it [00:01, 4.45it/s] 7it [00:01, 4.50it/s] 8it [00:01, 4.52it/s] 9it [00:02, 4.36it/s] 10it [00:02, 4.29it/s] 11it [00:02, 4.22it/s] 12it [00:02, 4.19it/s] 13it [00:03, 4.28it/s] 14it [00:03, 4.35it/s] 15it [00:03, 4.38it/s] 16it [00:03, 4.27it/s] 17it [00:03, 4.36it/s] 18it [00:04, 4.42it/s] 19it [00:04, 4.34it/s] 20it [00:04, 4.42it/s] 21it [00:04, 4.44it/s] 22it [00:05, 4.45it/s] 23it [00:05, 4.31it/s] 24it [00:05, 4.39it/s] 25it [00:05, 4.43it/s] 26it [00:05, 4.46it/s] 27it [00:06, 4.47it/s] 28it [00:06, 4.48it/s] 29it [00:06, 4.44it/s] 30it [00:06, 4.33it/s] 31it [00:07, 4.40it/s] 32it [00:07, 4.37it/s] 33it [00:07, 4.23it/s] 34it [00:07, 4.29it/s] 35it [00:08, 4.33it/s] 36it [00:08, 4.37it/s] 37it [00:08, 4.45it/s] 38it [00:08, 4.46it/s] 39it [00:08, 4.46it/s] 40it [00:09, 4.35it/s] 41it [00:09, 4.41it/s] 42it [00:09, 4.46it/s] 43it [00:09, 4.42it/s] 44it [00:10, 4.26it/s] 45it [00:10, 4.34it/s] 46it [00:10, 4.42it/s] 47it [00:10, 4.33it/s] 48it [00:11, 4.19it/s] 49it [00:11, 4.30it/s] 50it [00:11, 4.38it/s]2025-05-26 01:20:10,081 - INFO - [Epoch 003 | Batch 0050] IWAE-loss 6395.8638 | mean log_px -0.0435 | KL -3348.27 + 51it [00:11, 4.26it/s] 52it [00:11, 4.33it/s] 53it [00:12, 4.36it/s] 54it [00:12, 4.42it/s] 55it [00:12, 4.33it/s] 56it [00:12, 4.36it/s] 57it [00:13, 4.43it/s] 58it [00:13, 4.45it/s] 59it [00:13, 4.50it/s] 60it [00:13, 4.52it/s] 61it [00:13, 4.42it/s] 62it [00:14, 4.44it/s] 63it [00:14, 4.49it/s] 64it [00:14, 4.36it/s] 65it [00:15, 3.40it/s] 66it [00:15, 3.67it/s] 67it [00:15, 3.88it/s] 68it [00:15, 4.07it/s] 69it [00:15, 4.17it/s] 70it [00:16, 4.23it/s] 71it [00:16, 4.33it/s] 72it [00:16, 4.38it/s] 73it [00:16, 4.37it/s] 74it [00:17, 4.29it/s] 75it [00:17, 4.36it/s] 76it [00:17, 4.43it/s] 77it [00:17, 4.48it/s] 78it [00:18, 4.50it/s] 79it [00:18, 4.54it/s] 80it [00:18, 4.39it/s] 81it [00:18, 4.44it/s] 82it [00:18, 4.34it/s] 83it [00:19, 4.43it/s] 84it [00:19, 4.48it/s] 85it [00:19, 4.50it/s] 86it [00:19, 4.36it/s] 87it [00:20, 4.42it/s] 88it [00:20, 4.41it/s] 89it [00:20, 4.42it/s] 90it [00:20, 4.44it/s] 91it [00:20, 4.34it/s] 92it [00:21, 4.25it/s] 93it [00:21, 4.33it/s] 94it [00:21, 4.40it/s] 95it [00:21, 4.42it/s] 96it [00:22, 4.40it/s] 97it [00:22, 4.32it/s] 98it [00:22, 4.38it/s] 99it [00:22, 4.30it/s] 100it [00:23, 4.33it/s]2025-05-26 01:20:21,620 - INFO - [Epoch 003 | Batch 0100] IWAE-loss 6408.8643 | mean log_px -0.0460 | KL -3327.64 + 101it [00:23, 4.36it/s] 102it [00:23, 4.40it/s] 103it [00:23, 4.46it/s] 104it [00:23, 4.43it/s] 105it [00:24, 4.32it/s] 106it [00:24, 4.21it/s] 107it [00:24, 4.18it/s] 108it [00:24, 4.28it/s] 109it [00:25, 4.37it/s] 110it [00:25, 4.44it/s] 111it [00:25, 4.40it/s] 112it [00:25, 4.27it/s] 113it [00:26, 4.22it/s] 114it [00:26, 4.31it/s] 115it [00:26, 4.26it/s] 116it [00:26, 4.35it/s] 117it [00:26, 4.25it/s] 118it [00:27, 4.34it/s] 119it [00:27, 4.40it/s] 120it [00:27, 4.47it/s] 121it [00:27, 4.52it/s] 122it [00:28, 4.53it/s] 123it [00:28, 4.56it/s] 124it [00:28, 4.57it/s] 125it [00:28, 4.57it/s] 126it [00:28, 4.56it/s] 127it [00:29, 4.57it/s] 128it [00:29, 4.26it/s] 129it [00:29, 4.35it/s] 130it [00:29, 4.40it/s] 131it [00:30, 4.31it/s] 132it [00:30, 4.37it/s] 133it [00:30, 4.43it/s] 134it [00:30, 4.30it/s] 135it [00:31, 4.38it/s] 136it [00:31, 4.29it/s] 137it [00:31, 4.24it/s] 138it [00:31, 4.18it/s] 139it [00:32, 4.17it/s] 140it [00:32, 4.27it/s] 141it [00:32, 4.36it/s] 142it [00:32, 4.41it/s] 143it [00:32, 4.44it/s] 144it [00:33, 4.47it/s] 145it [00:33, 4.36it/s] 146it [00:33, 4.44it/s] 147it [00:33, 4.38it/s] 148it [00:34, 4.43it/s] 149it [00:34, 4.48it/s] 150it [00:34, 4.41it/s]2025-05-26 01:20:33,041 - INFO - [Epoch 003 | Batch 0150] IWAE-loss 6867.9688 | mean log_px -0.0538 | KL -3303.91 + 151it [00:34, 4.44it/s] 152it [00:34, 4.35it/s] 153it [00:35, 4.42it/s] 154it [00:35, 4.47it/s] 155it [00:35, 4.46it/s] 156it [00:35, 4.50it/s] 157it [00:36, 4.53it/s] 158it [00:36, 4.21it/s] 159it [00:36, 4.12it/s] 160it [00:36, 4.06it/s] 161it [00:37, 4.10it/s] 162it [00:37, 4.22it/s] 163it [00:37, 4.32it/s] 164it [00:37, 4.38it/s] 165it [00:37, 4.43it/s] 166it [00:38, 4.42it/s] 167it [00:38, 4.45it/s] 168it [00:38, 4.48it/s] 169it [00:38, 4.48it/s] 170it [00:39, 4.52it/s] 171it [00:39, 4.53it/s] 172it [00:39, 4.54it/s] 173it [00:39, 4.56it/s] 174it [00:39, 4.38it/s] 175it [00:40, 4.43it/s] 176it [00:40, 4.47it/s] 177it [00:40, 4.45it/s] 178it [00:40, 4.36it/s] 179it [00:41, 4.28it/s] 180it [00:41, 4.36it/s] 181it [00:41, 4.42it/s] 182it [00:41, 4.45it/s] 183it [00:41, 4.49it/s] 184it [00:42, 4.37it/s] 185it [00:42, 4.26it/s] 186it [00:42, 4.34it/s] 187it [00:42, 4.42it/s] 188it [00:43, 4.44it/s] 189it [00:43, 4.46it/s] 190it [00:43, 4.51it/s] 191it [00:43, 4.53it/s] 192it [00:44, 4.43it/s] 193it [00:44, 4.48it/s] 194it [00:44, 4.31it/s] 195it [00:44, 4.28it/s] 196it [00:44, 4.24it/s] 196it [00:45, 4.35it/s] +2025-05-26 01:20:43,448 - INFO - Epoch: 3, Objective: tensor([5746.6787], device='cuda:0', grad_fn=), Loss: 0.046654097735881805, KL/n: 67.17630004882812 + 0it [00:00, ?it/s]2025-05-26 01:20:43,853 - INFO - [Epoch 004 | Batch 0000] IWAE-loss 5883.0645 | mean log_px -0.0408 | KL -3290.14 + 1it [00:00, 2.97it/s] 2it [00:00, 3.63it/s] 3it [00:00, 4.01it/s] 4it [00:01, 4.05it/s] 5it [00:01, 4.19it/s] 6it [00:01, 4.32it/s] 7it [00:01, 4.29it/s] 8it [00:01, 4.40it/s] 9it [00:02, 4.47it/s] 10it [00:02, 4.52it/s] 11it [00:02, 4.59it/s] 12it [00:02, 4.61it/s] 13it [00:02, 4.64it/s] 14it [00:03, 4.65it/s] 15it [00:03, 4.67it/s] 16it [00:03, 4.67it/s] 17it [00:03, 4.68it/s] 18it [00:04, 4.68it/s] 19it [00:04, 4.69it/s] 20it [00:04, 4.69it/s] 21it [00:04, 4.69it/s] 22it [00:04, 4.68it/s] 23it [00:05, 4.68it/s] 24it [00:05, 4.68it/s] 25it [00:05, 4.69it/s] 26it [00:05, 4.53it/s] 27it [00:06, 4.59it/s] 28it [00:06, 4.61it/s] 29it [00:06, 4.64it/s] 30it [00:06, 4.65it/s] 31it [00:06, 4.67it/s] 32it [00:07, 4.67it/s] 33it [00:07, 4.68it/s] 34it [00:07, 4.68it/s] 35it [00:07, 4.52it/s] 36it [00:07, 4.56it/s] 37it [00:08, 4.62it/s] 38it [00:08, 4.63it/s] 39it [00:08, 4.64it/s] 40it [00:08, 4.65it/s] 41it [00:09, 4.66it/s] 42it [00:09, 4.67it/s] 43it [00:09, 4.67it/s] 44it [00:09, 4.67it/s] 45it [00:09, 4.68it/s] 46it [00:10, 4.52it/s] 47it [00:10, 4.58it/s] 48it [00:10, 4.48it/s] 49it [00:10, 4.48it/s] 50it [00:10, 4.54it/s]2025-05-26 01:20:54,728 - INFO - [Epoch 004 | Batch 0050] IWAE-loss 4895.3418 | mean log_px -0.0286 | KL -3262.91 + 51it [00:11, 4.59it/s] 52it [00:11, 4.62it/s] 53it [00:11, 4.51it/s] 54it [00:11, 4.57it/s] 55it [00:12, 4.59it/s] 56it [00:12, 4.61it/s] 57it [00:12, 4.65it/s] 58it [00:12, 4.66it/s] 59it [00:12, 4.67it/s] 60it [00:13, 4.68it/s] 61it [00:13, 4.52it/s] 62it [00:13, 4.58it/s] 63it [00:13, 4.60it/s] 64it [00:14, 4.62it/s] 65it [00:14, 4.64it/s] 66it [00:14, 4.63it/s] 67it [00:14, 4.65it/s] 68it [00:14, 4.66it/s] 69it [00:15, 4.67it/s] 70it [00:15, 4.67it/s] 71it [00:15, 4.68it/s] 72it [00:15, 4.52it/s] 73it [00:15, 4.59it/s] 74it [00:16, 4.56it/s] 75it [00:16, 4.60it/s] 76it [00:16, 4.62it/s] 77it [00:16, 4.65it/s] 78it [00:17, 4.65it/s] 79it [00:17, 4.67it/s] 80it [00:17, 4.67it/s] 81it [00:17, 4.68it/s] 82it [00:17, 4.68it/s] 83it [00:18, 4.67it/s] 84it [00:18, 4.68it/s] 85it [00:18, 4.68it/s] 86it [00:18, 4.69it/s] 87it [00:18, 4.66it/s] 88it [00:19, 4.67it/s] 89it [00:19, 4.65it/s] 90it [00:19, 4.66it/s] 91it [00:19, 4.68it/s] 92it [00:20, 4.69it/s] 93it [00:20, 4.69it/s] 94it [00:20, 4.69it/s] 95it [00:20, 4.70it/s] 96it [00:20, 4.69it/s] 97it [00:21, 4.69it/s] 98it [00:21, 4.52it/s] 99it [00:21, 4.58it/s] 100it [00:21, 4.60it/s]2025-05-26 01:21:05,507 - INFO - [Epoch 004 | Batch 0100] IWAE-loss 5435.9736 | mean log_px -0.0313 | KL -3245.03 + 101it [00:21, 4.62it/s] 102it [00:22, 4.61it/s] 103it [00:22, 4.65it/s] 104it [00:22, 4.65it/s] 105it [00:22, 4.51it/s] 106it [00:23, 4.57it/s] 107it [00:23, 4.61it/s] 108it [00:23, 4.64it/s] 109it [00:23, 4.58it/s] 110it [00:23, 4.60it/s] 111it [00:24, 4.63it/s] 112it [00:24, 4.65it/s] 113it [00:24, 4.67it/s] 114it [00:24, 4.67it/s] 115it [00:25, 4.68it/s] 116it [00:25, 4.69it/s] 117it [00:25, 4.70it/s] 118it [00:25, 4.69it/s] 119it [00:25, 4.70it/s] 120it [00:26, 4.70it/s] 121it [00:26, 4.70it/s] 122it [00:26, 4.70it/s] 123it [00:26, 4.70it/s] 124it [00:26, 4.56it/s] 125it [00:27, 4.62it/s] 126it [00:27, 4.64it/s] 127it [00:27, 4.53it/s] 128it [00:27, 4.59it/s] 129it [00:28, 4.63it/s] 130it [00:28, 4.64it/s] 131it [00:28, 4.66it/s] 132it [00:28, 4.67it/s] 133it [00:28, 4.53it/s] 134it [00:29, 4.58it/s] 135it [00:29, 4.61it/s] 136it [00:29, 4.63it/s] 137it [00:29, 4.65it/s] 138it [00:29, 4.66it/s] 139it [00:30, 4.50it/s] 140it [00:30, 4.57it/s] 141it [00:30, 4.59it/s] 142it [00:30, 4.61it/s] 143it [00:31, 4.64it/s] 144it [00:31, 4.65it/s] 145it [00:31, 4.67it/s] 146it [00:31, 4.51it/s] 147it [00:31, 4.58it/s] 148it [00:32, 4.61it/s] 149it [00:32, 4.64it/s] 150it [00:32, 4.65it/s]2025-05-26 01:21:16,309 - INFO - [Epoch 004 | Batch 0150] IWAE-loss 4805.7720 | mean log_px -0.0276 | KL -3228.11 + 151it [00:32, 4.67it/s] 152it [00:32, 4.68it/s] 153it [00:33, 4.68it/s] 154it [00:33, 4.68it/s] 155it [00:33, 4.69it/s] 156it [00:33, 4.68it/s] 157it [00:34, 4.69it/s] 158it [00:34, 4.69it/s] 159it [00:34, 4.69it/s] 160it [00:34, 4.69it/s] 161it [00:34, 4.69it/s] 162it [00:35, 4.41it/s] 163it [00:35, 4.51it/s] 164it [00:35, 4.56it/s] 165it [00:35, 4.60it/s] 166it [00:36, 4.63it/s] 167it [00:36, 4.65it/s] 168it [00:36, 4.66it/s] 169it [00:36, 4.64it/s] 170it [00:36, 4.66it/s] 171it [00:37, 4.68it/s] 172it [00:37, 4.68it/s] 173it [00:37, 4.68it/s] 174it [00:37, 4.49it/s] 175it [00:37, 4.56it/s] 176it [00:38, 4.57it/s] 177it [00:38, 4.62it/s] 178it [00:38, 4.64it/s] 179it [00:38, 4.65it/s] 180it [00:39, 4.66it/s] 181it [00:39, 4.54it/s] 182it [00:39, 4.60it/s] 183it [00:39, 4.63it/s] 184it [00:39, 4.64it/s] 185it [00:40, 4.66it/s] 186it [00:40, 4.67it/s] 187it [00:40, 4.68it/s] 188it [00:40, 4.54it/s] 189it [00:41, 4.57it/s] 190it [00:41, 4.56it/s] 191it [00:41, 4.58it/s] 192it [00:41, 4.58it/s] 193it [00:41, 4.36it/s] 194it [00:42, 4.41it/s] 195it [00:42, 4.32it/s] 196it [00:42, 4.39it/s] 196it [00:42, 4.59it/s] +2025-05-26 01:21:26,254 - INFO - Epoch: 4, Objective: tensor([5635.8784], device='cuda:0', grad_fn=), Loss: 0.03690037503838539, KL/n: 65.52703094482422 + 0it [00:00, ?it/s]2025-05-26 01:21:26,814 - INFO - [Epoch 005 | Batch 0000] IWAE-loss 6954.7480 | mean log_px -0.0605 | KL -3211.71 + 1it [00:00, 3.28it/s] 2it [00:00, 3.94it/s] 3it [00:00, 4.06it/s] 4it [00:00, 4.27it/s] 5it [00:01, 4.30it/s] 6it [00:01, 4.40it/s] 7it [00:01, 4.46it/s] 8it [00:01, 4.46it/s] 9it [00:02, 4.55it/s] 10it [00:02, 4.44it/s] 11it [00:02, 4.52it/s] 12it [00:02, 4.56it/s] 13it [00:02, 4.61it/s] 14it [00:03, 4.63it/s] 15it [00:03, 4.49it/s] 16it [00:03, 4.51it/s] 17it [00:03, 4.56it/s] 18it [00:04, 4.59it/s] 19it [00:04, 4.62it/s] 20it [00:04, 4.63it/s] 21it [00:04, 4.51it/s] 22it [00:04, 4.57it/s] 23it [00:05, 4.46it/s] 24it [00:05, 4.54it/s] 25it [00:05, 4.59it/s] 26it [00:05, 4.61it/s] 27it [00:06, 4.63it/s] 28it [00:06, 4.65it/s] 29it [00:06, 4.51it/s] 30it [00:06, 4.57it/s] 31it [00:06, 4.60it/s] 32it [00:07, 4.62it/s] 33it [00:07, 4.64it/s] 34it [00:07, 4.65it/s] 35it [00:07, 4.52it/s] 36it [00:07, 4.58it/s] 37it [00:08, 4.61it/s] 38it [00:08, 4.64it/s] 39it [00:08, 4.65it/s] 40it [00:08, 4.65it/s] 41it [00:09, 4.52it/s] 42it [00:09, 4.58it/s] 43it [00:09, 4.61it/s] 44it [00:09, 4.62it/s] 45it [00:09, 4.64it/s] 46it [00:10, 4.66it/s] 47it [00:10, 4.52it/s] 48it [00:10, 4.58it/s] 49it [00:10, 4.62it/s] 50it [00:11, 4.62it/s]2025-05-26 01:21:37,739 - INFO - [Epoch 005 | Batch 0050] IWAE-loss 6567.6064 | mean log_px -0.0585 | KL -3187.38 + 51it [00:11, 4.64it/s] 52it [00:11, 4.50it/s] 53it [00:11, 4.57it/s] 54it [00:11, 4.60it/s] 55it [00:12, 4.63it/s] 56it [00:12, 4.65it/s] 57it [00:12, 4.67it/s] 58it [00:12, 4.67it/s] 59it [00:12, 4.68it/s] 60it [00:13, 4.53it/s] 61it [00:13, 4.59it/s] 62it [00:13, 4.62it/s] 63it [00:13, 4.65it/s] 64it [00:14, 4.64it/s] 65it [00:14, 4.65it/s] 66it [00:14, 4.65it/s] 67it [00:14, 4.65it/s] 68it [00:14, 4.54it/s] 69it [00:15, 4.61it/s] 70it [00:15, 4.63it/s] 71it [00:15, 4.65it/s] 72it [00:15, 4.66it/s] 73it [00:15, 4.66it/s] 74it [00:16, 4.66it/s] 75it [00:16, 4.67it/s] 76it [00:16, 4.44it/s] 77it [00:16, 4.51it/s] 78it [00:17, 4.51it/s] 79it [00:17, 4.56it/s] 80it [00:17, 4.61it/s] 81it [00:17, 4.63it/s] 82it [00:17, 4.63it/s] 83it [00:18, 4.66it/s] 84it [00:18, 4.67it/s] 85it [00:18, 4.68it/s] 86it [00:18, 4.68it/s] 87it [00:19, 4.53it/s] 88it [00:19, 4.59it/s] 89it [00:19, 4.63it/s] 90it [00:19, 4.64it/s] 91it [00:19, 4.66it/s] 92it [00:20, 4.66it/s] 93it [00:20, 4.52it/s] 94it [00:20, 4.58it/s] 95it [00:20, 4.62it/s] 96it [00:20, 4.63it/s] 97it [00:21, 4.65it/s] 98it [00:21, 4.66it/s] 99it [00:21, 4.68it/s] 100it [00:21, 4.68it/s]2025-05-26 01:21:48,559 - INFO - [Epoch 005 | Batch 0100] IWAE-loss 5110.2051 | mean log_px -0.0323 | KL -3168.64 + 101it [00:22, 4.68it/s] 102it [00:22, 4.68it/s] 103it [00:22, 4.69it/s] 104it [00:22, 4.65it/s] 105it [00:22, 4.49it/s] 106it [00:23, 4.55it/s] 107it [00:23, 4.59it/s] 108it [00:23, 4.63it/s] 109it [00:23, 4.65it/s] 110it [00:23, 4.65it/s] 111it [00:24, 4.68it/s] 112it [00:24, 4.68it/s] 113it [00:24, 4.69it/s] 114it [00:24, 4.54it/s] 115it [00:25, 4.60it/s] 116it [00:25, 4.62it/s] 117it [00:25, 4.65it/s] 118it [00:25, 4.65it/s] 119it [00:25, 4.66it/s] 120it [00:26, 4.68it/s] 121it [00:26, 4.49it/s] 122it [00:26, 4.56it/s] 123it [00:26, 4.61it/s] 124it [00:27, 4.64it/s] 125it [00:27, 4.66it/s] 126it [00:27, 4.68it/s] 127it [00:27, 4.69it/s] 128it [00:27, 4.69it/s] 129it [00:28, 4.70it/s] 130it [00:28, 4.69it/s] 131it [00:28, 4.70it/s] 132it [00:28, 4.70it/s] 133it [00:28, 4.70it/s] 134it [00:29, 4.54it/s] 135it [00:29, 4.60it/s] 136it [00:29, 4.61it/s] 137it [00:29, 4.64it/s] 138it [00:30, 4.64it/s] 139it [00:30, 4.52it/s] 140it [00:30, 4.54it/s] 141it [00:30, 4.58it/s] 142it [00:30, 4.60it/s] 143it [00:31, 4.62it/s] 144it [00:31, 4.61it/s] 145it [00:31, 4.64it/s] 146it [00:31, 4.65it/s] 147it [00:31, 4.67it/s] 148it [00:32, 4.67it/s] 149it [00:32, 4.68it/s] 150it [00:32, 4.68it/s]2025-05-26 01:21:59,351 - INFO - [Epoch 005 | Batch 0150] IWAE-loss 3932.0217 | mean log_px -0.0119 | KL -3150.20 + 151it [00:32, 4.68it/s] 152it [00:33, 4.68it/s] 153it [00:33, 4.68it/s] 154it [00:33, 4.68it/s] 155it [00:33, 4.69it/s] 156it [00:33, 4.68it/s] 157it [00:34, 4.69it/s] 158it [00:34, 4.69it/s] 159it [00:34, 4.54it/s] 160it [00:34, 4.60it/s] 161it [00:34, 4.63it/s] 162it [00:35, 4.63it/s] 163it [00:35, 4.65it/s] 164it [00:35, 4.66it/s] 165it [00:35, 4.67it/s] 166it [00:36, 4.67it/s] 167it [00:36, 4.68it/s] 168it [00:36, 4.68it/s] 169it [00:36, 4.69it/s] 170it [00:36, 4.68it/s] 171it [00:37, 4.53it/s] 172it [00:37, 4.59it/s] 173it [00:37, 4.62it/s] 174it [00:37, 4.61it/s] 175it [00:38, 4.64it/s] 176it [00:38, 4.64it/s] 177it [00:38, 4.66it/s] 178it [00:38, 4.66it/s] 179it [00:38, 4.68it/s] 180it [00:39, 4.53it/s] 181it [00:39, 4.59it/s] 182it [00:39, 4.61it/s] 183it [00:39, 4.63it/s] 184it [00:39, 4.65it/s] 185it [00:40, 4.50it/s] 186it [00:40, 4.43it/s] 187it [00:40, 4.38it/s] 188it [00:40, 4.47it/s] 189it [00:41, 4.54it/s] 190it [00:41, 4.57it/s] 191it [00:41, 4.51it/s] 192it [00:41, 4.58it/s] 193it [00:41, 4.62it/s] 194it [00:42, 4.64it/s] 195it [00:42, 4.37it/s] 196it [00:42, 4.34it/s] 196it [00:42, 4.59it/s] +2025-05-26 01:22:09,305 - INFO - Epoch: 5, Objective: tensor([4262.7358], device='cuda:0', grad_fn=), Loss: 0.01855652406811714, KL/n: 64.05235290527344 + 0it [00:00, ?it/s]2025-05-26 01:22:09,685 - INFO - [Epoch 006 | Batch 0000] IWAE-loss 4869.3335 | mean log_px -0.0318 | KL -3135.65 + 1it [00:00, 3.01it/s] 2it [00:00, 3.80it/s] 3it [00:00, 4.16it/s] 4it [00:00, 4.34it/s] 5it [00:01, 4.41it/s] 6it [00:01, 4.48it/s] 7it [00:01, 4.57it/s] 8it [00:01, 4.59it/s] 9it [00:02, 4.63it/s] 10it [00:02, 4.48it/s] 11it [00:02, 4.56it/s] 12it [00:02, 4.59it/s] 13it [00:02, 4.63it/s] 14it [00:03, 4.64it/s] 15it [00:03, 4.63it/s] 16it [00:03, 4.50it/s] 17it [00:03, 4.57it/s] 18it [00:04, 4.60it/s] 19it [00:04, 4.62it/s] 20it [00:04, 4.63it/s] 21it [00:04, 4.66it/s] 22it [00:04, 4.67it/s] 23it [00:05, 4.68it/s] 24it [00:05, 4.51it/s] 25it [00:05, 4.58it/s] 26it [00:05, 3.67it/s] 27it [00:06, 3.93it/s] 28it [00:06, 4.12it/s] 29it [00:06, 4.28it/s] 30it [00:06, 4.40it/s] 31it [00:07, 4.49it/s] 32it [00:07, 4.55it/s] 33it [00:07, 4.60it/s] 34it [00:07, 4.62it/s] 35it [00:07, 4.65it/s] 36it [00:08, 4.66it/s] 37it [00:08, 4.68it/s] 38it [00:08, 4.68it/s] 39it [00:08, 4.69it/s] 40it [00:08, 4.69it/s] 41it [00:09, 4.70it/s] 42it [00:09, 4.54it/s] 43it [00:09, 4.60it/s] 44it [00:09, 4.63it/s] 45it [00:10, 4.65it/s] 46it [00:10, 4.66it/s] 47it [00:10, 4.68it/s] 48it [00:10, 4.68it/s] 49it [00:10, 4.69it/s] 50it [00:11, 4.69it/s]2025-05-26 01:22:20,658 - INFO - [Epoch 006 | Batch 0050] IWAE-loss 7057.3750 | mean log_px -0.0627 | KL -3113.32 + 51it [00:11, 4.69it/s] 52it [00:11, 4.67it/s] 53it [00:11, 4.70it/s] 54it [00:11, 4.70it/s] 55it [00:12, 4.71it/s] 56it [00:12, 4.69it/s] 57it [00:12, 4.66it/s] 58it [00:12, 4.56it/s] 59it [00:13, 4.63it/s] 60it [00:13, 4.64it/s] 61it [00:13, 4.66it/s] 62it [00:13, 4.67it/s] 63it [00:13, 4.68it/s] 64it [00:14, 4.69it/s] 65it [00:14, 4.70it/s] 66it [00:14, 4.70it/s] 67it [00:14, 4.54it/s] 68it [00:14, 4.60it/s] 69it [00:15, 4.63it/s] 70it [00:15, 4.65it/s] 71it [00:15, 4.67it/s] 72it [00:15, 4.68it/s] 73it [00:15, 4.69it/s] 74it [00:16, 4.55it/s] 75it [00:16, 4.62it/s] 76it [00:16, 4.62it/s] 77it [00:16, 4.63it/s] 78it [00:17, 4.64it/s] 79it [00:17, 4.66it/s] 80it [00:17, 4.67it/s] 81it [00:17, 4.48it/s] 82it [00:17, 4.55it/s] 83it [00:18, 4.60it/s] 84it [00:18, 4.62it/s] 85it [00:18, 4.65it/s] 86it [00:18, 4.57it/s] 87it [00:19, 4.60it/s] 88it [00:19, 4.45it/s] 89it [00:19, 4.54it/s] 90it [00:19, 4.58it/s] 91it [00:19, 4.61it/s] 92it [00:20, 4.64it/s] 93it [00:20, 4.66it/s] 94it [00:20, 4.67it/s] 95it [00:20, 4.68it/s] 96it [00:21, 4.52it/s] 97it [00:21, 4.59it/s] 98it [00:21, 4.62it/s] 99it [00:21, 4.65it/s] 100it [00:21, 4.66it/s]2025-05-26 01:22:31,461 - INFO - [Epoch 006 | Batch 0100] IWAE-loss 6381.2471 | mean log_px -0.0664 | KL -3103.59 + 101it [00:22, 4.67it/s] 102it [00:22, 4.68it/s] 103it [00:22, 4.69it/s] 104it [00:22, 4.69it/s] 105it [00:22, 4.53it/s] 106it [00:23, 4.59it/s] 107it [00:23, 4.63it/s] 108it [00:23, 4.65it/s] 109it [00:23, 4.67it/s] 110it [00:24, 4.67it/s] 111it [00:24, 4.69it/s] 112it [00:24, 4.69it/s] 113it [00:24, 4.70it/s] 114it [00:24, 4.53it/s] 115it [00:25, 4.59it/s] 116it [00:25, 4.61it/s] 117it [00:25, 4.65it/s] 118it [00:25, 4.66it/s] 119it [00:25, 4.68it/s] 120it [00:26, 4.52it/s] 121it [00:26, 4.59it/s] 122it [00:26, 4.61it/s] 123it [00:26, 4.64it/s] 124it [00:27, 4.65it/s] 125it [00:27, 4.67it/s] 126it [00:27, 4.67it/s] 127it [00:27, 4.52it/s] 128it [00:27, 4.57it/s] 129it [00:28, 4.61it/s] 130it [00:28, 4.63it/s] 131it [00:28, 4.66it/s] 132it [00:28, 4.67it/s] 133it [00:29, 4.49it/s] 134it [00:29, 4.56it/s] 135it [00:29, 4.61it/s] 136it [00:29, 4.63it/s] 137it [00:29, 4.65it/s] 138it [00:30, 4.66it/s] 139it [00:30, 4.52it/s] 140it [00:30, 4.58it/s] 141it [00:30, 4.62it/s] 142it [00:30, 4.63it/s] 143it [00:31, 4.65it/s] 144it [00:31, 4.65it/s] 145it [00:31, 4.68it/s] 146it [00:31, 4.68it/s] 147it [00:32, 4.69it/s] 148it [00:32, 4.69it/s] 149it [00:32, 4.70it/s] 150it [00:32, 4.70it/s]2025-05-26 01:22:42,251 - INFO - [Epoch 006 | Batch 0150] IWAE-loss 4548.9775 | mean log_px -0.0281 | KL -3080.35 + 151it [00:32, 4.52it/s] 152it [00:33, 4.59it/s] 153it [00:33, 4.63it/s] 154it [00:33, 4.64it/s] 155it [00:33, 4.66it/s] 156it [00:33, 4.66it/s] 157it [00:34, 4.52it/s] 158it [00:34, 4.56it/s] 159it [00:34, 4.62it/s] 160it [00:34, 4.64it/s] 161it [00:35, 4.67it/s] 162it [00:35, 4.67it/s] 163it [00:35, 4.51it/s] 164it [00:35, 4.58it/s] 165it [00:35, 4.60it/s] 166it [00:36, 4.64it/s] 167it [00:36, 4.66it/s] 168it [00:36, 4.68it/s] 169it [00:36, 4.69it/s] 170it [00:37, 4.53it/s] 171it [00:37, 4.60it/s] 172it [00:37, 4.61it/s] 173it [00:37, 4.66it/s] 174it [00:37, 4.67it/s] 175it [00:38, 4.68it/s] 176it [00:38, 4.68it/s] 177it [00:38, 4.69it/s] 178it [00:38, 4.70it/s] 179it [00:38, 4.71it/s] 180it [00:39, 4.71it/s] 181it [00:39, 4.55it/s] 182it [00:39, 4.60it/s] 183it [00:39, 4.64it/s] 184it [00:40, 4.65it/s] 185it [00:40, 4.67it/s] 186it [00:40, 4.65it/s] 187it [00:40, 4.51it/s] 188it [00:40, 4.57it/s] 189it [00:41, 4.61it/s] 190it [00:41, 4.63it/s] 191it [00:41, 4.66it/s] 192it [00:41, 4.66it/s] 193it [00:41, 4.50it/s] 194it [00:42, 4.57it/s] 195it [00:42, 4.35it/s] 196it [00:42, 4.44it/s] 196it [00:42, 4.59it/s] +2025-05-26 01:22:52,174 - INFO - Epoch: 6, Objective: tensor([7316.6924], device='cuda:0', grad_fn=), Loss: 0.06832034140825272, KL/n: 62.47688674926758 + 0it [00:00, ?it/s]2025-05-26 01:22:52,594 - INFO - [Epoch 007 | Batch 0000] IWAE-loss 5764.2217 | mean log_px -0.0439 | KL -3059.68 + 1it [00:00, 2.90it/s] 2it [00:00, 3.74it/s] 3it [00:00, 3.94it/s] 4it [00:01, 4.18it/s] 5it [00:01, 4.35it/s] 6it [00:01, 4.46it/s] 7it [00:01, 4.55it/s] 8it [00:01, 4.57it/s] 9it [00:02, 4.47it/s] 10it [00:02, 4.56it/s] 11it [00:02, 4.57it/s] 12it [00:02, 4.59it/s] 13it [00:02, 4.63it/s] 14it [00:03, 4.64it/s] 15it [00:03, 4.67it/s] 16it [00:03, 4.53it/s] 17it [00:03, 4.60it/s] 18it [00:04, 4.62it/s] 19it [00:04, 4.65it/s] 20it [00:04, 4.66it/s] 21it [00:04, 4.68it/s] 22it [00:04, 4.68it/s] 23it [00:05, 4.69it/s] 24it [00:05, 4.69it/s] 25it [00:05, 4.70it/s] 26it [00:05, 4.70it/s] 27it [00:05, 4.70it/s] 28it [00:06, 4.68it/s] 29it [00:06, 4.70it/s] 30it [00:06, 4.55it/s] 31it [00:06, 4.61it/s] 32it [00:07, 4.62it/s] 33it [00:07, 4.49it/s] 34it [00:07, 4.52it/s] 35it [00:07, 4.55it/s] 36it [00:07, 4.56it/s] 37it [00:08, 4.58it/s] 38it [00:08, 4.58it/s] 39it [00:08, 4.45it/s] 40it [00:08, 4.47it/s] 41it [00:09, 4.55it/s] 42it [00:09, 4.58it/s] 43it [00:09, 4.60it/s] 44it [00:09, 4.61it/s] 45it [00:09, 4.65it/s] 46it [00:10, 4.50it/s] 47it [00:10, 4.57it/s] 48it [00:10, 4.60it/s] 49it [00:10, 4.63it/s] 50it [00:10, 4.64it/s]2025-05-26 01:23:03,453 - INFO - [Epoch 007 | Batch 0050] IWAE-loss 4438.1538 | mean log_px -0.0305 | KL -3042.06 + 51it [00:11, 4.59it/s] 52it [00:11, 4.44it/s] 53it [00:11, 4.36it/s] 54it [00:11, 4.47it/s] 55it [00:12, 4.54it/s] 56it [00:12, 4.52it/s] 57it [00:12, 4.57it/s] 58it [00:12, 4.60it/s] 59it [00:12, 4.50it/s] 60it [00:13, 4.55it/s] 61it [00:13, 4.61it/s] 62it [00:13, 4.61it/s] 63it [00:13, 4.64it/s] 64it [00:14, 4.65it/s] 65it [00:14, 4.64it/s] 66it [00:14, 4.67it/s] 67it [00:14, 4.67it/s] 68it [00:14, 4.50it/s] 69it [00:15, 4.57it/s] 70it [00:15, 4.60it/s] 71it [00:15, 4.63it/s] 72it [00:15, 4.65it/s] 73it [00:16, 4.50it/s] 74it [00:16, 4.56it/s] 75it [00:16, 4.60it/s] 76it [00:16, 4.63it/s] 77it [00:16, 4.65it/s] 78it [00:17, 4.66it/s] 79it [00:17, 4.67it/s] 80it [00:17, 4.67it/s] 81it [00:17, 4.67it/s] 82it [00:17, 4.69it/s] 83it [00:18, 4.52it/s] 84it [00:18, 4.58it/s] 85it [00:18, 4.61it/s] 86it [00:18, 4.63it/s] 87it [00:19, 4.53it/s] 88it [00:19, 4.57it/s] 89it [00:19, 4.59it/s] 90it [00:19, 4.61it/s] 91it [00:19, 4.62it/s] 92it [00:20, 4.46it/s] 93it [00:20, 4.51it/s] 94it [00:20, 4.52it/s] 95it [00:20, 4.56it/s] 96it [00:21, 4.58it/s] 97it [00:21, 4.55it/s] 98it [00:21, 4.58it/s] 99it [00:21, 4.59it/s] 100it [00:21, 4.62it/s]2025-05-26 01:23:14,370 - INFO - [Epoch 007 | Batch 0100] IWAE-loss 3706.3210 | mean log_px -0.0132 | KL -3016.29 + 101it [00:22, 4.62it/s] 102it [00:22, 4.48it/s] 103it [00:22, 4.55it/s] 104it [00:22, 4.57it/s] 105it [00:23, 4.59it/s] 106it [00:23, 4.61it/s] 107it [00:23, 4.62it/s] 108it [00:23, 4.63it/s] 109it [00:23, 4.65it/s] 110it [00:24, 4.65it/s] 111it [00:24, 4.65it/s] 112it [00:24, 4.64it/s] 113it [00:24, 4.64it/s] 114it [00:24, 4.64it/s] 115it [00:25, 4.64it/s] 116it [00:25, 4.63it/s] 117it [00:25, 4.64it/s] 118it [00:25, 4.63it/s] 119it [00:26, 4.63it/s] 120it [00:26, 4.63it/s] 121it [00:26, 4.64it/s] 122it [00:26, 4.62it/s] 123it [00:26, 4.63it/s] 124it [00:27, 4.64it/s] 125it [00:27, 4.63it/s] 126it [00:27, 4.62it/s] 127it [00:27, 4.64it/s] 128it [00:27, 4.48it/s] 129it [00:28, 4.54it/s] 130it [00:28, 4.56it/s] 131it [00:28, 4.59it/s] 132it [00:28, 4.49it/s] 133it [00:29, 4.54it/s] 134it [00:29, 4.58it/s] 135it [00:29, 4.56it/s] 136it [00:29, 4.57it/s] 137it [00:29, 4.62it/s] 138it [00:30, 4.63it/s] 139it [00:30, 4.49it/s] 140it [00:30, 4.54it/s] 141it [00:30, 4.59it/s] 142it [00:31, 4.60it/s] 143it [00:31, 4.62it/s] 144it [00:31, 4.62it/s] 145it [00:31, 4.46it/s] 146it [00:31, 4.52it/s] 147it [00:32, 4.56it/s] 148it [00:32, 4.58it/s] 149it [00:32, 4.61it/s] 150it [00:32, 4.62it/s]2025-05-26 01:23:25,253 - INFO - [Epoch 007 | Batch 0150] IWAE-loss 6590.7559 | mean log_px -0.0561 | KL -2995.29 + 151it [00:33, 4.48it/s] 152it [00:33, 4.53it/s] 153it [00:33, 4.56it/s] 154it [00:33, 4.57it/s] 155it [00:33, 4.60it/s] 156it [00:34, 4.61it/s] 157it [00:34, 4.63it/s] 158it [00:34, 4.63it/s] 159it [00:34, 4.64it/s] 160it [00:34, 4.64it/s] 161it [00:35, 4.62it/s] 162it [00:35, 4.54it/s] 163it [00:35, 4.57it/s] 164it [00:35, 4.55it/s] 165it [00:36, 4.59it/s] 166it [00:36, 4.63it/s] 167it [00:36, 4.63it/s] 168it [00:36, 4.64it/s] 169it [00:36, 4.64it/s] 170it [00:37, 4.63it/s] 171it [00:37, 4.61it/s] 172it [00:37, 4.62it/s] 173it [00:37, 4.63it/s] 174it [00:38, 4.62it/s] 175it [00:38, 4.64it/s] 176it [00:38, 4.60it/s] 177it [00:38, 4.55it/s] 178it [00:38, 4.57it/s] 179it [00:39, 4.61it/s] 180it [00:39, 4.63it/s] 181it [00:39, 4.64it/s] 182it [00:39, 4.65it/s] 183it [00:39, 4.64it/s] 184it [00:40, 4.54it/s] 185it [00:40, 4.59it/s] 186it [00:40, 4.61it/s] 187it [00:40, 4.63it/s] 188it [00:41, 4.63it/s] 189it [00:41, 4.63it/s] 190it [00:41, 4.61it/s] 191it [00:41, 4.50it/s] 192it [00:41, 4.57it/s] 193it [00:42, 4.60it/s] 194it [00:42, 4.63it/s] 195it [00:42, 4.33it/s] 196it [00:42, 4.31it/s] 196it [00:42, 4.57it/s] +2025-05-26 01:23:35,233 - INFO - Epoch: 7, Objective: tensor([5831.9897], device='cuda:0', grad_fn=), Loss: 0.03322037681937218, KL/n: 60.5771369934082 + 0it [00:00, ?it/s]2025-05-26 01:23:35,823 - INFO - [Epoch 008 | Batch 0000] IWAE-loss 3881.9414 | mean log_px -0.0130 | KL -2970.20 + 1it [00:00, 2.80it/s] 2it [00:00, 3.65it/s] 3it [00:00, 4.04it/s] 4it [00:01, 4.26it/s] 5it [00:01, 4.38it/s] 6it [00:01, 4.48it/s] 7it [00:01, 4.55it/s] 8it [00:01, 4.59it/s] 9it [00:02, 4.62it/s] 10it [00:02, 4.63it/s] 11it [00:02, 4.59it/s] 12it [00:02, 4.32it/s] 13it [00:02, 4.41it/s] 14it [00:03, 4.47it/s] 15it [00:03, 4.51it/s] 16it [00:03, 4.40it/s] 17it [00:03, 4.45it/s] 18it [00:04, 4.51it/s] 19it [00:04, 4.52it/s] 20it [00:04, 4.56it/s] 21it [00:04, 4.43it/s] 22it [00:05, 4.36it/s] 23it [00:05, 4.29it/s] 24it [00:05, 4.39it/s] 25it [00:05, 4.47it/s] 26it [00:05, 4.52it/s] 27it [00:06, 4.56it/s] 28it [00:06, 4.42it/s] 29it [00:06, 4.35it/s] 30it [00:06, 4.30it/s] 31it [00:07, 4.40it/s] 32it [00:07, 4.46it/s] 33it [00:07, 4.30it/s] 34it [00:07, 4.13it/s] 35it [00:07, 4.25it/s] 36it [00:08, 4.34it/s] 37it [00:08, 4.40it/s] 38it [00:08, 4.48it/s] 39it [00:08, 4.54it/s] 40it [00:09, 4.57it/s] 41it [00:09, 4.44it/s] 42it [00:09, 4.52it/s] 43it [00:09, 4.47it/s] 44it [00:09, 4.46it/s] 45it [00:10, 4.50it/s] 46it [00:10, 4.55it/s] 47it [00:10, 4.43it/s] 48it [00:10, 4.35it/s] 49it [00:11, 4.40it/s] 50it [00:11, 4.18it/s]2025-05-26 01:23:47,090 - INFO - [Epoch 008 | Batch 0050] IWAE-loss 4140.3315 | mean log_px -0.0194 | KL -2946.16 + 51it [00:11, 4.32it/s] 52it [00:11, 4.21it/s] 53it [00:12, 4.32it/s] 54it [00:12, 4.40it/s] 55it [00:12, 4.45it/s] 56it [00:12, 4.36it/s] 57it [00:12, 4.44it/s] 58it [00:13, 4.48it/s] 59it [00:13, 4.50it/s] 60it [00:13, 4.52it/s] 61it [00:13, 4.36it/s] 62it [00:14, 4.45it/s] 63it [00:14, 4.22it/s] 64it [00:14, 4.21it/s] 65it [00:14, 4.34it/s] 66it [00:15, 4.28it/s] 67it [00:15, 4.34it/s] 68it [00:15, 4.35it/s] 69it [00:15, 4.31it/s] 70it [00:16, 4.09it/s] 71it [00:16, 4.13it/s] 72it [00:16, 4.25it/s] 73it [00:16, 4.32it/s] 74it [00:16, 4.40it/s] 75it [00:17, 4.45it/s] 76it [00:17, 4.45it/s] 77it [00:17, 4.36it/s] 78it [00:17, 4.44it/s] 79it [00:18, 4.48it/s] 80it [00:18, 4.51it/s] 81it [00:18, 4.39it/s] 82it [00:18, 4.27it/s] 83it [00:18, 4.29it/s] 84it [00:19, 4.34it/s] 85it [00:19, 4.13it/s] 86it [00:19, 4.26it/s] 87it [00:19, 4.21it/s] 88it [00:20, 4.31it/s] 89it [00:20, 4.41it/s] 90it [00:20, 4.18it/s] 91it [00:20, 4.30it/s] 92it [00:21, 4.38it/s] 93it [00:21, 4.45it/s] 94it [00:21, 4.49it/s] 95it [00:21, 4.52it/s] 96it [00:21, 4.53it/s] 97it [00:22, 4.43it/s] 98it [00:22, 4.49it/s] 99it [00:22, 4.33it/s] 100it [00:22, 4.24it/s]2025-05-26 01:23:58,575 - INFO - [Epoch 008 | Batch 0100] IWAE-loss 3203.0884 | mean log_px -0.0045 | KL -2923.38 + 101it [00:23, 4.34it/s] 102it [00:23, 4.41it/s] 103it [00:23, 4.32it/s] 104it [00:23, 4.41it/s] 105it [00:23, 4.46it/s] 106it [00:24, 4.49it/s] 107it [00:24, 4.52it/s] 108it [00:24, 4.55it/s] 109it [00:24, 4.56it/s] 110it [00:25, 4.22it/s] 111it [00:25, 4.31it/s] 112it [00:25, 4.23it/s] 113it [00:25, 4.21it/s] 114it [00:26, 4.32it/s] 115it [00:26, 4.38it/s] 116it [00:26, 4.44it/s] 117it [00:26, 4.37it/s] 118it [00:26, 4.43it/s] 119it [00:27, 4.30it/s] 120it [00:27, 4.27it/s] 121it [00:27, 4.17it/s] 122it [00:27, 4.08it/s] 123it [00:28, 4.09it/s] 124it [00:28, 4.23it/s] 125it [00:28, 4.22it/s] 126it [00:28, 4.34it/s] 127it [00:29, 4.42it/s] 128it [00:29, 4.48it/s] 129it [00:29, 4.54it/s] 130it [00:29, 4.40it/s] 131it [00:29, 4.37it/s] 132it [00:30, 4.46it/s] 133it [00:30, 4.53it/s] 134it [00:30, 4.55it/s] 135it [00:30, 4.58it/s] 136it [00:31, 4.28it/s] 137it [00:31, 4.21it/s] 138it [00:31, 4.21it/s] 139it [00:31, 4.19it/s] 140it [00:32, 4.30it/s] 141it [00:32, 4.26it/s] 142it [00:32, 4.21it/s] 143it [00:32, 4.07it/s] 144it [00:33, 4.08it/s] 145it [00:33, 4.22it/s] 146it [00:33, 4.33it/s] 147it [00:33, 4.41it/s] 148it [00:33, 4.43it/s] 149it [00:34, 4.37it/s] 150it [00:34, 4.44it/s]2025-05-26 01:24:10,080 - INFO - [Epoch 008 | Batch 0150] IWAE-loss 3672.0759 | mean log_px -0.0163 | KL -2904.56 + 151it [00:34, 4.51it/s] 152it [00:34, 4.53it/s] 153it [00:35, 4.58it/s] 154it [00:35, 4.59it/s] 155it [00:35, 4.53it/s] 156it [00:35, 4.37it/s] 157it [00:35, 4.43it/s] 158it [00:36, 4.51it/s] 159it [00:36, 4.55it/s] 160it [00:36, 4.58it/s] 161it [00:36, 4.52it/s] 162it [00:37, 4.33it/s] 163it [00:37, 4.43it/s] 164it [00:37, 4.48it/s] 165it [00:37, 4.50it/s] 166it [00:37, 4.49it/s] 167it [00:38, 4.53it/s] 168it [00:38, 4.56it/s] 169it [00:38, 4.59it/s] 170it [00:38, 4.44it/s] 171it [00:39, 4.51it/s] 172it [00:39, 4.54it/s] 173it [00:39, 4.57it/s] 174it [00:39, 4.54it/s] 175it [00:39, 4.58it/s] 176it [00:40, 4.41it/s] 177it [00:40, 4.47it/s] 178it [00:40, 4.20it/s] 179it [00:40, 4.32it/s] 180it [00:41, 4.43it/s] 181it [00:41, 4.34it/s] 182it [00:41, 4.27it/s] 183it [00:41, 4.37it/s] 184it [00:41, 4.45it/s] 185it [00:42, 4.52it/s] 186it [00:42, 4.39it/s] 187it [00:42, 4.46it/s] 188it [00:42, 4.39it/s] 189it [00:43, 4.47it/s] 190it [00:43, 4.53it/s] 191it [00:43, 4.58it/s] 192it [00:43, 4.60it/s] 193it [00:43, 4.48it/s] 194it [00:44, 4.33it/s] 195it [00:44, 4.30it/s] 196it [00:44, 4.30it/s] 196it [00:44, 4.38it/s] +2025-05-26 01:24:20,329 - INFO - Epoch: 8, Objective: tensor([4215.5410], device='cuda:0', grad_fn=), Loss: 0.014363881200551987, KL/n: 58.71515655517578 + 0it [00:00, ?it/s]2025-05-26 01:24:20,686 - INFO - [Epoch 009 | Batch 0000] IWAE-loss 3831.5950 | mean log_px -0.0261 | KL -2873.97 + 1it [00:00, 3.49it/s] 2it [00:00, 4.07it/s] 3it [00:00, 4.08it/s] 4it [00:00, 4.31it/s] 5it [00:01, 4.44it/s] 6it [00:01, 4.51it/s] 7it [00:01, 4.57it/s] 8it [00:01, 4.60it/s] 9it [00:02, 4.48it/s] 10it [00:02, 4.51it/s] 11it [00:02, 4.55it/s] 12it [00:02, 3.61it/s] 13it [00:03, 3.87it/s] 14it [00:03, 4.07it/s] 15it [00:03, 4.10it/s] 16it [00:03, 4.22it/s] 17it [00:04, 4.33it/s] 18it [00:04, 4.44it/s] 19it [00:04, 4.52it/s] 20it [00:04, 4.57it/s] 21it [00:04, 4.62it/s] 22it [00:05, 4.63it/s] 23it [00:05, 4.65it/s] 24it [00:05, 4.66it/s] 25it [00:05, 4.51it/s] 26it [00:05, 4.59it/s] 27it [00:06, 4.62it/s] 28it [00:06, 4.64it/s] 29it [00:06, 4.67it/s] 30it [00:06, 4.68it/s] 31it [00:06, 4.70it/s] 32it [00:07, 4.70it/s] 33it [00:07, 4.70it/s] 34it [00:07, 4.70it/s] 35it [00:07, 4.71it/s] 36it [00:08, 4.70it/s] 37it [00:08, 4.71it/s] 38it [00:08, 4.71it/s] 39it [00:08, 4.71it/s] 40it [00:08, 4.71it/s] 41it [00:09, 4.71it/s] 42it [00:09, 4.71it/s] 43it [00:09, 4.71it/s] 44it [00:09, 4.71it/s] 45it [00:09, 4.71it/s] 46it [00:10, 4.69it/s] 47it [00:10, 4.70it/s] 48it [00:10, 4.52it/s] 49it [00:10, 4.58it/s] 50it [00:11, 4.61it/s]2025-05-26 01:24:31,684 - INFO - [Epoch 009 | Batch 0050] IWAE-loss 3554.7034 | mean log_px -0.0139 | KL -2847.36 + 51it [00:11, 4.64it/s] 52it [00:11, 4.65it/s] 53it [00:11, 4.49it/s] 54it [00:11, 4.57it/s] 55it [00:12, 4.61it/s] 56it [00:12, 4.62it/s] 57it [00:12, 4.65it/s] 58it [00:12, 4.67it/s] 59it [00:13, 4.68it/s] 60it [00:13, 4.46it/s] 61it [00:13, 4.54it/s] 62it [00:13, 4.55it/s] 63it [00:13, 4.60it/s] 64it [00:14, 4.62it/s] 65it [00:14, 4.48it/s] 66it [00:14, 4.56it/s] 67it [00:14, 4.61it/s] 68it [00:14, 4.63it/s] 69it [00:15, 4.65it/s] 70it [00:15, 4.50it/s] 71it [00:15, 4.58it/s] 72it [00:15, 4.60it/s] 73it [00:16, 4.63it/s] 74it [00:16, 4.65it/s] 75it [00:16, 4.67it/s] 76it [00:16, 4.68it/s] 77it [00:16, 4.69it/s] 78it [00:17, 4.70it/s] 79it [00:17, 4.71it/s] 80it [00:17, 4.71it/s] 81it [00:17, 4.72it/s] 82it [00:17, 4.71it/s] 83it [00:18, 4.71it/s] 84it [00:18, 4.71it/s] 85it [00:18, 4.73it/s] 86it [00:18, 4.72it/s] 87it [00:19, 4.73it/s] 88it [00:19, 4.72it/s] 89it [00:19, 4.73it/s] 90it [00:19, 4.73it/s] 91it [00:19, 4.55it/s] 92it [00:20, 4.60it/s] 93it [00:20, 4.64it/s] 94it [00:20, 4.65it/s] 95it [00:20, 4.55it/s] 96it [00:20, 4.61it/s] 97it [00:21, 4.64it/s] 98it [00:21, 4.66it/s] 99it [00:21, 4.69it/s] 100it [00:21, 4.56it/s]2025-05-26 01:24:42,478 - INFO - [Epoch 009 | Batch 0100] IWAE-loss 3406.7056 | mean log_px -0.0110 | KL -2821.77 + 101it [00:22, 4.62it/s] 102it [00:22, 4.64it/s] 103it [00:22, 4.67it/s] 104it [00:22, 4.68it/s] 105it [00:22, 4.54it/s] 106it [00:23, 4.56it/s] 107it [00:23, 4.60it/s] 108it [00:23, 4.63it/s] 109it [00:23, 4.67it/s] 110it [00:24, 4.52it/s] 111it [00:24, 4.57it/s] 112it [00:24, 4.61it/s] 113it [00:24, 4.64it/s] 114it [00:24, 4.67it/s] 115it [00:25, 4.52it/s] 116it [00:25, 4.59it/s] 117it [00:25, 4.62it/s] 118it [00:25, 4.66it/s] 119it [00:25, 4.66it/s] 120it [00:26, 4.67it/s] 121it [00:26, 4.69it/s] 122it [00:26, 4.70it/s] 123it [00:26, 4.71it/s] 124it [00:27, 4.71it/s] 125it [00:27, 4.58it/s] 126it [00:27, 4.64it/s] 127it [00:27, 4.67it/s] 128it [00:27, 4.68it/s] 129it [00:28, 4.69it/s] 130it [00:28, 4.52it/s] 131it [00:28, 4.59it/s] 132it [00:28, 4.63it/s] 133it [00:28, 4.65it/s] 134it [00:29, 4.67it/s] 135it [00:29, 4.69it/s] 136it [00:29, 4.67it/s] 137it [00:29, 4.69it/s] 138it [00:30, 4.52it/s] 139it [00:30, 4.60it/s] 140it [00:30, 4.63it/s] 141it [00:30, 4.66it/s] 142it [00:30, 4.67it/s] 143it [00:31, 4.53it/s] 144it [00:31, 4.59it/s] 145it [00:31, 4.63it/s] 146it [00:31, 4.66it/s] 147it [00:31, 4.68it/s] 148it [00:32, 4.69it/s] 149it [00:32, 4.71it/s] 150it [00:32, 4.70it/s]2025-05-26 01:24:53,251 - INFO - [Epoch 009 | Batch 0150] IWAE-loss 5147.5215 | mean log_px -0.0361 | KL -2803.57 + 151it [00:32, 4.54it/s] 152it [00:33, 4.61it/s] 153it [00:33, 4.64it/s] 154it [00:33, 4.66it/s] 155it [00:33, 4.68it/s] 156it [00:33, 4.69it/s] 157it [00:34, 4.70it/s] 158it [00:34, 4.67it/s] 159it [00:34, 4.70it/s] 160it [00:34, 4.70it/s] 161it [00:34, 4.72it/s] 162it [00:35, 4.71it/s] 163it [00:35, 4.72it/s] 164it [00:35, 4.72it/s] 165it [00:35, 4.72it/s] 166it [00:36, 4.55it/s] 167it [00:36, 4.62it/s] 168it [00:36, 4.64it/s] 169it [00:36, 4.66it/s] 170it [00:36, 4.68it/s] 171it [00:37, 4.70it/s] 172it [00:37, 4.54it/s] 173it [00:37, 4.61it/s] 174it [00:37, 4.63it/s] 175it [00:38, 4.66it/s] 176it [00:38, 4.68it/s] 177it [00:38, 4.69it/s] 178it [00:38, 4.57it/s] 179it [00:38, 4.63it/s] 180it [00:39, 4.65it/s] 181it [00:39, 4.67it/s] 182it [00:39, 4.69it/s] 183it [00:39, 4.70it/s] 184it [00:39, 4.55it/s] 185it [00:40, 4.61it/s] 186it [00:40, 4.63it/s] 187it [00:40, 4.66it/s] 188it [00:40, 4.68it/s] 189it [00:41, 4.68it/s] 190it [00:41, 4.64it/s] 191it [00:41, 4.68it/s] 192it [00:41, 4.56it/s] 193it [00:41, 4.57it/s] 194it [00:42, 4.60it/s] 195it [00:42, 4.43it/s] 196it [00:42, 4.36it/s] 196it [00:42, 4.59it/s] +2025-05-26 01:25:03,123 - INFO - Epoch: 9, Objective: tensor([4143.1064], device='cuda:0', grad_fn=), Loss: 0.02341052144765854, KL/n: 56.89252471923828 + 0it [00:00, ?it/s]2025-05-26 01:25:03,515 - INFO - [Epoch 010 | Batch 0000] IWAE-loss 3292.7747 | mean log_px -0.0090 | KL -2785.48 + 1it [00:00, 2.94it/s] 2it [00:00, 3.76it/s] 3it [00:00, 4.15it/s] 4it [00:00, 4.36it/s] 5it [00:01, 4.48it/s] 6it [00:01, 4.55it/s] 7it [00:01, 4.61it/s] 8it [00:01, 4.39it/s] 9it [00:02, 4.49it/s] 10it [00:02, 4.53it/s] 11it [00:02, 4.58it/s] 12it [00:02, 4.60it/s] 13it [00:02, 4.62it/s] 14it [00:03, 4.48it/s] 15it [00:03, 4.52it/s] 16it [00:03, 4.54it/s] 17it [00:03, 4.60it/s] 18it [00:04, 4.62it/s] 19it [00:04, 4.65it/s] 20it [00:04, 4.67it/s] 21it [00:04, 4.68it/s] 22it [00:04, 4.70it/s] 23it [00:05, 4.71it/s] 24it [00:05, 4.71it/s] 25it [00:05, 4.72it/s] 26it [00:05, 4.71it/s] 27it [00:05, 4.71it/s] 28it [00:06, 4.71it/s] 29it [00:06, 4.71it/s] 30it [00:06, 4.68it/s] 31it [00:06, 4.71it/s] 32it [00:07, 4.70it/s] 33it [00:07, 4.62it/s] 34it [00:07, 4.67it/s] 35it [00:07, 4.68it/s] 36it [00:07, 4.68it/s] 37it [00:08, 4.68it/s] 38it [00:08, 4.69it/s] 39it [00:08, 4.53it/s] 40it [00:08, 4.60it/s] 41it [00:08, 4.64it/s] 42it [00:09, 4.66it/s] 43it [00:09, 4.68it/s] 44it [00:09, 4.52it/s] 45it [00:09, 4.60it/s] 46it [00:10, 4.63it/s] 47it [00:10, 4.66it/s] 48it [00:10, 4.67it/s] 49it [00:10, 4.68it/s] 50it [00:10, 4.69it/s]2025-05-26 01:25:14,299 - INFO - [Epoch 010 | Batch 0050] IWAE-loss 3255.0281 | mean log_px -0.0100 | KL -2764.80 + 51it [00:11, 4.53it/s] 52it [00:11, 4.59it/s] 53it [00:11, 4.63it/s] 54it [00:11, 4.66it/s] 55it [00:11, 4.68it/s] 56it [00:12, 4.68it/s] 57it [00:12, 4.52it/s] 58it [00:12, 4.59it/s] 59it [00:12, 4.63it/s] 60it [00:13, 4.64it/s] 61it [00:13, 4.67it/s] 62it [00:13, 4.68it/s] 63it [00:13, 4.69it/s] 64it [00:13, 4.69it/s] 65it [00:14, 4.70it/s] 66it [00:14, 4.70it/s] 67it [00:14, 4.54it/s] 68it [00:14, 4.55it/s] 69it [00:14, 4.60it/s] 70it [00:15, 4.63it/s] 71it [00:15, 4.65it/s] 72it [00:15, 4.51it/s] 73it [00:15, 4.59it/s] 74it [00:16, 4.62it/s] 75it [00:16, 4.64it/s] 76it [00:16, 4.66it/s] 77it [00:16, 4.67it/s] 78it [00:16, 4.68it/s] 79it [00:17, 4.69it/s] 80it [00:17, 4.70it/s] 81it [00:17, 4.71it/s] 82it [00:17, 4.70it/s] 83it [00:17, 4.71it/s] 84it [00:18, 4.54it/s] 85it [00:18, 4.61it/s] 86it [00:18, 4.63it/s] 87it [00:18, 4.65it/s] 88it [00:19, 4.66it/s] 89it [00:19, 4.68it/s] 90it [00:19, 4.68it/s] 91it [00:19, 4.53it/s] 92it [00:19, 4.59it/s] 93it [00:20, 4.62it/s] 94it [00:20, 4.64it/s] 95it [00:20, 4.67it/s] 96it [00:20, 4.67it/s] 97it [00:21, 4.51it/s] 98it [00:21, 4.59it/s] 99it [00:21, 4.62it/s] 100it [00:21, 4.65it/s]2025-05-26 01:25:25,096 - INFO - [Epoch 010 | Batch 0100] IWAE-loss 3816.2234 | mean log_px -0.0176 | KL -2740.36 + 101it [00:21, 4.66it/s] 102it [00:22, 4.67it/s] 103it [00:22, 4.69it/s] 104it [00:22, 4.52it/s] 105it [00:22, 4.59it/s] 106it [00:22, 4.62it/s] 107it [00:23, 4.65it/s] 108it [00:23, 4.66it/s] 109it [00:23, 4.68it/s] 110it [00:23, 4.69it/s] 111it [00:24, 4.71it/s] 112it [00:24, 4.71it/s] 113it [00:24, 4.71it/s] 114it [00:24, 4.71it/s] 115it [00:24, 4.72it/s] 116it [00:25, 4.71it/s] 117it [00:25, 4.71it/s] 118it [00:25, 4.53it/s] 119it [00:25, 4.59it/s] 120it [00:25, 4.60it/s] 121it [00:26, 4.57it/s] 122it [00:26, 4.56it/s] 123it [00:26, 4.59it/s] 124it [00:26, 4.60it/s] 125it [00:27, 4.61it/s] 126it [00:27, 4.62it/s] 127it [00:27, 4.62it/s] 128it [00:27, 4.63it/s] 129it [00:27, 4.63it/s] 130it [00:28, 4.48it/s] 131it [00:28, 4.55it/s] 132it [00:28, 4.57it/s] 133it [00:28, 4.59it/s] 134it [00:29, 4.60it/s] 135it [00:29, 4.61it/s] 136it [00:29, 4.62it/s] 137it [00:29, 4.63it/s] 138it [00:29, 4.63it/s] 139it [00:30, 4.63it/s] 140it [00:30, 4.63it/s] 141it [00:30, 4.48it/s] 142it [00:30, 4.54it/s] 143it [00:30, 4.57it/s] 144it [00:31, 4.57it/s] 145it [00:31, 4.55it/s] 146it [00:31, 4.39it/s] 147it [00:31, 4.47it/s] 148it [00:32, 4.51it/s] 149it [00:32, 4.55it/s] 150it [00:32, 4.55it/s]2025-05-26 01:25:35,968 - INFO - [Epoch 010 | Batch 0150] IWAE-loss 4118.2427 | mean log_px -0.0299 | KL -2717.40 + 151it [00:32, 4.55it/s] 152it [00:32, 4.54it/s] 153it [00:33, 4.46it/s] 154it [00:33, 4.36it/s] 155it [00:33, 4.43it/s] 156it [00:33, 4.47it/s] 157it [00:34, 4.52it/s] 158it [00:34, 4.53it/s] 159it [00:34, 4.55it/s] 160it [00:34, 4.53it/s] 161it [00:34, 4.55it/s] 162it [00:35, 4.47it/s] 163it [00:35, 4.48it/s] 164it [00:35, 4.53it/s] 165it [00:35, 4.54it/s] 166it [00:36, 4.53it/s] 167it [00:36, 4.52it/s] 168it [00:36, 4.53it/s] 169it [00:36, 4.55it/s] 170it [00:36, 4.55it/s] 171it [00:37, 4.41it/s] 172it [00:37, 4.46it/s] 173it [00:37, 4.49it/s] 174it [00:37, 4.51it/s] 175it [00:38, 4.49it/s] 176it [00:38, 4.46it/s] 177it [00:38, 4.49it/s] 178it [00:38, 4.51it/s] 179it [00:38, 4.53it/s] 180it [00:39, 4.54it/s] 181it [00:39, 4.55it/s] 182it [00:39, 4.56it/s] 183it [00:39, 4.41it/s] 184it [00:40, 4.46it/s] 185it [00:40, 4.50it/s] 186it [00:40, 4.53it/s] 187it [00:40, 4.51it/s] 188it [00:41, 4.34it/s] 189it [00:41, 4.38it/s] 190it [00:41, 4.43it/s] 191it [00:41, 4.48it/s] 192it [00:41, 4.51it/s] 193it [00:42, 4.54it/s] 194it [00:42, 4.55it/s] 195it [00:42, 4.19it/s] 196it [00:42, 4.22it/s] 196it [00:42, 4.57it/s] +2025-05-26 01:25:46,183 - INFO - Epoch: 10, Objective: tensor([2976.3257], device='cuda:0', grad_fn=), Loss: 0.00489531084895134, KL/n: 55.191680908203125 + 0it [00:00, ?it/s]2025-05-26 01:25:46,767 - INFO - [Epoch 011 | Batch 0000] IWAE-loss 3065.4336 | mean log_px -0.0064 | KL -2701.94 + 1it [00:00, 2.95it/s] 2it [00:00, 3.71it/s] 3it [00:00, 4.01it/s] 4it [00:01, 4.09it/s] 5it [00:01, 4.28it/s] 6it [00:01, 4.37it/s] 7it [00:01, 4.45it/s] 8it [00:01, 4.48it/s] 9it [00:02, 4.49it/s] 10it [00:02, 4.52it/s] 11it [00:02, 4.38it/s] 12it [00:02, 4.43it/s] 13it [00:03, 4.47it/s] 14it [00:03, 4.49it/s] 15it [00:03, 4.51it/s] 16it [00:03, 4.52it/s] 17it [00:03, 4.48it/s] 18it [00:04, 4.48it/s] 19it [00:04, 4.52it/s] 20it [00:04, 4.52it/s] 21it [00:04, 4.53it/s] 22it [00:05, 4.36it/s] 23it [00:05, 4.45it/s] 24it [00:05, 4.49it/s] 25it [00:05, 4.51it/s] 26it [00:05, 4.52it/s] 27it [00:06, 4.54it/s] 28it [00:06, 4.52it/s] 29it [00:06, 4.55it/s] 30it [00:06, 4.55it/s] 31it [00:06, 4.57it/s] 32it [00:07, 4.56it/s] 33it [00:07, 4.55it/s] 34it [00:07, 4.56it/s] 35it [00:07, 4.54it/s] 36it [00:08, 4.56it/s] 37it [00:08, 4.42it/s] 38it [00:08, 4.47it/s] 39it [00:08, 4.51it/s] 40it [00:08, 4.51it/s] 41it [00:09, 4.38it/s] 42it [00:09, 4.44it/s] 43it [00:09, 4.45it/s] 44it [00:09, 4.48it/s] 45it [00:10, 4.50it/s] 46it [00:10, 4.51it/s] 47it [00:10, 4.53it/s] 48it [00:10, 4.55it/s] 49it [00:11, 4.42it/s] 50it [00:11, 4.46it/s]2025-05-26 01:25:57,892 - INFO - [Epoch 011 | Batch 0050] IWAE-loss 3133.4580 | mean log_px -0.0073 | KL -2682.37 + 51it [00:11, 4.45it/s] 52it [00:11, 4.46it/s] 53it [00:11, 4.50it/s] 54it [00:12, 4.49it/s] 55it [00:12, 4.49it/s] 56it [00:12, 4.51it/s] 57it [00:12, 4.53it/s] 58it [00:13, 4.41it/s] 59it [00:13, 4.46it/s] 60it [00:13, 4.50it/s] 61it [00:13, 4.54it/s] 62it [00:13, 4.56it/s] 63it [00:14, 4.58it/s] 64it [00:14, 4.57it/s] 65it [00:14, 4.60it/s] 66it [00:14, 4.60it/s] 67it [00:15, 4.46it/s] 68it [00:15, 4.51it/s] 69it [00:15, 4.55it/s] 70it [00:15, 4.56it/s] 71it [00:15, 4.59it/s] 72it [00:16, 4.60it/s] 73it [00:16, 4.60it/s] 74it [00:16, 4.61it/s] 75it [00:16, 4.61it/s] 76it [00:16, 4.63it/s] 77it [00:17, 4.61it/s] 78it [00:17, 4.43it/s] 79it [00:17, 4.50it/s] 80it [00:17, 4.52it/s] 81it [00:18, 4.55it/s] 82it [00:18, 4.55it/s] 83it [00:18, 4.57it/s] 84it [00:18, 4.58it/s] 85it [00:18, 4.59it/s] 86it [00:19, 4.60it/s] 87it [00:19, 4.48it/s] 88it [00:19, 4.51it/s] 89it [00:19, 4.51it/s] 90it [00:20, 4.56it/s] 91it [00:20, 4.57it/s] 92it [00:20, 4.58it/s] 93it [00:20, 4.45it/s] 94it [00:20, 4.48it/s] 95it [00:21, 4.54it/s] 96it [00:21, 4.45it/s] 97it [00:21, 4.47it/s] 98it [00:21, 4.51it/s] 99it [00:22, 4.55it/s] 100it [00:22, 4.57it/s]2025-05-26 01:26:08,903 - INFO - [Epoch 011 | Batch 0100] IWAE-loss 4312.6279 | mean log_px -0.0334 | KL -2658.71 + 101it [00:22, 4.58it/s] 102it [00:22, 4.59it/s] 103it [00:22, 4.55it/s] 104it [00:23, 4.59it/s] 105it [00:23, 4.55it/s] 106it [00:23, 4.58it/s] 107it [00:23, 4.59it/s] 108it [00:24, 4.47it/s] 109it [00:24, 4.51it/s] 110it [00:24, 4.55it/s] 111it [00:24, 4.51it/s] 112it [00:24, 4.50it/s] 113it [00:25, 4.52it/s] 114it [00:25, 4.52it/s] 115it [00:25, 4.55it/s] 116it [00:25, 4.58it/s] 117it [00:25, 4.54it/s] 118it [00:26, 4.54it/s] 119it [00:26, 4.55it/s] 120it [00:26, 4.42it/s] 121it [00:26, 4.48it/s] 122it [00:27, 4.52it/s] 123it [00:27, 4.55it/s] 124it [00:27, 4.57it/s] 125it [00:27, 4.59it/s] 126it [00:27, 4.57it/s] 127it [00:28, 4.58it/s] 128it [00:28, 4.59it/s] 129it [00:28, 4.58it/s] 130it [00:28, 4.59it/s] 131it [00:29, 4.45it/s] 132it [00:29, 4.51it/s] 133it [00:29, 4.54it/s] 134it [00:29, 4.56it/s] 135it [00:29, 4.59it/s] 136it [00:30, 4.59it/s] 137it [00:30, 4.60it/s] 138it [00:30, 4.60it/s] 139it [00:30, 4.60it/s] 140it [00:31, 4.60it/s] 141it [00:31, 4.61it/s] 142it [00:31, 4.58it/s] 143it [00:31, 4.59it/s] 144it [00:31, 4.59it/s] 145it [00:32, 4.57it/s] 146it [00:32, 4.46it/s] 147it [00:32, 4.53it/s] 148it [00:32, 4.54it/s] 149it [00:33, 4.55it/s] 150it [00:33, 4.56it/s]2025-05-26 01:26:19,891 - INFO - [Epoch 011 | Batch 0150] IWAE-loss 3104.3960 | mean log_px -0.0096 | KL -2631.08 + 151it [00:33, 4.56it/s] 152it [00:33, 4.55it/s] 153it [00:33, 4.58it/s] 154it [00:34, 4.60it/s] 155it [00:34, 4.61it/s] 156it [00:34, 4.61it/s] 157it [00:34, 4.62it/s] 158it [00:34, 4.61it/s] 159it [00:35, 4.62it/s] 160it [00:35, 4.61it/s] 161it [00:35, 4.60it/s] 162it [00:35, 4.61it/s] 163it [00:36, 4.62it/s] 164it [00:36, 4.62it/s] 165it [00:36, 4.62it/s] 166it [00:36, 4.62it/s] 167it [00:36, 4.62it/s] 168it [00:37, 4.61it/s] 169it [00:37, 4.60it/s] 170it [00:37, 4.59it/s] 171it [00:37, 4.46it/s] 172it [00:38, 4.49it/s] 173it [00:38, 4.50it/s] 174it [00:38, 4.54it/s] 175it [00:38, 4.50it/s] 176it [00:38, 4.52it/s] 177it [00:39, 4.53it/s] 178it [00:39, 4.41it/s] 179it [00:39, 4.47it/s] 180it [00:39, 4.47it/s] 181it [00:40, 4.48it/s] 182it [00:40, 4.51it/s] 183it [00:40, 4.52it/s] 184it [00:40, 4.54it/s] 185it [00:40, 4.50it/s] 186it [00:41, 4.53it/s] 187it [00:41, 4.53it/s] 188it [00:41, 4.48it/s] 189it [00:41, 4.52it/s] 190it [00:42, 4.54it/s] 191it [00:42, 4.54it/s] 192it [00:42, 4.54it/s] 193it [00:42, 4.57it/s] 194it [00:42, 4.57it/s] 195it [00:43, 4.30it/s] 196it [00:43, 4.13it/s] 196it [00:43, 4.50it/s] +2025-05-26 01:26:30,003 - INFO - Epoch: 11, Objective: tensor([4247.3716], device='cuda:0', grad_fn=), Loss: 0.031174693256616592, KL/n: 53.34761047363281 + 0it [00:00, ?it/s]2025-05-26 01:26:30,412 - INFO - [Epoch 012 | Batch 0000] IWAE-loss 3012.1206 | mean log_px -0.0057 | KL -2611.20 + 1it [00:00, 3.12it/s] 2it [00:00, 3.88it/s] 3it [00:00, 4.18it/s] 4it [00:00, 4.38it/s] 5it [00:01, 4.19it/s] 6it [00:01, 4.33it/s] 7it [00:01, 4.45it/s] 8it [00:01, 4.52it/s] 9it [00:02, 4.57it/s] 10it [00:02, 4.60it/s] 11it [00:02, 4.65it/s] 12it [00:02, 3.69it/s] 13it [00:03, 3.95it/s] 14it [00:03, 4.13it/s] 15it [00:03, 4.31it/s] 16it [00:03, 4.41it/s] 17it [00:03, 4.42it/s] 18it [00:04, 4.46it/s] 19it [00:04, 4.46it/s] 20it [00:04, 4.49it/s] 21it [00:04, 4.52it/s] 22it [00:05, 4.41it/s] 23it [00:05, 4.52it/s] 24it [00:05, 4.57it/s] 25it [00:05, 4.63it/s] 26it [00:05, 4.65it/s] 27it [00:06, 4.68it/s] 28it [00:06, 4.69it/s] 29it [00:06, 4.71it/s] 30it [00:06, 4.71it/s] 31it [00:06, 4.72it/s] 32it [00:07, 4.72it/s] 33it [00:07, 4.72it/s] 34it [00:07, 4.52it/s] 35it [00:07, 4.59it/s] 36it [00:08, 4.63it/s] 37it [00:08, 4.66it/s] 38it [00:08, 4.67it/s] 39it [00:08, 4.70it/s] 40it [00:08, 4.69it/s] 41it [00:09, 4.45it/s] 42it [00:09, 4.51it/s] 43it [00:09, 4.57it/s] 44it [00:09, 4.60it/s] 45it [00:10, 4.63it/s] 46it [00:10, 4.64it/s] 47it [00:10, 4.65it/s] 48it [00:10, 4.67it/s] 49it [00:10, 4.69it/s] 50it [00:11, 4.68it/s]2025-05-26 01:26:41,410 - INFO - [Epoch 012 | Batch 0050] IWAE-loss 3992.2141 | mean log_px -0.0251 | KL -2592.65 + 51it [00:11, 4.71it/s] 52it [00:11, 4.54it/s] 53it [00:11, 4.60it/s] 54it [00:11, 4.61it/s] 55it [00:12, 4.64it/s] 56it [00:12, 4.66it/s] 57it [00:12, 4.68it/s] 58it [00:12, 4.64it/s] 59it [00:13, 4.68it/s] 60it [00:13, 4.52it/s] 61it [00:13, 4.60it/s] 62it [00:13, 4.64it/s] 63it [00:13, 4.67it/s] 64it [00:14, 4.68it/s] 65it [00:14, 4.70it/s] 66it [00:14, 4.68it/s] 67it [00:14, 4.71it/s] 68it [00:14, 4.72it/s] 69it [00:15, 4.72it/s] 70it [00:15, 4.71it/s] 71it [00:15, 4.55it/s] 72it [00:15, 4.62it/s] 73it [00:16, 4.65it/s] 74it [00:16, 4.63it/s] 75it [00:16, 4.68it/s] 76it [00:16, 4.69it/s] 77it [00:16, 4.71it/s] 78it [00:17, 4.70it/s] 79it [00:17, 4.71it/s] 80it [00:17, 4.71it/s] 81it [00:17, 4.72it/s] 82it [00:17, 4.72it/s] 83it [00:18, 4.73it/s] 84it [00:18, 4.72it/s] 85it [00:18, 4.72it/s] 86it [00:18, 4.71it/s] 87it [00:19, 4.69it/s] 88it [00:19, 4.57it/s] 89it [00:19, 4.58it/s] 90it [00:19, 4.63it/s] 91it [00:19, 4.66it/s] 92it [00:20, 4.66it/s] 93it [00:20, 4.51it/s] 94it [00:20, 4.58it/s] 95it [00:20, 4.60it/s] 96it [00:20, 4.65it/s] 97it [00:21, 4.68it/s] 98it [00:21, 4.69it/s] 99it [00:21, 4.70it/s] 100it [00:21, 4.70it/s]2025-05-26 01:26:52,141 - INFO - [Epoch 012 | Batch 0100] IWAE-loss 7227.1890 | mean log_px -0.0753 | KL -2570.68 + 101it [00:22, 4.71it/s] 102it [00:22, 4.71it/s] 103it [00:22, 4.71it/s] 104it [00:22, 4.71it/s] 105it [00:22, 4.71it/s] 106it [00:23, 4.71it/s] 107it [00:23, 4.72it/s] 108it [00:23, 4.72it/s] 109it [00:23, 4.73it/s] 110it [00:23, 4.73it/s] 111it [00:24, 4.73it/s] 112it [00:24, 4.59it/s] 113it [00:24, 4.65it/s] 114it [00:24, 4.67it/s] 115it [00:25, 4.69it/s] 116it [00:25, 4.70it/s] 117it [00:25, 4.54it/s] 118it [00:25, 4.60it/s] 119it [00:25, 4.63it/s] 120it [00:26, 4.65it/s] 121it [00:26, 4.67it/s] 122it [00:26, 4.69it/s] 123it [00:26, 4.70it/s] 124it [00:26, 4.70it/s] 125it [00:27, 4.71it/s] 126it [00:27, 4.71it/s] 127it [00:27, 4.51it/s] 128it [00:27, 4.58it/s] 129it [00:28, 4.63it/s] 130it [00:28, 4.65it/s] 131it [00:28, 4.67it/s] 132it [00:28, 4.64it/s] 133it [00:28, 4.64it/s] 134it [00:29, 4.46it/s] 135it [00:29, 4.55it/s] 136it [00:29, 4.59it/s] 137it [00:29, 4.63it/s] 138it [00:30, 4.65it/s] 139it [00:30, 4.65it/s] 140it [00:30, 4.66it/s] 141it [00:30, 4.69it/s] 142it [00:30, 4.70it/s] 143it [00:31, 4.54it/s] 144it [00:31, 4.61it/s] 145it [00:31, 4.62it/s] 146it [00:31, 4.65it/s] 147it [00:31, 4.67it/s] 148it [00:32, 4.68it/s] 149it [00:32, 4.70it/s] 150it [00:32, 4.53it/s]2025-05-26 01:27:02,905 - INFO - [Epoch 012 | Batch 0150] IWAE-loss 3201.9055 | mean log_px -0.0163 | KL -2551.84 + 151it [00:32, 4.60it/s] 152it [00:33, 4.63it/s] 153it [00:33, 4.67it/s] 154it [00:33, 4.69it/s] 155it [00:33, 4.54it/s] 156it [00:33, 4.60it/s] 157it [00:34, 4.64it/s] 158it [00:34, 4.66it/s] 159it [00:34, 4.68it/s] 160it [00:34, 4.68it/s] 161it [00:34, 4.69it/s] 162it [00:35, 4.70it/s] 163it [00:35, 4.71it/s] 164it [00:35, 4.57it/s] 165it [00:35, 4.64it/s] 166it [00:36, 4.66it/s] 167it [00:36, 4.52it/s] 168it [00:36, 4.59it/s] 169it [00:36, 4.63it/s] 170it [00:36, 4.65it/s] 171it [00:37, 4.68it/s] 172it [00:37, 4.68it/s] 173it [00:37, 4.70it/s] 174it [00:37, 4.70it/s] 175it [00:37, 4.72it/s] 176it [00:38, 4.55it/s] 177it [00:38, 4.62it/s] 178it [00:38, 4.65it/s] 179it [00:38, 4.67it/s] 180it [00:39, 4.69it/s] 181it [00:39, 4.70it/s] 182it [00:39, 4.54it/s] 183it [00:39, 4.61it/s] 184it [00:39, 4.64it/s] 185it [00:40, 4.67it/s] 186it [00:40, 4.54it/s] 187it [00:40, 4.51it/s] 188it [00:40, 4.55it/s] 189it [00:41, 4.59it/s] 190it [00:41, 4.62it/s] 191it [00:41, 4.64it/s] 192it [00:41, 4.49it/s] 193it [00:41, 4.57it/s] 194it [00:42, 4.59it/s] 195it [00:42, 4.40it/s] 196it [00:42, 4.46it/s] 196it [00:42, 4.60it/s] +2025-05-26 01:27:12,797 - INFO - Epoch: 12, Objective: tensor([2863.8979], device='cuda:0', grad_fn=), Loss: 0.006043643224984407, KL/n: 51.6978874206543 + 0it [00:00, ?it/s]2025-05-26 01:27:13,205 - INFO - [Epoch 013 | Batch 0000] IWAE-loss 2755.2402 | mean log_px -0.0041 | KL -2532.30 + 1it [00:00, 2.79it/s] 2it [00:00, 3.65it/s] 3it [00:00, 4.07it/s] 4it [00:00, 4.31it/s] 5it [00:01, 4.46it/s] 6it [00:01, 4.39it/s] 7it [00:01, 4.28it/s] 8it [00:01, 4.42it/s] 9it [00:02, 4.51it/s] 10it [00:02, 4.39it/s] 11it [00:02, 4.33it/s] 12it [00:02, 4.27it/s] 13it [00:03, 4.40it/s] 14it [00:03, 4.49it/s] 15it [00:03, 4.35it/s] 16it [00:03, 4.40it/s] 17it [00:03, 4.42it/s] 18it [00:04, 4.47it/s] 19it [00:04, 4.55it/s] 20it [00:04, 4.58it/s] 21it [00:04, 4.46it/s] 22it [00:05, 4.37it/s] 23it [00:05, 4.41it/s] 24it [00:05, 4.40it/s] 25it [00:05, 4.50it/s] 26it [00:05, 4.56it/s] 27it [00:06, 4.28it/s] 28it [00:06, 4.24it/s] 29it [00:06, 4.40it/s] 30it [00:06, 4.49it/s] 31it [00:07, 4.40it/s] 32it [00:07, 4.38it/s] 33it [00:07, 4.30it/s] 34it [00:07, 4.43it/s] 35it [00:08, 4.49it/s] 36it [00:08, 4.55it/s] 37it [00:08, 4.61it/s] 38it [00:08, 4.31it/s] 39it [00:08, 4.44it/s] 40it [00:09, 4.50it/s] 41it [00:09, 4.57it/s] 42it [00:09, 4.61it/s] 43it [00:09, 4.60it/s] 44it [00:09, 4.47it/s] 45it [00:10, 4.57it/s] 46it [00:10, 4.60it/s] 47it [00:10, 4.59it/s] 48it [00:10, 4.47it/s] 49it [00:11, 4.31it/s] 50it [00:11, 4.42it/s]2025-05-26 01:27:24,428 - INFO - [Epoch 013 | Batch 0050] IWAE-loss 2921.4778 | mean log_px -0.0094 | KL -2503.91 + 51it [00:11, 4.48it/s] 52it [00:11, 4.43it/s] 53it [00:12, 4.34it/s] 54it [00:12, 4.45it/s] 55it [00:12, 4.36it/s] 56it [00:12, 4.30it/s] 57it [00:12, 4.27it/s] 58it [00:13, 4.26it/s] 59it [00:13, 4.31it/s] 60it [00:13, 4.27it/s] 61it [00:13, 4.20it/s] 62it [00:14, 4.20it/s] 63it [00:14, 4.20it/s] 64it [00:14, 4.26it/s] 65it [00:14, 4.37it/s] 66it [00:15, 4.48it/s] 67it [00:15, 4.55it/s] 68it [00:15, 4.44it/s] 69it [00:15, 4.51it/s] 70it [00:15, 4.42it/s] 71it [00:16, 4.45it/s] 72it [00:16, 4.53it/s] 73it [00:16, 4.54it/s] 74it [00:16, 4.58it/s] 75it [00:17, 4.51it/s] 76it [00:17, 4.59it/s] 77it [00:17, 4.63it/s] 78it [00:17, 4.65it/s] 79it [00:17, 4.67it/s] 80it [00:18, 4.69it/s] 81it [00:18, 4.70it/s] 82it [00:18, 4.70it/s] 83it [00:18, 4.72it/s] 84it [00:18, 4.72it/s] 85it [00:19, 4.72it/s] 86it [00:19, 4.55it/s] 87it [00:19, 4.62it/s] 88it [00:19, 4.65it/s] 89it [00:20, 4.67it/s] 90it [00:20, 4.68it/s] 91it [00:20, 4.54it/s] 92it [00:20, 4.59it/s] 93it [00:20, 4.46it/s] 94it [00:21, 4.36it/s] 95it [00:21, 4.22it/s] 96it [00:21, 4.38it/s] 97it [00:21, 4.31it/s] 98it [00:22, 4.39it/s] 99it [00:22, 4.45it/s] 100it [00:22, 4.36it/s]2025-05-26 01:27:35,651 - INFO - [Epoch 013 | Batch 0100] IWAE-loss 3051.0591 | mean log_px -0.0105 | KL -2480.72 + 101it [00:22, 4.30it/s] 102it [00:22, 4.39it/s] 103it [00:23, 4.48it/s] 104it [00:23, 4.53it/s] 105it [00:23, 4.58it/s] 106it [00:23, 4.62it/s] 107it [00:24, 4.48it/s] 108it [00:24, 4.35it/s] 109it [00:24, 4.32it/s] 110it [00:24, 4.18it/s] 111it [00:25, 4.32it/s] 112it [00:25, 4.27it/s] 113it [00:25, 4.28it/s] 114it [00:25, 4.25it/s] 115it [00:25, 4.38it/s] 116it [00:26, 4.31it/s] 117it [00:26, 4.27it/s] 118it [00:26, 4.37it/s] 119it [00:26, 4.15it/s] 120it [00:27, 4.18it/s] 121it [00:27, 4.26it/s] 122it [00:27, 4.23it/s] 123it [00:27, 4.29it/s] 124it [00:28, 4.10it/s] 125it [00:28, 4.21it/s] 126it [00:28, 4.33it/s] 127it [00:28, 4.31it/s] 128it [00:29, 4.28it/s] 129it [00:29, 4.22it/s] 130it [00:29, 4.18it/s] 131it [00:29, 4.33it/s] 132it [00:29, 4.28it/s] 133it [00:30, 4.37it/s] 134it [00:30, 4.44it/s] 135it [00:30, 4.53it/s] 136it [00:30, 4.51it/s] 137it [00:31, 4.57it/s] 138it [00:31, 4.61it/s] 139it [00:31, 4.48it/s] 140it [00:31, 4.56it/s] 141it [00:31, 4.61it/s] 142it [00:32, 4.64it/s] 143it [00:32, 4.67it/s] 144it [00:32, 4.68it/s] 145it [00:32, 4.64it/s] 146it [00:33, 4.51it/s] 147it [00:33, 4.39it/s] 148it [00:33, 4.32it/s] 149it [00:33, 4.45it/s] 150it [00:33, 4.52it/s]2025-05-26 01:27:47,032 - INFO - [Epoch 013 | Batch 0150] IWAE-loss 2694.3430 | mean log_px -0.0060 | KL -2454.87 + 151it [00:34, 4.42it/s] 152it [00:34, 4.33it/s] 153it [00:34, 4.20it/s] 154it [00:34, 4.24it/s] 155it [00:35, 4.39it/s] 156it [00:35, 4.36it/s] 157it [00:35, 4.48it/s] 158it [00:35, 4.39it/s] 159it [00:36, 4.38it/s] 160it [00:36, 4.35it/s] 161it [00:36, 4.37it/s] 162it [00:36, 4.38it/s] 163it [00:36, 4.46it/s] 164it [00:37, 4.40it/s] 165it [00:37, 4.20it/s] 166it [00:37, 4.26it/s] 167it [00:37, 4.31it/s] 168it [00:38, 4.34it/s] 169it [00:38, 4.33it/s] 170it [00:38, 4.43it/s] 171it [00:38, 4.39it/s] 172it [00:38, 4.40it/s] 173it [00:39, 4.38it/s] 174it [00:39, 4.18it/s] 175it [00:39, 4.23it/s] 176it [00:39, 4.35it/s] 177it [00:40, 4.45it/s] 178it [00:40, 4.52it/s] 179it [00:40, 4.42it/s] 180it [00:40, 4.22it/s] 181it [00:41, 4.31it/s] 182it [00:41, 4.31it/s] 183it [00:41, 4.22it/s] 184it [00:41, 4.20it/s] 185it [00:42, 4.31it/s] 186it [00:42, 4.39it/s] 187it [00:42, 4.33it/s] 188it [00:42, 4.21it/s] 189it [00:42, 4.36it/s] 190it [00:43, 4.46it/s] 191it [00:43, 4.40it/s] 192it [00:43, 4.32it/s] 193it [00:43, 4.18it/s] 194it [00:44, 4.21it/s] 195it [00:44, 4.28it/s] 196it [00:44, 4.28it/s] 196it [00:44, 4.39it/s] +2025-05-26 01:27:57,574 - INFO - Epoch: 13, Objective: tensor([4922.8945], device='cuda:0', grad_fn=), Loss: 0.041003212332725525, KL/n: 49.89161682128906 + 0it [00:00, ?it/s]2025-05-26 01:27:58,149 - INFO - [Epoch 014 | Batch 0000] IWAE-loss 2859.6846 | mean log_px -0.0121 | KL -2441.73 + 1it [00:00, 3.10it/s] 2it [00:00, 3.85it/s] 3it [00:00, 4.02it/s] 4it [00:00, 4.25it/s] 5it [00:01, 4.41it/s] 6it [00:01, 4.48it/s] 7it [00:01, 4.51it/s] 8it [00:01, 4.54it/s] 9it [00:02, 4.43it/s] 10it [00:02, 4.52it/s] 11it [00:02, 4.58it/s] 12it [00:02, 4.59it/s] 13it [00:02, 4.63it/s] 14it [00:03, 4.63it/s] 15it [00:03, 4.49it/s] 16it [00:03, 4.54it/s] 17it [00:03, 4.42it/s] 18it [00:04, 4.49it/s] 19it [00:04, 4.52it/s] 20it [00:04, 4.54it/s] 21it [00:04, 4.59it/s] 22it [00:04, 4.58it/s] 23it [00:05, 4.43it/s] 24it [00:05, 4.48it/s] 25it [00:05, 4.50it/s] 26it [00:05, 4.40it/s] 27it [00:06, 4.46it/s] 28it [00:06, 4.51it/s] 29it [00:06, 4.53it/s] 30it [00:06, 4.53it/s] 31it [00:06, 4.54it/s] 32it [00:07, 4.54it/s] 33it [00:07, 4.43it/s] 34it [00:07, 4.50it/s] 35it [00:07, 4.40it/s] 36it [00:08, 4.47it/s] 37it [00:08, 4.52it/s] 38it [00:08, 4.55it/s] 39it [00:08, 4.59it/s] 40it [00:08, 4.59it/s] 41it [00:09, 4.61it/s] 42it [00:09, 4.44it/s] 43it [00:09, 4.51it/s] 44it [00:09, 4.54it/s] 45it [00:10, 4.57it/s] 46it [00:10, 4.59it/s] 47it [00:10, 4.59it/s] 48it [00:10, 4.60it/s] 49it [00:10, 4.48it/s] 50it [00:11, 4.53it/s]2025-05-26 01:28:09,185 - INFO - [Epoch 014 | Batch 0050] IWAE-loss 3013.0603 | mean log_px -0.0122 | KL -2423.46 + 51it [00:11, 4.55it/s] 52it [00:11, 4.56it/s] 53it [00:11, 4.59it/s] 54it [00:12, 4.60it/s] 55it [00:12, 4.47it/s] 56it [00:12, 4.51it/s] 57it [00:12, 4.54it/s] 58it [00:12, 4.56it/s] 59it [00:13, 4.44it/s] 60it [00:13, 4.47it/s] 61it [00:13, 4.52it/s] 62it [00:13, 4.55it/s] 63it [00:14, 4.58it/s] 64it [00:14, 4.59it/s] 65it [00:14, 4.50it/s] 66it [00:14, 4.55it/s] 67it [00:14, 4.56it/s] 68it [00:15, 4.44it/s] 69it [00:15, 4.51it/s] 70it [00:15, 4.46it/s] 71it [00:15, 4.46it/s] 72it [00:16, 4.51it/s] 73it [00:16, 4.54it/s] 74it [00:16, 4.55it/s] 75it [00:16, 4.43it/s] 76it [00:16, 4.49it/s] 77it [00:17, 4.53it/s] 78it [00:17, 4.55it/s] 79it [00:17, 4.58it/s] 80it [00:17, 4.60it/s] 81it [00:17, 4.61it/s] 82it [00:18, 4.60it/s] 83it [00:18, 4.61it/s] 84it [00:18, 4.59it/s] 85it [00:18, 4.60it/s] 86it [00:19, 4.61it/s] 87it [00:19, 4.48it/s] 88it [00:19, 4.53it/s] 89it [00:19, 4.56it/s] 90it [00:19, 4.57it/s] 91it [00:20, 4.59it/s] 92it [00:20, 4.60it/s] 93it [00:20, 4.46it/s] 94it [00:20, 4.51it/s] 95it [00:21, 4.52it/s] 96it [00:21, 4.54it/s] 97it [00:21, 4.58it/s] 98it [00:21, 4.58it/s] 99it [00:21, 4.58it/s] 100it [00:22, 4.45it/s]2025-05-26 01:28:20,213 - INFO - [Epoch 014 | Batch 0100] IWAE-loss 3804.5000 | mean log_px -0.0205 | KL -2399.92 + 101it [00:22, 4.50it/s] 102it [00:22, 4.52it/s] 103it [00:22, 4.52it/s] 104it [00:23, 4.36it/s] 105it [00:23, 4.46it/s] 106it [00:23, 4.50it/s] 107it [00:23, 4.54it/s] 108it [00:23, 4.55it/s] 109it [00:24, 4.56it/s] 110it [00:24, 4.45it/s] 111it [00:24, 4.52it/s] 112it [00:24, 4.55it/s] 113it [00:25, 4.54it/s] 114it [00:25, 4.57it/s] 115it [00:25, 4.58it/s] 116it [00:25, 4.45it/s] 117it [00:25, 4.51it/s] 118it [00:26, 4.56it/s] 119it [00:26, 4.58it/s] 120it [00:26, 4.59it/s] 121it [00:26, 4.62it/s] 122it [00:27, 4.48it/s] 123it [00:27, 4.53it/s] 124it [00:27, 4.50it/s] 125it [00:27, 4.55it/s] 126it [00:27, 4.44it/s] 127it [00:28, 4.49it/s] 128it [00:28, 4.52it/s] 129it [00:28, 4.54it/s] 130it [00:28, 4.55it/s] 131it [00:29, 4.55it/s] 132it [00:29, 4.55it/s] 133it [00:29, 4.57it/s] 134it [00:29, 4.57it/s] 135it [00:29, 4.58it/s] 136it [00:30, 4.59it/s] 137it [00:30, 4.56it/s] 138it [00:30, 4.42it/s] 139it [00:30, 4.49it/s] 140it [00:30, 4.52it/s] 141it [00:31, 4.55it/s] 142it [00:31, 4.56it/s] 143it [00:31, 4.54it/s] 144it [00:31, 4.58it/s] 145it [00:32, 4.58it/s] 146it [00:32, 4.57it/s] 147it [00:32, 4.44it/s] 148it [00:32, 4.48it/s] 149it [00:32, 4.52it/s] 150it [00:33, 4.53it/s]2025-05-26 01:28:31,249 - INFO - [Epoch 014 | Batch 0150] IWAE-loss 3109.0154 | mean log_px -0.0184 | KL -2386.44 + 151it [00:33, 4.54it/s] 152it [00:33, 4.56it/s] 153it [00:33, 4.56it/s] 154it [00:34, 4.40it/s] 155it [00:34, 4.42it/s] 156it [00:34, 4.46it/s] 157it [00:34, 4.51it/s] 158it [00:34, 4.47it/s] 159it [00:35, 4.52it/s] 160it [00:35, 4.55it/s] 161it [00:35, 4.57it/s] 162it [00:35, 4.58it/s] 163it [00:36, 4.59it/s] 164it [00:36, 4.60it/s] 165it [00:36, 4.62it/s] 166it [00:36, 4.59it/s] 167it [00:36, 4.44it/s] 168it [00:37, 4.46it/s] 169it [00:37, 4.46it/s] 170it [00:37, 4.47it/s] 171it [00:37, 4.52it/s] 172it [00:38, 4.54it/s] 173it [00:38, 4.55it/s] 174it [00:38, 4.56it/s] 175it [00:38, 4.56it/s] 176it [00:38, 4.59it/s] 177it [00:39, 4.61it/s] 178it [00:39, 4.56it/s] 179it [00:39, 4.59it/s] 180it [00:39, 4.58it/s] 181it [00:40, 4.60it/s] 182it [00:40, 4.57it/s] 183it [00:40, 4.59it/s] 184it [00:40, 4.57it/s] 185it [00:40, 4.60it/s] 186it [00:41, 4.59it/s] 187it [00:41, 4.60it/s] 188it [00:41, 4.60it/s] 189it [00:41, 4.62it/s] 190it [00:41, 4.61it/s] 191it [00:42, 4.63it/s] 192it [00:42, 4.64it/s] 193it [00:42, 4.64it/s] 194it [00:42, 4.63it/s] 195it [00:43, 4.42it/s] 196it [00:43, 4.51it/s] 196it [00:43, 4.52it/s] +2025-05-26 01:28:41,271 - INFO - Epoch: 14, Objective: tensor([2733.1536], device='cuda:0', grad_fn=), Loss: 0.013086755760014057, KL/n: 48.29157638549805 + 0it [00:00, ?it/s]2025-05-26 01:28:41,680 - INFO - [Epoch 015 | Batch 0000] IWAE-loss 3566.3582 | mean log_px -0.0216 | KL -2368.83 + 1it [00:00, 2.94it/s] 2it [00:00, 3.69it/s] 3it [00:00, 4.05it/s] 4it [00:01, 4.23it/s] 5it [00:01, 4.36it/s] 6it [00:01, 4.43it/s] 7it [00:01, 4.34it/s] 8it [00:02, 3.51it/s] 9it [00:02, 3.80it/s] 10it [00:02, 4.03it/s] 11it [00:02, 4.20it/s] 12it [00:02, 4.32it/s] 13it [00:03, 4.42it/s] 14it [00:03, 4.37it/s] 15it [00:03, 4.38it/s] 16it [00:03, 4.48it/s] 17it [00:04, 4.54it/s] 18it [00:04, 4.57it/s] 19it [00:04, 4.61it/s] 20it [00:04, 4.46it/s] 21it [00:04, 4.53it/s] 22it [00:05, 4.52it/s] 23it [00:05, 4.56it/s] 24it [00:05, 4.58it/s] 25it [00:05, 4.61it/s] 26it [00:06, 4.47it/s] 27it [00:06, 4.54it/s] 28it [00:06, 4.57it/s] 29it [00:06, 4.60it/s] 30it [00:06, 4.61it/s] 31it [00:07, 4.62it/s] 32it [00:07, 4.63it/s] 33it [00:07, 4.64it/s] 34it [00:07, 4.65it/s] 35it [00:07, 4.65it/s] 36it [00:08, 4.63it/s] 37it [00:08, 4.62it/s] 38it [00:08, 4.44it/s] 39it [00:08, 4.51it/s] 40it [00:09, 4.49it/s] 41it [00:09, 4.40it/s] 42it [00:09, 4.49it/s] 43it [00:09, 4.55it/s] 44it [00:09, 4.42it/s] 45it [00:10, 4.51it/s] 46it [00:10, 4.55it/s] 47it [00:10, 4.60it/s] 48it [00:10, 4.63it/s] 49it [00:11, 4.64it/s] 50it [00:11, 4.64it/s]2025-05-26 01:28:52,829 - INFO - [Epoch 015 | Batch 0050] IWAE-loss 2586.0901 | mean log_px -0.0101 | KL -2342.14 + 51it [00:11, 4.63it/s] 52it [00:11, 4.62it/s] 53it [00:11, 4.49it/s] 54it [00:12, 4.54it/s] 55it [00:12, 4.57it/s] 56it [00:12, 4.59it/s] 57it [00:12, 4.62it/s] 58it [00:13, 4.63it/s] 59it [00:13, 4.49it/s] 60it [00:13, 4.48it/s] 61it [00:13, 4.50it/s] 62it [00:13, 4.53it/s] 63it [00:14, 4.55it/s] 64it [00:14, 4.56it/s] 65it [00:14, 4.58it/s] 66it [00:14, 4.58it/s] 67it [00:15, 4.48it/s] 68it [00:15, 4.52it/s] 69it [00:15, 4.42it/s] 70it [00:15, 4.50it/s] 71it [00:15, 4.54it/s] 72it [00:16, 4.58it/s] 73it [00:16, 4.60it/s] 74it [00:16, 4.61it/s] 75it [00:16, 4.63it/s] 76it [00:16, 4.64it/s] 77it [00:17, 4.49it/s] 78it [00:17, 4.52it/s] 79it [00:17, 4.56it/s] 80it [00:17, 4.58it/s] 81it [00:18, 4.60it/s] 82it [00:18, 4.61it/s] 83it [00:18, 4.63it/s] 84it [00:18, 4.63it/s] 85it [00:18, 4.49it/s] 86it [00:19, 4.55it/s] 87it [00:19, 4.57it/s] 88it [00:19, 4.59it/s] 89it [00:19, 4.60it/s] 90it [00:20, 4.60it/s] 91it [00:20, 4.62it/s] 92it [00:20, 4.62it/s] 93it [00:20, 4.63it/s] 94it [00:20, 4.64it/s] 95it [00:21, 4.49it/s] 96it [00:21, 4.54it/s] 97it [00:21, 4.57it/s] 98it [00:21, 4.59it/s] 99it [00:21, 4.61it/s] 100it [00:22, 4.61it/s]2025-05-26 01:29:03,777 - INFO - [Epoch 015 | Batch 0100] IWAE-loss 2982.4482 | mean log_px -0.0107 | KL -2318.40 + 101it [00:22, 4.62it/s] 102it [00:22, 4.62it/s] 103it [00:22, 4.62it/s] 104it [00:23, 4.62it/s] 105it [00:23, 4.48it/s] 106it [00:23, 4.55it/s] 107it [00:23, 4.59it/s] 108it [00:23, 4.62it/s] 109it [00:24, 4.63it/s] 110it [00:24, 4.51it/s] 111it [00:24, 4.55it/s] 112it [00:24, 4.59it/s] 113it [00:25, 4.55it/s] 114it [00:25, 4.60it/s] 115it [00:25, 4.62it/s] 116it [00:25, 4.64it/s] 117it [00:25, 4.66it/s] 118it [00:26, 4.67it/s] 119it [00:26, 4.68it/s] 120it [00:26, 4.69it/s] 121it [00:26, 4.69it/s] 122it [00:27, 4.53it/s] 123it [00:27, 4.60it/s] 124it [00:27, 4.62it/s] 125it [00:27, 4.65it/s] 126it [00:27, 4.66it/s] 127it [00:28, 4.68it/s] 128it [00:28, 4.68it/s] 129it [00:28, 4.69it/s] 130it [00:28, 4.69it/s] 131it [00:28, 4.69it/s] 132it [00:29, 4.69it/s] 133it [00:29, 4.52it/s] 134it [00:29, 4.54it/s] 135it [00:29, 4.59it/s] 136it [00:30, 4.60it/s] 137it [00:30, 4.62it/s] 138it [00:30, 4.63it/s] 139it [00:30, 4.63it/s] 140it [00:30, 4.49it/s] 141it [00:31, 4.55it/s] 142it [00:31, 4.56it/s] 143it [00:31, 4.57it/s] 144it [00:31, 4.56it/s] 145it [00:31, 4.59it/s] 146it [00:32, 4.62it/s] 147it [00:32, 4.48it/s] 148it [00:32, 4.52it/s] 149it [00:32, 4.57it/s] 150it [00:33, 4.61it/s]2025-05-26 01:29:14,641 - INFO - [Epoch 015 | Batch 0150] IWAE-loss 3421.2581 | mean log_px -0.0186 | KL -2299.48 + 151it [00:33, 4.63it/s] 152it [00:33, 4.65it/s] 153it [00:33, 4.67it/s] 154it [00:33, 4.67it/s] 155it [00:34, 4.68it/s] 156it [00:34, 4.68it/s] 157it [00:34, 4.69it/s] 158it [00:34, 4.69it/s] 159it [00:35, 4.46it/s] 160it [00:35, 4.53it/s] 161it [00:35, 4.58it/s] 162it [00:35, 4.61it/s] 163it [00:35, 4.65it/s] 164it [00:36, 4.65it/s] 165it [00:36, 4.67it/s] 166it [00:36, 4.61it/s] 167it [00:36, 4.64it/s] 168it [00:36, 4.51it/s] 169it [00:37, 4.58it/s] 170it [00:37, 4.62it/s] 171it [00:37, 4.65it/s] 172it [00:37, 4.66it/s] 173it [00:38, 4.67it/s] 174it [00:38, 4.64it/s] 175it [00:38, 4.66it/s] 176it [00:38, 4.67it/s] 177it [00:38, 4.68it/s] 178it [00:39, 4.68it/s] 179it [00:39, 4.69it/s] 180it [00:39, 4.49it/s] 181it [00:39, 4.49it/s] 182it [00:40, 4.38it/s] 183it [00:40, 4.43it/s] 184it [00:40, 4.46it/s] 185it [00:40, 4.49it/s] 186it [00:40, 4.55it/s] 187it [00:41, 4.59it/s] 188it [00:41, 4.61it/s] 189it [00:41, 4.64it/s] 190it [00:41, 4.48it/s] 191it [00:42, 4.51it/s] 192it [00:42, 4.55it/s] 193it [00:42, 4.59it/s] 194it [00:42, 4.60it/s] 195it [00:42, 4.49it/s] 196it [00:43, 4.37it/s] 196it [00:43, 4.54it/s] +2025-05-26 01:29:24,600 - INFO - Epoch: 15, Objective: tensor([2673.8301], device='cuda:0', grad_fn=), Loss: 0.006941231433302164, KL/n: 46.54920196533203 + 0it [00:00, ?it/s]2025-05-26 01:29:25,038 - INFO - [Epoch 016 | Batch 0000] IWAE-loss 2568.5730 | mean log_px -0.0058 | KL -2277.45 + 1it [00:00, 2.80it/s] 2it [00:00, 3.66it/s] 3it [00:00, 4.03it/s] 4it [00:01, 4.22it/s] 5it [00:01, 4.21it/s] 6it [00:01, 4.34it/s] 7it [00:01, 4.43it/s] 8it [00:01, 4.48it/s] 9it [00:02, 4.54it/s] 10it [00:02, 4.56it/s] 11it [00:02, 4.59it/s] 12it [00:02, 4.59it/s] 13it [00:02, 4.60it/s] 14it [00:03, 4.59it/s] 15it [00:03, 4.58it/s] 16it [00:03, 4.46it/s] 17it [00:03, 4.51it/s] 18it [00:04, 4.53it/s] 19it [00:04, 4.57it/s] 20it [00:04, 4.45it/s] 21it [00:04, 4.48it/s] 22it [00:04, 4.50it/s] 23it [00:05, 4.40it/s] 24it [00:05, 4.46it/s] 25it [00:05, 4.47it/s] 26it [00:05, 4.53it/s] 27it [00:06, 4.59it/s] 28it [00:06, 4.61it/s] 29it [00:06, 4.63it/s] 30it [00:06, 4.65it/s] 31it [00:06, 4.67it/s] 32it [00:07, 4.67it/s] 33it [00:07, 4.68it/s] 34it [00:07, 4.53it/s] 35it [00:07, 4.59it/s] 36it [00:08, 4.61it/s] 37it [00:08, 4.65it/s] 38it [00:08, 4.66it/s] 39it [00:08, 4.67it/s] 40it [00:08, 4.49it/s] 41it [00:09, 4.54it/s] 42it [00:09, 4.58it/s] 43it [00:09, 4.60it/s] 44it [00:09, 4.60it/s] 45it [00:09, 4.64it/s] 46it [00:10, 4.54it/s] 47it [00:10, 4.61it/s] 48it [00:10, 4.62it/s] 49it [00:10, 4.64it/s] 50it [00:11, 4.66it/s]2025-05-26 01:29:35,961 - INFO - [Epoch 016 | Batch 0050] IWAE-loss 2469.5354 | mean log_px -0.0050 | KL -2246.70 + 51it [00:11, 4.51it/s] 52it [00:11, 4.57it/s] 53it [00:11, 4.61it/s] 54it [00:11, 4.62it/s] 55it [00:12, 4.65it/s] 56it [00:12, 4.64it/s] 57it [00:12, 4.66it/s] 58it [00:12, 4.63it/s] 59it [00:13, 4.60it/s] 60it [00:13, 4.63it/s] 61it [00:13, 4.64it/s] 62it [00:13, 4.50it/s] 63it [00:13, 4.55it/s] 64it [00:14, 4.57it/s] 65it [00:14, 4.58it/s] 66it [00:14, 4.58it/s] 67it [00:14, 4.51it/s] 68it [00:15, 4.55it/s] 69it [00:15, 4.55it/s] 70it [00:15, 4.55it/s] 71it [00:15, 4.40it/s] 72it [00:15, 4.43it/s] 73it [00:16, 4.50it/s] 74it [00:16, 4.57it/s] 75it [00:16, 4.61it/s] 76it [00:16, 4.63it/s] 77it [00:16, 4.66it/s] 78it [00:17, 4.50it/s] 79it [00:17, 4.58it/s] 80it [00:17, 4.62it/s] 81it [00:17, 4.65it/s] 82it [00:18, 4.66it/s] 83it [00:18, 4.68it/s] 84it [00:18, 4.68it/s] 85it [00:18, 4.70it/s] 86it [00:18, 4.71it/s] 87it [00:19, 4.54it/s] 88it [00:19, 4.60it/s] 89it [00:19, 4.64it/s] 90it [00:19, 4.66it/s] 91it [00:19, 4.63it/s] 92it [00:20, 4.65it/s] 93it [00:20, 4.67it/s] 94it [00:20, 4.68it/s] 95it [00:20, 4.52it/s] 96it [00:21, 4.58it/s] 97it [00:21, 4.62it/s] 98it [00:21, 4.64it/s] 99it [00:21, 4.66it/s] 100it [00:21, 4.68it/s]2025-05-26 01:29:46,830 - INFO - [Epoch 016 | Batch 0100] IWAE-loss 2823.7253 | mean log_px -0.0109 | KL -2227.54 + 101it [00:22, 4.53it/s] 102it [00:22, 4.59it/s] 103it [00:22, 4.63it/s] 104it [00:22, 4.64it/s] 105it [00:23, 4.59it/s] 106it [00:23, 4.53it/s] 107it [00:23, 4.44it/s] 108it [00:23, 4.52it/s] 109it [00:23, 4.57it/s] 110it [00:24, 4.63it/s] 111it [00:24, 4.63it/s] 112it [00:24, 4.67it/s] 113it [00:24, 4.69it/s] 114it [00:24, 4.69it/s] 115it [00:25, 4.71it/s] 116it [00:25, 4.71it/s] 117it [00:25, 4.53it/s] 118it [00:25, 4.59it/s] 119it [00:26, 4.48it/s] 120it [00:26, 4.55it/s] 121it [00:26, 4.61it/s] 122it [00:26, 4.62it/s] 123it [00:26, 4.67it/s] 124it [00:27, 4.69it/s] 125it [00:27, 4.55it/s] 126it [00:27, 4.59it/s] 127it [00:27, 4.47it/s] 128it [00:28, 4.56it/s] 129it [00:28, 4.61it/s] 130it [00:28, 4.64it/s] 131it [00:28, 4.66it/s] 132it [00:28, 4.67it/s] 133it [00:29, 4.66it/s] 134it [00:29, 4.67it/s] 135it [00:29, 4.68it/s] 136it [00:29, 4.52it/s] 137it [00:29, 4.59it/s] 138it [00:30, 4.61it/s] 139it [00:30, 4.63it/s] 140it [00:30, 4.58it/s] 141it [00:30, 4.60it/s] 142it [00:31, 4.47it/s] 143it [00:31, 4.51it/s] 144it [00:31, 4.53it/s] 145it [00:31, 4.56it/s] 146it [00:31, 4.59it/s] 147it [00:32, 4.46it/s] 148it [00:32, 4.53it/s] 149it [00:32, 4.56it/s] 150it [00:32, 4.58it/s]2025-05-26 01:29:57,732 - INFO - [Epoch 016 | Batch 0150] IWAE-loss 2373.7930 | mean log_px -0.0035 | KL -2207.88 + 151it [00:33, 4.58it/s] 152it [00:33, 4.62it/s] 153it [00:33, 4.64it/s] 154it [00:33, 4.50it/s] 155it [00:33, 4.55it/s] 156it [00:34, 4.57it/s] 157it [00:34, 4.60it/s] 158it [00:34, 4.62it/s] 159it [00:34, 4.64it/s] 160it [00:34, 4.65it/s] 161it [00:35, 4.66it/s] 162it [00:35, 4.51it/s] 163it [00:35, 4.57it/s] 164it [00:35, 4.59it/s] 165it [00:36, 4.61it/s] 166it [00:36, 4.63it/s] 167it [00:36, 4.61it/s] 168it [00:36, 4.53it/s] 169it [00:36, 4.43it/s] 170it [00:37, 4.51it/s] 171it [00:37, 4.48it/s] 172it [00:37, 4.52it/s] 173it [00:37, 4.56it/s] 174it [00:38, 4.57it/s] 175it [00:38, 4.43it/s] 176it [00:38, 4.45it/s] 177it [00:38, 4.46it/s] 178it [00:38, 4.51it/s] 179it [00:39, 4.55it/s] 180it [00:39, 4.56it/s] 181it [00:39, 4.60it/s] 182it [00:39, 4.45it/s] 183it [00:40, 4.52it/s] 184it [00:40, 4.54it/s] 185it [00:40, 4.58it/s] 186it [00:40, 4.60it/s] 187it [00:40, 4.62it/s] 188it [00:41, 4.47it/s] 189it [00:41, 4.54it/s] 190it [00:41, 4.55it/s] 191it [00:41, 4.59it/s] 192it [00:42, 4.60it/s] 193it [00:42, 4.61it/s] 194it [00:42, 4.47it/s] 195it [00:42, 4.42it/s] 196it [00:42, 4.43it/s] 196it [00:43, 4.56it/s] +2025-05-26 01:30:07,756 - INFO - Epoch: 16, Objective: tensor([2848.4922], device='cuda:0', grad_fn=), Loss: 0.02026955410838127, KL/n: 44.883338928222656 + 0it [00:00, ?it/s]2025-05-26 01:30:08,312 - INFO - [Epoch 017 | Batch 0000] IWAE-loss 2439.9866 | mean log_px -0.0047 | KL -2197.12 + 1it [00:00, 3.34it/s] 2it [00:00, 4.02it/s] 3it [00:00, 4.30it/s] 4it [00:00, 4.43it/s] 5it [00:01, 4.51it/s] 6it [00:01, 4.57it/s] 7it [00:01, 4.43it/s] 8it [00:01, 4.49it/s] 9it [00:02, 4.55it/s] 10it [00:02, 4.57it/s] 11it [00:02, 4.61it/s] 12it [00:02, 4.61it/s] 13it [00:02, 4.47it/s] 14it [00:03, 4.52it/s] 15it [00:03, 4.57it/s] 16it [00:03, 4.59it/s] 17it [00:03, 4.46it/s] 18it [00:04, 4.51it/s] 19it [00:04, 4.57it/s] 20it [00:04, 4.59it/s] 21it [00:04, 4.63it/s] 22it [00:04, 4.64it/s] 23it [00:05, 4.50it/s] 24it [00:05, 4.55it/s] 25it [00:05, 4.59it/s] 26it [00:05, 4.61it/s] 27it [00:05, 4.63it/s] 28it [00:06, 4.61it/s] 29it [00:06, 4.51it/s] 30it [00:06, 4.55it/s] 31it [00:06, 4.55it/s] 32it [00:07, 4.58it/s] 33it [00:07, 4.62it/s] 34it [00:07, 4.47it/s] 35it [00:07, 4.54it/s] 36it [00:07, 4.57it/s] 37it [00:08, 4.61it/s] 38it [00:08, 4.63it/s] 39it [00:08, 4.64it/s] 40it [00:08, 4.49it/s] 41it [00:09, 4.53it/s] 42it [00:09, 4.57it/s] 43it [00:09, 4.60it/s] 44it [00:09, 4.61it/s] 45it [00:09, 4.62it/s] 46it [00:10, 4.49it/s] 47it [00:10, 4.55it/s] 48it [00:10, 4.57it/s] 49it [00:10, 4.61it/s] 50it [00:11, 4.46it/s]2025-05-26 01:30:19,268 - INFO - [Epoch 017 | Batch 0050] IWAE-loss 3817.5354 | mean log_px -0.0287 | KL -2182.09 + 51it [00:11, 4.44it/s] 52it [00:11, 4.51it/s] 53it [00:11, 4.56it/s] 54it [00:11, 4.59it/s] 55it [00:12, 4.61it/s] 56it [00:12, 4.52it/s] 57it [00:12, 4.56it/s] 58it [00:12, 4.59it/s] 59it [00:12, 4.60it/s] 60it [00:13, 4.62it/s] 61it [00:13, 4.52it/s] 62it [00:13, 4.57it/s] 63it [00:13, 4.60it/s] 64it [00:14, 4.62it/s] 65it [00:14, 4.64it/s] 66it [00:14, 4.61it/s] 67it [00:14, 4.48it/s] 68it [00:14, 4.53it/s] 69it [00:15, 4.58it/s] 70it [00:15, 4.60it/s] 71it [00:15, 4.61it/s] 72it [00:15, 4.61it/s] 73it [00:16, 4.47it/s] 74it [00:16, 4.53it/s] 75it [00:16, 4.56it/s] 76it [00:16, 4.58it/s] 77it [00:16, 4.58it/s] 78it [00:17, 4.59it/s] 79it [00:17, 4.59it/s] 80it [00:17, 4.44it/s] 81it [00:17, 4.50it/s] 82it [00:18, 4.55it/s] 83it [00:18, 4.55it/s] 84it [00:18, 4.58it/s] 85it [00:18, 4.60it/s] 86it [00:18, 4.61it/s] 87it [00:19, 4.49it/s] 88it [00:19, 4.54it/s] 89it [00:19, 4.57it/s] 90it [00:19, 4.59it/s] 91it [00:19, 4.63it/s] 92it [00:20, 4.61it/s] 93it [00:20, 4.52it/s] 94it [00:20, 4.57it/s] 95it [00:20, 4.59it/s] 96it [00:21, 4.60it/s] 97it [00:21, 4.62it/s] 98it [00:21, 4.48it/s] 99it [00:21, 4.54it/s] 100it [00:21, 4.58it/s]2025-05-26 01:30:30,196 - INFO - [Epoch 017 | Batch 0100] IWAE-loss 2449.2668 | mean log_px -0.0059 | KL -2174.15 + 101it [00:22, 4.59it/s] 102it [00:22, 4.62it/s] 103it [00:22, 4.49it/s] 104it [00:22, 4.54it/s] 105it [00:23, 4.58it/s] 106it [00:23, 4.58it/s] 107it [00:23, 4.60it/s] 108it [00:23, 4.49it/s] 109it [00:23, 4.54it/s] 110it [00:24, 4.56it/s] 111it [00:24, 4.60it/s] 112it [00:24, 4.61it/s] 113it [00:24, 4.62it/s] 114it [00:25, 4.48it/s] 115it [00:25, 4.54it/s] 116it [00:25, 4.57it/s] 117it [00:25, 4.60it/s] 118it [00:25, 4.62it/s] 119it [00:26, 4.63it/s] 120it [00:26, 4.53it/s] 121it [00:26, 4.53it/s] 122it [00:26, 4.56it/s] 123it [00:27, 4.60it/s] 124it [00:27, 4.62it/s] 125it [00:27, 4.50it/s] 126it [00:27, 4.54it/s] 127it [00:27, 4.57it/s] 128it [00:28, 4.59it/s] 129it [00:28, 4.61it/s] 130it [00:28, 4.62it/s] 131it [00:28, 4.49it/s] 132it [00:28, 4.53it/s] 133it [00:29, 4.58it/s] 134it [00:29, 4.60it/s] 135it [00:29, 4.63it/s] 136it [00:29, 4.60it/s] 137it [00:30, 4.47it/s] 138it [00:30, 4.52it/s] 139it [00:30, 4.57it/s] 140it [00:30, 4.58it/s] 141it [00:30, 4.61it/s] 142it [00:31, 4.63it/s] 143it [00:31, 4.49it/s] 144it [00:31, 4.55it/s] 145it [00:31, 4.57it/s] 146it [00:32, 4.59it/s] 147it [00:32, 4.61it/s] 148it [00:32, 4.61it/s] 149it [00:32, 4.47it/s] 150it [00:32, 4.53it/s]2025-05-26 01:30:41,151 - INFO - [Epoch 017 | Batch 0150] IWAE-loss 2379.8494 | mean log_px -0.0040 | KL -2152.76 + 151it [00:33, 4.55it/s] 152it [00:33, 4.57it/s] 153it [00:33, 4.61it/s] 154it [00:33, 4.60it/s] 155it [00:34, 4.61it/s] 156it [00:34, 4.47it/s] 157it [00:34, 4.52it/s] 158it [00:34, 4.53it/s] 159it [00:34, 4.58it/s] 160it [00:35, 4.61it/s] 161it [00:35, 4.63it/s] 162it [00:35, 4.50it/s] 163it [00:35, 4.57it/s] 164it [00:35, 4.60it/s] 165it [00:36, 4.62it/s] 166it [00:36, 4.65it/s] 167it [00:36, 4.66it/s] 168it [00:36, 4.67it/s] 169it [00:37, 4.68it/s] 170it [00:37, 4.68it/s] 171it [00:37, 4.52it/s] 172it [00:37, 4.58it/s] 173it [00:37, 4.61it/s] 174it [00:38, 4.63it/s] 175it [00:38, 4.65it/s] 176it [00:38, 4.65it/s] 177it [00:38, 4.67it/s] 178it [00:38, 4.67it/s] 179it [00:39, 4.68it/s] 180it [00:39, 4.53it/s] 181it [00:39, 4.59it/s] 182it [00:39, 4.62it/s] 183it [00:40, 4.65it/s] 184it [00:40, 4.66it/s] 185it [00:40, 4.66it/s] 186it [00:40, 4.50it/s] 187it [00:40, 4.56it/s] 188it [00:41, 4.45it/s] 189it [00:41, 4.52it/s] 190it [00:41, 4.54it/s] 191it [00:41, 4.56it/s] 192it [00:42, 4.59it/s] 193it [00:42, 4.61it/s] 194it [00:42, 4.40it/s] 195it [00:42, 4.08it/s] 196it [00:43, 4.22it/s] 196it [00:43, 4.55it/s] +2025-05-26 01:30:51,179 - INFO - Epoch: 17, Objective: tensor([2270.9153], device='cuda:0', grad_fn=), Loss: 0.004182320553809404, KL/n: 43.6452751159668 + 0it [00:00, ?it/s]2025-05-26 01:30:51,585 - INFO - [Epoch 018 | Batch 0000] IWAE-loss 2706.3704 | mean log_px -0.0173 | KL -2135.82 + 1it [00:00, 2.98it/s] 2it [00:00, 3.72it/s] 3it [00:00, 4.05it/s] 4it [00:01, 4.21it/s] 5it [00:01, 4.29it/s] 6it [00:01, 4.23it/s] 7it [00:01, 4.39it/s] 8it [00:01, 4.45it/s] 9it [00:02, 4.50it/s] 10it [00:02, 4.56it/s] 11it [00:02, 4.58it/s] 12it [00:02, 4.59it/s] 13it [00:02, 4.63it/s] 14it [00:03, 4.57it/s] 15it [00:03, 4.42it/s] 16it [00:03, 4.46it/s] 17it [00:03, 4.52it/s] 18it [00:04, 4.48it/s] 19it [00:04, 4.53it/s] 20it [00:04, 4.49it/s] 21it [00:04, 4.47it/s] 22it [00:05, 4.36it/s] 23it [00:05, 4.36it/s] 24it [00:05, 4.43it/s] 25it [00:05, 4.44it/s] 26it [00:05, 4.47it/s] 27it [00:06, 4.49it/s] 28it [00:06, 4.53it/s] 29it [00:06, 4.35it/s] 30it [00:06, 4.43it/s] 31it [00:07, 4.50it/s] 32it [00:07, 4.53it/s] 33it [00:07, 4.57it/s] 34it [00:07, 4.58it/s] 35it [00:07, 4.59it/s] 36it [00:08, 4.58it/s] 37it [00:08, 4.54it/s] 38it [00:08, 4.56it/s] 39it [00:08, 4.42it/s] 40it [00:09, 4.43it/s] 41it [00:09, 4.50it/s] 42it [00:09, 4.42it/s] 43it [00:09, 4.48it/s] 44it [00:09, 4.45it/s] 45it [00:10, 4.30it/s] 46it [00:10, 4.41it/s] 47it [00:10, 4.43it/s] 48it [00:10, 4.48it/s] 49it [00:11, 4.54it/s] 50it [00:11, 4.55it/s]2025-05-26 01:31:02,718 - INFO - [Epoch 018 | Batch 0050] IWAE-loss 2571.1865 | mean log_px -0.0093 | KL -2121.10 + 51it [00:11, 4.43it/s] 52it [00:11, 4.43it/s] 53it [00:11, 4.50it/s] 54it [00:12, 4.54it/s] 55it [00:12, 4.55it/s] 56it [00:12, 4.57it/s] 57it [00:12, 4.31it/s] 58it [00:13, 4.36it/s] 59it [00:13, 4.38it/s] 60it [00:13, 4.41it/s] 61it [00:13, 4.48it/s] 62it [00:13, 4.53it/s] 63it [00:14, 4.43it/s] 64it [00:14, 4.50it/s] 65it [00:14, 4.54it/s] 66it [00:14, 4.56it/s] 67it [00:15, 4.58it/s] 68it [00:15, 4.59it/s] 69it [00:15, 4.53it/s] 70it [00:15, 4.40it/s] 71it [00:15, 4.48it/s] 72it [00:16, 4.51it/s] 73it [00:16, 4.51it/s] 74it [00:16, 4.54it/s] 75it [00:16, 4.58it/s] 76it [00:17, 4.53it/s] 77it [00:17, 4.36it/s] 78it [00:17, 3.55it/s] 79it [00:17, 3.82it/s] 80it [00:18, 4.05it/s] 81it [00:18, 4.20it/s] 82it [00:18, 4.33it/s] 83it [00:18, 4.37it/s] 84it [00:19, 4.28it/s] 85it [00:19, 4.33it/s] 86it [00:19, 4.41it/s] 87it [00:19, 4.47it/s] 88it [00:19, 4.51it/s] 89it [00:20, 4.55it/s] 90it [00:20, 4.53it/s] 91it [00:20, 4.50it/s] 92it [00:20, 4.32it/s] 93it [00:21, 4.41it/s] 94it [00:21, 4.48it/s] 95it [00:21, 4.43it/s] 96it [00:21, 4.49it/s] 97it [00:21, 4.52it/s] 98it [00:22, 4.55it/s] 99it [00:22, 4.38it/s] 100it [00:22, 4.47it/s]2025-05-26 01:31:14,056 - INFO - [Epoch 018 | Batch 0100] IWAE-loss 2327.6116 | mean log_px -0.0041 | KL -2106.47 + 101it [00:22, 4.53it/s] 102it [00:23, 4.55it/s] 103it [00:23, 4.59it/s] 104it [00:23, 4.60it/s] 105it [00:23, 4.55it/s] 106it [00:23, 4.44it/s] 107it [00:24, 4.52it/s] 108it [00:24, 4.56it/s] 109it [00:24, 4.55it/s] 110it [00:24, 4.55it/s] 111it [00:24, 4.57it/s] 112it [00:25, 4.60it/s] 113it [00:25, 4.48it/s] 114it [00:25, 4.53it/s] 115it [00:25, 4.57it/s] 116it [00:26, 4.60it/s] 117it [00:26, 4.62it/s] 118it [00:26, 4.63it/s] 119it [00:26, 4.65it/s] 120it [00:26, 4.50it/s] 121it [00:27, 4.55it/s] 122it [00:27, 4.51it/s] 123it [00:27, 4.57it/s] 124it [00:27, 4.56it/s] 125it [00:28, 4.54it/s] 126it [00:28, 4.59it/s] 127it [00:28, 4.46it/s] 128it [00:28, 4.52it/s] 129it [00:28, 4.56it/s] 130it [00:29, 4.58it/s] 131it [00:29, 4.47it/s] 132it [00:29, 4.47it/s] 133it [00:29, 4.53it/s] 134it [00:30, 4.42it/s] 135it [00:30, 4.50it/s] 136it [00:30, 4.51it/s] 137it [00:30, 4.46it/s] 138it [00:30, 4.44it/s] 139it [00:31, 4.49it/s] 140it [00:31, 4.39it/s] 141it [00:31, 4.43it/s] 142it [00:31, 4.48it/s] 143it [00:32, 4.51it/s] 144it [00:32, 4.46it/s] 145it [00:32, 4.54it/s] 146it [00:32, 4.52it/s] 147it [00:32, 4.47it/s] 148it [00:33, 4.38it/s] 149it [00:33, 4.42it/s] 150it [00:33, 4.43it/s]2025-05-26 01:31:25,128 - INFO - [Epoch 018 | Batch 0150] IWAE-loss 3520.7913 | mean log_px -0.0254 | KL -2092.53 + 151it [00:33, 4.47it/s] 152it [00:34, 4.49it/s] 153it [00:34, 4.54it/s] 154it [00:34, 4.55it/s] 155it [00:34, 4.59it/s] 156it [00:34, 4.60it/s] 157it [00:35, 4.46it/s] 158it [00:35, 4.50it/s] 159it [00:35, 4.55it/s] 160it [00:35, 4.59it/s] 161it [00:36, 4.61it/s] 162it [00:36, 4.62it/s] 163it [00:36, 4.66it/s] 164it [00:36, 4.67it/s] 165it [00:36, 4.61it/s] 166it [00:37, 4.62it/s] 167it [00:37, 4.64it/s] 168it [00:37, 4.66it/s] 169it [00:37, 4.66it/s] 170it [00:37, 4.63it/s] 171it [00:38, 4.64it/s] 172it [00:38, 4.65it/s] 173it [00:38, 4.65it/s] 174it [00:38, 4.67it/s] 175it [00:39, 4.60it/s] 176it [00:39, 4.61it/s] 177it [00:39, 4.64it/s] 178it [00:39, 4.60it/s] 179it [00:39, 4.61it/s] 180it [00:40, 4.56it/s] 181it [00:40, 4.57it/s] 182it [00:40, 4.54it/s] 183it [00:40, 4.51it/s] 184it [00:41, 4.56it/s] 185it [00:41, 4.55it/s] 186it [00:41, 4.58it/s] 187it [00:41, 4.62it/s] 188it [00:41, 4.64it/s] 189it [00:42, 4.64it/s] 190it [00:42, 4.60it/s] 191it [00:42, 4.55it/s] 192it [00:42, 4.59it/s] 193it [00:43, 4.56it/s] 194it [00:43, 4.60it/s] 195it [00:43, 4.48it/s] 196it [00:43, 4.26it/s] 196it [00:43, 4.48it/s] +2025-05-26 01:31:35,111 - INFO - Epoch: 18, Objective: tensor([2600.6919], device='cuda:0', grad_fn=), Loss: 0.01254788413643837, KL/n: 42.441864013671875 + 0it [00:00, ?it/s]2025-05-26 01:31:35,492 - INFO - [Epoch 019 | Batch 0000] IWAE-loss 2569.3970 | mean log_px -0.0069 | KL -2083.59 + 1it [00:00, 3.27it/s] 2it [00:00, 3.97it/s] 3it [00:00, 4.23it/s] 4it [00:00, 4.40it/s] 5it [00:01, 4.32it/s] 6it [00:01, 4.28it/s] 7it [00:01, 4.27it/s] 8it [00:01, 4.23it/s] 9it [00:02, 4.38it/s] 10it [00:02, 4.28it/s] 11it [00:02, 4.25it/s] 12it [00:02, 4.22it/s] 13it [00:03, 4.24it/s] 14it [00:03, 4.36it/s] 15it [00:03, 4.44it/s] 16it [00:03, 4.39it/s] 17it [00:03, 4.35it/s] 18it [00:04, 4.45it/s] 19it [00:04, 4.47it/s] 20it [00:04, 4.38it/s] 21it [00:04, 4.32it/s] 22it [00:05, 4.42it/s] 23it [00:05, 4.27it/s] 24it [00:05, 4.33it/s] 25it [00:05, 4.41it/s] 26it [00:06, 4.49it/s] 27it [00:06, 4.55it/s] 28it [00:06, 4.58it/s] 29it [00:06, 4.41it/s] 30it [00:06, 4.48it/s] 31it [00:07, 4.55it/s] 32it [00:07, 4.58it/s] 33it [00:07, 4.62it/s] 34it [00:07, 4.35it/s] 35it [00:08, 4.45it/s] 36it [00:08, 4.50it/s] 37it [00:08, 4.48it/s] 38it [00:08, 4.41it/s] 39it [00:08, 4.48it/s] 40it [00:09, 4.37it/s] 41it [00:09, 4.31it/s] 42it [00:09, 4.39it/s] 43it [00:09, 4.48it/s] 44it [00:10, 4.38it/s] 45it [00:10, 4.46it/s] 46it [00:10, 4.31it/s] 47it [00:10, 4.44it/s] 48it [00:10, 4.51it/s] 49it [00:11, 4.38it/s] 50it [00:11, 4.30it/s]2025-05-26 01:31:46,847 - INFO - [Epoch 019 | Batch 0050] IWAE-loss 2562.2981 | mean log_px -0.0159 | KL -2057.50 + 51it [00:11, 4.28it/s] 52it [00:11, 4.26it/s] 53it [00:12, 4.39it/s] 54it [00:12, 4.47it/s] 55it [00:12, 4.46it/s] 56it [00:12, 4.35it/s] 57it [00:13, 4.46it/s] 58it [00:13, 4.38it/s] 59it [00:13, 4.31it/s] 60it [00:13, 4.39it/s] 61it [00:13, 4.35it/s] 62it [00:14, 4.47it/s] 63it [00:14, 4.54it/s] 64it [00:14, 4.54it/s] 65it [00:14, 4.51it/s] 66it [00:15, 4.40it/s] 67it [00:15, 4.38it/s] 68it [00:15, 4.31it/s] 69it [00:15, 4.28it/s] 70it [00:15, 4.39it/s] 71it [00:16, 4.49it/s] 72it [00:16, 4.55it/s] 73it [00:16, 4.57it/s] 74it [00:16, 4.48it/s] 75it [00:17, 4.39it/s] 76it [00:17, 4.48it/s] 77it [00:17, 4.54it/s] 78it [00:17, 4.59it/s] 79it [00:17, 4.46it/s] 80it [00:18, 4.49it/s] 81it [00:18, 4.40it/s] 82it [00:18, 4.47it/s] 83it [00:18, 4.35it/s] 84it [00:19, 4.44it/s] 85it [00:19, 4.33it/s] 86it [00:19, 4.24it/s] 87it [00:19, 4.39it/s] 88it [00:20, 4.17it/s] 89it [00:20, 4.27it/s] 90it [00:20, 4.38it/s] 91it [00:20, 4.47it/s] 92it [00:20, 4.47it/s] 93it [00:21, 4.50it/s] 94it [00:21, 4.53it/s] 95it [00:21, 4.37it/s] 96it [00:21, 4.47it/s] 97it [00:22, 4.53it/s] 98it [00:22, 4.48it/s] 99it [00:22, 4.44it/s] 100it [00:22, 4.52it/s]2025-05-26 01:31:58,120 - INFO - [Epoch 019 | Batch 0100] IWAE-loss 2413.2510 | mean log_px -0.0084 | KL -2045.86 + 101it [00:22, 4.48it/s] 102it [00:23, 4.50it/s] 103it [00:23, 4.57it/s] 104it [00:23, 4.58it/s] 105it [00:23, 4.64it/s] 106it [00:24, 4.44it/s] 107it [00:24, 4.39it/s] 108it [00:24, 4.44it/s] 109it [00:24, 4.45it/s] 110it [00:24, 4.28it/s] 111it [00:25, 4.31it/s] 112it [00:25, 4.40it/s] 113it [00:25, 4.49it/s] 114it [00:25, 4.55it/s] 115it [00:26, 4.60it/s] 116it [00:26, 4.54it/s] 117it [00:26, 4.49it/s] 118it [00:26, 4.39it/s] 119it [00:26, 4.32it/s] 120it [00:27, 4.27it/s] 121it [00:27, 4.39it/s] 122it [00:27, 4.42it/s] 123it [00:27, 4.50it/s] 124it [00:28, 4.45it/s] 125it [00:28, 4.53it/s] 126it [00:28, 4.56it/s] 127it [00:28, 4.62it/s] 128it [00:28, 4.53it/s] 129it [00:29, 4.56it/s] 130it [00:29, 4.46it/s] 131it [00:29, 4.54it/s] 132it [00:29, 4.52it/s] 133it [00:30, 4.56it/s] 134it [00:30, 4.61it/s] 135it [00:30, 4.40it/s] 136it [00:30, 4.25it/s] 137it [00:31, 4.32it/s] 138it [00:31, 4.39it/s] 139it [00:31, 4.44it/s] 140it [00:31, 4.21it/s] 141it [00:31, 4.22it/s] 142it [00:32, 4.22it/s] 143it [00:32, 4.20it/s] 144it [00:32, 4.26it/s] 145it [00:32, 4.23it/s] 146it [00:33, 4.25it/s] 147it [00:33, 4.22it/s] 148it [00:33, 4.26it/s] 149it [00:33, 4.22it/s] 150it [00:34, 4.20it/s]2025-05-26 01:32:09,494 - INFO - [Epoch 019 | Batch 0150] IWAE-loss 2499.8535 | mean log_px -0.0090 | KL -2029.06 + 151it [00:34, 4.14it/s] 152it [00:34, 4.27it/s] 153it [00:34, 4.24it/s] 154it [00:35, 4.29it/s] 155it [00:35, 4.29it/s] 156it [00:35, 4.34it/s] 157it [00:35, 4.32it/s] 158it [00:35, 4.25it/s] 159it [00:36, 4.36it/s] 160it [00:36, 4.36it/s] 161it [00:36, 4.37it/s] 162it [00:36, 4.38it/s] 163it [00:37, 4.46it/s] 164it [00:37, 4.54it/s] 165it [00:37, 4.57it/s] 166it [00:37, 4.47it/s] 167it [00:37, 4.42it/s] 168it [00:38, 4.50it/s] 169it [00:38, 4.56it/s] 170it [00:38, 4.60it/s] 171it [00:38, 4.40it/s] 172it [00:39, 4.51it/s] 173it [00:39, 4.42it/s] 174it [00:39, 4.43it/s] 175it [00:39, 4.52it/s] 176it [00:39, 4.42it/s] 177it [00:40, 4.37it/s] 178it [00:40, 4.36it/s] 179it [00:40, 4.36it/s] 180it [00:40, 4.46it/s] 181it [00:41, 4.54it/s] 182it [00:41, 4.44it/s] 183it [00:41, 4.54it/s] 184it [00:41, 4.45it/s] 185it [00:41, 4.43it/s] 186it [00:42, 4.49it/s] 187it [00:42, 4.42it/s] 188it [00:42, 4.36it/s] 189it [00:42, 4.22it/s] 190it [00:43, 4.22it/s] 191it [00:43, 4.24it/s] 192it [00:43, 4.32it/s] 193it [00:43, 4.30it/s] 194it [00:44, 4.11it/s] 195it [00:44, 4.09it/s] 196it [00:44, 4.16it/s] 196it [00:44, 4.39it/s] +2025-05-26 01:32:19,924 - INFO - Epoch: 19, Objective: tensor([2346.0564], device='cuda:0', grad_fn=), Loss: 0.010250546969473362, KL/n: 41.190834045410156 + 0it [00:00, ?it/s]2025-05-26 01:32:20,528 - INFO - [Epoch 020 | Batch 0000] IWAE-loss 2297.0408 | mean log_px -0.0067 | KL -2018.12 + 1it [00:00, 2.88it/s] 2it [00:00, 3.52it/s] 3it [00:00, 4.00it/s] 4it [00:01, 4.24it/s] 5it [00:01, 4.41it/s] 6it [00:01, 4.51it/s] 7it [00:01, 4.57it/s] 8it [00:01, 4.48it/s] 9it [00:02, 4.54it/s] 10it [00:02, 4.56it/s] 11it [00:02, 4.62it/s] 12it [00:02, 4.65it/s] 13it [00:02, 4.68it/s] 14it [00:03, 4.69it/s] 15it [00:03, 4.71it/s] 16it [00:03, 4.71it/s] 17it [00:03, 4.72it/s] 18it [00:03, 4.72it/s] 19it [00:04, 4.72it/s] 20it [00:04, 4.68it/s] 21it [00:04, 4.42it/s] 22it [00:04, 4.52it/s] 23it [00:05, 4.49it/s] 24it [00:05, 4.57it/s] 25it [00:05, 4.61it/s] 26it [00:05, 4.58it/s] 27it [00:05, 4.53it/s] 28it [00:06, 4.41it/s] 29it [00:06, 4.50it/s] 30it [00:06, 4.56it/s] 31it [00:06, 4.60it/s] 32it [00:07, 4.61it/s] 33it [00:07, 4.64it/s] 34it [00:07, 4.49it/s] 35it [00:07, 4.57it/s] 36it [00:07, 4.60it/s] 37it [00:08, 4.62it/s] 38it [00:08, 4.63it/s] 39it [00:08, 4.48it/s] 40it [00:08, 4.30it/s] 41it [00:09, 4.43it/s] 42it [00:09, 4.47it/s] 43it [00:09, 4.43it/s] 44it [00:09, 4.49it/s] 45it [00:09, 4.42it/s] 46it [00:10, 4.37it/s] 47it [00:10, 4.38it/s] 48it [00:10, 4.34it/s] 49it [00:10, 4.37it/s] 50it [00:11, 4.44it/s]2025-05-26 01:32:31,529 - INFO - [Epoch 020 | Batch 0050] IWAE-loss 2567.9041 | mean log_px -0.0136 | KL -1997.04 + 51it [00:11, 4.51it/s] 52it [00:11, 4.56it/s] 53it [00:11, 4.33it/s] 54it [00:12, 4.45it/s] 55it [00:12, 4.39it/s] 56it [00:12, 4.36it/s] 57it [00:12, 4.26it/s] 58it [00:12, 4.39it/s] 59it [00:13, 4.40it/s] 60it [00:13, 4.47it/s] 61it [00:13, 4.37it/s] 62it [00:13, 4.49it/s] 63it [00:14, 4.32it/s] 64it [00:14, 4.31it/s] 65it [00:14, 4.32it/s] 66it [00:14, 4.30it/s] 67it [00:15, 4.32it/s] 68it [00:15, 4.43it/s] 69it [00:15, 4.33it/s] 70it [00:15, 4.35it/s] 71it [00:15, 4.33it/s] 72it [00:16, 4.31it/s] 73it [00:16, 4.31it/s] 74it [00:16, 4.44it/s] 75it [00:16, 4.43it/s] 76it [00:17, 4.43it/s] 77it [00:17, 4.40it/s] 78it [00:17, 4.48it/s] 79it [00:17, 4.56it/s] 80it [00:17, 4.60it/s] 81it [00:18, 4.48it/s] 82it [00:18, 4.53it/s] 83it [00:18, 4.50it/s] 84it [00:18, 4.40it/s] 85it [00:19, 4.35it/s] 86it [00:19, 4.42it/s] 87it [00:19, 4.48it/s] 88it [00:19, 4.55it/s] 89it [00:19, 4.44it/s] 90it [00:20, 4.36it/s] 91it [00:20, 4.32it/s] 92it [00:20, 4.40it/s] 93it [00:20, 4.49it/s] 94it [00:21, 4.54it/s] 95it [00:21, 4.44it/s] 96it [00:21, 4.53it/s] 97it [00:21, 4.59it/s] 98it [00:21, 4.51it/s] 99it [00:22, 4.51it/s] 100it [00:22, 4.54it/s]2025-05-26 01:32:42,825 - INFO - [Epoch 020 | Batch 0100] IWAE-loss 3235.3687 | mean log_px -0.0223 | KL -1973.44 + 101it [00:22, 4.37it/s] 102it [00:22, 4.47it/s] 103it [00:23, 4.41it/s] 104it [00:23, 4.42it/s] 105it [00:23, 4.44it/s] 106it [00:23, 4.42it/s] 107it [00:24, 4.29it/s] 108it [00:24, 4.33it/s] 109it [00:24, 4.31it/s] 110it [00:24, 4.39it/s] 111it [00:24, 4.44it/s] 112it [00:25, 4.44it/s] 113it [00:25, 4.24it/s] 114it [00:25, 4.33it/s] 115it [00:25, 4.36it/s] 116it [00:26, 4.48it/s] 117it [00:26, 4.56it/s] 118it [00:26, 4.54it/s] 119it [00:26, 4.55it/s] 120it [00:26, 4.45it/s] 121it [00:27, 4.54it/s] 122it [00:27, 4.59it/s] 123it [00:27, 4.63it/s] 124it [00:27, 4.66it/s] 125it [00:28, 4.64it/s] 126it [00:28, 4.57it/s] 127it [00:28, 4.55it/s] 128it [00:28, 4.39it/s] 129it [00:28, 4.42it/s] 130it [00:29, 4.43it/s] 131it [00:29, 4.46it/s] 132it [00:29, 4.41it/s] 133it [00:29, 4.44it/s] 134it [00:30, 4.35it/s] 135it [00:30, 4.46it/s] 136it [00:30, 4.41it/s] 137it [00:30, 4.53it/s] 138it [00:30, 4.52it/s] 139it [00:31, 4.52it/s] 140it [00:31, 4.55it/s] 141it [00:31, 4.56it/s] 142it [00:31, 4.61it/s] 143it [00:32, 4.39it/s] 144it [00:32, 4.42it/s] 145it [00:32, 4.45it/s] 146it [00:32, 4.53it/s] 147it [00:32, 4.52it/s] 148it [00:33, 4.56it/s] 149it [00:33, 4.56it/s] 150it [00:33, 4.60it/s]2025-05-26 01:32:54,001 - INFO - [Epoch 020 | Batch 0150] IWAE-loss 2351.8418 | mean log_px -0.0055 | KL -1967.71 + 151it [00:33, 4.47it/s] 152it [00:34, 4.43it/s] 153it [00:34, 4.54it/s] 154it [00:34, 4.55it/s] 155it [00:34, 4.61it/s] 156it [00:34, 4.59it/s] 157it [00:35, 4.53it/s] 158it [00:35, 4.53it/s] 159it [00:35, 4.39it/s] 160it [00:35, 4.41it/s] 161it [00:36, 4.35it/s] 162it [00:36, 4.29it/s] 163it [00:36, 4.37it/s] 164it [00:36, 4.31it/s] 165it [00:37, 4.32it/s] 166it [00:37, 4.27it/s] 167it [00:37, 4.30it/s] 168it [00:37, 4.27it/s] 169it [00:37, 4.34it/s] 170it [00:38, 4.13it/s] 171it [00:38, 4.06it/s] 172it [00:38, 4.12it/s] 173it [00:38, 4.15it/s] 174it [00:39, 4.16it/s] 175it [00:39, 4.30it/s] 176it [00:39, 4.40it/s] 177it [00:39, 4.50it/s] 178it [00:40, 4.56it/s] 179it [00:40, 4.37it/s] 180it [00:40, 4.37it/s] 181it [00:40, 4.47it/s] 182it [00:40, 4.48it/s] 183it [00:41, 4.55it/s] 184it [00:41, 4.41it/s] 185it [00:41, 4.40it/s] 186it [00:41, 4.49it/s] 187it [00:42, 4.56it/s] 188it [00:42, 4.53it/s] 189it [00:42, 4.57it/s] 190it [00:42, 4.48it/s] 191it [00:42, 4.54it/s] 192it [00:43, 4.58it/s] 193it [00:43, 4.29it/s] 194it [00:43, 4.38it/s] 195it [00:43, 4.28it/s] 196it [00:44, 4.26it/s] 196it [00:44, 4.44it/s] +2025-05-26 01:33:04,437 - INFO - Epoch: 20, Objective: tensor([2321.2383], device='cuda:0', grad_fn=), Loss: 0.013511824421584606, KL/n: 39.98223876953125 + 0it [00:00, ?it/s]2025-05-26 01:33:04,814 - INFO - [Epoch 021 | Batch 0000] IWAE-loss 2518.2864 | mean log_px -0.0100 | KL -1959.45 + 1it [00:00, 3.35it/s] 2it [00:00, 3.79it/s] 3it [00:00, 3.87it/s] 4it [00:00, 4.18it/s] 5it [00:01, 4.34it/s] 6it [00:01, 4.23it/s] 7it [00:01, 4.09it/s] 8it [00:01, 4.25it/s] 9it [00:02, 4.30it/s] 10it [00:02, 4.27it/s] 11it [00:02, 4.29it/s] 12it [00:02, 4.40it/s] 13it [00:03, 4.17it/s] 14it [00:03, 4.25it/s] 15it [00:03, 4.36it/s] 16it [00:03, 4.31it/s] 17it [00:04, 4.42it/s] 18it [00:04, 4.35it/s] 19it [00:04, 4.45it/s] 20it [00:04, 4.51it/s] 21it [00:04, 4.45it/s] 22it [00:05, 4.37it/s] 23it [00:05, 4.33it/s] 24it [00:05, 4.39it/s] 25it [00:05, 4.35it/s] 26it [00:06, 4.39it/s] 27it [00:06, 4.21it/s] 28it [00:06, 4.20it/s] 29it [00:06, 4.22it/s] 30it [00:07, 4.22it/s] 31it [00:07, 4.34it/s] 32it [00:07, 4.29it/s] 33it [00:07, 4.40it/s] 34it [00:07, 4.35it/s] 35it [00:08, 4.35it/s] 36it [00:08, 4.35it/s] 37it [00:08, 4.30it/s] 38it [00:08, 4.18it/s] 39it [00:09, 3.48it/s] 40it [00:09, 3.78it/s] 41it [00:09, 3.98it/s] 42it [00:09, 4.03it/s] 43it [00:10, 3.99it/s] 44it [00:10, 4.13it/s] 45it [00:10, 4.25it/s] 46it [00:10, 4.25it/s] 47it [00:11, 4.27it/s] 48it [00:11, 4.33it/s] 49it [00:11, 4.15it/s] 50it [00:11, 4.18it/s]2025-05-26 01:33:16,596 - INFO - [Epoch 021 | Batch 0050] IWAE-loss 2608.6096 | mean log_px -0.0148 | KL -1939.67 + 51it [00:12, 4.20it/s] 52it [00:12, 4.34it/s] 53it [00:12, 4.36it/s] 54it [00:12, 4.33it/s] 55it [00:13, 4.13it/s] 56it [00:13, 4.16it/s] 57it [00:13, 4.21it/s] 58it [00:13, 4.24it/s] 59it [00:13, 4.34it/s] 60it [00:14, 4.32it/s] 61it [00:14, 4.32it/s] 62it [00:14, 4.38it/s] 63it [00:14, 4.32it/s] 64it [00:15, 4.33it/s] 65it [00:15, 4.32it/s] 66it [00:15, 4.33it/s] 67it [00:15, 4.34it/s] 68it [00:16, 4.31it/s] 69it [00:16, 4.31it/s] 70it [00:16, 4.31it/s] 71it [00:16, 4.34it/s] 72it [00:16, 4.32it/s] 73it [00:17, 4.34it/s] 74it [00:17, 4.38it/s] 75it [00:17, 4.39it/s] 76it [00:17, 4.48it/s] 77it [00:18, 4.54it/s] 78it [00:18, 4.40it/s] 79it [00:18, 4.35it/s] 80it [00:18, 4.44it/s] 81it [00:18, 4.41it/s] 82it [00:19, 4.37it/s] 83it [00:19, 4.36it/s] 84it [00:19, 4.30it/s] 85it [00:19, 4.29it/s] 86it [00:20, 4.27it/s] 87it [00:20, 4.29it/s] 88it [00:20, 4.29it/s] 89it [00:20, 4.26it/s] 90it [00:21, 4.28it/s] 91it [00:21, 4.27it/s] 92it [00:21, 4.30it/s] 93it [00:21, 4.31it/s] 94it [00:22, 4.31it/s] 95it [00:22, 4.26it/s] 96it [00:22, 4.22it/s] 97it [00:22, 4.33it/s] 98it [00:22, 4.33it/s] 99it [00:23, 4.08it/s] 100it [00:23, 4.14it/s]2025-05-26 01:33:28,206 - INFO - [Epoch 021 | Batch 0100] IWAE-loss 2265.2100 | mean log_px -0.0051 | KL -1927.49 + 101it [00:23, 4.17it/s] 102it [00:23, 4.17it/s] 103it [00:24, 4.20it/s] 104it [00:24, 4.19it/s] 105it [00:24, 4.07it/s] 106it [00:24, 4.12it/s] 107it [00:25, 4.16it/s] 108it [00:25, 4.22it/s] 109it [00:25, 4.26it/s] 110it [00:25, 4.22it/s] 111it [00:26, 4.11it/s] 112it [00:26, 4.11it/s] 113it [00:26, 4.17it/s] 114it [00:26, 4.11it/s] 115it [00:27, 4.14it/s] 116it [00:27, 4.06it/s] 117it [00:27, 4.11it/s] 118it [00:27, 4.18it/s] 119it [00:28, 4.18it/s] 120it [00:28, 4.20it/s] 121it [00:28, 4.32it/s] 122it [00:28, 4.41it/s] 123it [00:28, 4.31it/s] 124it [00:29, 4.29it/s] 125it [00:29, 4.26it/s] 126it [00:29, 4.29it/s] 127it [00:29, 4.30it/s] 128it [00:30, 4.22it/s] 129it [00:30, 4.21it/s] 130it [00:30, 4.24it/s] 131it [00:30, 4.25it/s] 132it [00:31, 4.27it/s] 133it [00:31, 4.33it/s] 134it [00:31, 4.16it/s] 135it [00:31, 4.18it/s] 136it [00:32, 4.24it/s] 137it [00:32, 4.32it/s] 138it [00:32, 4.25it/s] 139it [00:32, 4.25it/s] 140it [00:32, 4.11it/s] 141it [00:33, 4.19it/s] 142it [00:33, 4.21it/s] 143it [00:33, 4.21it/s] 144it [00:33, 4.22it/s] 145it [00:34, 4.22it/s] 146it [00:34, 4.11it/s] 147it [00:34, 4.15it/s] 148it [00:34, 4.28it/s] 149it [00:35, 4.37it/s] 150it [00:35, 4.32it/s]2025-05-26 01:33:40,049 - INFO - [Epoch 021 | Batch 0150] IWAE-loss 2249.6196 | mean log_px -0.0076 | KL -1918.02 + 151it [00:35, 4.33it/s] 152it [00:35, 4.43it/s] 153it [00:35, 4.31it/s] 154it [00:36, 4.29it/s] 155it [00:36, 4.27it/s] 156it [00:36, 4.25it/s] 157it [00:36, 4.21it/s] 158it [00:37, 4.19it/s] 159it [00:37, 4.19it/s] 160it [00:37, 4.32it/s] 161it [00:37, 4.29it/s] 162it [00:38, 4.40it/s] 163it [00:38, 4.41it/s] 164it [00:38, 4.45it/s] 165it [00:38, 4.37it/s] 166it [00:39, 4.32it/s] 167it [00:39, 4.29it/s] 168it [00:39, 4.30it/s] 169it [00:39, 4.30it/s] 170it [00:39, 4.29it/s] 171it [00:40, 4.32it/s] 172it [00:40, 4.29it/s] 173it [00:40, 4.39it/s] 174it [00:40, 4.40it/s] 175it [00:41, 4.34it/s] 176it [00:41, 4.30it/s] 177it [00:41, 4.30it/s] 178it [00:41, 4.32it/s] 179it [00:42, 4.40it/s] 180it [00:42, 4.32it/s] 181it [00:42, 4.29it/s] 182it [00:42, 4.27it/s] 183it [00:42, 4.31it/s] 184it [00:43, 4.28it/s] 185it [00:43, 4.29it/s] 186it [00:43, 4.41it/s] 187it [00:43, 4.38it/s] 188it [00:44, 4.30it/s] 189it [00:44, 4.30it/s] 190it [00:44, 4.42it/s] 191it [00:44, 4.35it/s] 192it [00:45, 4.30it/s] 193it [00:45, 4.29it/s] 194it [00:45, 4.41it/s] 195it [00:45, 4.33it/s] 196it [00:45, 4.31it/s] 196it [00:46, 4.26it/s] +2025-05-26 01:33:50,600 - INFO - Epoch: 21, Objective: tensor([2395.0178], device='cuda:0', grad_fn=), Loss: 0.009308933280408382, KL/n: 39.00183868408203 + 0it [00:00, ?it/s]2025-05-26 01:33:51,017 - INFO - [Epoch 022 | Batch 0000] IWAE-loss 2293.9033 | mean log_px -0.0119 | KL -1907.14 + 1it [00:00, 2.93it/s] 2it [00:00, 3.74it/s] 3it [00:00, 3.90it/s] 4it [00:01, 4.14it/s] 5it [00:01, 4.12it/s] 6it [00:01, 4.11it/s] 7it [00:01, 4.15it/s] 8it [00:01, 4.15it/s] 9it [00:02, 4.19it/s] 10it [00:02, 4.06it/s] 11it [00:02, 4.12it/s] 12it [00:02, 4.17it/s] 13it [00:03, 4.20it/s] 14it [00:03, 4.26it/s] 15it [00:03, 4.28it/s] 16it [00:03, 4.22it/s] 17it [00:04, 4.26it/s] 18it [00:04, 4.24it/s] 19it [00:04, 4.09it/s] 20it [00:04, 4.11it/s] 21it [00:05, 4.17it/s] 22it [00:05, 4.30it/s] 23it [00:05, 4.26it/s] 24it [00:05, 4.31it/s] 25it [00:06, 4.32it/s] 26it [00:06, 4.36it/s] 27it [00:06, 4.44it/s] 28it [00:06, 4.43it/s] 29it [00:06, 4.34it/s] 30it [00:07, 4.30it/s] 31it [00:07, 4.28it/s] 32it [00:07, 4.18it/s] 33it [00:07, 4.19it/s] 34it [00:08, 4.24it/s] 35it [00:08, 4.23it/s] 36it [00:08, 4.14it/s] 37it [00:08, 4.20it/s] 38it [00:09, 4.22it/s] 39it [00:09, 4.34it/s] 40it [00:09, 4.16it/s] 41it [00:09, 4.08it/s] 42it [00:10, 4.14it/s] 43it [00:10, 4.28it/s] 44it [00:10, 4.38it/s] 45it [00:10, 4.46it/s] 46it [00:10, 4.49it/s] 47it [00:11, 4.54it/s] 48it [00:11, 4.40it/s] 49it [00:11, 4.36it/s] 50it [00:11, 4.45it/s]2025-05-26 01:34:02,691 - INFO - [Epoch 022 | Batch 0050] IWAE-loss 2142.6248 | mean log_px -0.0071 | KL -1895.51 + 51it [00:12, 4.52it/s] 52it [00:12, 4.53it/s] 53it [00:12, 4.43it/s] 54it [00:12, 4.37it/s] 55it [00:12, 4.37it/s] 56it [00:13, 4.37it/s] 57it [00:13, 4.46it/s] 58it [00:13, 4.36it/s] 59it [00:13, 4.18it/s] 60it [00:14, 4.20it/s] 61it [00:14, 4.22it/s] 62it [00:14, 4.26it/s] 63it [00:14, 4.29it/s] 64it [00:15, 4.28it/s] 65it [00:15, 4.29it/s] 66it [00:15, 4.31it/s] 67it [00:15, 4.31it/s] 68it [00:15, 4.43it/s] 69it [00:16, 4.20it/s] 70it [00:16, 4.25it/s] 71it [00:16, 4.31it/s] 72it [00:16, 4.41it/s] 73it [00:17, 4.36it/s] 74it [00:17, 4.32it/s] 75it [00:17, 4.31it/s] 76it [00:17, 4.32it/s] 77it [00:18, 4.42it/s] 78it [00:18, 4.36it/s] 79it [00:18, 4.39it/s] 80it [00:18, 4.32it/s] 81it [00:18, 4.18it/s] 82it [00:19, 4.22it/s] 83it [00:19, 4.26it/s] 84it [00:19, 4.24it/s] 85it [00:19, 4.25it/s] 86it [00:20, 4.35it/s] 87it [00:20, 4.47it/s] 88it [00:20, 4.38it/s] 89it [00:20, 4.47it/s] 90it [00:21, 4.38it/s] 91it [00:21, 4.34it/s] 92it [00:21, 4.36it/s] 93it [00:21, 4.38it/s] 94it [00:21, 4.46it/s] 95it [00:22, 4.33it/s] 96it [00:22, 4.29it/s] 97it [00:22, 4.36it/s] 98it [00:22, 4.28it/s] 99it [00:23, 4.30it/s] 100it [00:23, 4.33it/s]2025-05-26 01:34:14,239 - INFO - [Epoch 022 | Batch 0100] IWAE-loss 2433.9939 | mean log_px -0.0126 | KL -1877.79 + 101it [00:23, 4.44it/s] 102it [00:23, 4.39it/s] 103it [00:24, 4.33it/s] 104it [00:24, 4.34it/s] 105it [00:24, 4.35it/s] 106it [00:24, 4.34it/s] 107it [00:24, 4.37it/s] 108it [00:25, 4.37it/s] 109it [00:25, 4.37it/s] 110it [00:25, 4.40it/s] 111it [00:25, 4.37it/s] 112it [00:26, 4.33it/s] 113it [00:26, 4.30it/s] 114it [00:26, 4.39it/s] 115it [00:26, 4.30it/s] 116it [00:27, 4.33it/s] 117it [00:27, 4.21it/s] 118it [00:27, 4.21it/s] 119it [00:27, 4.26it/s] 120it [00:27, 4.36it/s] 121it [00:28, 4.33it/s] 122it [00:28, 4.35it/s] 123it [00:28, 4.37it/s] 124it [00:28, 4.47it/s] 125it [00:29, 4.36it/s] 126it [00:29, 4.32it/s] 127it [00:29, 4.29it/s] 128it [00:29, 4.27it/s] 129it [00:30, 4.37it/s] 130it [00:30, 4.46it/s] 131it [00:30, 4.51it/s] 132it [00:30, 4.54it/s] 133it [00:30, 4.47it/s] 134it [00:31, 4.41it/s] 135it [00:31, 4.50it/s] 136it [00:31, 4.53it/s] 137it [00:31, 4.46it/s] 138it [00:32, 4.40it/s] 139it [00:32, 4.36it/s] 140it [00:32, 4.31it/s] 141it [00:32, 4.30it/s] 142it [00:32, 4.42it/s] 143it [00:33, 4.35it/s] 144it [00:33, 4.34it/s] 145it [00:33, 4.35it/s] 146it [00:33, 4.32it/s] 147it [00:34, 4.30it/s] 148it [00:34, 4.28it/s] 149it [00:34, 4.33it/s] 150it [00:34, 4.37it/s]2025-05-26 01:34:25,698 - INFO - [Epoch 022 | Batch 0150] IWAE-loss 2279.8452 | mean log_px -0.0095 | KL -1866.57 + 151it [00:35, 4.44it/s] 152it [00:35, 4.40it/s] 153it [00:35, 4.46it/s] 154it [00:35, 4.48it/s] 155it [00:35, 4.55it/s] 156it [00:36, 4.45it/s] 157it [00:36, 4.52it/s] 158it [00:36, 4.45it/s] 159it [00:36, 4.40it/s] 160it [00:37, 4.36it/s] 161it [00:37, 4.33it/s] 162it [00:37, 4.43it/s] 163it [00:37, 4.41it/s] 164it [00:37, 4.37it/s] 165it [00:38, 4.41it/s] 166it [00:38, 4.48it/s] 167it [00:38, 4.55it/s] 168it [00:38, 4.54it/s] 169it [00:39, 4.54it/s] 170it [00:39, 4.58it/s] 171it [00:39, 4.63it/s] 172it [00:39, 4.44it/s] 173it [00:39, 4.44it/s] 174it [00:40, 4.41it/s] 175it [00:40, 4.49it/s] 176it [00:40, 4.36it/s] 177it [00:40, 4.34it/s] 178it [00:41, 4.43it/s] 179it [00:41, 4.50it/s] 180it [00:41, 4.46it/s] 181it [00:41, 4.51it/s] 182it [00:41, 4.47it/s] 183it [00:42, 4.39it/s] 184it [00:42, 4.34it/s] 185it [00:42, 4.29it/s] 186it [00:42, 4.26it/s] 187it [00:43, 4.25it/s] 188it [00:43, 4.24it/s] 189it [00:43, 4.30it/s] 190it [00:43, 4.40it/s] 191it [00:44, 4.33it/s] 192it [00:44, 4.39it/s] 193it [00:44, 4.46it/s] 194it [00:44, 4.37it/s] 195it [00:45, 4.24it/s] 196it [00:45, 4.29it/s] 196it [00:45, 4.33it/s] +2025-05-26 01:34:36,043 - INFO - Epoch: 22, Objective: tensor([2321.2053], device='cuda:0', grad_fn=), Loss: 0.0126264663413167, KL/n: 37.90328598022461 + 0it [00:00, ?it/s]2025-05-26 01:34:36,626 - INFO - [Epoch 023 | Batch 0000] IWAE-loss 2031.7919 | mean log_px -0.0048 | KL -1857.27 + 1it [00:00, 3.00it/s] 2it [00:00, 3.65it/s] 3it [00:00, 3.93it/s] 4it [00:01, 4.07it/s] 5it [00:01, 4.22it/s] 6it [00:01, 4.38it/s] 7it [00:01, 4.47it/s] 8it [00:01, 4.49it/s] 9it [00:02, 4.44it/s] 10it [00:02, 4.44it/s] 11it [00:02, 4.41it/s] 12it [00:02, 4.43it/s] 13it [00:03, 4.39it/s] 14it [00:03, 4.41it/s] 15it [00:03, 4.36it/s] 16it [00:03, 4.31it/s] 17it [00:03, 4.36it/s] 18it [00:04, 4.38it/s] 19it [00:04, 4.42it/s] 20it [00:04, 4.47it/s] 21it [00:04, 4.50it/s] 22it [00:05, 4.41it/s] 23it [00:05, 4.50it/s] 24it [00:05, 4.49it/s] 25it [00:05, 4.43it/s] 26it [00:05, 4.48it/s] 27it [00:06, 4.56it/s] 28it [00:06, 4.46it/s] 29it [00:06, 4.50it/s] 30it [00:06, 4.41it/s] 31it [00:07, 4.50it/s] 32it [00:07, 4.49it/s] 33it [00:07, 4.45it/s] 34it [00:07, 4.49it/s] 35it [00:07, 4.55it/s] 36it [00:08, 4.52it/s] 37it [00:08, 4.50it/s] 38it [00:08, 4.44it/s] 39it [00:08, 4.40it/s] 40it [00:09, 4.40it/s] 41it [00:09, 4.37it/s] 42it [00:09, 4.43it/s] 43it [00:09, 4.37it/s] 44it [00:10, 4.45it/s] 45it [00:10, 4.44it/s] 46it [00:10, 4.52it/s] 47it [00:10, 4.58it/s] 48it [00:10, 4.44it/s] 49it [00:11, 4.39it/s] 50it [00:11, 4.40it/s]2025-05-26 01:34:47,872 - INFO - [Epoch 023 | Batch 0050] IWAE-loss 2093.6794 | mean log_px -0.0058 | KL -1840.02 + 51it [00:11, 4.50it/s] 52it [00:11, 4.50it/s] 53it [00:12, 4.41it/s] 54it [00:12, 4.37it/s] 55it [00:12, 4.16it/s] 56it [00:12, 4.19it/s] 57it [00:12, 4.26it/s] 58it [00:13, 4.35it/s] 59it [00:13, 4.34it/s] 60it [00:13, 4.41it/s] 61it [00:13, 4.37it/s] 62it [00:14, 4.33it/s] 63it [00:14, 4.32it/s] 64it [00:14, 4.40it/s] 65it [00:14, 4.31it/s] 66it [00:15, 4.29it/s] 67it [00:15, 4.37it/s] 68it [00:15, 4.45it/s] 69it [00:15, 4.45it/s] 70it [00:15, 4.50it/s] 71it [00:16, 4.51it/s] 72it [00:16, 4.42it/s] 73it [00:16, 4.48it/s] 74it [00:16, 4.55it/s] 75it [00:17, 4.46it/s] 76it [00:17, 4.29it/s] 77it [00:17, 4.25it/s] 78it [00:17, 4.36it/s] 79it [00:17, 4.37it/s] 80it [00:18, 4.30it/s] 81it [00:18, 4.28it/s] 82it [00:18, 4.34it/s] 83it [00:18, 4.31it/s] 84it [00:19, 4.36it/s] 85it [00:19, 4.19it/s] 86it [00:19, 4.24it/s] 87it [00:19, 4.33it/s] 88it [00:20, 4.40it/s] 89it [00:20, 4.40it/s] 90it [00:20, 4.46it/s] 91it [00:20, 4.40it/s] 92it [00:20, 4.34it/s] 93it [00:21, 4.34it/s] 94it [00:21, 4.28it/s] 95it [00:21, 4.30it/s] 96it [00:21, 4.38it/s] 97it [00:22, 4.35it/s] 98it [00:22, 4.22it/s] 99it [00:22, 4.34it/s] 100it [00:22, 4.40it/s]2025-05-26 01:34:59,356 - INFO - [Epoch 023 | Batch 0100] IWAE-loss 2605.1060 | mean log_px -0.0202 | KL -1829.09 + 101it [00:23, 4.40it/s] 102it [00:23, 4.36it/s] 103it [00:23, 4.43it/s] 104it [00:23, 4.49it/s] 105it [00:23, 4.38it/s] 106it [00:24, 4.45it/s] 107it [00:24, 4.52it/s] 108it [00:24, 4.38it/s] 109it [00:24, 4.38it/s] 110it [00:25, 4.26it/s] 111it [00:25, 4.09it/s] 112it [00:25, 4.02it/s] 113it [00:25, 4.07it/s] 114it [00:26, 4.13it/s] 115it [00:26, 4.17it/s] 116it [00:26, 4.29it/s] 117it [00:26, 4.39it/s] 118it [00:27, 4.46it/s] 119it [00:27, 4.38it/s] 120it [00:27, 4.30it/s] 121it [00:27, 4.31it/s] 122it [00:27, 4.31it/s] 123it [00:28, 4.29it/s] 124it [00:28, 4.38it/s] 125it [00:28, 4.46it/s] 126it [00:28, 4.52it/s] 127it [00:29, 4.56it/s] 128it [00:29, 4.45it/s] 129it [00:29, 4.36it/s] 130it [00:29, 4.34it/s] 131it [00:29, 4.43it/s] 132it [00:30, 4.48it/s] 133it [00:30, 4.39it/s] 134it [00:30, 4.41it/s] 135it [00:30, 4.38it/s] 136it [00:31, 4.34it/s] 137it [00:31, 4.43it/s] 138it [00:31, 4.47it/s] 139it [00:31, 4.38it/s] 140it [00:32, 4.34it/s] 141it [00:32, 4.40it/s] 142it [00:32, 4.38it/s] 143it [00:32, 4.34it/s] 144it [00:32, 4.31it/s] 145it [00:33, 4.39it/s] 146it [00:33, 4.29it/s] 147it [00:33, 4.41it/s] 148it [00:33, 4.44it/s] 149it [00:34, 4.46it/s] 150it [00:34, 4.51it/s]2025-05-26 01:35:10,806 - INFO - [Epoch 023 | Batch 0150] IWAE-loss 2053.4185 | mean log_px -0.0083 | KL -1817.16 + 151it [00:34, 4.47it/s] 152it [00:34, 4.37it/s] 153it [00:34, 4.44it/s] 154it [00:35, 4.18it/s] 155it [00:35, 4.23it/s] 156it [00:35, 4.32it/s] 157it [00:35, 4.40it/s] 158it [00:36, 4.47it/s] 159it [00:36, 4.49it/s] 160it [00:36, 4.44it/s] 161it [00:36, 4.42it/s] 162it [00:37, 4.34it/s] 163it [00:37, 4.37it/s] 164it [00:37, 4.28it/s] 165it [00:37, 4.32it/s] 166it [00:37, 4.21it/s] 167it [00:38, 4.35it/s] 168it [00:38, 4.33it/s] 169it [00:38, 4.43it/s] 170it [00:38, 4.48it/s] 171it [00:39, 4.51it/s] 172it [00:39, 4.43it/s] 173it [00:39, 4.50it/s] 174it [00:39, 4.40it/s] 175it [00:40, 4.25it/s] 176it [00:40, 4.29it/s] 177it [00:40, 4.28it/s] 178it [00:40, 4.29it/s] 179it [00:40, 4.28it/s] 180it [00:41, 4.24it/s] 181it [00:41, 4.24it/s] 182it [00:41, 4.26it/s] 183it [00:41, 4.31it/s] 184it [00:42, 4.28it/s] 185it [00:42, 4.29it/s] 186it [00:42, 4.32it/s] 187it [00:42, 4.34it/s] 188it [00:43, 4.23it/s] 189it [00:43, 4.26it/s] 190it [00:43, 4.29it/s] 191it [00:43, 4.32it/s] 192it [00:43, 4.32it/s] 193it [00:44, 4.20it/s] 194it [00:44, 4.34it/s] 195it [00:44, 4.33it/s] 196it [00:44, 4.45it/s] 196it [00:44, 4.36it/s] +2025-05-26 01:35:21,329 - INFO - Epoch: 23, Objective: tensor([2333.9048], device='cuda:0', grad_fn=), Loss: 0.009835069067776203, KL/n: 36.8824462890625 + 0it [00:00, ?it/s]2025-05-26 01:35:21,740 - INFO - [Epoch 024 | Batch 0000] IWAE-loss 2042.8802 | mean log_px -0.0088 | KL -1806.51 + 1it [00:00, 2.96it/s] 2it [00:00, 3.41it/s] 3it [00:00, 3.91it/s] 4it [00:01, 4.18it/s] 5it [00:01, 4.36it/s] 6it [00:01, 4.37it/s] 7it [00:01, 4.35it/s] 8it [00:01, 4.42it/s] 9it [00:02, 4.51it/s] 10it [00:02, 4.39it/s] 11it [00:02, 4.35it/s] 12it [00:02, 4.21it/s] 13it [00:03, 4.23it/s] 14it [00:03, 3.44it/s] 15it [00:03, 3.71it/s] 16it [00:03, 3.93it/s] 17it [00:04, 3.93it/s] 18it [00:04, 4.07it/s] 19it [00:04, 4.25it/s] 20it [00:04, 4.34it/s] 21it [00:05, 4.42it/s] 22it [00:05, 4.49it/s] 23it [00:05, 4.56it/s] 24it [00:05, 4.60it/s] 25it [00:05, 4.63it/s] 26it [00:06, 4.64it/s] 27it [00:06, 4.60it/s] 28it [00:06, 4.46it/s] 29it [00:06, 4.55it/s] 30it [00:07, 4.57it/s] 31it [00:07, 4.61it/s] 32it [00:07, 4.54it/s] 33it [00:07, 4.60it/s] 34it [00:07, 4.55it/s] 35it [00:08, 4.55it/s] 36it [00:08, 4.52it/s] 37it [00:08, 4.55it/s] 38it [00:08, 4.50it/s] 39it [00:09, 4.53it/s] 40it [00:09, 4.58it/s] 41it [00:09, 4.61it/s] 42it [00:09, 4.52it/s] 43it [00:09, 4.59it/s] 44it [00:10, 4.61it/s] 45it [00:10, 4.50it/s] 46it [00:10, 4.54it/s] 47it [00:10, 4.57it/s] 48it [00:10, 4.57it/s] 49it [00:11, 4.59it/s] 50it [00:11, 4.62it/s]2025-05-26 01:35:33,045 - INFO - [Epoch 024 | Batch 0050] IWAE-loss 1896.7238 | mean log_px -0.0014 | KL -1796.85 + 51it [00:11, 4.50it/s] 52it [00:11, 4.31it/s] 53it [00:12, 4.36it/s] 54it [00:12, 4.36it/s] 55it [00:12, 4.42it/s] 56it [00:12, 4.40it/s] 57it [00:13, 4.41it/s] 58it [00:13, 4.48it/s] 59it [00:13, 4.51it/s] 60it [00:13, 4.55it/s] 61it [00:13, 4.51it/s] 62it [00:14, 4.35it/s] 63it [00:14, 4.43it/s] 64it [00:14, 4.47it/s] 65it [00:14, 4.38it/s] 66it [00:15, 4.24it/s] 67it [00:15, 4.27it/s] 68it [00:15, 4.33it/s] 69it [00:15, 4.31it/s] 70it [00:15, 4.33it/s] 71it [00:16, 4.29it/s] 72it [00:16, 4.38it/s] 73it [00:16, 4.42it/s] 74it [00:16, 4.34it/s] 75it [00:17, 4.40it/s] 76it [00:17, 4.45it/s] 77it [00:17, 4.37it/s] 78it [00:17, 4.45it/s] 79it [00:18, 4.49it/s] 80it [00:18, 4.45it/s] 81it [00:18, 4.40it/s] 82it [00:18, 4.37it/s] 83it [00:18, 4.31it/s] 84it [00:19, 4.27it/s] 85it [00:19, 4.28it/s] 86it [00:19, 4.25it/s] 87it [00:19, 4.28it/s] 88it [00:20, 4.37it/s] 89it [00:20, 4.17it/s] 90it [00:20, 4.20it/s] 91it [00:20, 4.23it/s] 92it [00:21, 4.23it/s] 93it [00:21, 4.26it/s] 94it [00:21, 4.21it/s] 95it [00:21, 4.09it/s] 96it [00:22, 4.13it/s] 97it [00:22, 4.21it/s] 98it [00:22, 4.23it/s] 99it [00:22, 4.23it/s] 100it [00:22, 4.19it/s]2025-05-26 01:35:44,631 - INFO - [Epoch 024 | Batch 0100] IWAE-loss 2474.6335 | mean log_px -0.0208 | KL -1782.80 + 101it [00:23, 4.09it/s] 102it [00:23, 4.20it/s] 103it [00:23, 4.32it/s] 104it [00:23, 4.42it/s] 105it [00:24, 4.50it/s] 106it [00:24, 4.21it/s] 107it [00:24, 4.27it/s] 108it [00:24, 4.26it/s] 109it [00:25, 4.26it/s] 110it [00:25, 4.27it/s] 111it [00:25, 4.25it/s] 112it [00:25, 4.24it/s] 113it [00:26, 4.30it/s] 114it [00:26, 4.26it/s] 115it [00:26, 4.30it/s] 116it [00:26, 4.29it/s] 117it [00:26, 4.31it/s] 118it [00:27, 4.32it/s] 119it [00:27, 4.33it/s] 120it [00:27, 4.42it/s] 121it [00:27, 4.34it/s] 122it [00:28, 4.35it/s] 123it [00:28, 4.39it/s] 124it [00:28, 4.37it/s] 125it [00:28, 4.36it/s] 126it [00:29, 4.37it/s] 127it [00:29, 4.43it/s] 128it [00:29, 4.49it/s] 129it [00:29, 4.49it/s] 130it [00:29, 4.42it/s] 131it [00:30, 4.38it/s] 132it [00:30, 4.32it/s] 133it [00:30, 4.28it/s] 134it [00:30, 4.23it/s] 135it [00:31, 4.23it/s] 136it [00:31, 4.34it/s] 137it [00:31, 4.28it/s] 138it [00:31, 4.09it/s] 139it [00:32, 4.12it/s] 140it [00:32, 4.17it/s] 141it [00:32, 4.19it/s] 142it [00:32, 4.25it/s] 143it [00:32, 4.28it/s] 144it [00:33, 4.32it/s] 145it [00:33, 4.15it/s] 146it [00:33, 4.17it/s] 147it [00:33, 4.20it/s] 148it [00:34, 4.19it/s] 149it [00:34, 4.20it/s] 150it [00:34, 4.22it/s]2025-05-26 01:35:56,299 - INFO - [Epoch 024 | Batch 0150] IWAE-loss 2033.4376 | mean log_px -0.0059 | KL -1774.52 + 151it [00:34, 4.08it/s] 152it [00:35, 4.11it/s] 153it [00:35, 4.25it/s] 154it [00:35, 4.20it/s] 155it [00:35, 4.19it/s] 156it [00:36, 4.20it/s] 157it [00:36, 4.11it/s] 158it [00:36, 4.17it/s] 159it [00:36, 4.20it/s] 160it [00:37, 4.25it/s] 161it [00:37, 4.36it/s] 162it [00:37, 4.41it/s] 163it [00:37, 4.32it/s] 164it [00:37, 4.39it/s] 165it [00:38, 4.24it/s] 166it [00:38, 4.27it/s] 167it [00:38, 4.22it/s] 168it [00:38, 4.23it/s] 169it [00:39, 4.24it/s] 170it [00:39, 4.21it/s] 171it [00:39, 4.33it/s] 172it [00:39, 4.39it/s] 173it [00:40, 4.47it/s] 174it [00:40, 4.45it/s] 175it [00:40, 4.32it/s] 176it [00:40, 4.25it/s] 177it [00:40, 4.37it/s] 178it [00:41, 4.42it/s] 179it [00:41, 4.34it/s] 180it [00:41, 4.28it/s] 181it [00:41, 4.37it/s] 182it [00:42, 4.39it/s] 183it [00:42, 4.20it/s] 184it [00:42, 4.24it/s] 185it [00:42, 4.22it/s] 186it [00:43, 4.21it/s] 187it [00:43, 4.14it/s] 188it [00:43, 4.14it/s] 189it [00:43, 4.13it/s] 190it [00:44, 4.13it/s] 191it [00:44, 4.21it/s] 192it [00:44, 4.19it/s] 193it [00:44, 4.18it/s] 194it [00:44, 4.22it/s] 195it [00:45, 4.14it/s] 196it [00:45, 4.26it/s] 196it [00:45, 4.31it/s] +2025-05-26 01:36:06,993 - INFO - Epoch: 24, Objective: tensor([2720.5593], device='cuda:0', grad_fn=), Loss: 0.01608070731163025, KL/n: 36.15454864501953 +2025-05-26 01:36:06,999 - INFO - Select objective: bbb + 0it [00:00, ?it/s] 2it [00:00, 15.06it/s] 5it [00:00, 21.37it/s] 9it [00:00, 24.88it/s] 13it [00:00, 26.66it/s] 16it [00:00, 27.09it/s] 19it [00:00, 27.87it/s] 22it [00:00, 28.40it/s] 25it [00:00, 27.89it/s] 29it [00:01, 28.69it/s] 32it [00:01, 28.78it/s] 35it [00:01, 28.23it/s] 39it [00:01, 29.07it/s] 42it [00:01, 28.20it/s] 45it [00:01, 28.41it/s] 48it [00:01, 28.19it/s] 51it [00:01, 28.14it/s] 54it [00:01, 27.78it/s] 57it [00:02, 28.25it/s] 60it [00:02, 28.37it/s] 63it [00:02, 28.05it/s] 66it [00:02, 28.58it/s] 69it [00:02, 28.57it/s] 72it [00:02, 27.88it/s] 75it [00:02, 28.24it/s] 78it [00:02, 28.03it/s] 81it [00:02, 27.17it/s] 84it [00:03, 26.82it/s] 87it [00:03, 27.48it/s] 90it [00:03, 27.06it/s] 93it [00:03, 27.78it/s] 96it [00:03, 27.75it/s] 99it [00:03, 27.72it/s] 102it [00:03, 28.23it/s] 105it [00:03, 28.19it/s] 108it [00:03, 28.25it/s] 111it [00:04, 28.46it/s] 114it [00:04, 28.89it/s] 117it [00:04, 28.92it/s] 120it [00:04, 28.67it/s] 123it [00:04, 29.03it/s] 126it [00:04, 28.61it/s] 129it [00:04, 28.94it/s] 132it [00:04, 28.69it/s] 135it [00:04, 28.91it/s] 139it [00:04, 28.98it/s] 142it [00:05, 28.78it/s] 145it [00:05, 29.09it/s] 148it [00:05, 28.77it/s] 151it [00:05, 29.07it/s] 154it [00:05, 28.73it/s] 157it [00:05, 29.07it/s] 160it [00:05, 28.81it/s] 164it [00:05, 28.64it/s] 168it [00:05, 29.06it/s] 172it [00:06, 29.32it/s] 175it [00:06, 28.71it/s] 178it [00:06, 28.82it/s] 181it [00:06, 29.03it/s] 184it [00:06, 29.24it/s] 187it [00:06, 28.39it/s] 191it [00:06, 28.77it/s] 194it [00:06, 28.93it/s] 197it [00:06, 28.26it/s] 201it [00:07, 28.81it/s] 204it [00:07, 28.69it/s] 207it [00:07, 28.68it/s] 211it [00:07, 28.95it/s] 215it [00:07, 28.48it/s] 219it [00:07, 28.76it/s] 222it [00:07, 28.78it/s] 225it [00:07, 27.90it/s] 228it [00:08, 28.21it/s] 231it [00:08, 27.76it/s] 235it [00:08, 28.44it/s] 239it [00:08, 28.74it/s] 243it [00:08, 29.15it/s] 246it [00:08, 29.12it/s] 250it [00:08, 29.03it/s] 253it [00:08, 29.20it/s] 256it [00:09, 28.98it/s] 259it [00:09, 29.20it/s] 262it [00:09, 29.05it/s] 265it [00:09, 29.05it/s] 269it [00:09, 29.36it/s] 273it [00:09, 29.22it/s] 276it [00:09, 29.05it/s] 279it [00:09, 27.00it/s] 280it [00:09, 28.18it/s] +2025-05-26 01:36:17,101 - INFO - Epoch: 0, Objective: 0.018377337604761124, Loss: 0.010894941166043282, KL/n: 0.0074823955073952675 + 0%| | 0/84 [00:00), Loss: 0.11140021681785583, KL/n: 71.59821319580078 + 0it [00:00, ?it/s]2025-05-26 01:48:39,245 - INFO - [Epoch 001 | Batch 0000] IWAE-loss 11894.2480 | mean log_px -0.1369 | KL -3499.28 + 1it [00:00, 3.15it/s] 2it [00:00, 3.90it/s] 3it [00:00, 4.24it/s] 4it [00:00, 4.40it/s] 5it [00:01, 4.50it/s] 6it [00:01, 4.54it/s] 7it [00:01, 4.59it/s] 8it [00:01, 4.41it/s] 9it [00:02, 4.50it/s] 10it [00:02, 4.54it/s] 11it [00:02, 4.57it/s] 12it [00:02, 4.60it/s] 13it [00:02, 4.61it/s] 14it [00:03, 4.62it/s] 15it [00:03, 4.46it/s] 16it [00:03, 4.53it/s] 17it [00:03, 4.57it/s] 18it [00:04, 4.57it/s] 19it [00:04, 4.59it/s] 20it [00:04, 4.61it/s] 21it [00:04, 4.61it/s] 22it [00:04, 4.65it/s] 23it [00:05, 4.65it/s] 24it [00:05, 4.66it/s] 25it [00:05, 4.65it/s] 26it [00:05, 4.50it/s] 27it [00:05, 4.56it/s] 28it [00:06, 4.58it/s] 29it [00:06, 4.61it/s] 30it [00:06, 4.63it/s] 31it [00:06, 4.63it/s] 32it [00:07, 4.64it/s] 33it [00:07, 4.65it/s] 34it [00:07, 4.65it/s] 35it [00:07, 4.66it/s] 36it [00:07, 4.66it/s] 37it [00:08, 4.48it/s] 38it [00:08, 4.54it/s] 39it [00:08, 4.58it/s] 40it [00:08, 4.60it/s] 41it [00:09, 4.61it/s] 42it [00:09, 4.61it/s] 43it [00:09, 4.47it/s] 44it [00:09, 4.53it/s] 45it [00:09, 4.50it/s] 46it [00:10, 4.50it/s] 47it [00:10, 4.53it/s] 48it [00:10, 4.56it/s] 49it [00:10, 4.59it/s] 50it [00:10, 4.61it/s]2025-05-26 01:48:50,165 - INFO - [Epoch 001 | Batch 0050] IWAE-loss 11227.0039 | mean log_px -0.1305 | KL -3490.07 + 51it [00:11, 4.62it/s] 52it [00:11, 4.46it/s] 53it [00:11, 4.53it/s] 54it [00:11, 4.56it/s] 55it [00:12, 4.59it/s] 56it [00:12, 4.39it/s] 57it [00:12, 4.43it/s] 58it [00:12, 4.50it/s] 59it [00:12, 4.55it/s] 60it [00:13, 4.58it/s] 61it [00:13, 4.45it/s] 62it [00:13, 4.51it/s] 63it [00:13, 4.54it/s] 64it [00:14, 4.58it/s] 65it [00:14, 4.60it/s] 66it [00:14, 4.61it/s] 67it [00:14, 4.63it/s] 68it [00:14, 4.63it/s] 69it [00:15, 4.65it/s] 70it [00:15, 4.45it/s] 71it [00:15, 4.52it/s] 72it [00:15, 4.52it/s] 73it [00:16, 4.56it/s] 74it [00:16, 4.59it/s] 75it [00:16, 4.62it/s] 76it [00:16, 4.61it/s] 77it [00:16, 4.46it/s] 78it [00:17, 4.42it/s] 79it [00:17, 4.50it/s] 80it [00:17, 4.56it/s] 81it [00:17, 4.55it/s] 82it [00:18, 4.61it/s] 83it [00:18, 4.64it/s] 84it [00:18, 4.66it/s] 85it [00:18, 4.52it/s] 86it [00:18, 4.59it/s] 87it [00:19, 4.63it/s] 88it [00:19, 4.65it/s] 89it [00:19, 4.66it/s] 90it [00:19, 4.68it/s] 91it [00:19, 4.68it/s] 92it [00:20, 4.71it/s] 93it [00:20, 4.71it/s] 94it [00:20, 4.72it/s] 95it [00:20, 4.71it/s] 96it [00:21, 4.71it/s] 97it [00:21, 4.71it/s] 98it [00:21, 4.71it/s] 99it [00:21, 4.72it/s] 100it [00:21, 4.55it/s]2025-05-26 01:49:01,072 - INFO - [Epoch 001 | Batch 0100] IWAE-loss 8575.6543 | mean log_px -0.0730 | KL -3466.15 + 101it [00:22, 4.61it/s] 102it [00:22, 4.64it/s] 103it [00:22, 4.66it/s] 104it [00:22, 4.68it/s] 105it [00:22, 4.69it/s] 106it [00:23, 4.53it/s] 107it [00:23, 4.59it/s] 108it [00:23, 4.62it/s] 109it [00:23, 4.65it/s] 110it [00:24, 4.66it/s] 111it [00:24, 4.68it/s] 112it [00:24, 4.52it/s] 113it [00:24, 4.59it/s] 114it [00:24, 4.63it/s] 115it [00:25, 4.66it/s] 116it [00:25, 4.68it/s] 117it [00:25, 4.52it/s] 118it [00:25, 4.57it/s] 119it [00:26, 4.63it/s] 120it [00:26, 4.65it/s] 121it [00:26, 4.67it/s] 122it [00:26, 4.68it/s] 123it [00:26, 4.66it/s] 124it [00:27, 4.68it/s] 125it [00:27, 4.70it/s] 126it [00:27, 4.54it/s] 127it [00:27, 4.60it/s] 128it [00:27, 4.62it/s] 129it [00:28, 4.66it/s] 130it [00:28, 4.68it/s] 131it [00:28, 4.69it/s] 132it [00:28, 4.69it/s] 133it [00:29, 4.54it/s] 134it [00:29, 4.60it/s] 135it [00:29, 4.61it/s] 136it [00:29, 4.46it/s] 137it [00:29, 4.52it/s] 138it [00:30, 4.58it/s] 139it [00:30, 4.62it/s] 140it [00:30, 4.59it/s] 141it [00:30, 4.55it/s] 142it [00:30, 4.60it/s] 143it [00:31, 4.64it/s] 144it [00:31, 4.67it/s] 145it [00:31, 4.52it/s] 146it [00:31, 4.57it/s] 147it [00:32, 4.62it/s] 148it [00:32, 4.64it/s] 149it [00:32, 4.66it/s] 150it [00:32, 4.68it/s]2025-05-26 01:49:11,882 - INFO - [Epoch 001 | Batch 0150] IWAE-loss 10918.8730 | mean log_px -0.1088 | KL -3451.89 + 151it [00:32, 4.53it/s] 152it [00:33, 4.59it/s] 153it [00:33, 4.63it/s] 154it [00:33, 4.64it/s] 155it [00:33, 4.66it/s] 156it [00:34, 4.67it/s] 157it [00:34, 4.53it/s] 158it [00:34, 4.59it/s] 159it [00:34, 4.64it/s] 160it [00:34, 4.66it/s] 161it [00:35, 4.67it/s] 162it [00:35, 4.70it/s] 163it [00:35, 4.54it/s] 164it [00:35, 4.60it/s] 165it [00:35, 4.64it/s] 166it [00:36, 4.66it/s] 167it [00:36, 4.69it/s] 168it [00:36, 4.53it/s] 169it [00:36, 4.60it/s] 170it [00:37, 4.63it/s] 171it [00:37, 4.66it/s] 172it [00:37, 4.67it/s] 173it [00:37, 4.69it/s] 174it [00:37, 4.70it/s] 175it [00:38, 4.53it/s] 176it [00:38, 4.57it/s] 177it [00:38, 4.59it/s] 178it [00:38, 4.62it/s] 179it [00:38, 4.65it/s] 180it [00:39, 4.66it/s] 181it [00:39, 4.52it/s] 182it [00:39, 4.59it/s] 183it [00:39, 4.63it/s] 184it [00:40, 4.64it/s] 185it [00:40, 4.66it/s] 186it [00:40, 4.68it/s] 187it [00:40, 4.48it/s] 188it [00:40, 4.56it/s] 189it [00:41, 4.60it/s] 190it [00:41, 4.62it/s] 191it [00:41, 4.65it/s] 192it [00:41, 4.65it/s] 193it [00:42, 4.51it/s] 194it [00:42, 4.58it/s] 195it [00:42, 4.42it/s] 196it [00:42, 4.50it/s] 196it [00:42, 4.58it/s] +2025-05-26 01:49:21,792 - INFO - Epoch: 1, Objective: tensor([9172.7520], device='cuda:0', grad_fn=), Loss: 0.07874009013175964, KL/n: 70.15756225585938 + 0it [00:00, ?it/s]2025-05-26 01:49:22,359 - INFO - [Epoch 002 | Batch 0000] IWAE-loss 7225.7852 | mean log_px -0.0616 | KL -3439.12 + 1it [00:00, 3.09it/s] 2it [00:00, 3.67it/s] 3it [00:00, 3.72it/s] 4it [00:01, 3.89it/s] 5it [00:01, 4.03it/s] 6it [00:01, 4.07it/s] 7it [00:01, 4.23it/s] 8it [00:01, 4.21it/s] 9it [00:02, 4.06it/s] 10it [00:02, 4.24it/s] 11it [00:02, 4.38it/s] 12it [00:02, 4.45it/s] 13it [00:03, 4.53it/s] 14it [00:03, 4.55it/s] 15it [00:03, 4.62it/s] 16it [00:03, 4.52it/s] 17it [00:03, 4.60it/s] 18it [00:04, 4.62it/s] 19it [00:04, 4.46it/s] 20it [00:04, 4.51it/s] 21it [00:04, 4.41it/s] 22it [00:05, 4.44it/s] 23it [00:05, 4.47it/s] 24it [00:05, 4.54it/s] 25it [00:05, 4.60it/s] 26it [00:05, 4.60it/s] 27it [00:06, 4.64it/s] 28it [00:06, 4.63it/s] 29it [00:06, 4.49it/s] 30it [00:06, 4.41it/s] 31it [00:07, 4.20it/s] 32it [00:07, 4.33it/s] 33it [00:07, 4.28it/s] 34it [00:07, 4.26it/s] 35it [00:08, 4.38it/s] 36it [00:08, 4.32it/s] 37it [00:08, 4.42it/s] 38it [00:08, 4.35it/s] 39it [00:08, 4.31it/s] 40it [00:09, 4.40it/s] 41it [00:09, 4.49it/s] 42it [00:09, 4.39it/s] 43it [00:09, 4.33it/s] 44it [00:10, 4.42it/s] 45it [00:10, 4.20it/s] 46it [00:10, 4.34it/s] 47it [00:10, 4.42it/s] 48it [00:11, 4.50it/s] 49it [00:11, 4.56it/s] 50it [00:11, 4.60it/s]2025-05-26 01:49:33,676 - INFO - [Epoch 002 | Batch 0050] IWAE-loss 7740.6035 | mean log_px -0.0618 | KL -3413.71 + 51it [00:11, 4.64it/s] 52it [00:11, 4.59it/s] 53it [00:12, 4.61it/s] 54it [00:12, 4.64it/s] 55it [00:12, 4.66it/s] 56it [00:12, 4.67it/s] 57it [00:12, 4.69it/s] 58it [00:13, 4.51it/s] 59it [00:13, 4.42it/s] 60it [00:13, 4.48it/s] 61it [00:13, 4.55it/s] 62it [00:14, 4.43it/s] 63it [00:14, 4.38it/s] 64it [00:14, 4.30it/s] 65it [00:14, 4.42it/s] 66it [00:14, 4.50it/s] 67it [00:15, 4.56it/s] 68it [00:15, 4.43it/s] 69it [00:15, 4.37it/s] 70it [00:15, 4.45it/s] 71it [00:16, 4.41it/s] 72it [00:16, 4.26it/s] 73it [00:16, 4.01it/s] 74it [00:16, 4.16it/s] 75it [00:17, 4.28it/s] 76it [00:17, 4.38it/s] 77it [00:17, 4.45it/s] 78it [00:17, 4.52it/s] 79it [00:17, 4.55it/s] 80it [00:18, 4.60it/s] 81it [00:18, 4.52it/s] 82it [00:18, 4.46it/s] 83it [00:18, 4.49it/s] 84it [00:19, 4.46it/s] 85it [00:19, 4.52it/s] 86it [00:19, 4.55it/s] 87it [00:19, 4.45it/s] 88it [00:19, 4.34it/s] 89it [00:20, 4.42it/s] 90it [00:20, 4.49it/s] 91it [00:20, 4.49it/s] 92it [00:20, 4.54it/s] 93it [00:21, 4.59it/s] 94it [00:21, 4.55it/s] 95it [00:21, 4.57it/s] 96it [00:21, 4.61it/s] 97it [00:21, 4.65it/s] 98it [00:22, 4.66it/s] 99it [00:22, 4.63it/s] 100it [00:22, 4.49it/s]2025-05-26 01:49:44,865 - INFO - [Epoch 002 | Batch 0100] IWAE-loss 10890.5635 | mean log_px -0.1134 | KL -3399.14 + 101it [00:22, 4.39it/s] 102it [00:23, 4.46it/s] 103it [00:23, 4.53it/s] 104it [00:23, 4.40it/s] 105it [00:23, 4.48it/s] 106it [00:23, 4.55it/s] 107it [00:24, 4.43it/s] 108it [00:24, 4.52it/s] 109it [00:24, 4.58it/s] 110it [00:24, 4.62it/s] 111it [00:25, 4.66it/s] 112it [00:25, 4.67it/s] 113it [00:25, 4.69it/s] 114it [00:25, 4.69it/s] 115it [00:25, 4.70it/s] 116it [00:26, 4.70it/s] 117it [00:26, 4.71it/s] 118it [00:26, 4.54it/s] 119it [00:26, 4.61it/s] 120it [00:26, 4.45it/s] 121it [00:27, 4.37it/s] 122it [00:27, 4.45it/s] 123it [00:27, 4.53it/s] 124it [00:27, 4.57it/s] 125it [00:28, 4.61it/s] 126it [00:28, 4.45it/s] 127it [00:28, 4.36it/s] 128it [00:28, 4.47it/s] 129it [00:28, 4.54it/s] 130it [00:29, 4.59it/s] 131it [00:29, 4.58it/s] 132it [00:29, 4.61it/s] 133it [00:29, 4.64it/s] 134it [00:30, 4.63it/s] 135it [00:30, 4.50it/s] 136it [00:30, 4.57it/s] 137it [00:30, 4.44it/s] 138it [00:30, 4.51it/s] 139it [00:31, 4.57it/s] 140it [00:31, 4.42it/s] 141it [00:31, 4.42it/s] 142it [00:31, 4.35it/s] 143it [00:32, 4.31it/s] 144it [00:32, 4.40it/s] 145it [00:32, 4.48it/s] 146it [00:32, 4.39it/s] 147it [00:32, 4.46it/s] 148it [00:33, 4.53it/s] 149it [00:33, 4.59it/s] 150it [00:33, 4.43it/s]2025-05-26 01:49:55,931 - INFO - [Epoch 002 | Batch 0150] IWAE-loss 6388.3467 | mean log_px -0.0455 | KL -3380.82 + 151it [00:33, 4.36it/s] 152it [00:34, 4.45it/s] 153it [00:34, 4.52it/s] 154it [00:34, 4.28it/s] 155it [00:34, 4.39it/s] 156it [00:35, 4.48it/s] 157it [00:35, 4.54it/s] 158it [00:35, 4.53it/s] 159it [00:35, 4.45it/s] 160it [00:35, 4.54it/s] 161it [00:36, 4.58it/s] 162it [00:36, 4.59it/s] 163it [00:36, 4.63it/s] 164it [00:36, 4.65it/s] 165it [00:36, 4.67it/s] 166it [00:37, 4.69it/s] 167it [00:37, 4.69it/s] 168it [00:37, 4.70it/s] 169it [00:37, 4.69it/s] 170it [00:38, 4.70it/s] 171it [00:38, 4.51it/s] 172it [00:38, 4.26it/s] 173it [00:38, 4.24it/s] 174it [00:39, 4.21it/s] 175it [00:39, 4.31it/s] 176it [00:39, 4.38it/s] 177it [00:39, 4.45it/s] 178it [00:39, 4.52it/s] 179it [00:40, 4.36it/s] 180it [00:40, 4.15it/s] 181it [00:40, 4.23it/s] 182it [00:40, 4.37it/s] 183it [00:41, 4.47it/s] 184it [00:41, 4.52it/s] 185it [00:41, 4.58it/s] 186it [00:41, 4.62it/s] 187it [00:41, 4.45it/s] 188it [00:42, 4.39it/s] 189it [00:42, 4.49it/s] 190it [00:42, 4.25it/s] 191it [00:42, 4.23it/s] 192it [00:43, 4.28it/s] 193it [00:43, 4.36it/s] 194it [00:43, 4.44it/s] 195it [00:43, 4.44it/s] 196it [00:43, 4.50it/s] 196it [00:44, 4.45it/s] +2025-05-26 01:50:06,141 - INFO - Epoch: 2, Objective: tensor([7126.1548], device='cuda:0', grad_fn=), Loss: 0.05375305190682411, KL/n: 68.71427154541016 + 0it [00:00, ?it/s]2025-05-26 01:50:06,530 - INFO - [Epoch 003 | Batch 0000] IWAE-loss 6548.8511 | mean log_px -0.0590 | KL -3364.44 + 1it [00:00, 2.90it/s] 2it [00:00, 3.75it/s] 3it [00:00, 4.03it/s] 4it [00:01, 4.08it/s] 5it [00:01, 4.10it/s] 6it [00:01, 4.12it/s] 7it [00:01, 4.29it/s] 8it [00:01, 4.41it/s] 9it [00:02, 4.50it/s] 10it [00:02, 4.23it/s] 11it [00:02, 4.37it/s] 12it [00:02, 4.31it/s] 13it [00:03, 4.41it/s] 14it [00:03, 4.33it/s] 15it [00:03, 4.24it/s] 16it [00:03, 4.24it/s] 17it [00:04, 4.21it/s] 18it [00:04, 4.33it/s] 19it [00:04, 4.26it/s] 20it [00:04, 4.37it/s] 21it [00:04, 4.44it/s] 22it [00:05, 4.51it/s] 23it [00:05, 4.57it/s] 24it [00:05, 4.62it/s] 25it [00:05, 4.48it/s] 26it [00:06, 4.54it/s] 27it [00:06, 4.44it/s] 28it [00:06, 4.48it/s] 29it [00:06, 4.53it/s] 30it [00:06, 4.58it/s] 31it [00:07, 4.46it/s] 32it [00:07, 4.53it/s] 33it [00:07, 4.42it/s] 34it [00:07, 4.43it/s] 35it [00:08, 4.47it/s] 36it [00:08, 4.50it/s] 37it [00:08, 4.38it/s] 38it [00:08, 4.45it/s] 39it [00:08, 4.51it/s] 40it [00:09, 4.54it/s] 41it [00:09, 4.57it/s] 42it [00:09, 4.59it/s] 43it [00:09, 4.62it/s] 44it [00:10, 4.45it/s] 45it [00:10, 4.29it/s] 46it [00:10, 4.39it/s] 47it [00:10, 4.30it/s] 48it [00:10, 4.24it/s] 49it [00:11, 4.31it/s] 50it [00:11, 4.40it/s]2025-05-26 01:50:17,883 - INFO - [Epoch 003 | Batch 0050] IWAE-loss 6395.8638 | mean log_px -0.0435 | KL -3348.27 + 51it [00:11, 4.31it/s] 52it [00:11, 4.13it/s] 53it [00:12, 4.28it/s] 54it [00:12, 4.38it/s] 55it [00:12, 4.44it/s] 56it [00:12, 4.51it/s] 57it [00:13, 4.56it/s] 58it [00:13, 4.44it/s] 59it [00:13, 4.44it/s] 60it [00:13, 4.49it/s] 61it [00:13, 4.44it/s] 62it [00:14, 4.52it/s] 63it [00:14, 4.50it/s] 64it [00:14, 4.54it/s] 65it [00:14, 4.55it/s] 66it [00:15, 4.60it/s] 67it [00:15, 4.39it/s] 68it [00:15, 4.49it/s] 69it [00:15, 4.54it/s] 70it [00:15, 4.58it/s] 71it [00:16, 4.61it/s] 72it [00:16, 4.63it/s] 73it [00:16, 4.45it/s] 74it [00:16, 4.35it/s] 75it [00:17, 4.44it/s] 76it [00:17, 4.50it/s] 77it [00:17, 4.53it/s] 78it [00:17, 3.57it/s] 79it [00:18, 3.84it/s] 80it [00:18, 4.07it/s] 81it [00:18, 4.23it/s] 82it [00:18, 4.36it/s] 83it [00:18, 4.45it/s] 84it [00:19, 4.35it/s] 85it [00:19, 4.45it/s] 86it [00:19, 4.47it/s] 87it [00:19, 4.53it/s] 88it [00:20, 4.35it/s] 89it [00:20, 4.44it/s] 90it [00:20, 4.51it/s] 91it [00:20, 4.39it/s] 92it [00:20, 4.46it/s] 93it [00:21, 4.53it/s] 94it [00:21, 4.57it/s] 95it [00:21, 4.47it/s] 96it [00:21, 4.53it/s] 97it [00:22, 4.42it/s] 98it [00:22, 4.34it/s] 99it [00:22, 4.42it/s] 100it [00:22, 4.34it/s]2025-05-26 01:50:29,216 - INFO - [Epoch 003 | Batch 0100] IWAE-loss 6408.8643 | mean log_px -0.0460 | KL -3327.64 + 101it [00:23, 4.42it/s] 102it [00:23, 4.49it/s] 103it [00:23, 4.54it/s] 104it [00:23, 4.57it/s] 105it [00:23, 4.61it/s] 106it [00:24, 4.45it/s] 107it [00:24, 4.53it/s] 108it [00:24, 4.57it/s] 109it [00:24, 4.61it/s] 110it [00:24, 4.63it/s] 111it [00:25, 4.63it/s] 112it [00:25, 4.59it/s] 113it [00:25, 4.59it/s] 114it [00:25, 4.61it/s] 115it [00:26, 4.62it/s] 116it [00:26, 4.63it/s] 117it [00:26, 4.65it/s] 118it [00:26, 4.65it/s] 119it [00:26, 4.66it/s] 120it [00:27, 4.67it/s] 121it [00:27, 4.67it/s] 122it [00:27, 4.52it/s] 123it [00:27, 4.58it/s] 124it [00:27, 4.60it/s] 125it [00:28, 4.63it/s] 126it [00:28, 4.62it/s] 127it [00:28, 4.63it/s] 128it [00:28, 4.48it/s] 129it [00:29, 4.55it/s] 130it [00:29, 4.50it/s] 131it [00:29, 4.49it/s] 132it [00:29, 4.53it/s] 133it [00:29, 4.57it/s] 134it [00:30, 4.44it/s] 135it [00:30, 4.51it/s] 136it [00:30, 4.56it/s] 137it [00:30, 4.49it/s] 138it [00:31, 4.48it/s] 139it [00:31, 4.54it/s] 140it [00:31, 4.57it/s] 141it [00:31, 4.60it/s] 142it [00:31, 4.47it/s] 143it [00:32, 4.53it/s] 144it [00:32, 4.56it/s] 145it [00:32, 4.58it/s] 146it [00:32, 4.61it/s] 147it [00:33, 4.63it/s] 148it [00:33, 4.65it/s] 149it [00:33, 4.66it/s] 150it [00:33, 4.66it/s]2025-05-26 01:50:40,141 - INFO - [Epoch 003 | Batch 0150] IWAE-loss 6867.9688 | mean log_px -0.0538 | KL -3303.91 + 151it [00:33, 4.35it/s] 152it [00:34, 4.43it/s] 153it [00:34, 4.51it/s] 154it [00:34, 4.54it/s] 155it [00:34, 4.57it/s] 156it [00:35, 4.60it/s] 157it [00:35, 4.52it/s] 158it [00:35, 4.57it/s] 159it [00:35, 4.26it/s] 160it [00:35, 4.24it/s] 161it [00:36, 4.20it/s] 162it [00:36, 4.32it/s] 163it [00:36, 4.12it/s] 164it [00:36, 4.21it/s] 165it [00:37, 4.32it/s] 166it [00:37, 4.25it/s] 167it [00:37, 4.12it/s] 168it [00:37, 4.06it/s] 169it [00:38, 4.09it/s] 170it [00:38, 4.25it/s] 171it [00:38, 4.35it/s] 172it [00:38, 4.41it/s] 173it [00:39, 4.32it/s] 174it [00:39, 4.20it/s] 175it [00:39, 4.33it/s] 176it [00:39, 4.42it/s] 177it [00:39, 4.31it/s] 178it [00:40, 4.41it/s] 179it [00:40, 4.49it/s] 180it [00:40, 4.35it/s] 181it [00:40, 4.42it/s] 182it [00:41, 4.48it/s] 183it [00:41, 4.38it/s] 184it [00:41, 4.45it/s] 185it [00:41, 4.52it/s] 186it [00:41, 4.50it/s] 187it [00:42, 4.48it/s] 188it [00:42, 4.49it/s] 189it [00:42, 4.51it/s] 190it [00:42, 4.55it/s] 191it [00:43, 4.59it/s] 192it [00:43, 4.60it/s] 193it [00:43, 4.62it/s] 194it [00:43, 4.43it/s] 195it [00:44, 4.25it/s] 196it [00:44, 4.40it/s] 196it [00:44, 4.43it/s] +2025-05-26 01:50:50,544 - INFO - Epoch: 3, Objective: tensor([5746.6787], device='cuda:0', grad_fn=), Loss: 0.046654097735881805, KL/n: 67.17630004882812 + 0it [00:00, ?it/s]2025-05-26 01:50:50,958 - INFO - [Epoch 004 | Batch 0000] IWAE-loss 5883.0645 | mean log_px -0.0408 | KL -3290.14 + 1it [00:00, 2.94it/s] 2it [00:00, 3.59it/s] 3it [00:00, 4.03it/s] 4it [00:01, 4.21it/s] 5it [00:01, 4.23it/s] 6it [00:01, 4.36it/s] 7it [00:01, 4.28it/s] 8it [00:01, 4.28it/s] 9it [00:02, 4.26it/s] 10it [00:02, 4.24it/s] 11it [00:02, 4.26it/s] 12it [00:02, 4.12it/s] 13it [00:03, 4.14it/s] 14it [00:03, 4.18it/s] 15it [00:03, 4.21it/s] 16it [00:03, 4.34it/s] 17it [00:04, 4.43it/s] 18it [00:04, 4.36it/s] 19it [00:04, 4.48it/s] 20it [00:04, 4.43it/s] 21it [00:04, 4.40it/s] 22it [00:05, 4.36it/s] 23it [00:05, 4.38it/s] 24it [00:05, 4.45it/s] 25it [00:05, 4.23it/s] 26it [00:06, 4.30it/s] 27it [00:06, 4.39it/s] 28it [00:06, 4.33it/s] 29it [00:06, 4.36it/s] 30it [00:07, 4.45it/s] 31it [00:07, 4.28it/s] 32it [00:07, 4.28it/s] 33it [00:07, 4.31it/s] 34it [00:07, 4.28it/s] 35it [00:08, 4.32it/s] 36it [00:08, 4.31it/s] 37it [00:08, 4.22it/s] 38it [00:08, 4.31it/s] 39it [00:09, 4.30it/s] 40it [00:09, 4.32it/s] 41it [00:09, 4.34it/s] 42it [00:09, 4.44it/s] 43it [00:10, 4.52it/s] 44it [00:10, 4.56it/s] 45it [00:10, 4.61it/s] 46it [00:10, 4.57it/s] 47it [00:10, 4.53it/s] 48it [00:11, 4.37it/s] 49it [00:11, 4.47it/s] 50it [00:11, 4.50it/s]2025-05-26 01:51:02,399 - INFO - [Epoch 004 | Batch 0050] IWAE-loss 4895.3418 | mean log_px -0.0286 | KL -3262.91 + 51it [00:11, 4.49it/s] 52it [00:12, 4.46it/s] 53it [00:12, 4.47it/s] 54it [00:12, 4.40it/s] 55it [00:12, 4.51it/s] 56it [00:12, 4.43it/s] 57it [00:13, 4.53it/s] 58it [00:13, 4.42it/s] 59it [00:13, 4.24it/s] 60it [00:13, 4.25it/s] 61it [00:14, 4.30it/s] 62it [00:14, 4.30it/s] 63it [00:14, 4.32it/s] 64it [00:14, 4.37it/s] 65it [00:14, 4.40it/s] 66it [00:15, 4.42it/s] 67it [00:15, 4.41it/s] 68it [00:15, 4.41it/s] 69it [00:15, 4.41it/s] 70it [00:16, 4.47it/s] 71it [00:16, 4.35it/s] 72it [00:16, 4.42it/s] 73it [00:16, 4.50it/s] 74it [00:17, 4.39it/s] 75it [00:17, 4.39it/s] 76it [00:17, 4.42it/s] 77it [00:17, 4.39it/s] 78it [00:17, 4.35it/s] 79it [00:18, 4.37it/s] 80it [00:18, 4.38it/s] 81it [00:18, 4.42it/s] 82it [00:18, 4.42it/s] 83it [00:19, 4.51it/s] 84it [00:19, 4.42it/s] 85it [00:19, 4.47it/s] 86it [00:19, 4.54it/s] 87it [00:19, 4.58it/s] 88it [00:20, 4.52it/s] 89it [00:20, 4.58it/s] 90it [00:20, 4.54it/s] 91it [00:20, 4.60it/s] 92it [00:21, 4.58it/s] 93it [00:21, 4.62it/s] 94it [00:21, 4.50it/s] 95it [00:21, 4.49it/s] 96it [00:21, 4.52it/s] 97it [00:22, 4.55it/s] 98it [00:22, 4.53it/s] 99it [00:22, 4.51it/s] 100it [00:22, 4.38it/s]2025-05-26 01:51:13,668 - INFO - [Epoch 004 | Batch 0100] IWAE-loss 5435.9736 | mean log_px -0.0313 | KL -3245.03 + 101it [00:23, 4.41it/s] 102it [00:23, 4.48it/s] 103it [00:23, 4.49it/s] 104it [00:23, 4.53it/s] 105it [00:23, 4.50it/s] 106it [00:24, 4.57it/s] 107it [00:24, 4.54it/s] 108it [00:24, 4.30it/s] 109it [00:24, 4.40it/s] 110it [00:25, 4.45it/s] 111it [00:25, 4.53it/s] 112it [00:25, 4.51it/s] 113it [00:25, 4.57it/s] 114it [00:25, 4.56it/s] 115it [00:26, 4.50it/s] 116it [00:26, 4.56it/s] 117it [00:26, 4.56it/s] 118it [00:26, 4.47it/s] 119it [00:27, 4.49it/s] 120it [00:27, 4.52it/s] 121it [00:27, 4.37it/s] 122it [00:27, 4.44it/s] 123it [00:27, 4.52it/s] 124it [00:28, 4.48it/s] 125it [00:28, 4.50it/s] 126it [00:28, 4.52it/s] 127it [00:28, 4.51it/s] 128it [00:29, 4.54it/s] 129it [00:29, 4.51it/s] 130it [00:29, 4.56it/s] 131it [00:29, 4.42it/s] 132it [00:29, 4.51it/s] 133it [00:30, 4.57it/s] 134it [00:30, 4.56it/s] 135it [00:30, 4.56it/s] 136it [00:30, 4.48it/s] 137it [00:31, 4.49it/s] 138it [00:31, 4.47it/s] 139it [00:31, 4.53it/s] 140it [00:31, 4.56it/s] 141it [00:31, 4.38it/s] 142it [00:32, 4.47it/s] 143it [00:32, 4.48it/s] 144it [00:32, 4.48it/s] 145it [00:32, 4.51it/s] 146it [00:33, 4.51it/s] 147it [00:33, 4.56it/s] 148it [00:33, 4.55it/s] 149it [00:33, 4.43it/s] 150it [00:33, 4.42it/s]2025-05-26 01:51:24,799 - INFO - [Epoch 004 | Batch 0150] IWAE-loss 4805.7720 | mean log_px -0.0276 | KL -3228.11 + 151it [00:34, 4.34it/s] 152it [00:34, 4.45it/s] 153it [00:34, 4.44it/s] 154it [00:34, 4.44it/s] 155it [00:35, 4.41it/s] 156it [00:35, 4.40it/s] 157it [00:35, 4.36it/s] 158it [00:35, 4.25it/s] 159it [00:36, 4.31it/s] 160it [00:36, 4.32it/s] 161it [00:36, 4.36it/s] 162it [00:36, 4.40it/s] 163it [00:36, 4.47it/s] 164it [00:37, 4.53it/s] 165it [00:37, 4.58it/s] 166it [00:37, 4.39it/s] 167it [00:37, 4.49it/s] 168it [00:38, 4.48it/s] 169it [00:38, 4.46it/s] 170it [00:38, 4.52it/s] 171it [00:38, 4.45it/s] 172it [00:38, 4.45it/s] 173it [00:39, 4.43it/s] 174it [00:39, 4.41it/s] 175it [00:39, 4.37it/s] 176it [00:39, 4.39it/s] 177it [00:40, 4.44it/s] 178it [00:40, 4.42it/s] 179it [00:40, 4.31it/s] 180it [00:40, 4.37it/s] 181it [00:40, 4.47it/s] 182it [00:41, 4.51it/s] 183it [00:41, 4.49it/s] 184it [00:41, 4.42it/s] 185it [00:41, 4.51it/s] 186it [00:42, 4.49it/s] 187it [00:42, 4.46it/s] 188it [00:42, 4.48it/s] 189it [00:42, 4.46it/s] 190it [00:42, 4.50it/s] 191it [00:43, 4.48it/s] 192it [00:43, 4.44it/s] 193it [00:43, 4.40it/s] 194it [00:43, 4.49it/s] 195it [00:44, 4.39it/s] 196it [00:44, 4.38it/s] 196it [00:44, 4.42it/s] +2025-05-26 01:51:35,066 - INFO - Epoch: 4, Objective: tensor([5635.8784], device='cuda:0', grad_fn=), Loss: 0.03690037503838539, KL/n: 65.52703094482422 + 0it [00:00, ?it/s]2025-05-26 01:51:35,627 - INFO - [Epoch 005 | Batch 0000] IWAE-loss 6954.7480 | mean log_px -0.0605 | KL -3211.71 + 1it [00:00, 2.99it/s] 2it [00:00, 3.67it/s] 3it [00:00, 4.08it/s] 4it [00:00, 4.27it/s] 5it [00:01, 4.43it/s] 6it [00:01, 4.51it/s] 7it [00:01, 4.58it/s] 8it [00:01, 4.47it/s] 9it [00:02, 4.56it/s] 10it [00:02, 4.59it/s] 11it [00:02, 4.62it/s] 12it [00:02, 4.64it/s] 13it [00:02, 4.50it/s] 14it [00:03, 4.56it/s] 15it [00:03, 4.60it/s] 16it [00:03, 4.61it/s] 17it [00:03, 4.62it/s] 18it [00:04, 4.64it/s] 19it [00:04, 4.65it/s] 20it [00:04, 4.49it/s] 21it [00:04, 4.57it/s] 22it [00:04, 4.59it/s] 23it [00:05, 4.63it/s] 24it [00:05, 4.64it/s] 25it [00:05, 4.65it/s] 26it [00:05, 4.66it/s] 27it [00:05, 4.67it/s] 28it [00:06, 4.68it/s] 29it [00:06, 4.52it/s] 30it [00:06, 4.58it/s] 31it [00:06, 4.61it/s] 32it [00:07, 4.63it/s] 33it [00:07, 4.65it/s] 34it [00:07, 4.66it/s] 35it [00:07, 4.68it/s] 36it [00:07, 4.67it/s] 37it [00:08, 4.51it/s] 38it [00:08, 4.58it/s] 39it [00:08, 4.61it/s] 40it [00:08, 4.63it/s] 41it [00:09, 4.66it/s] 42it [00:09, 4.66it/s] 43it [00:09, 4.51it/s] 44it [00:09, 4.57it/s] 45it [00:09, 4.61it/s] 46it [00:10, 4.60it/s] 47it [00:10, 4.64it/s] 48it [00:10, 4.65it/s] 49it [00:10, 4.67it/s] 50it [00:10, 4.53it/s]2025-05-26 01:51:46,517 - INFO - [Epoch 005 | Batch 0050] IWAE-loss 6567.6064 | mean log_px -0.0585 | KL -3187.38 + 51it [00:11, 4.46it/s] 52it [00:11, 4.47it/s] 53it [00:11, 4.53it/s] 54it [00:11, 4.54it/s] 55it [00:12, 4.56it/s] 56it [00:12, 4.43it/s] 57it [00:12, 4.51it/s] 58it [00:12, 4.56it/s] 59it [00:12, 4.60it/s] 60it [00:13, 4.61it/s] 61it [00:13, 4.64it/s] 62it [00:13, 4.65it/s] 63it [00:13, 4.50it/s] 64it [00:14, 4.56it/s] 65it [00:14, 4.58it/s] 66it [00:14, 4.59it/s] 67it [00:14, 4.62it/s] 68it [00:14, 4.64it/s] 69it [00:15, 4.66it/s] 70it [00:15, 4.67it/s] 71it [00:15, 4.68it/s] 72it [00:15, 4.67it/s] 73it [00:15, 4.68it/s] 74it [00:16, 4.52it/s] 75it [00:16, 4.58it/s] 76it [00:16, 4.60it/s] 77it [00:16, 4.62it/s] 78it [00:17, 4.64it/s] 79it [00:17, 4.49it/s] 80it [00:17, 4.56it/s] 81it [00:17, 4.59it/s] 82it [00:17, 4.61it/s] 83it [00:18, 4.63it/s] 84it [00:18, 4.63it/s] 85it [00:18, 4.64it/s] 86it [00:18, 4.49it/s] 87it [00:19, 4.54it/s] 88it [00:19, 4.60it/s] 89it [00:19, 4.63it/s] 90it [00:19, 4.64it/s] 91it [00:19, 4.65it/s] 92it [00:20, 4.66it/s] 93it [00:20, 4.52it/s] 94it [00:20, 4.58it/s] 95it [00:20, 4.61it/s] 96it [00:20, 4.63it/s] 97it [00:21, 4.64it/s] 98it [00:21, 4.62it/s] 99it [00:21, 4.63it/s] 100it [00:21, 4.65it/s]2025-05-26 01:51:57,383 - INFO - [Epoch 005 | Batch 0100] IWAE-loss 5110.2051 | mean log_px -0.0323 | KL -3168.64 + 101it [00:22, 4.66it/s] 102it [00:22, 4.66it/s] 103it [00:22, 4.68it/s] 104it [00:22, 4.68it/s] 105it [00:22, 4.52it/s] 106it [00:23, 4.57it/s] 107it [00:23, 4.61it/s] 108it [00:23, 4.63it/s] 109it [00:23, 4.65it/s] 110it [00:24, 4.67it/s] 111it [00:24, 4.67it/s] 112it [00:24, 4.51it/s] 113it [00:24, 4.57it/s] 114it [00:24, 4.60it/s] 115it [00:25, 4.63it/s] 116it [00:25, 4.64it/s] 117it [00:25, 4.65it/s] 118it [00:25, 4.66it/s] 119it [00:25, 4.67it/s] 120it [00:26, 4.67it/s] 121it [00:26, 4.51it/s] 122it [00:26, 4.57it/s] 123it [00:26, 4.60it/s] 124it [00:27, 4.60it/s] 125it [00:27, 4.64it/s] 126it [00:27, 4.65it/s] 127it [00:27, 4.66it/s] 128it [00:27, 4.67it/s] 129it [00:28, 4.52it/s] 130it [00:28, 4.57it/s] 131it [00:28, 4.60it/s] 132it [00:28, 4.62it/s] 133it [00:28, 4.64it/s] 134it [00:29, 4.65it/s] 135it [00:29, 4.66it/s] 136it [00:29, 4.66it/s] 137it [00:29, 4.67it/s] 138it [00:30, 4.67it/s] 139it [00:30, 4.68it/s] 140it [00:30, 4.68it/s] 141it [00:30, 4.69it/s] 142it [00:30, 4.51it/s] 143it [00:31, 4.56it/s] 144it [00:31, 4.59it/s] 145it [00:31, 4.61it/s] 146it [00:31, 4.63it/s] 147it [00:32, 4.66it/s] 148it [00:32, 4.66it/s] 149it [00:32, 4.50it/s] 150it [00:32, 4.56it/s]2025-05-26 01:52:08,217 - INFO - [Epoch 005 | Batch 0150] IWAE-loss 3932.0217 | mean log_px -0.0119 | KL -3150.20 + 151it [00:32, 4.55it/s] 152it [00:33, 4.56it/s] 153it [00:33, 4.60it/s] 154it [00:33, 4.61it/s] 155it [00:33, 4.63it/s] 156it [00:33, 4.49it/s] 157it [00:34, 4.57it/s] 158it [00:34, 4.59it/s] 159it [00:34, 4.63it/s] 160it [00:34, 4.65it/s] 161it [00:35, 4.63it/s] 162it [00:35, 4.50it/s] 163it [00:35, 4.57it/s] 164it [00:35, 4.60it/s] 165it [00:35, 4.63it/s] 166it [00:36, 4.64it/s] 167it [00:36, 4.65it/s] 168it [00:36, 4.50it/s] 169it [00:36, 4.56it/s] 170it [00:37, 4.58it/s] 171it [00:37, 4.61it/s] 172it [00:37, 4.63it/s] 173it [00:37, 4.64it/s] 174it [00:37, 4.62it/s] 175it [00:38, 4.46it/s] 176it [00:38, 4.53it/s] 177it [00:38, 4.58it/s] 178it [00:38, 4.61it/s] 179it [00:38, 4.62it/s] 180it [00:39, 4.62it/s] 181it [00:39, 4.65it/s] 182it [00:39, 4.66it/s] 183it [00:39, 4.67it/s] 184it [00:40, 4.67it/s] 185it [00:40, 4.67it/s] 186it [00:40, 4.52it/s] 187it [00:40, 4.57it/s] 188it [00:40, 4.59it/s] 189it [00:41, 4.62it/s] 190it [00:41, 4.64it/s] 191it [00:41, 4.65it/s] 192it [00:41, 4.66it/s] 193it [00:42, 4.67it/s] 194it [00:42, 4.67it/s] 195it [00:42, 4.43it/s] 196it [00:42, 4.40it/s] 196it [00:42, 4.58it/s] +2025-05-26 01:52:18,161 - INFO - Epoch: 5, Objective: tensor([4262.7358], device='cuda:0', grad_fn=), Loss: 0.01855652406811714, KL/n: 64.05235290527344 + 0it [00:00, ?it/s]2025-05-26 01:52:18,564 - INFO - [Epoch 006 | Batch 0000] IWAE-loss 4869.3335 | mean log_px -0.0318 | KL -3135.65 + 1it [00:00, 3.01it/s] 2it [00:00, 3.74it/s] 3it [00:00, 4.03it/s] 4it [00:00, 4.28it/s] 5it [00:01, 4.41it/s] 6it [00:01, 4.30it/s] 7it [00:01, 4.43it/s] 8it [00:01, 4.50it/s] 9it [00:02, 4.54it/s] 10it [00:02, 4.59it/s] 11it [00:02, 4.63it/s] 12it [00:02, 4.63it/s] 13it [00:02, 4.66it/s] 14it [00:03, 4.66it/s] 15it [00:03, 4.67it/s] 16it [00:03, 4.64it/s] 17it [00:03, 4.63it/s] 18it [00:04, 4.63it/s] 19it [00:04, 4.64it/s] 20it [00:04, 4.63it/s] 21it [00:04, 4.63it/s] 22it [00:04, 4.63it/s] 23it [00:05, 4.63it/s] 24it [00:05, 4.61it/s] 25it [00:05, 4.47it/s] 26it [00:05, 4.52it/s] 27it [00:05, 4.55it/s] 28it [00:06, 4.55it/s] 29it [00:06, 4.59it/s] 30it [00:06, 4.57it/s] 31it [00:06, 4.44it/s] 32it [00:07, 4.46it/s] 33it [00:07, 4.51it/s] 34it [00:07, 4.54it/s] 35it [00:07, 4.56it/s] 36it [00:07, 4.58it/s] 37it [00:08, 4.61it/s] 38it [00:08, 4.63it/s] 39it [00:08, 4.64it/s] 40it [00:09, 3.71it/s] 41it [00:09, 3.96it/s] 42it [00:09, 4.03it/s] 43it [00:09, 4.23it/s] 44it [00:09, 4.36it/s] 45it [00:10, 4.46it/s] 46it [00:10, 4.50it/s] 47it [00:10, 4.56it/s] 48it [00:10, 4.60it/s] 49it [00:10, 4.63it/s] 50it [00:11, 4.65it/s]2025-05-26 01:52:29,618 - INFO - [Epoch 006 | Batch 0050] IWAE-loss 7057.3750 | mean log_px -0.0627 | KL -3113.32 + 51it [00:11, 4.66it/s] 52it [00:11, 4.67it/s] 53it [00:11, 4.68it/s] 54it [00:12, 4.67it/s] 55it [00:12, 4.68it/s] 56it [00:12, 4.68it/s] 57it [00:12, 4.68it/s] 58it [00:12, 4.50it/s] 59it [00:13, 4.55it/s] 60it [00:13, 4.59it/s] 61it [00:13, 4.51it/s] 62it [00:13, 4.40it/s] 63it [00:14, 4.48it/s] 64it [00:14, 4.54it/s] 65it [00:14, 4.58it/s] 66it [00:14, 4.61it/s] 67it [00:14, 4.63it/s] 68it [00:15, 4.65it/s] 69it [00:15, 4.66it/s] 70it [00:15, 4.51it/s] 71it [00:15, 4.53it/s] 72it [00:15, 4.54it/s] 73it [00:16, 4.57it/s] 74it [00:16, 4.58it/s] 75it [00:16, 4.59it/s] 76it [00:16, 4.60it/s] 77it [00:17, 4.61it/s] 78it [00:17, 4.59it/s] 79it [00:17, 4.60it/s] 80it [00:17, 4.59it/s] 81it [00:17, 4.60it/s] 82it [00:18, 4.60it/s] 83it [00:18, 4.47it/s] 84it [00:18, 4.52it/s] 85it [00:18, 4.56it/s] 86it [00:19, 4.58it/s] 87it [00:19, 4.59it/s] 88it [00:19, 4.60it/s] 89it [00:19, 4.58it/s] 90it [00:19, 4.58it/s] 91it [00:20, 4.60it/s] 92it [00:20, 4.59it/s] 93it [00:20, 4.60it/s] 94it [00:20, 4.60it/s] 95it [00:20, 4.61it/s] 96it [00:21, 4.59it/s] 97it [00:21, 4.60it/s] 98it [00:21, 4.61it/s] 99it [00:21, 4.61it/s] 100it [00:22, 4.61it/s]2025-05-26 01:52:40,522 - INFO - [Epoch 006 | Batch 0100] IWAE-loss 6381.2471 | mean log_px -0.0664 | KL -3103.59 + 101it [00:22, 4.61it/s] 102it [00:22, 4.45it/s] 103it [00:22, 4.50it/s] 104it [00:22, 4.52it/s] 105it [00:23, 4.53it/s] 106it [00:23, 4.55it/s] 107it [00:23, 4.55it/s] 108it [00:23, 4.58it/s] 109it [00:24, 4.59it/s] 110it [00:24, 4.57it/s] 111it [00:24, 4.43it/s] 112it [00:24, 4.51it/s] 113it [00:24, 4.55it/s] 114it [00:25, 4.45it/s] 115it [00:25, 4.50it/s] 116it [00:25, 4.53it/s] 117it [00:25, 4.55it/s] 118it [00:26, 4.56it/s] 119it [00:26, 4.57it/s] 120it [00:26, 4.54it/s] 121it [00:26, 4.56it/s] 122it [00:26, 4.57it/s] 123it [00:27, 4.57it/s] 124it [00:27, 4.56it/s] 125it [00:27, 4.49it/s] 126it [00:27, 4.48it/s] 127it [00:28, 4.48it/s] 128it [00:28, 4.49it/s] 129it [00:28, 4.52it/s] 130it [00:28, 4.38it/s] 131it [00:28, 4.46it/s] 132it [00:29, 4.50it/s] 133it [00:29, 4.39it/s] 134it [00:29, 4.45it/s] 135it [00:29, 4.49it/s] 136it [00:30, 4.51it/s] 137it [00:30, 4.52it/s] 138it [00:30, 4.48it/s] 139it [00:30, 4.49it/s] 140it [00:30, 4.29it/s] 141it [00:31, 4.25it/s] 142it [00:31, 4.31it/s] 143it [00:31, 4.36it/s] 144it [00:31, 4.39it/s] 145it [00:32, 4.43it/s] 146it [00:32, 4.45it/s] 147it [00:32, 4.49it/s] 148it [00:32, 4.49it/s] 149it [00:33, 4.30it/s] 150it [00:33, 4.29it/s]2025-05-26 01:52:51,725 - INFO - [Epoch 006 | Batch 0150] IWAE-loss 4548.9775 | mean log_px -0.0281 | KL -3080.35 + 151it [00:33, 4.35it/s] 152it [00:33, 4.33it/s] 153it [00:33, 4.36it/s] 154it [00:34, 4.42it/s] 155it [00:34, 4.47it/s] 156it [00:34, 4.36it/s] 157it [00:34, 4.40it/s] 158it [00:35, 4.43it/s] 159it [00:35, 4.39it/s] 160it [00:35, 4.38it/s] 161it [00:35, 4.40it/s] 162it [00:35, 4.37it/s] 163it [00:36, 4.36it/s] 164it [00:36, 4.46it/s] 165it [00:36, 4.52it/s] 166it [00:36, 4.54it/s] 167it [00:37, 4.56it/s] 168it [00:37, 4.55it/s] 169it [00:37, 4.56it/s] 170it [00:37, 4.59it/s] 171it [00:37, 4.54it/s] 172it [00:38, 4.54it/s] 173it [00:38, 4.42it/s] 174it [00:38, 4.46it/s] 175it [00:38, 4.46it/s] 176it [00:39, 4.52it/s] 177it [00:39, 4.56it/s] 178it [00:39, 4.58it/s] 179it [00:39, 4.61it/s] 180it [00:39, 4.62it/s] 181it [00:40, 4.47it/s] 182it [00:40, 4.54it/s] 183it [00:40, 4.58it/s] 184it [00:40, 4.60it/s] 185it [00:41, 4.62it/s] 186it [00:41, 4.63it/s] 187it [00:41, 4.64it/s] 188it [00:41, 4.48it/s] 189it [00:41, 4.55it/s] 190it [00:42, 4.57it/s] 191it [00:42, 4.60it/s] 192it [00:42, 4.60it/s] 193it [00:42, 4.62it/s] 194it [00:43, 4.48it/s] 195it [00:43, 4.34it/s] 196it [00:43, 4.39it/s] 196it [00:43, 4.50it/s] +2025-05-26 01:53:01,857 - INFO - Epoch: 6, Objective: tensor([7316.6924], device='cuda:0', grad_fn=), Loss: 0.06832034140825272, KL/n: 62.47688674926758 + 0it [00:00, ?it/s]2025-05-26 01:53:02,278 - INFO - [Epoch 007 | Batch 0000] IWAE-loss 5764.2217 | mean log_px -0.0439 | KL -3059.68 + 1it [00:00, 2.91it/s] 2it [00:00, 3.72it/s] 3it [00:00, 3.90it/s] 4it [00:01, 4.16it/s] 5it [00:01, 4.31it/s] 6it [00:01, 4.18it/s] 7it [00:01, 4.24it/s] 8it [00:01, 4.26it/s] 9it [00:02, 4.33it/s] 10it [00:02, 4.39it/s] 11it [00:02, 4.50it/s] 12it [00:02, 4.50it/s] 13it [00:03, 4.57it/s] 14it [00:03, 4.60it/s] 15it [00:03, 4.62it/s] 16it [00:03, 4.57it/s] 17it [00:03, 4.59it/s] 18it [00:04, 4.61it/s] 19it [00:04, 4.63it/s] 20it [00:04, 4.63it/s] 21it [00:04, 4.49it/s] 22it [00:05, 4.53it/s] 23it [00:05, 4.57it/s] 24it [00:05, 4.59it/s] 25it [00:05, 4.61it/s] 26it [00:05, 4.62it/s] 27it [00:06, 4.64it/s] 28it [00:06, 4.64it/s] 29it [00:06, 4.63it/s] 30it [00:06, 4.50it/s] 31it [00:06, 4.55it/s] 32it [00:07, 4.57it/s] 33it [00:07, 4.58it/s] 34it [00:07, 4.60it/s] 35it [00:07, 4.62it/s] 36it [00:08, 4.48it/s] 37it [00:08, 4.55it/s] 38it [00:08, 4.58it/s] 39it [00:08, 4.61it/s] 40it [00:08, 4.47it/s] 41it [00:09, 4.56it/s] 42it [00:09, 4.60it/s] 43it [00:09, 4.63it/s] 44it [00:09, 4.65it/s] 45it [00:09, 4.67it/s] 46it [00:10, 4.52it/s] 47it [00:10, 4.60it/s] 48it [00:10, 4.62it/s] 49it [00:10, 4.65it/s] 50it [00:11, 4.67it/s]2025-05-26 01:53:13,238 - INFO - [Epoch 007 | Batch 0050] IWAE-loss 4438.1538 | mean log_px -0.0305 | KL -3042.06 + 51it [00:11, 4.68it/s] 52it [00:11, 4.66it/s] 53it [00:11, 4.68it/s] 54it [00:11, 4.70it/s] 55it [00:12, 4.71it/s] 56it [00:12, 4.53it/s] 57it [00:12, 4.60it/s] 58it [00:12, 4.63it/s] 59it [00:13, 4.66it/s] 60it [00:13, 4.67it/s] 61it [00:13, 4.69it/s] 62it [00:13, 4.52it/s] 63it [00:13, 4.60it/s] 64it [00:14, 4.63it/s] 65it [00:14, 4.66it/s] 66it [00:14, 4.67it/s] 67it [00:14, 4.66it/s] 68it [00:14, 4.66it/s] 69it [00:15, 4.68it/s] 70it [00:15, 4.68it/s] 71it [00:15, 4.52it/s] 72it [00:15, 4.58it/s] 73it [00:16, 4.63it/s] 74it [00:16, 4.65it/s] 75it [00:16, 4.67it/s] 76it [00:16, 4.69it/s] 77it [00:16, 4.70it/s] 78it [00:17, 4.70it/s] 79it [00:17, 4.71it/s] 80it [00:17, 4.71it/s] 81it [00:17, 4.72it/s] 82it [00:17, 4.71it/s] 83it [00:18, 4.71it/s] 84it [00:18, 4.71it/s] 85it [00:18, 4.70it/s] 86it [00:18, 4.47it/s] 87it [00:19, 4.53it/s] 88it [00:19, 4.57it/s] 89it [00:19, 4.61it/s] 90it [00:19, 4.63it/s] 91it [00:19, 4.64it/s] 92it [00:20, 4.66it/s] 93it [00:20, 4.51it/s] 94it [00:20, 4.59it/s] 95it [00:20, 4.63it/s] 96it [00:20, 4.65it/s] 97it [00:21, 4.68it/s] 98it [00:21, 4.51it/s] 99it [00:21, 4.59it/s] 100it [00:21, 4.63it/s]2025-05-26 01:53:24,020 - INFO - [Epoch 007 | Batch 0100] IWAE-loss 3706.3210 | mean log_px -0.0132 | KL -3016.29 + 101it [00:22, 4.66it/s] 102it [00:22, 4.66it/s] 103it [00:22, 4.69it/s] 104it [00:22, 4.53it/s] 105it [00:22, 4.60it/s] 106it [00:23, 4.63it/s] 107it [00:23, 4.64it/s] 108it [00:23, 4.66it/s] 109it [00:23, 4.68it/s] 110it [00:24, 4.51it/s] 111it [00:24, 4.56it/s] 112it [00:24, 4.60it/s] 113it [00:24, 4.64it/s] 114it [00:24, 4.66it/s] 115it [00:25, 4.67it/s] 116it [00:25, 4.53it/s] 117it [00:25, 4.60it/s] 118it [00:25, 4.58it/s] 119it [00:25, 4.62it/s] 120it [00:26, 4.61it/s] 121it [00:26, 4.50it/s] 122it [00:26, 4.59it/s] 123it [00:26, 4.63it/s] 124it [00:27, 4.65it/s] 125it [00:27, 4.68it/s] 126it [00:27, 4.53it/s] 127it [00:27, 4.54it/s] 128it [00:27, 4.58it/s] 129it [00:28, 4.62it/s] 130it [00:28, 4.65it/s] 131it [00:28, 4.67it/s] 132it [00:28, 4.52it/s] 133it [00:29, 4.60it/s] 134it [00:29, 4.62it/s] 135it [00:29, 4.64it/s] 136it [00:29, 4.67it/s] 137it [00:29, 4.68it/s] 138it [00:30, 4.52it/s] 139it [00:30, 4.58it/s] 140it [00:30, 4.61it/s] 141it [00:30, 4.63it/s] 142it [00:30, 4.66it/s] 143it [00:31, 4.68it/s] 144it [00:31, 4.69it/s] 145it [00:31, 4.70it/s] 146it [00:31, 4.71it/s] 147it [00:32, 4.55it/s] 148it [00:32, 4.60it/s] 149it [00:32, 4.52it/s] 150it [00:32, 4.56it/s]2025-05-26 01:53:34,864 - INFO - [Epoch 007 | Batch 0150] IWAE-loss 6590.7559 | mean log_px -0.0561 | KL -2995.29 + 151it [00:32, 4.60it/s] 152it [00:33, 4.62it/s] 153it [00:33, 4.64it/s] 154it [00:33, 4.54it/s] 155it [00:33, 4.58it/s] 156it [00:34, 4.60it/s] 157it [00:34, 4.62it/s] 158it [00:34, 4.63it/s] 159it [00:34, 4.64it/s] 160it [00:34, 4.62it/s] 161it [00:35, 4.64it/s] 162it [00:35, 4.54it/s] 163it [00:35, 4.57it/s] 164it [00:35, 4.56it/s] 165it [00:35, 4.60it/s] 166it [00:36, 4.63it/s] 167it [00:36, 4.57it/s] 168it [00:36, 4.59it/s] 169it [00:36, 4.62it/s] 170it [00:37, 4.64it/s] 171it [00:37, 4.50it/s] 172it [00:37, 4.54it/s] 173it [00:37, 4.55it/s] 174it [00:37, 4.58it/s] 175it [00:38, 4.60it/s] 176it [00:38, 4.61it/s] 177it [00:38, 4.63it/s] 178it [00:38, 4.65it/s] 179it [00:39, 4.62it/s] 180it [00:39, 4.63it/s] 181it [00:39, 4.65it/s] 182it [00:39, 4.64it/s] 183it [00:39, 4.65it/s] 184it [00:40, 4.63it/s] 185it [00:40, 4.65it/s] 186it [00:40, 4.50it/s] 187it [00:40, 4.55it/s] 188it [00:40, 4.58it/s] 189it [00:41, 4.59it/s] 190it [00:41, 4.60it/s] 191it [00:41, 4.62it/s] 192it [00:41, 4.47it/s] 193it [00:42, 4.53it/s] 194it [00:42, 4.57it/s] 195it [00:42, 4.34it/s] 196it [00:42, 4.41it/s] 196it [00:42, 4.58it/s] +2025-05-26 01:53:44,829 - INFO - Epoch: 7, Objective: tensor([5831.9897], device='cuda:0', grad_fn=), Loss: 0.03322037681937218, KL/n: 60.5771369934082 + 0it [00:00, ?it/s]2025-05-26 01:53:45,410 - INFO - [Epoch 008 | Batch 0000] IWAE-loss 3881.9414 | mean log_px -0.0130 | KL -2970.20 + 1it [00:00, 3.05it/s] 2it [00:00, 3.64it/s] 3it [00:00, 4.09it/s] 4it [00:00, 4.31it/s] 5it [00:01, 4.46it/s] 6it [00:01, 4.54it/s] 7it [00:01, 4.61it/s] 8it [00:01, 4.64it/s] 9it [00:02, 4.51it/s] 10it [00:02, 4.59it/s] 11it [00:02, 4.63it/s] 12it [00:02, 4.66it/s] 13it [00:02, 4.68it/s] 14it [00:03, 4.52it/s] 15it [00:03, 4.60it/s] 16it [00:03, 4.63it/s] 17it [00:03, 4.66it/s] 18it [00:03, 4.68it/s] 19it [00:04, 4.53it/s] 20it [00:04, 4.60it/s] 21it [00:04, 4.65it/s] 22it [00:04, 4.67it/s] 23it [00:05, 4.69it/s] 24it [00:05, 4.53it/s] 25it [00:05, 4.62it/s] 26it [00:05, 4.64it/s] 27it [00:05, 4.64it/s] 28it [00:06, 4.63it/s] 29it [00:06, 4.50it/s] 30it [00:06, 4.58it/s] 31it [00:06, 4.61it/s] 32it [00:07, 4.57it/s] 33it [00:07, 4.50it/s] 34it [00:07, 4.47it/s] 35it [00:07, 4.49it/s] 36it [00:07, 4.50it/s] 37it [00:08, 4.34it/s] 38it [00:08, 4.38it/s] 39it [00:08, 4.43it/s] 40it [00:08, 4.46it/s] 41it [00:09, 4.50it/s] 42it [00:09, 4.55it/s] 43it [00:09, 4.41it/s] 44it [00:09, 4.50it/s] 45it [00:09, 4.56it/s] 46it [00:10, 4.59it/s] 47it [00:10, 4.64it/s] 48it [00:10, 4.65it/s] 49it [00:10, 4.67it/s] 50it [00:11, 4.68it/s]2025-05-26 01:53:56,320 - INFO - [Epoch 008 | Batch 0050] IWAE-loss 4140.3315 | mean log_px -0.0194 | KL -2946.16 + 51it [00:11, 4.54it/s] 52it [00:11, 4.52it/s] 53it [00:11, 4.55it/s] 54it [00:11, 4.56it/s] 55it [00:12, 4.56it/s] 56it [00:12, 4.57it/s] 57it [00:12, 4.58it/s] 58it [00:12, 4.60it/s] 59it [00:13, 4.59it/s] 60it [00:13, 4.44it/s] 61it [00:13, 4.51it/s] 62it [00:13, 4.54it/s] 63it [00:13, 4.53it/s] 64it [00:14, 4.54it/s] 65it [00:14, 4.59it/s] 66it [00:14, 4.63it/s] 67it [00:14, 4.52it/s] 68it [00:14, 4.58it/s] 69it [00:15, 4.62it/s] 70it [00:15, 4.64it/s] 71it [00:15, 4.66it/s] 72it [00:15, 4.67it/s] 73it [00:16, 4.67it/s] 74it [00:16, 4.68it/s] 75it [00:16, 4.69it/s] 76it [00:16, 4.52it/s] 77it [00:16, 4.59it/s] 78it [00:17, 4.59it/s] 79it [00:17, 4.64it/s] 80it [00:17, 4.66it/s] 81it [00:17, 4.68it/s] 82it [00:17, 4.69it/s] 83it [00:18, 4.69it/s] 84it [00:18, 4.69it/s] 85it [00:18, 4.53it/s] 86it [00:18, 4.59it/s] 87it [00:19, 4.63it/s] 88it [00:19, 4.65it/s] 89it [00:19, 4.67it/s] 90it [00:19, 4.68it/s] 91it [00:19, 4.70it/s] 92it [00:20, 4.70it/s] 93it [00:20, 4.71it/s] 94it [00:20, 4.70it/s] 95it [00:20, 4.56it/s] 96it [00:21, 4.61it/s] 97it [00:21, 4.63it/s] 98it [00:21, 4.65it/s] 99it [00:21, 4.67it/s] 100it [00:21, 4.68it/s]2025-05-26 01:54:07,161 - INFO - [Epoch 008 | Batch 0100] IWAE-loss 3203.0884 | mean log_px -0.0045 | KL -2923.38 + 101it [00:22, 4.68it/s] 102it [00:22, 4.69it/s] 103it [00:22, 4.69it/s] 104it [00:22, 4.54it/s] 105it [00:22, 4.61it/s] 106it [00:23, 4.63it/s] 107it [00:23, 4.65it/s] 108it [00:23, 4.65it/s] 109it [00:23, 4.66it/s] 110it [00:24, 4.67it/s] 111it [00:24, 4.68it/s] 112it [00:24, 4.68it/s] 113it [00:24, 4.69it/s] 114it [00:24, 4.69it/s] 115it [00:25, 4.70it/s] 116it [00:25, 4.70it/s] 117it [00:25, 4.54it/s] 118it [00:25, 4.60it/s] 119it [00:25, 4.63it/s] 120it [00:26, 4.63it/s] 121it [00:26, 4.67it/s] 122it [00:26, 4.50it/s] 123it [00:26, 4.58it/s] 124it [00:27, 4.61it/s] 125it [00:27, 4.61it/s] 126it [00:27, 4.61it/s] 127it [00:27, 4.65it/s] 128it [00:27, 4.65it/s] 129it [00:28, 4.67it/s] 130it [00:28, 4.52it/s] 131it [00:28, 4.59it/s] 132it [00:28, 4.60it/s] 133it [00:28, 4.63it/s] 134it [00:29, 4.65it/s] 135it [00:29, 4.67it/s] 136it [00:29, 4.67it/s] 137it [00:29, 4.68it/s] 138it [00:30, 4.68it/s] 139it [00:30, 4.69it/s] 140it [00:30, 4.69it/s] 141it [00:30, 4.70it/s] 142it [00:30, 4.69it/s] 143it [00:31, 4.70it/s] 144it [00:31, 4.69it/s] 145it [00:31, 4.69it/s] 146it [00:31, 4.69it/s] 147it [00:31, 4.69it/s] 148it [00:32, 4.69it/s] 149it [00:32, 4.51it/s] 150it [00:32, 4.57it/s]2025-05-26 01:54:17,934 - INFO - [Epoch 008 | Batch 0150] IWAE-loss 3672.0759 | mean log_px -0.0163 | KL -2904.56 + 151it [00:32, 4.62it/s] 152it [00:33, 4.64it/s] 153it [00:33, 4.64it/s] 154it [00:33, 4.65it/s] 155it [00:33, 4.67it/s] 156it [00:33, 4.67it/s] 157it [00:34, 4.53it/s] 158it [00:34, 4.59it/s] 159it [00:34, 4.59it/s] 160it [00:34, 4.63it/s] 161it [00:35, 4.65it/s] 162it [00:35, 4.66it/s] 163it [00:35, 4.68it/s] 164it [00:35, 4.66it/s] 165it [00:35, 4.69it/s] 166it [00:36, 4.69it/s] 167it [00:36, 4.69it/s] 168it [00:36, 4.70it/s] 169it [00:36, 4.71it/s] 170it [00:36, 4.70it/s] 171it [00:37, 4.70it/s] 172it [00:37, 4.70it/s] 173it [00:37, 4.70it/s] 174it [00:37, 4.70it/s] 175it [00:37, 4.70it/s] 176it [00:38, 4.68it/s] 177it [00:38, 4.47it/s] 178it [00:38, 4.46it/s] 179it [00:38, 4.51it/s] 180it [00:39, 4.55it/s] 181it [00:39, 4.60it/s] 182it [00:39, 4.62it/s] 183it [00:39, 4.63it/s] 184it [00:39, 4.62it/s] 185it [00:40, 4.58it/s] 186it [00:40, 4.59it/s] 187it [00:40, 4.47it/s] 188it [00:40, 4.55it/s] 189it [00:41, 4.59it/s] 190it [00:41, 4.61it/s] 191it [00:41, 4.64it/s] 192it [00:41, 4.65it/s] 193it [00:41, 4.67it/s] 194it [00:42, 4.67it/s] 195it [00:42, 4.53it/s] 196it [00:42, 4.31it/s] 196it [00:42, 4.59it/s] +2025-05-26 01:54:27,845 - INFO - Epoch: 8, Objective: tensor([4215.5410], device='cuda:0', grad_fn=), Loss: 0.014363881200551987, KL/n: 58.71515655517578 + 0it [00:00, ?it/s]2025-05-26 01:54:28,274 - INFO - [Epoch 009 | Batch 0000] IWAE-loss 3831.5950 | mean log_px -0.0261 | KL -2873.97 + 1it [00:00, 2.87it/s] 2it [00:00, 3.74it/s] 3it [00:00, 4.13it/s] 4it [00:00, 4.33it/s] 5it [00:01, 4.46it/s] 6it [00:01, 4.53it/s] 7it [00:01, 4.59it/s] 8it [00:01, 4.61it/s] 9it [00:02, 4.65it/s] 10it [00:02, 4.63it/s] 11it [00:02, 4.65it/s] 12it [00:02, 4.65it/s] 13it [00:02, 4.65it/s] 14it [00:03, 3.64it/s] 15it [00:03, 3.92it/s] 16it [00:03, 4.10it/s] 17it [00:03, 4.26it/s] 18it [00:04, 4.37it/s] 19it [00:04, 4.47it/s] 20it [00:04, 4.37it/s] 21it [00:04, 4.48it/s] 22it [00:05, 4.53it/s] 23it [00:05, 4.58it/s] 24it [00:05, 4.46it/s] 25it [00:05, 4.55it/s] 26it [00:05, 4.58it/s] 27it [00:06, 4.62it/s] 28it [00:06, 4.64it/s] 29it [00:06, 4.66it/s] 30it [00:06, 4.50it/s] 31it [00:07, 4.57it/s] 32it [00:07, 4.60it/s] 33it [00:07, 4.63it/s] 34it [00:07, 4.64it/s] 35it [00:07, 4.67it/s] 36it [00:08, 4.67it/s] 37it [00:08, 4.68it/s] 38it [00:08, 4.52it/s] 39it [00:08, 4.54it/s] 40it [00:08, 4.58it/s] 41it [00:09, 4.62it/s] 42it [00:09, 4.63it/s] 43it [00:09, 4.66it/s] 44it [00:09, 4.64it/s] 45it [00:10, 4.67it/s] 46it [00:10, 4.51it/s] 47it [00:10, 4.57it/s] 48it [00:10, 4.60it/s] 49it [00:10, 4.63it/s] 50it [00:11, 4.63it/s]2025-05-26 01:54:39,275 - INFO - [Epoch 009 | Batch 0050] IWAE-loss 3554.7034 | mean log_px -0.0139 | KL -2847.36 + 51it [00:11, 4.65it/s] 52it [00:11, 4.51it/s] 53it [00:11, 4.58it/s] 54it [00:12, 4.61it/s] 55it [00:12, 4.64it/s] 56it [00:12, 4.64it/s] 57it [00:12, 4.66it/s] 58it [00:12, 4.67it/s] 59it [00:13, 4.65it/s] 60it [00:13, 4.47it/s] 61it [00:13, 4.50it/s] 62it [00:13, 4.55it/s] 63it [00:13, 4.60it/s] 64it [00:14, 4.62it/s] 65it [00:14, 4.65it/s] 66it [00:14, 4.66it/s] 67it [00:14, 4.67it/s] 68it [00:15, 4.67it/s] 69it [00:15, 4.68it/s] 70it [00:15, 4.68it/s] 71it [00:15, 4.53it/s] 72it [00:15, 4.59it/s] 73it [00:16, 4.63it/s] 74it [00:16, 4.64it/s] 75it [00:16, 4.60it/s] 76it [00:16, 4.60it/s] 77it [00:17, 4.47it/s] 78it [00:17, 4.54it/s] 79it [00:17, 4.59it/s] 80it [00:17, 4.62it/s] 81it [00:17, 4.64it/s] 82it [00:18, 4.64it/s] 83it [00:18, 4.64it/s] 84it [00:18, 4.66it/s] 85it [00:18, 4.51it/s] 86it [00:18, 4.57it/s] 87it [00:19, 4.61it/s] 88it [00:19, 4.63it/s] 89it [00:19, 4.64it/s] 90it [00:19, 4.64it/s] 91it [00:20, 4.67it/s] 92it [00:20, 4.64it/s] 93it [00:20, 4.66it/s] 94it [00:20, 4.66it/s] 95it [00:20, 4.67it/s] 96it [00:21, 4.68it/s] 97it [00:21, 4.69it/s] 98it [00:21, 4.68it/s] 99it [00:21, 4.69it/s] 100it [00:21, 4.69it/s]2025-05-26 01:54:50,088 - INFO - [Epoch 009 | Batch 0100] IWAE-loss 3406.7056 | mean log_px -0.0110 | KL -2821.77 + 101it [00:22, 4.69it/s] 102it [00:22, 4.69it/s] 103it [00:22, 4.69it/s] 104it [00:22, 4.69it/s] 105it [00:23, 4.70it/s] 106it [00:23, 4.69it/s] 107it [00:23, 4.69it/s] 108it [00:23, 4.67it/s] 109it [00:23, 4.70it/s] 110it [00:24, 4.70it/s] 111it [00:24, 4.69it/s] 112it [00:24, 4.69it/s] 113it [00:24, 4.70it/s] 114it [00:24, 4.69it/s] 115it [00:25, 4.70it/s] 116it [00:25, 4.67it/s] 117it [00:25, 4.67it/s] 118it [00:25, 4.67it/s] 119it [00:25, 4.67it/s] 120it [00:26, 4.67it/s] 121it [00:26, 4.68it/s] 122it [00:26, 4.68it/s] 123it [00:26, 4.68it/s] 124it [00:27, 4.44it/s] 125it [00:27, 4.46it/s] 126it [00:27, 4.50it/s] 127it [00:27, 4.54it/s] 128it [00:27, 4.57it/s] 129it [00:28, 4.58it/s] 130it [00:28, 4.30it/s] 131it [00:28, 4.42it/s] 132it [00:28, 4.49it/s] 133it [00:29, 4.56it/s] 134it [00:29, 4.60it/s] 135it [00:29, 4.63it/s] 136it [00:29, 4.64it/s] 137it [00:29, 4.66it/s] 138it [00:30, 4.67it/s] 139it [00:30, 4.68it/s] 140it [00:30, 4.68it/s] 141it [00:30, 4.69it/s] 142it [00:31, 4.69it/s] 143it [00:31, 4.70it/s] 144it [00:31, 4.69it/s] 145it [00:31, 4.67it/s] 146it [00:31, 4.67it/s] 147it [00:32, 4.53it/s] 148it [00:32, 4.58it/s] 149it [00:32, 4.62it/s] 150it [00:32, 4.64it/s]2025-05-26 01:55:00,888 - INFO - [Epoch 009 | Batch 0150] IWAE-loss 5147.5215 | mean log_px -0.0361 | KL -2803.57 + 151it [00:32, 4.66it/s] 152it [00:33, 4.66it/s] 153it [00:33, 4.64it/s] 154it [00:33, 4.46it/s] 155it [00:33, 4.54it/s] 156it [00:34, 4.58it/s] 157it [00:34, 4.62it/s] 158it [00:34, 4.46it/s] 159it [00:34, 4.51it/s] 160it [00:34, 4.57it/s] 161it [00:35, 4.61it/s] 162it [00:35, 4.60it/s] 163it [00:35, 4.49it/s] 164it [00:35, 4.55it/s] 165it [00:36, 4.56it/s] 166it [00:36, 4.59it/s] 167it [00:36, 4.63it/s] 168it [00:36, 4.51it/s] 169it [00:36, 4.58it/s] 170it [00:37, 4.60it/s] 171it [00:37, 4.63it/s] 172it [00:37, 4.64it/s] 173it [00:37, 4.56it/s] 174it [00:37, 4.61it/s] 175it [00:38, 4.63it/s] 176it [00:38, 4.64it/s] 177it [00:38, 4.65it/s] 178it [00:38, 4.53it/s] 179it [00:39, 4.59it/s] 180it [00:39, 4.62it/s] 181it [00:39, 4.62it/s] 182it [00:39, 4.63it/s] 183it [00:39, 4.49it/s] 184it [00:40, 4.55it/s] 185it [00:40, 4.57it/s] 186it [00:40, 4.59it/s] 187it [00:40, 4.62it/s] 188it [00:41, 4.63it/s] 189it [00:41, 4.46it/s] 190it [00:41, 4.53it/s] 191it [00:41, 4.55it/s] 192it [00:41, 4.58it/s] 193it [00:42, 4.61it/s] 194it [00:42, 4.62it/s] 195it [00:42, 4.38it/s] 196it [00:42, 4.49it/s] 196it [00:42, 4.57it/s] +2025-05-26 01:55:10,882 - INFO - Epoch: 9, Objective: tensor([4143.1064], device='cuda:0', grad_fn=), Loss: 0.02341052144765854, KL/n: 56.89252471923828 + 0it [00:00, ?it/s]2025-05-26 01:55:11,260 - INFO - [Epoch 010 | Batch 0000] IWAE-loss 3292.7747 | mean log_px -0.0090 | KL -2785.48 + 1it [00:00, 3.30it/s] 2it [00:00, 3.85it/s] 3it [00:00, 4.06it/s] 4it [00:00, 4.14it/s] 5it [00:01, 4.21it/s] 6it [00:01, 4.24it/s] 7it [00:01, 4.39it/s] 8it [00:01, 4.45it/s] 9it [00:02, 4.53it/s] 10it [00:02, 4.58it/s] 11it [00:02, 4.62it/s] 12it [00:02, 4.64it/s] 13it [00:02, 4.66it/s] 14it [00:03, 4.53it/s] 15it [00:03, 4.59it/s] 16it [00:03, 4.62it/s] 17it [00:03, 4.64it/s] 18it [00:04, 4.65it/s] 19it [00:04, 4.66it/s] 20it [00:04, 4.50it/s] 21it [00:04, 4.58it/s] 22it [00:04, 4.61it/s] 23it [00:05, 4.64it/s] 24it [00:05, 4.65it/s] 25it [00:05, 4.66it/s] 26it [00:05, 4.67it/s] 27it [00:05, 4.68it/s] 28it [00:06, 4.68it/s] 29it [00:06, 4.53it/s] 30it [00:06, 4.59it/s] 31it [00:06, 4.62it/s] 32it [00:07, 4.64it/s] 33it [00:07, 4.66it/s] 34it [00:07, 4.67it/s] 35it [00:07, 4.51it/s] 36it [00:07, 4.58it/s] 37it [00:08, 4.62it/s] 38it [00:08, 4.64it/s] 39it [00:08, 4.66it/s] 40it [00:08, 4.67it/s] 41it [00:09, 4.68it/s] 42it [00:09, 4.68it/s] 43it [00:09, 4.55it/s] 44it [00:09, 4.58it/s] 45it [00:09, 4.63it/s] 46it [00:10, 4.65it/s] 47it [00:10, 4.66it/s] 48it [00:10, 4.65it/s] 49it [00:10, 4.65it/s] 50it [00:10, 4.67it/s]2025-05-26 01:55:22,122 - INFO - [Epoch 010 | Batch 0050] IWAE-loss 3255.0281 | mean log_px -0.0100 | KL -2764.80 + 51it [00:11, 4.67it/s] 52it [00:11, 4.47it/s] 53it [00:11, 4.54it/s] 54it [00:11, 4.59it/s] 55it [00:12, 4.62it/s] 56it [00:12, 4.63it/s] 57it [00:12, 4.64it/s] 58it [00:12, 4.49it/s] 59it [00:12, 4.56it/s] 60it [00:13, 4.59it/s] 61it [00:13, 4.63it/s] 62it [00:13, 4.64it/s] 63it [00:13, 4.66it/s] 64it [00:13, 4.67it/s] 65it [00:14, 4.47it/s] 66it [00:14, 4.47it/s] 67it [00:14, 4.52it/s] 68it [00:14, 4.55it/s] 69it [00:15, 4.58it/s] 70it [00:15, 4.44it/s] 71it [00:15, 4.51it/s] 72it [00:15, 4.44it/s] 73it [00:16, 4.50it/s] 74it [00:16, 4.56it/s] 75it [00:16, 4.61it/s] 76it [00:16, 4.63it/s] 77it [00:16, 4.66it/s] 78it [00:17, 4.65it/s] 79it [00:17, 4.67it/s] 80it [00:17, 4.68it/s] 81it [00:17, 4.69it/s] 82it [00:17, 4.69it/s] 83it [00:18, 4.69it/s] 84it [00:18, 4.53it/s] 85it [00:18, 4.59it/s] 86it [00:18, 4.62it/s] 87it [00:19, 4.64it/s] 88it [00:19, 4.64it/s] 89it [00:19, 4.66it/s] 90it [00:19, 4.67it/s] 91it [00:19, 4.69it/s] 92it [00:20, 4.69it/s] 93it [00:20, 4.53it/s] 94it [00:20, 4.58it/s] 95it [00:20, 4.60it/s] 96it [00:20, 4.63it/s] 97it [00:21, 4.66it/s] 98it [00:21, 4.66it/s] 99it [00:21, 4.67it/s] 100it [00:21, 4.68it/s]2025-05-26 01:55:32,986 - INFO - [Epoch 010 | Batch 0100] IWAE-loss 3816.2234 | mean log_px -0.0176 | KL -2740.36 + 101it [00:22, 4.68it/s] 102it [00:22, 4.68it/s] 103it [00:22, 4.55it/s] 104it [00:22, 4.55it/s] 105it [00:22, 4.60it/s] 106it [00:23, 4.63it/s] 107it [00:23, 4.64it/s] 108it [00:23, 4.45it/s] 109it [00:23, 4.54it/s] 110it [00:24, 4.58it/s] 111it [00:24, 4.62it/s] 112it [00:24, 4.64it/s] 113it [00:24, 4.66it/s] 114it [00:24, 4.68it/s] 115it [00:25, 4.50it/s] 116it [00:25, 4.55it/s] 117it [00:25, 4.57it/s] 118it [00:25, 4.59it/s] 119it [00:25, 4.60it/s] 120it [00:26, 4.60it/s] 121it [00:26, 4.60it/s] 122it [00:26, 4.60it/s] 123it [00:26, 4.61it/s] 124it [00:27, 4.61it/s] 125it [00:27, 4.62it/s] 126it [00:27, 4.61it/s] 127it [00:27, 4.61it/s] 128it [00:27, 4.50it/s] 129it [00:28, 4.54it/s] 130it [00:28, 4.45it/s] 131it [00:28, 4.49it/s] 132it [00:28, 4.50it/s] 133it [00:29, 4.53it/s] 134it [00:29, 4.53it/s] 135it [00:29, 4.54it/s] 136it [00:29, 4.54it/s] 137it [00:29, 4.42it/s] 138it [00:30, 4.47it/s] 139it [00:30, 4.45it/s] 140it [00:30, 4.49it/s] 141it [00:30, 4.53it/s] 142it [00:31, 4.55it/s] 143it [00:31, 4.58it/s] 144it [00:31, 4.45it/s] 145it [00:31, 4.51it/s] 146it [00:31, 4.53it/s] 147it [00:32, 4.56it/s] 148it [00:32, 4.58it/s] 149it [00:32, 4.58it/s] 150it [00:32, 4.59it/s]2025-05-26 01:55:43,960 - INFO - [Epoch 010 | Batch 0150] IWAE-loss 4118.2427 | mean log_px -0.0299 | KL -2717.40 + 151it [00:33, 4.60it/s] 152it [00:33, 4.60it/s] 153it [00:33, 4.61it/s] 154it [00:33, 4.61it/s] 155it [00:33, 4.61it/s] 156it [00:34, 4.46it/s] 157it [00:34, 4.52it/s] 158it [00:34, 4.55it/s] 159it [00:34, 4.57it/s] 160it [00:34, 4.58it/s] 161it [00:35, 4.60it/s] 162it [00:35, 4.59it/s] 163it [00:35, 4.59it/s] 164it [00:35, 4.62it/s] 165it [00:36, 4.63it/s] 166it [00:36, 4.62it/s] 167it [00:36, 4.61it/s] 168it [00:36, 4.61it/s] 169it [00:36, 4.62it/s] 170it [00:37, 4.62it/s] 171it [00:37, 4.61it/s] 172it [00:37, 4.60it/s] 173it [00:37, 4.32it/s] 174it [00:38, 4.40it/s] 175it [00:38, 4.46it/s] 176it [00:38, 4.50it/s] 177it [00:38, 4.52it/s] 178it [00:38, 4.54it/s] 179it [00:39, 4.42it/s] 180it [00:39, 4.48it/s] 181it [00:39, 4.51it/s] 182it [00:39, 4.56it/s] 183it [00:40, 4.61it/s] 184it [00:40, 4.64it/s] 185it [00:40, 4.68it/s] 186it [00:40, 4.54it/s] 187it [00:40, 4.62it/s] 188it [00:41, 4.64it/s] 189it [00:41, 4.67it/s] 190it [00:41, 4.68it/s] 191it [00:41, 4.70it/s] 192it [00:41, 4.52it/s] 193it [00:42, 4.60it/s] 194it [00:42, 4.62it/s] 195it [00:42, 4.52it/s] 196it [00:42, 4.59it/s] 196it [00:42, 4.57it/s] +2025-05-26 01:55:53,925 - INFO - Epoch: 10, Objective: tensor([2976.3257], device='cuda:0', grad_fn=), Loss: 0.00489531084895134, KL/n: 55.191680908203125 + 0it [00:00, ?it/s]2025-05-26 01:55:54,478 - INFO - [Epoch 011 | Batch 0000] IWAE-loss 3065.4336 | mean log_px -0.0064 | KL -2701.94 + 1it [00:00, 3.41it/s] 2it [00:00, 4.04it/s] 3it [00:00, 4.32it/s] 4it [00:00, 4.42it/s] 5it [00:01, 4.32it/s] 6it [00:01, 4.41it/s] 7it [00:01, 4.38it/s] 8it [00:01, 4.47it/s] 9it [00:02, 4.56it/s] 10it [00:02, 4.57it/s] 11it [00:02, 4.62it/s] 12it [00:02, 4.46it/s] 13it [00:02, 4.56it/s] 14it [00:03, 4.60it/s] 15it [00:03, 4.65it/s] 16it [00:03, 4.66it/s] 17it [00:03, 4.63it/s] 18it [00:04, 4.59it/s] 19it [00:04, 4.45it/s] 20it [00:04, 4.51it/s] 21it [00:04, 4.56it/s] 22it [00:04, 4.58it/s] 23it [00:05, 4.60it/s] 24it [00:05, 4.64it/s] 25it [00:05, 4.63it/s] 26it [00:05, 4.66it/s] 27it [00:05, 4.52it/s] 28it [00:06, 4.60it/s] 29it [00:06, 4.64it/s] 30it [00:06, 4.66it/s] 31it [00:06, 4.69it/s] 32it [00:07, 4.69it/s] 33it [00:07, 4.54it/s] 34it [00:07, 4.60it/s] 35it [00:07, 4.64it/s] 36it [00:07, 4.66it/s] 37it [00:08, 4.68it/s] 38it [00:08, 4.56it/s] 39it [00:08, 4.63it/s] 40it [00:08, 4.65it/s] 41it [00:08, 4.67it/s] 42it [00:09, 4.67it/s] 43it [00:09, 4.70it/s] 44it [00:09, 4.55it/s] 45it [00:09, 4.62it/s] 46it [00:10, 4.63it/s] 47it [00:10, 4.66it/s] 48it [00:10, 4.68it/s] 49it [00:10, 4.69it/s] 50it [00:10, 4.53it/s]2025-05-26 01:56:05,342 - INFO - [Epoch 011 | Batch 0050] IWAE-loss 3133.4580 | mean log_px -0.0073 | KL -2682.37 + 51it [00:11, 4.60it/s] 52it [00:11, 4.63it/s] 53it [00:11, 4.66it/s] 54it [00:11, 4.68it/s] 55it [00:12, 4.70it/s] 56it [00:12, 4.70it/s] 57it [00:12, 4.71it/s] 58it [00:12, 4.71it/s] 59it [00:12, 4.72it/s] 60it [00:13, 4.71it/s] 61it [00:13, 4.72it/s] 62it [00:13, 4.69it/s] 63it [00:13, 4.56it/s] 64it [00:13, 4.62it/s] 65it [00:14, 4.64it/s] 66it [00:14, 4.65it/s] 67it [00:14, 4.68it/s] 68it [00:14, 4.68it/s] 69it [00:14, 4.69it/s] 70it [00:15, 4.70it/s] 71it [00:15, 4.54it/s] 72it [00:15, 4.61it/s] 73it [00:15, 4.65it/s] 74it [00:16, 4.66it/s] 75it [00:16, 4.68it/s] 76it [00:16, 4.68it/s] 77it [00:16, 4.70it/s] 78it [00:16, 4.70it/s] 79it [00:17, 4.70it/s] 80it [00:17, 4.72it/s] 81it [00:17, 4.72it/s] 82it [00:17, 4.55it/s] 83it [00:18, 4.62it/s] 84it [00:18, 4.64it/s] 85it [00:18, 4.66it/s] 86it [00:18, 4.67it/s] 87it [00:18, 4.69it/s] 88it [00:19, 4.70it/s] 89it [00:19, 4.71it/s] 90it [00:19, 4.54it/s] 91it [00:19, 4.61it/s] 92it [00:19, 4.64it/s] 93it [00:20, 4.67it/s] 94it [00:20, 4.67it/s] 95it [00:20, 4.69it/s] 96it [00:20, 4.70it/s] 97it [00:21, 4.71it/s] 98it [00:21, 4.71it/s] 99it [00:21, 4.72it/s] 100it [00:21, 4.72it/s]2025-05-26 01:56:16,034 - INFO - [Epoch 011 | Batch 0100] IWAE-loss 4312.6279 | mean log_px -0.0334 | KL -2658.71 + 101it [00:21, 4.55it/s] 102it [00:22, 4.61it/s] 103it [00:22, 4.64it/s] 104it [00:22, 4.66it/s] 105it [00:22, 4.68it/s] 106it [00:22, 4.68it/s] 107it [00:23, 4.69it/s] 108it [00:23, 4.69it/s] 109it [00:23, 4.71it/s] 110it [00:23, 4.54it/s] 111it [00:24, 4.61it/s] 112it [00:24, 4.55it/s] 113it [00:24, 4.61it/s] 114it [00:24, 4.64it/s] 115it [00:24, 4.66it/s] 116it [00:25, 4.66it/s] 117it [00:25, 4.68it/s] 118it [00:25, 4.69it/s] 119it [00:25, 4.71it/s] 120it [00:25, 4.71it/s] 121it [00:26, 4.55it/s] 122it [00:26, 4.61it/s] 123it [00:26, 4.64it/s] 124it [00:26, 4.66it/s] 125it [00:27, 4.68it/s] 126it [00:27, 4.70it/s] 127it [00:27, 4.71it/s] 128it [00:27, 4.71it/s] 129it [00:27, 4.73it/s] 130it [00:28, 4.52it/s] 131it [00:28, 4.60it/s] 132it [00:28, 4.63it/s] 133it [00:28, 4.66it/s] 134it [00:28, 4.65it/s] 135it [00:29, 4.69it/s] 136it [00:29, 4.52it/s] 137it [00:29, 4.57it/s] 138it [00:29, 4.62it/s] 139it [00:30, 4.65it/s] 140it [00:30, 4.66it/s] 141it [00:30, 4.62it/s] 142it [00:30, 4.62it/s] 143it [00:30, 4.67it/s] 144it [00:31, 4.69it/s] 145it [00:31, 4.70it/s] 146it [00:31, 4.54it/s] 147it [00:31, 4.62it/s] 148it [00:31, 4.64it/s] 149it [00:32, 4.66it/s] 150it [00:32, 4.66it/s]2025-05-26 01:56:26,807 - INFO - [Epoch 011 | Batch 0150] IWAE-loss 3104.3960 | mean log_px -0.0096 | KL -2631.08 + 151it [00:32, 4.52it/s] 152it [00:32, 4.60it/s] 153it [00:33, 4.63it/s] 154it [00:33, 4.65it/s] 155it [00:33, 4.67it/s] 156it [00:33, 4.67it/s] 157it [00:33, 4.69it/s] 158it [00:34, 4.70it/s] 159it [00:34, 4.70it/s] 160it [00:34, 4.54it/s] 161it [00:34, 4.61it/s] 162it [00:35, 4.64it/s] 163it [00:35, 4.65it/s] 164it [00:35, 4.56it/s] 165it [00:35, 4.61it/s] 166it [00:35, 4.64it/s] 167it [00:36, 4.67it/s] 168it [00:36, 4.68it/s] 169it [00:36, 4.50it/s] 170it [00:36, 4.59it/s] 171it [00:36, 4.61it/s] 172it [00:37, 4.64it/s] 173it [00:37, 4.67it/s] 174it [00:37, 4.68it/s] 175it [00:37, 4.70it/s] 176it [00:38, 4.53it/s] 177it [00:38, 4.60it/s] 178it [00:38, 4.63it/s] 179it [00:38, 4.66it/s] 180it [00:38, 4.68it/s] 181it [00:39, 4.69it/s] 182it [00:39, 4.69it/s] 183it [00:39, 4.71it/s] 184it [00:39, 4.56it/s] 185it [00:39, 4.63it/s] 186it [00:40, 4.65it/s] 187it [00:40, 4.68it/s] 188it [00:40, 4.68it/s] 189it [00:40, 4.69it/s] 190it [00:41, 4.52it/s] 191it [00:41, 4.59it/s] 192it [00:41, 4.63it/s] 193it [00:41, 4.65it/s] 194it [00:41, 4.67it/s] 195it [00:42, 4.58it/s] 196it [00:42, 4.64it/s] 196it [00:42, 4.62it/s] +2025-05-26 01:56:36,639 - INFO - Epoch: 11, Objective: tensor([4247.3716], device='cuda:0', grad_fn=), Loss: 0.031174693256616592, KL/n: 53.34761047363281 + 0it [00:00, ?it/s]2025-05-26 01:56:37,055 - INFO - [Epoch 012 | Batch 0000] IWAE-loss 3012.1206 | mean log_px -0.0057 | KL -2611.20 + 1it [00:00, 2.77it/s] 2it [00:00, 3.52it/s] 3it [00:00, 3.79it/s] 4it [00:01, 4.06it/s] 5it [00:01, 4.12it/s] 6it [00:01, 4.26it/s] 7it [00:01, 4.27it/s] 8it [00:01, 4.40it/s] 9it [00:02, 4.21it/s] 10it [00:02, 4.19it/s] 11it [00:02, 3.43it/s] 12it [00:03, 3.70it/s] 13it [00:03, 3.92it/s] 14it [00:03, 4.11it/s] 15it [00:03, 4.15it/s] 16it [00:03, 4.28it/s] 17it [00:04, 4.37it/s] 18it [00:04, 4.30it/s] 19it [00:04, 4.41it/s] 20it [00:04, 4.33it/s] 21it [00:05, 4.32it/s] 22it [00:05, 4.32it/s] 23it [00:05, 4.16it/s] 24it [00:05, 4.21it/s] 25it [00:06, 4.33it/s] 26it [00:06, 4.28it/s] 27it [00:06, 4.32it/s] 28it [00:06, 4.37it/s] 29it [00:06, 4.44it/s] 30it [00:07, 4.49it/s] 31it [00:07, 4.39it/s] 32it [00:07, 4.33it/s] 33it [00:07, 4.32it/s] 34it [00:08, 4.29it/s] 35it [00:08, 4.27it/s] 36it [00:08, 4.30it/s] 37it [00:08, 4.29it/s] 38it [00:09, 4.36it/s] 39it [00:09, 4.31it/s] 40it [00:09, 4.38it/s] 41it [00:09, 4.33it/s] 42it [00:09, 4.29it/s] 43it [00:10, 4.37it/s] 44it [00:10, 4.39it/s] 45it [00:10, 4.34it/s] 46it [00:10, 4.40it/s] 47it [00:11, 4.33it/s] 48it [00:11, 4.37it/s] 49it [00:11, 4.44it/s] 50it [00:11, 4.50it/s]2025-05-26 01:56:48,720 - INFO - [Epoch 012 | Batch 0050] IWAE-loss 3992.2141 | mean log_px -0.0251 | KL -2592.65 + 51it [00:11, 4.55it/s] 52it [00:12, 4.53it/s] 53it [00:12, 4.40it/s] 54it [00:12, 4.38it/s] 55it [00:12, 4.34it/s] 56it [00:13, 4.36it/s] 57it [00:13, 4.47it/s] 58it [00:13, 4.34it/s] 59it [00:13, 4.31it/s] 60it [00:14, 4.18it/s] 61it [00:14, 4.19it/s] 62it [00:14, 4.22it/s] 63it [00:14, 4.32it/s] 64it [00:15, 4.42it/s] 65it [00:15, 4.48it/s] 66it [00:15, 4.51it/s] 67it [00:15, 4.55it/s] 68it [00:15, 4.56it/s] 69it [00:16, 4.45it/s] 70it [00:16, 4.43it/s] 71it [00:16, 4.48it/s] 72it [00:16, 4.35it/s] 73it [00:17, 4.44it/s] 74it [00:17, 4.38it/s] 75it [00:17, 4.41it/s] 76it [00:17, 4.37it/s] 77it [00:17, 4.45it/s] 78it [00:18, 4.37it/s] 79it [00:18, 4.31it/s] 80it [00:18, 4.27it/s] 81it [00:18, 4.32it/s] 82it [00:19, 4.24it/s] 83it [00:19, 4.35it/s] 84it [00:19, 4.27it/s] 85it [00:19, 4.26it/s] 86it [00:20, 4.27it/s] 87it [00:20, 4.24it/s] 88it [00:20, 4.08it/s] 89it [00:20, 4.13it/s] 90it [00:21, 4.13it/s] 91it [00:21, 4.16it/s] 92it [00:21, 4.18it/s] 93it [00:21, 4.31it/s] 94it [00:21, 4.23it/s] 95it [00:22, 4.23it/s] 96it [00:22, 4.19it/s] 97it [00:22, 4.20it/s] 98it [00:22, 4.21it/s] 99it [00:23, 4.33it/s] 100it [00:23, 4.40it/s]2025-05-26 01:57:00,286 - INFO - [Epoch 012 | Batch 0100] IWAE-loss 7227.1890 | mean log_px -0.0753 | KL -2570.68 + 101it [00:23, 4.42it/s] 102it [00:23, 4.39it/s] 103it [00:24, 4.21it/s] 104it [00:24, 4.06it/s] 105it [00:24, 4.10it/s] 106it [00:24, 4.24it/s] 107it [00:25, 4.22it/s] 108it [00:25, 4.31it/s] 109it [00:25, 4.40it/s] 110it [00:25, 4.17it/s] 111it [00:25, 4.32it/s] 112it [00:26, 4.32it/s] 113it [00:26, 4.30it/s] 114it [00:26, 4.17it/s] 115it [00:26, 4.24it/s] 116it [00:27, 4.27it/s] 117it [00:27, 4.25it/s] 118it [00:27, 4.24it/s] 119it [00:27, 4.28it/s] 120it [00:28, 4.11it/s] 121it [00:28, 4.13it/s] 122it [00:28, 4.21it/s] 123it [00:28, 4.33it/s] 124it [00:28, 4.36it/s] 125it [00:29, 4.44it/s] 126it [00:29, 4.32it/s] 127it [00:29, 4.31it/s] 128it [00:29, 4.33it/s] 129it [00:30, 4.31it/s] 130it [00:30, 4.33it/s] 131it [00:30, 4.42it/s] 132it [00:30, 4.47it/s] 133it [00:31, 4.42it/s] 134it [00:31, 4.35it/s] 135it [00:31, 4.37it/s] 136it [00:31, 4.31it/s] 137it [00:31, 4.28it/s] 138it [00:32, 4.24it/s] 139it [00:32, 4.37it/s] 140it [00:32, 4.28it/s] 141it [00:32, 4.27it/s] 142it [00:33, 4.26it/s] 143it [00:33, 4.26it/s] 144it [00:33, 4.27it/s] 145it [00:33, 4.28it/s] 146it [00:34, 4.13it/s] 147it [00:34, 4.28it/s] 148it [00:34, 4.30it/s] 149it [00:34, 4.36it/s] 150it [00:35, 4.36it/s]2025-05-26 01:57:11,960 - INFO - [Epoch 012 | Batch 0150] IWAE-loss 3201.9055 | mean log_px -0.0163 | KL -2551.84 + 151it [00:35, 4.40it/s] 152it [00:35, 4.48it/s] 153it [00:35, 4.44it/s] 154it [00:35, 4.47it/s] 155it [00:36, 4.29it/s] 156it [00:36, 4.26it/s] 157it [00:36, 4.27it/s] 158it [00:36, 4.25it/s] 159it [00:37, 4.36it/s] 160it [00:37, 4.31it/s] 161it [00:37, 4.24it/s] 162it [00:37, 4.36it/s] 163it [00:37, 4.45it/s] 164it [00:38, 4.38it/s] 165it [00:38, 4.44it/s] 166it [00:38, 4.34it/s] 167it [00:38, 4.32it/s] 168it [00:39, 4.32it/s] 169it [00:39, 4.28it/s] 170it [00:39, 4.27it/s] 171it [00:39, 4.32it/s] 172it [00:40, 4.44it/s] 173it [00:40, 4.44it/s] 174it [00:40, 4.37it/s] 175it [00:40, 4.43it/s] 176it [00:40, 4.45it/s] 177it [00:41, 4.51it/s] 178it [00:41, 4.56it/s] 179it [00:41, 4.49it/s] 180it [00:41, 4.39it/s] 181it [00:42, 4.21it/s] 182it [00:42, 4.27it/s] 183it [00:42, 4.26it/s] 184it [00:42, 4.26it/s] 185it [00:43, 4.34it/s] 186it [00:43, 4.43it/s] 187it [00:43, 4.37it/s] 188it [00:43, 4.42it/s] 189it [00:43, 4.33it/s] 190it [00:44, 4.14it/s] 191it [00:44, 4.23it/s] 192it [00:44, 4.22it/s] 193it [00:44, 4.35it/s] 194it [00:45, 4.44it/s] 195it [00:45, 4.40it/s] 196it [00:45, 4.50it/s] 196it [00:45, 4.30it/s] +2025-05-26 01:57:22,414 - INFO - Epoch: 12, Objective: tensor([2863.8979], device='cuda:0', grad_fn=), Loss: 0.006043643224984407, KL/n: 51.6978874206543 + 0it [00:00, ?it/s]2025-05-26 01:57:22,793 - INFO - [Epoch 013 | Batch 0000] IWAE-loss 2755.2402 | mean log_px -0.0041 | KL -2532.30 + 1it [00:00, 3.10it/s] 2it [00:00, 3.91it/s] 3it [00:00, 4.24it/s] 4it [00:00, 4.40it/s] 5it [00:01, 4.51it/s] 6it [00:01, 4.57it/s] 7it [00:01, 4.63it/s] 8it [00:01, 4.64it/s] 9it [00:02, 4.65it/s] 10it [00:02, 4.65it/s] 11it [00:02, 4.54it/s] 12it [00:02, 4.60it/s] 13it [00:02, 4.59it/s] 14it [00:03, 4.64it/s] 15it [00:03, 4.66it/s] 16it [00:03, 4.64it/s] 17it [00:03, 4.66it/s] 18it [00:03, 4.67it/s] 19it [00:04, 4.69it/s] 20it [00:04, 4.69it/s] 21it [00:04, 4.69it/s] 22it [00:04, 4.69it/s] 23it [00:05, 4.70it/s] 24it [00:05, 4.70it/s] 25it [00:05, 4.70it/s] 26it [00:05, 4.67it/s] 27it [00:05, 4.68it/s] 28it [00:06, 4.69it/s] 29it [00:06, 4.69it/s] 30it [00:06, 4.69it/s] 31it [00:06, 4.69it/s] 32it [00:06, 4.68it/s] 33it [00:07, 4.69it/s] 34it [00:07, 4.68it/s] 35it [00:07, 4.69it/s] 36it [00:07, 4.69it/s] 37it [00:08, 4.69it/s] 38it [00:08, 4.68it/s] 39it [00:08, 4.69it/s] 40it [00:08, 4.69it/s] 41it [00:08, 4.70it/s] 42it [00:09, 4.70it/s] 43it [00:09, 4.70it/s] 44it [00:09, 4.70it/s] 45it [00:09, 4.49it/s] 46it [00:09, 4.53it/s] 47it [00:10, 4.58it/s] 48it [00:10, 4.61it/s] 49it [00:10, 4.64it/s] 50it [00:10, 4.66it/s]2025-05-26 01:57:33,528 - INFO - [Epoch 013 | Batch 0050] IWAE-loss 2921.4778 | mean log_px -0.0094 | KL -2503.91 + 51it [00:11, 4.67it/s] 52it [00:11, 4.68it/s] 53it [00:11, 4.69it/s] 54it [00:11, 4.69it/s] 55it [00:11, 4.53it/s] 56it [00:12, 4.58it/s] 57it [00:12, 4.62it/s] 58it [00:12, 4.61it/s] 59it [00:12, 4.64it/s] 60it [00:12, 4.51it/s] 61it [00:13, 4.58it/s] 62it [00:13, 4.62it/s] 63it [00:13, 4.65it/s] 64it [00:13, 4.66it/s] 65it [00:14, 4.68it/s] 66it [00:14, 4.51it/s] 67it [00:14, 4.58it/s] 68it [00:14, 4.61it/s] 69it [00:14, 4.65it/s] 70it [00:15, 4.66it/s] 71it [00:15, 4.68it/s] 72it [00:15, 4.68it/s] 73it [00:15, 4.68it/s] 74it [00:15, 4.68it/s] 75it [00:16, 4.69it/s] 76it [00:16, 4.69it/s] 77it [00:16, 4.69it/s] 78it [00:16, 4.66it/s] 79it [00:17, 4.67it/s] 80it [00:17, 4.65it/s] 81it [00:17, 4.68it/s] 82it [00:17, 4.68it/s] 83it [00:17, 4.69it/s] 84it [00:18, 4.69it/s] 85it [00:18, 4.53it/s] 86it [00:18, 4.59it/s] 87it [00:18, 4.63it/s] 88it [00:19, 4.64it/s] 89it [00:19, 4.67it/s] 90it [00:19, 4.68it/s] 91it [00:19, 4.67it/s] 92it [00:19, 4.57it/s] 93it [00:20, 4.63it/s] 94it [00:20, 4.64it/s] 95it [00:20, 4.67it/s] 96it [00:20, 4.52it/s] 97it [00:20, 4.59it/s] 98it [00:21, 4.61it/s] 99it [00:21, 4.62it/s] 100it [00:21, 4.64it/s]2025-05-26 01:57:44,313 - INFO - [Epoch 013 | Batch 0100] IWAE-loss 3051.0591 | mean log_px -0.0105 | KL -2480.72 + 101it [00:21, 4.66it/s] 102it [00:22, 4.63it/s] 103it [00:22, 4.65it/s] 104it [00:22, 4.67it/s] 105it [00:22, 4.68it/s] 106it [00:22, 4.52it/s] 107it [00:23, 4.58it/s] 108it [00:23, 4.61it/s] 109it [00:23, 4.65it/s] 110it [00:23, 4.66it/s] 111it [00:23, 4.68it/s] 112it [00:24, 4.69it/s] 113it [00:24, 4.69it/s] 114it [00:24, 4.69it/s] 115it [00:24, 4.55it/s] 116it [00:25, 4.61it/s] 117it [00:25, 4.63it/s] 118it [00:25, 4.65it/s] 119it [00:25, 4.67it/s] 120it [00:25, 4.53it/s] 121it [00:26, 4.60it/s] 122it [00:26, 4.63it/s] 123it [00:26, 4.66it/s] 124it [00:26, 4.67it/s] 125it [00:26, 4.68it/s] 126it [00:27, 4.68it/s] 127it [00:27, 4.69it/s] 128it [00:27, 4.69it/s] 129it [00:27, 4.54it/s] 130it [00:28, 4.60it/s] 131it [00:28, 4.63it/s] 132it [00:28, 4.60it/s] 133it [00:28, 4.64it/s] 134it [00:28, 4.65it/s] 135it [00:29, 4.67it/s] 136it [00:29, 4.68it/s] 137it [00:29, 4.69it/s] 138it [00:29, 4.55it/s] 139it [00:30, 4.60it/s] 140it [00:30, 4.62it/s] 141it [00:30, 4.65it/s] 142it [00:30, 4.67it/s] 143it [00:30, 4.50it/s] 144it [00:31, 4.46it/s] 145it [00:31, 4.55it/s] 146it [00:31, 4.57it/s] 147it [00:31, 4.62it/s] 148it [00:31, 4.64it/s] 149it [00:32, 4.50it/s] 150it [00:32, 4.57it/s]2025-05-26 01:57:55,137 - INFO - [Epoch 013 | Batch 0150] IWAE-loss 2694.3430 | mean log_px -0.0060 | KL -2454.87 + 151it [00:32, 4.61it/s] 152it [00:32, 4.63it/s] 153it [00:33, 4.65it/s] 154it [00:33, 4.67it/s] 155it [00:33, 4.68it/s] 156it [00:33, 4.68it/s] 157it [00:33, 4.54it/s] 158it [00:34, 4.60it/s] 159it [00:34, 4.63it/s] 160it [00:34, 4.65it/s] 161it [00:34, 4.67it/s] 162it [00:35, 4.68it/s] 163it [00:35, 4.68it/s] 164it [00:35, 4.67it/s] 165it [00:35, 4.64it/s] 166it [00:35, 4.46it/s] 167it [00:36, 4.55it/s] 168it [00:36, 4.59it/s] 169it [00:36, 4.62it/s] 170it [00:36, 4.65it/s] 171it [00:36, 4.67it/s] 172it [00:37, 4.67it/s] 173it [00:37, 4.68it/s] 174it [00:37, 4.69it/s] 175it [00:37, 4.54it/s] 176it [00:38, 4.60it/s] 177it [00:38, 4.63it/s] 178it [00:38, 4.65it/s] 179it [00:38, 4.67it/s] 180it [00:38, 4.67it/s] 181it [00:39, 4.53it/s] 182it [00:39, 4.58it/s] 183it [00:39, 4.62it/s] 184it [00:39, 4.64it/s] 185it [00:39, 4.62it/s] 186it [00:40, 4.62it/s] 187it [00:40, 4.48it/s] 188it [00:40, 4.55it/s] 189it [00:40, 4.60it/s] 190it [00:41, 4.55it/s] 191it [00:41, 4.49it/s] 192it [00:41, 4.54it/s] 193it [00:41, 4.42it/s] 194it [00:41, 4.50it/s] 195it [00:42, 4.43it/s] 196it [00:42, 4.40it/s] 196it [00:42, 4.61it/s] +2025-05-26 01:58:05,072 - INFO - Epoch: 13, Objective: tensor([4922.8945], device='cuda:0', grad_fn=), Loss: 0.041003212332725525, KL/n: 49.89161682128906 + 0it [00:00, ?it/s]2025-05-26 01:58:05,609 - INFO - [Epoch 014 | Batch 0000] IWAE-loss 2859.6846 | mean log_px -0.0121 | KL -2441.73 + 1it [00:00, 3.53it/s] 2it [00:00, 4.14it/s] 3it [00:00, 4.39it/s] 4it [00:00, 4.51it/s] 5it [00:01, 4.43it/s] 6it [00:01, 4.53it/s] 7it [00:01, 4.60it/s] 8it [00:01, 4.63it/s] 9it [00:02, 4.65it/s] 10it [00:02, 4.65it/s] 11it [00:02, 4.68it/s] 12it [00:02, 4.69it/s] 13it [00:02, 4.70it/s] 14it [00:03, 4.54it/s] 15it [00:03, 4.61it/s] 16it [00:03, 4.64it/s] 17it [00:03, 4.66it/s] 18it [00:03, 4.67it/s] 19it [00:04, 4.70it/s] 20it [00:04, 4.55it/s] 21it [00:04, 4.61it/s] 22it [00:04, 4.63it/s] 23it [00:05, 4.64it/s] 24it [00:05, 4.67it/s] 25it [00:05, 4.68it/s] 26it [00:05, 4.68it/s] 27it [00:05, 4.69it/s] 28it [00:06, 4.68it/s] 29it [00:06, 4.69it/s] 30it [00:06, 4.69it/s] 31it [00:06, 4.70it/s] 32it [00:06, 4.55it/s] 33it [00:07, 4.61it/s] 34it [00:07, 4.64it/s] 35it [00:07, 4.65it/s] 36it [00:07, 4.67it/s] 37it [00:08, 4.53it/s] 38it [00:08, 4.60it/s] 39it [00:08, 4.60it/s] 40it [00:08, 4.62it/s] 41it [00:08, 4.63it/s] 42it [00:09, 4.53it/s] 43it [00:09, 4.61it/s] 44it [00:09, 4.63it/s] 45it [00:09, 4.66it/s] 46it [00:09, 4.67it/s] 47it [00:10, 4.69it/s] 48it [00:10, 4.70it/s] 49it [00:10, 4.70it/s] 50it [00:10, 4.54it/s]2025-05-26 01:58:16,384 - INFO - [Epoch 014 | Batch 0050] IWAE-loss 3013.0603 | mean log_px -0.0122 | KL -2423.46 + 51it [00:11, 4.60it/s] 52it [00:11, 4.63it/s] 53it [00:11, 4.66it/s] 54it [00:11, 4.67it/s] 55it [00:11, 4.52it/s] 56it [00:12, 4.59it/s] 57it [00:12, 4.62it/s] 58it [00:12, 4.64it/s] 59it [00:12, 4.67it/s] 60it [00:13, 4.45it/s] 61it [00:13, 4.38it/s] 62it [00:13, 4.33it/s] 63it [00:13, 4.37it/s] 64it [00:13, 4.43it/s] 65it [00:14, 4.48it/s] 66it [00:14, 4.51it/s] 67it [00:14, 4.54it/s] 68it [00:14, 4.41it/s] 69it [00:15, 4.51it/s] 70it [00:15, 4.55it/s] 71it [00:15, 4.55it/s] 72it [00:15, 4.57it/s] 73it [00:15, 4.57it/s] 74it [00:16, 4.58it/s] 75it [00:16, 4.59it/s] 76it [00:16, 4.59it/s] 77it [00:16, 4.60it/s] 78it [00:17, 4.47it/s] 79it [00:17, 4.44it/s] 80it [00:17, 4.49it/s] 81it [00:17, 4.53it/s] 82it [00:17, 4.54it/s] 83it [00:18, 4.56it/s] 84it [00:18, 4.46it/s] 85it [00:18, 4.50it/s] 86it [00:18, 4.51it/s] 87it [00:19, 4.53it/s] 88it [00:19, 4.54it/s] 89it [00:19, 4.56it/s] 90it [00:19, 4.43it/s] 91it [00:19, 4.49it/s] 92it [00:20, 4.50it/s] 93it [00:20, 4.55it/s] 94it [00:20, 4.55it/s] 95it [00:20, 4.56it/s] 96it [00:21, 4.57it/s] 97it [00:21, 4.59it/s] 98it [00:21, 4.58it/s] 99it [00:21, 4.60it/s] 100it [00:21, 4.60it/s]2025-05-26 01:58:27,411 - INFO - [Epoch 014 | Batch 0100] IWAE-loss 3804.5000 | mean log_px -0.0205 | KL -2399.92 + 101it [00:22, 4.60it/s] 102it [00:22, 4.60it/s] 103it [00:22, 4.60it/s] 104it [00:22, 4.60it/s] 105it [00:22, 4.46it/s] 106it [00:23, 4.52it/s] 107it [00:23, 4.54it/s] 108it [00:23, 4.55it/s] 109it [00:23, 4.58it/s] 110it [00:24, 4.58it/s] 111it [00:24, 4.57it/s] 112it [00:24, 4.57it/s] 113it [00:24, 4.58it/s] 114it [00:24, 4.58it/s] 115it [00:25, 4.42it/s] 116it [00:25, 4.48it/s] 117it [00:25, 4.53it/s] 118it [00:25, 4.55it/s] 119it [00:26, 4.57it/s] 120it [00:26, 4.56it/s] 121it [00:26, 4.57it/s] 122it [00:26, 4.55it/s] 123it [00:26, 4.57it/s] 124it [00:27, 4.54it/s] 125it [00:27, 4.57it/s] 126it [00:27, 4.61it/s] 127it [00:27, 4.59it/s] 128it [00:28, 4.59it/s] 129it [00:28, 4.45it/s] 130it [00:28, 4.50it/s] 131it [00:28, 4.53it/s] 132it [00:28, 4.55it/s] 133it [00:29, 4.60it/s] 134it [00:29, 4.62it/s] 135it [00:29, 4.47it/s] 136it [00:29, 4.39it/s] 137it [00:30, 4.47it/s] 138it [00:30, 4.52it/s] 139it [00:30, 4.56it/s] 140it [00:30, 4.58it/s] 141it [00:30, 4.59it/s] 142it [00:31, 4.60it/s] 143it [00:31, 4.55it/s] 144it [00:31, 4.56it/s] 145it [00:31, 4.58it/s] 146it [00:31, 4.58it/s] 147it [00:32, 4.61it/s] 148it [00:32, 4.61it/s] 149it [00:32, 4.47it/s] 150it [00:32, 4.52it/s]2025-05-26 01:58:38,409 - INFO - [Epoch 014 | Batch 0150] IWAE-loss 3109.0154 | mean log_px -0.0184 | KL -2386.44 + 151it [00:33, 4.54it/s] 152it [00:33, 4.42it/s] 153it [00:33, 4.50it/s] 154it [00:33, 4.52it/s] 155it [00:33, 4.56it/s] 156it [00:34, 4.57it/s] 157it [00:34, 4.59it/s] 158it [00:34, 4.51it/s] 159it [00:34, 4.55it/s] 160it [00:35, 4.58it/s] 161it [00:35, 4.59it/s] 162it [00:35, 4.60it/s] 163it [00:35, 4.60it/s] 164it [00:35, 4.61it/s] 165it [00:36, 4.61it/s] 166it [00:36, 4.61it/s] 167it [00:36, 4.62it/s] 168it [00:36, 4.61it/s] 169it [00:37, 4.60it/s] 170it [00:37, 4.61it/s] 171it [00:37, 4.58it/s] 172it [00:37, 4.59it/s] 173it [00:37, 4.61it/s] 174it [00:38, 4.63it/s] 175it [00:38, 4.65it/s] 176it [00:38, 4.62it/s] 177it [00:38, 4.64it/s] 178it [00:38, 4.66it/s] 179it [00:39, 4.65it/s] 180it [00:39, 4.66it/s] 181it [00:39, 4.51it/s] 182it [00:39, 4.56it/s] 183it [00:40, 4.57it/s] 184it [00:40, 4.59it/s] 185it [00:40, 4.56it/s] 186it [00:40, 4.56it/s] 187it [00:40, 4.62it/s] 188it [00:41, 4.61it/s] 189it [00:41, 4.62it/s] 190it [00:41, 4.47it/s] 191it [00:41, 4.49it/s] 192it [00:42, 4.53it/s] 193it [00:42, 4.55it/s] 194it [00:42, 4.56it/s] 195it [00:42, 4.46it/s] 196it [00:42, 4.50it/s] 196it [00:42, 4.56it/s] +2025-05-26 01:58:48,379 - INFO - Epoch: 14, Objective: tensor([2733.1536], device='cuda:0', grad_fn=), Loss: 0.013086755760014057, KL/n: 48.29157638549805 + 0it [00:00, ?it/s]2025-05-26 01:58:48,766 - INFO - [Epoch 015 | Batch 0000] IWAE-loss 3566.3582 | mean log_px -0.0216 | KL -2368.83 + 1it [00:00, 2.95it/s] 2it [00:00, 3.66it/s] 3it [00:00, 4.02it/s] 4it [00:01, 4.19it/s] 5it [00:01, 4.34it/s] 6it [00:01, 4.37it/s] 7it [00:01, 4.23it/s] 8it [00:02, 3.48it/s] 9it [00:02, 3.77it/s] 10it [00:02, 3.99it/s] 11it [00:02, 4.17it/s] 12it [00:02, 4.29it/s] 13it [00:03, 4.39it/s] 14it [00:03, 4.30it/s] 15it [00:03, 4.40it/s] 16it [00:03, 4.46it/s] 17it [00:04, 4.52it/s] 18it [00:04, 4.55it/s] 19it [00:04, 4.54it/s] 20it [00:04, 4.41it/s] 21it [00:04, 4.40it/s] 22it [00:05, 4.47it/s] 23it [00:05, 4.51it/s] 24it [00:05, 4.53it/s] 25it [00:05, 4.55it/s] 26it [00:06, 4.55it/s] 27it [00:06, 4.42it/s] 28it [00:06, 4.48it/s] 29it [00:06, 4.51it/s] 30it [00:06, 4.54it/s] 31it [00:07, 4.57it/s] 32it [00:07, 4.54it/s] 33it [00:07, 4.42it/s] 34it [00:07, 4.48it/s] 35it [00:08, 4.53it/s] 36it [00:08, 4.56it/s] 37it [00:08, 4.59it/s] 38it [00:08, 4.59it/s] 39it [00:08, 4.44it/s] 40it [00:09, 4.49it/s] 41it [00:09, 4.54it/s] 42it [00:09, 4.56it/s] 43it [00:09, 4.57it/s] 44it [00:10, 4.57it/s] 45it [00:10, 4.60it/s] 46it [00:10, 4.59it/s] 47it [00:10, 4.45it/s] 48it [00:10, 4.51it/s] 49it [00:11, 4.51it/s] 50it [00:11, 4.56it/s]2025-05-26 01:59:00,043 - INFO - [Epoch 015 | Batch 0050] IWAE-loss 2586.0901 | mean log_px -0.0101 | KL -2342.14 + 51it [00:11, 4.59it/s] 52it [00:11, 4.61it/s] 53it [00:12, 4.63it/s] 54it [00:12, 4.63it/s] 55it [00:12, 4.65it/s] 56it [00:12, 4.65it/s] 57it [00:12, 4.65it/s] 58it [00:13, 4.65it/s] 59it [00:13, 4.65it/s] 60it [00:13, 4.66it/s] 61it [00:13, 4.65it/s] 62it [00:13, 4.65it/s] 63it [00:14, 4.66it/s] 64it [00:14, 4.66it/s] 65it [00:14, 4.63it/s] 66it [00:14, 4.64it/s] 67it [00:15, 4.64it/s] 68it [00:15, 4.64it/s] 69it [00:15, 4.64it/s] 70it [00:15, 4.59it/s] 71it [00:15, 4.60it/s] 72it [00:16, 4.56it/s] 73it [00:16, 4.45it/s] 74it [00:16, 4.52it/s] 75it [00:16, 4.55it/s] 76it [00:17, 4.59it/s] 77it [00:17, 4.61it/s] 78it [00:17, 4.64it/s] 79it [00:17, 4.66it/s] 80it [00:17, 4.65it/s] 81it [00:18, 4.32it/s] 82it [00:18, 4.41it/s] 83it [00:18, 4.47it/s] 84it [00:18, 4.51it/s] 85it [00:18, 4.55it/s] 86it [00:19, 4.56it/s] 87it [00:19, 4.59it/s] 88it [00:19, 4.61it/s] 89it [00:19, 4.62it/s] 90it [00:20, 4.63it/s] 91it [00:20, 4.64it/s] 92it [00:20, 4.64it/s] 93it [00:20, 4.65it/s] 94it [00:20, 4.66it/s] 95it [00:21, 4.50it/s] 96it [00:21, 4.56it/s] 97it [00:21, 4.58it/s] 98it [00:21, 4.60it/s] 99it [00:22, 4.61it/s] 100it [00:22, 4.61it/s]2025-05-26 01:59:10,919 - INFO - [Epoch 015 | Batch 0100] IWAE-loss 2982.4482 | mean log_px -0.0107 | KL -2318.40 + 101it [00:22, 4.57it/s] 102it [00:22, 4.59it/s] 103it [00:22, 4.61it/s] 104it [00:23, 4.63it/s] 105it [00:23, 4.65it/s] 106it [00:23, 4.65it/s] 107it [00:23, 4.66it/s] 108it [00:23, 4.66it/s] 109it [00:24, 4.67it/s] 110it [00:24, 4.66it/s] 111it [00:24, 4.66it/s] 112it [00:24, 4.66it/s] 113it [00:25, 4.67it/s] 114it [00:25, 4.64it/s] 115it [00:25, 4.64it/s] 116it [00:25, 4.64it/s] 117it [00:25, 4.62it/s] 118it [00:26, 4.63it/s] 119it [00:26, 4.63it/s] 120it [00:26, 4.48it/s] 121it [00:26, 4.56it/s] 122it [00:27, 4.57it/s] 123it [00:27, 4.60it/s] 124it [00:27, 4.61it/s] 125it [00:27, 4.64it/s] 126it [00:27, 4.64it/s] 127it [00:28, 4.65it/s] 128it [00:28, 4.66it/s] 129it [00:28, 4.67it/s] 130it [00:28, 4.67it/s] 131it [00:28, 4.67it/s] 132it [00:29, 4.67it/s] 133it [00:29, 4.68it/s] 134it [00:29, 4.65it/s] 135it [00:29, 4.64it/s] 136it [00:30, 4.63it/s] 137it [00:30, 4.63it/s] 138it [00:30, 4.59it/s] 139it [00:30, 4.54it/s] 140it [00:30, 4.56it/s] 141it [00:31, 4.56it/s] 142it [00:31, 4.57it/s] 143it [00:31, 4.60it/s] 144it [00:31, 4.61it/s] 145it [00:31, 4.62it/s] 146it [00:32, 4.62it/s] 147it [00:32, 4.62it/s] 148it [00:32, 4.63it/s] 149it [00:32, 4.64it/s] 150it [00:33, 4.63it/s]2025-05-26 01:59:21,721 - INFO - [Epoch 015 | Batch 0150] IWAE-loss 3421.2581 | mean log_px -0.0186 | KL -2299.48 + 151it [00:33, 4.63it/s] 152it [00:33, 4.62it/s] 153it [00:33, 4.61it/s] 154it [00:33, 4.60it/s] 155it [00:34, 4.62it/s] 156it [00:34, 4.62it/s] 157it [00:34, 4.62it/s] 158it [00:34, 4.61it/s] 159it [00:35, 4.60it/s] 160it [00:35, 4.60it/s] 161it [00:35, 4.57it/s] 162it [00:35, 4.58it/s] 163it [00:35, 4.58it/s] 164it [00:36, 4.49it/s] 165it [00:36, 4.49it/s] 166it [00:36, 4.50it/s] 167it [00:36, 4.52it/s] 168it [00:36, 4.53it/s] 169it [00:37, 4.56it/s] 170it [00:37, 4.57it/s] 171it [00:37, 4.52it/s] 172it [00:37, 4.55it/s] 173it [00:38, 4.57it/s] 174it [00:38, 4.58it/s] 175it [00:38, 4.59it/s] 176it [00:38, 4.60it/s] 177it [00:38, 4.59it/s] 178it [00:39, 4.58it/s] 179it [00:39, 4.60it/s] 180it [00:39, 4.60it/s] 181it [00:39, 4.60it/s] 182it [00:40, 4.59it/s] 183it [00:40, 4.61it/s] 184it [00:40, 4.52it/s] 185it [00:40, 4.54it/s] 186it [00:40, 4.56it/s] 187it [00:41, 4.59it/s] 188it [00:41, 4.54it/s] 189it [00:41, 4.56it/s] 190it [00:41, 4.57it/s] 191it [00:42, 4.50it/s] 192it [00:42, 4.53it/s] 193it [00:42, 4.57it/s] 194it [00:42, 4.56it/s] 195it [00:42, 4.32it/s] 196it [00:43, 4.44it/s] 196it [00:43, 4.53it/s] +2025-05-26 01:59:31,739 - INFO - Epoch: 15, Objective: tensor([2673.8301], device='cuda:0', grad_fn=), Loss: 0.006941231433302164, KL/n: 46.54920196533203 + 0it [00:00, ?it/s]2025-05-26 01:59:32,120 - INFO - [Epoch 016 | Batch 0000] IWAE-loss 2568.5730 | mean log_px -0.0058 | KL -2277.45 + 1it [00:00, 3.28it/s] 2it [00:00, 3.94it/s] 3it [00:00, 4.21it/s] 4it [00:00, 4.34it/s] 5it [00:01, 4.28it/s] 6it [00:01, 4.36it/s] 7it [00:01, 4.39it/s] 8it [00:01, 4.44it/s] 9it [00:02, 4.49it/s] 10it [00:02, 4.50it/s] 11it [00:02, 4.53it/s] 12it [00:02, 4.44it/s] 13it [00:02, 4.50it/s] 14it [00:03, 4.51it/s] 15it [00:03, 4.56it/s] 16it [00:03, 4.56it/s] 17it [00:03, 4.50it/s] 18it [00:04, 4.38it/s] 19it [00:04, 4.46it/s] 20it [00:04, 4.52it/s] 21it [00:04, 4.55it/s] 22it [00:04, 4.51it/s] 23it [00:05, 4.55it/s] 24it [00:05, 4.39it/s] 25it [00:05, 4.48it/s] 26it [00:05, 4.45it/s] 27it [00:06, 4.46it/s] 28it [00:06, 4.48it/s] 29it [00:06, 4.51it/s] 30it [00:06, 4.39it/s] 31it [00:06, 4.46it/s] 32it [00:07, 4.49it/s] 33it [00:07, 4.52it/s] 34it [00:07, 4.53it/s] 35it [00:07, 4.55it/s] 36it [00:08, 4.41it/s] 37it [00:08, 4.48it/s] 38it [00:08, 4.48it/s] 39it [00:08, 4.53it/s] 40it [00:08, 4.50it/s] 41it [00:09, 4.54it/s] 42it [00:09, 4.40it/s] 43it [00:09, 4.47it/s] 44it [00:09, 4.52it/s] 45it [00:10, 4.50it/s] 46it [00:10, 4.52it/s] 47it [00:10, 4.55it/s] 48it [00:10, 4.42it/s] 49it [00:10, 4.49it/s] 50it [00:11, 4.52it/s]2025-05-26 01:59:43,242 - INFO - [Epoch 016 | Batch 0050] IWAE-loss 2469.5354 | mean log_px -0.0050 | KL -2246.70 + 51it [00:11, 4.55it/s] 52it [00:11, 4.52it/s] 53it [00:11, 4.56it/s] 54it [00:12, 4.43it/s] 55it [00:12, 4.50it/s] 56it [00:12, 4.53it/s] 57it [00:12, 4.50it/s] 58it [00:12, 4.50it/s] 59it [00:13, 4.54it/s] 60it [00:13, 4.52it/s] 61it [00:13, 4.43it/s] 62it [00:13, 4.51it/s] 63it [00:14, 4.56it/s] 64it [00:14, 4.59it/s] 65it [00:14, 4.61it/s] 66it [00:14, 4.63it/s] 67it [00:14, 4.47it/s] 68it [00:15, 4.52it/s] 69it [00:15, 4.56it/s] 70it [00:15, 4.56it/s] 71it [00:15, 4.59it/s] 72it [00:16, 4.61it/s] 73it [00:16, 4.48it/s] 74it [00:16, 4.55it/s] 75it [00:16, 4.59it/s] 76it [00:16, 4.61it/s] 77it [00:17, 4.63it/s] 78it [00:17, 4.64it/s] 79it [00:17, 4.48it/s] 80it [00:17, 4.55it/s] 81it [00:18, 4.58it/s] 82it [00:18, 4.60it/s] 83it [00:18, 4.61it/s] 84it [00:18, 4.63it/s] 85it [00:18, 4.49it/s] 86it [00:19, 4.55it/s] 87it [00:19, 4.58it/s] 88it [00:19, 4.59it/s] 89it [00:19, 4.61it/s] 90it [00:19, 4.63it/s] 91it [00:20, 4.48it/s] 92it [00:20, 4.54it/s] 93it [00:20, 4.58it/s] 94it [00:20, 4.60it/s] 95it [00:21, 4.61it/s] 96it [00:21, 4.59it/s] 97it [00:21, 4.45it/s] 98it [00:21, 4.49it/s] 99it [00:21, 4.53it/s] 100it [00:22, 4.54it/s]2025-05-26 01:59:54,225 - INFO - [Epoch 016 | Batch 0100] IWAE-loss 2823.7253 | mean log_px -0.0109 | KL -2227.54 + 101it [00:22, 4.56it/s] 102it [00:22, 4.42it/s] 103it [00:22, 4.51it/s] 104it [00:23, 4.54it/s] 105it [00:23, 4.58it/s] 106it [00:23, 4.59it/s] 107it [00:23, 4.62it/s] 108it [00:23, 4.47it/s] 109it [00:24, 4.54it/s] 110it [00:24, 4.57it/s] 111it [00:24, 4.60it/s] 112it [00:24, 4.58it/s] 113it [00:25, 4.60it/s] 114it [00:25, 4.47it/s] 115it [00:25, 4.54it/s] 116it [00:25, 4.57it/s] 117it [00:25, 4.60it/s] 118it [00:26, 4.61it/s] 119it [00:26, 4.63it/s] 120it [00:26, 4.48it/s] 121it [00:26, 4.55it/s] 122it [00:27, 4.58it/s] 123it [00:27, 4.61it/s] 124it [00:27, 4.62it/s] 125it [00:27, 4.63it/s] 126it [00:27, 4.48it/s] 127it [00:28, 4.54it/s] 128it [00:28, 4.56it/s] 129it [00:28, 4.60it/s] 130it [00:28, 4.60it/s] 131it [00:28, 4.61it/s] 132it [00:29, 4.47it/s] 133it [00:29, 4.54it/s] 134it [00:29, 4.56it/s] 135it [00:29, 4.59it/s] 136it [00:30, 4.57it/s] 137it [00:30, 4.56it/s] 138it [00:30, 4.44it/s] 139it [00:30, 4.52it/s] 140it [00:30, 4.46it/s] 141it [00:31, 4.49it/s] 142it [00:31, 4.55it/s] 143it [00:31, 4.59it/s] 144it [00:31, 4.45it/s] 145it [00:32, 4.53it/s] 146it [00:32, 4.55it/s] 147it [00:32, 4.59it/s] 148it [00:32, 4.60it/s] 149it [00:32, 4.62it/s] 150it [00:33, 4.48it/s]2025-05-26 02:00:05,213 - INFO - [Epoch 016 | Batch 0150] IWAE-loss 2373.7930 | mean log_px -0.0035 | KL -2207.88 + 151it [00:33, 4.54it/s] 152it [00:33, 4.57it/s] 153it [00:33, 4.60it/s] 154it [00:34, 4.61it/s] 155it [00:34, 4.63it/s] 156it [00:34, 4.49it/s] 157it [00:34, 4.56it/s] 158it [00:34, 4.59it/s] 159it [00:35, 4.62it/s] 160it [00:35, 4.62it/s] 161it [00:35, 4.48it/s] 162it [00:35, 4.54it/s] 163it [00:36, 4.58it/s] 164it [00:36, 4.57it/s] 165it [00:36, 4.60it/s] 166it [00:36, 4.60it/s] 167it [00:36, 4.46it/s] 168it [00:37, 4.53it/s] 169it [00:37, 4.56it/s] 170it [00:37, 4.50it/s] 171it [00:37, 4.51it/s] 172it [00:38, 4.54it/s] 173it [00:38, 4.43it/s] 174it [00:38, 4.50it/s] 175it [00:38, 4.54it/s] 176it [00:38, 4.57it/s] 177it [00:39, 4.60it/s] 178it [00:39, 4.54it/s] 179it [00:39, 4.59it/s] 180it [00:39, 4.46it/s] 181it [00:39, 4.53it/s] 182it [00:40, 4.56it/s] 183it [00:40, 4.60it/s] 184it [00:40, 4.61it/s] 185it [00:40, 4.63it/s] 186it [00:41, 4.47it/s] 187it [00:41, 4.54it/s] 188it [00:41, 4.57it/s] 189it [00:41, 4.59it/s] 190it [00:41, 4.61it/s] 191it [00:42, 4.60it/s] 192it [00:42, 4.45it/s] 193it [00:42, 4.51it/s] 194it [00:42, 4.53it/s] 195it [00:43, 4.48it/s] 196it [00:43, 4.54it/s] 196it [00:43, 4.52it/s] +2025-05-26 02:00:15,227 - INFO - Epoch: 16, Objective: tensor([2848.4922], device='cuda:0', grad_fn=), Loss: 0.02026955410838127, KL/n: 44.883338928222656 + 0it [00:00, ?it/s]2025-05-26 02:00:15,775 - INFO - [Epoch 017 | Batch 0000] IWAE-loss 2439.9866 | mean log_px -0.0047 | KL -2197.12 + 1it [00:00, 3.38it/s] 2it [00:00, 3.80it/s] 3it [00:00, 4.18it/s] 4it [00:00, 4.35it/s] 5it [00:01, 4.45it/s] 6it [00:01, 4.47it/s] 7it [00:01, 4.55it/s] 8it [00:01, 4.58it/s] 9it [00:02, 4.45it/s] 10it [00:02, 4.52it/s] 11it [00:02, 4.57it/s] 12it [00:02, 4.60it/s] 13it [00:02, 4.62it/s] 14it [00:03, 4.47it/s] 15it [00:03, 4.54it/s] 16it [00:03, 4.57it/s] 17it [00:03, 4.60it/s] 18it [00:04, 4.57it/s] 19it [00:04, 4.46it/s] 20it [00:04, 4.53it/s] 21it [00:04, 4.57it/s] 22it [00:04, 4.60it/s] 23it [00:05, 4.62it/s] 24it [00:05, 4.63it/s] 25it [00:05, 4.49it/s] 26it [00:05, 4.55it/s] 27it [00:05, 4.59it/s] 28it [00:06, 4.60it/s] 29it [00:06, 4.60it/s] 30it [00:06, 4.59it/s] 31it [00:06, 4.45it/s] 32it [00:07, 4.51it/s] 33it [00:07, 4.55it/s] 34it [00:07, 4.55it/s] 35it [00:07, 4.57it/s] 36it [00:07, 4.58it/s] 37it [00:08, 4.45it/s] 38it [00:08, 4.52it/s] 39it [00:08, 4.56it/s] 40it [00:08, 4.59it/s] 41it [00:09, 4.61it/s] 42it [00:09, 4.60it/s] 43it [00:09, 4.47it/s] 44it [00:09, 4.54it/s] 45it [00:09, 4.57it/s] 46it [00:10, 4.58it/s] 47it [00:10, 4.46it/s] 48it [00:10, 4.53it/s] 49it [00:10, 4.57it/s] 50it [00:11, 4.60it/s]2025-05-26 02:00:26,748 - INFO - [Epoch 017 | Batch 0050] IWAE-loss 3817.5354 | mean log_px -0.0287 | KL -2182.09 + 51it [00:11, 4.62it/s] 52it [00:11, 4.63it/s] 53it [00:11, 4.47it/s] 54it [00:11, 4.54it/s] 55it [00:12, 4.56it/s] 56it [00:12, 4.60it/s] 57it [00:12, 4.62it/s] 58it [00:12, 4.62it/s] 59it [00:13, 4.48it/s] 60it [00:13, 4.55it/s] 61it [00:13, 4.59it/s] 62it [00:13, 4.61it/s] 63it [00:13, 4.63it/s] 64it [00:14, 4.62it/s] 65it [00:14, 4.49it/s] 66it [00:14, 4.55it/s] 67it [00:14, 4.58it/s] 68it [00:14, 4.60it/s] 69it [00:15, 4.61it/s] 70it [00:15, 4.62it/s] 71it [00:15, 4.45it/s] 72it [00:15, 4.52it/s] 73it [00:16, 4.55it/s] 74it [00:16, 4.59it/s] 75it [00:16, 4.59it/s] 76it [00:16, 4.57it/s] 77it [00:16, 4.44it/s] 78it [00:17, 4.51it/s] 79it [00:17, 4.40it/s] 80it [00:17, 4.48it/s] 81it [00:17, 4.54it/s] 82it [00:18, 4.57it/s] 83it [00:18, 4.57it/s] 84it [00:18, 4.59it/s] 85it [00:18, 4.46it/s] 86it [00:18, 4.53it/s] 87it [00:19, 4.54it/s] 88it [00:19, 4.57it/s] 89it [00:19, 4.60it/s] 90it [00:19, 4.62it/s] 91it [00:20, 4.48it/s] 92it [00:20, 4.55it/s] 93it [00:20, 4.58it/s] 94it [00:20, 4.60it/s] 95it [00:20, 4.63it/s] 96it [00:21, 4.64it/s] 97it [00:21, 4.49it/s] 98it [00:21, 4.55it/s] 99it [00:21, 4.59it/s] 100it [00:22, 4.60it/s]2025-05-26 02:00:37,715 - INFO - [Epoch 017 | Batch 0100] IWAE-loss 2449.2668 | mean log_px -0.0059 | KL -2174.15 + 101it [00:22, 4.62it/s] 102it [00:22, 4.63it/s] 103it [00:22, 4.48it/s] 104it [00:22, 4.54it/s] 105it [00:23, 4.57it/s] 106it [00:23, 4.42it/s] 107it [00:23, 4.51it/s] 108it [00:23, 4.56it/s] 109it [00:24, 4.59it/s] 110it [00:24, 4.60it/s] 111it [00:24, 4.62it/s] 112it [00:24, 4.48it/s] 113it [00:24, 4.55it/s] 114it [00:25, 4.56it/s] 115it [00:25, 4.49it/s] 116it [00:25, 4.53it/s] 117it [00:25, 4.56it/s] 118it [00:25, 4.57it/s] 119it [00:26, 4.43it/s] 120it [00:26, 4.48it/s] 121it [00:26, 4.52it/s] 122it [00:26, 4.56it/s] 123it [00:27, 4.56it/s] 124it [00:27, 4.58it/s] 125it [00:27, 4.41it/s] 126it [00:27, 4.50it/s] 127it [00:27, 4.55it/s] 128it [00:28, 4.57it/s] 129it [00:28, 4.60it/s] 130it [00:28, 4.61it/s] 131it [00:28, 4.49it/s] 132it [00:29, 4.53it/s] 133it [00:29, 4.55it/s] 134it [00:29, 4.58it/s] 135it [00:29, 4.60it/s] 136it [00:29, 4.49it/s] 137it [00:30, 4.56it/s] 138it [00:30, 4.58it/s] 139it [00:30, 4.60it/s] 140it [00:30, 4.59it/s] 141it [00:31, 4.45it/s] 142it [00:31, 4.50it/s] 143it [00:31, 4.54it/s] 144it [00:31, 4.57it/s] 145it [00:31, 4.57it/s] 146it [00:32, 4.43it/s] 147it [00:32, 4.51it/s] 148it [00:32, 4.54it/s] 149it [00:32, 4.58it/s] 150it [00:33, 4.60it/s]2025-05-26 02:00:48,727 - INFO - [Epoch 017 | Batch 0150] IWAE-loss 2379.8494 | mean log_px -0.0040 | KL -2152.76 + 151it [00:33, 4.61it/s] 152it [00:33, 4.47it/s] 153it [00:33, 4.54it/s] 154it [00:33, 4.58it/s] 155it [00:34, 4.61it/s] 156it [00:34, 4.62it/s] 157it [00:34, 4.62it/s] 158it [00:34, 4.48it/s] 159it [00:35, 4.55it/s] 160it [00:35, 4.58it/s] 161it [00:35, 4.60it/s] 162it [00:35, 4.61it/s] 163it [00:35, 4.63it/s] 164it [00:36, 4.48it/s] 165it [00:36, 4.54it/s] 166it [00:36, 4.58it/s] 167it [00:36, 4.60it/s] 168it [00:36, 4.59it/s] 169it [00:37, 4.58it/s] 170it [00:37, 4.42it/s] 171it [00:37, 4.48it/s] 172it [00:37, 4.48it/s] 173it [00:38, 4.53it/s] 174it [00:38, 4.53it/s] 175it [00:38, 4.53it/s] 176it [00:38, 4.41it/s] 177it [00:38, 4.50it/s] 178it [00:39, 4.54it/s] 179it [00:39, 4.59it/s] 180it [00:39, 4.60it/s] 181it [00:39, 4.47it/s] 182it [00:40, 4.54it/s] 183it [00:40, 4.57it/s] 184it [00:40, 4.60it/s] 185it [00:40, 4.62it/s] 186it [00:40, 4.63it/s] 187it [00:41, 4.48it/s] 188it [00:41, 4.54it/s] 189it [00:41, 4.58it/s] 190it [00:41, 4.60it/s] 191it [00:42, 4.62it/s] 192it [00:42, 4.63it/s] 193it [00:42, 4.48it/s] 194it [00:42, 4.55it/s] 195it [00:42, 4.50it/s] 196it [00:43, 4.56it/s] 196it [00:43, 4.54it/s] +2025-05-26 02:00:58,749 - INFO - Epoch: 17, Objective: tensor([2270.9153], device='cuda:0', grad_fn=), Loss: 0.004182320553809404, KL/n: 43.6452751159668 + 0it [00:00, ?it/s]2025-05-26 02:00:59,128 - INFO - [Epoch 018 | Batch 0000] IWAE-loss 2706.3704 | mean log_px -0.0173 | KL -2135.82 + 1it [00:00, 3.03it/s] 2it [00:00, 3.84it/s] 3it [00:00, 4.12it/s] 4it [00:00, 4.34it/s] 5it [00:01, 4.45it/s] 6it [00:01, 4.51it/s] 7it [00:01, 4.40it/s] 8it [00:01, 4.45it/s] 9it [00:02, 4.48it/s] 10it [00:02, 4.43it/s] 11it [00:02, 4.50it/s] 12it [00:02, 4.54it/s] 13it [00:02, 4.59it/s] 14it [00:03, 4.45it/s] 15it [00:03, 4.53it/s] 16it [00:03, 4.55it/s] 17it [00:03, 4.57it/s] 18it [00:04, 4.59it/s] 19it [00:04, 4.61it/s] 20it [00:04, 4.61it/s] 21it [00:04, 4.46it/s] 22it [00:04, 4.53it/s] 23it [00:05, 4.58it/s] 24it [00:05, 4.60it/s] 25it [00:05, 4.46it/s] 26it [00:05, 4.54it/s] 27it [00:06, 4.58it/s] 28it [00:06, 4.61it/s] 29it [00:06, 4.61it/s] 30it [00:06, 4.61it/s] 31it [00:06, 4.48it/s] 32it [00:07, 4.55it/s] 33it [00:07, 4.59it/s] 34it [00:07, 4.61it/s] 35it [00:07, 4.63it/s] 36it [00:07, 4.62it/s] 37it [00:08, 4.49it/s] 38it [00:08, 4.56it/s] 39it [00:08, 4.59it/s] 40it [00:08, 4.61it/s] 41it [00:09, 4.64it/s] 42it [00:09, 4.64it/s] 43it [00:09, 4.49it/s] 44it [00:09, 4.55it/s] 45it [00:09, 4.60it/s] 46it [00:10, 4.61it/s] 47it [00:10, 4.63it/s] 48it [00:10, 4.64it/s] 49it [00:10, 4.48it/s] 50it [00:11, 4.55it/s]2025-05-26 02:01:10,102 - INFO - [Epoch 018 | Batch 0050] IWAE-loss 2571.1865 | mean log_px -0.0093 | KL -2121.10 + 51it [00:11, 4.56it/s] 52it [00:11, 4.60it/s] 53it [00:11, 4.63it/s] 54it [00:11, 4.62it/s] 55it [00:12, 4.64it/s] 56it [00:12, 4.63it/s] 57it [00:12, 4.66it/s] 58it [00:12, 4.48it/s] 59it [00:13, 4.52it/s] 60it [00:13, 4.39it/s] 61it [00:13, 4.44it/s] 62it [00:13, 4.49it/s] 63it [00:13, 4.51it/s] 64it [00:14, 3.64it/s] 65it [00:14, 3.89it/s] 66it [00:14, 4.06it/s] 67it [00:15, 4.05it/s] 68it [00:15, 4.22it/s] 69it [00:15, 4.31it/s] 70it [00:15, 4.41it/s] 71it [00:15, 4.47it/s] 72it [00:16, 4.52it/s] 73it [00:16, 4.57it/s] 74it [00:16, 4.60it/s] 75it [00:16, 4.46it/s] 76it [00:16, 4.53it/s] 77it [00:17, 4.57it/s] 78it [00:17, 4.59it/s] 79it [00:17, 4.60it/s] 80it [00:17, 4.59it/s] 81it [00:18, 4.45it/s] 82it [00:18, 4.53it/s] 83it [00:18, 4.57it/s] 84it [00:18, 4.56it/s] 85it [00:18, 4.60it/s] 86it [00:19, 4.61it/s] 87it [00:19, 4.63it/s] 88it [00:19, 4.47it/s] 89it [00:19, 4.50it/s] 90it [00:20, 4.54it/s] 91it [00:20, 4.57it/s] 92it [00:20, 4.59it/s] 93it [00:20, 4.61it/s] 94it [00:20, 4.63it/s] 95it [00:21, 4.49it/s] 96it [00:21, 4.55it/s] 97it [00:21, 4.57it/s] 98it [00:21, 4.57it/s] 99it [00:22, 4.54it/s] 100it [00:22, 4.55it/s]2025-05-26 02:01:21,268 - INFO - [Epoch 018 | Batch 0100] IWAE-loss 2327.6116 | mean log_px -0.0041 | KL -2106.47 + 101it [00:22, 4.42it/s] 102it [00:22, 4.48it/s] 103it [00:22, 4.45it/s] 104it [00:23, 4.50it/s] 105it [00:23, 4.55it/s] 106it [00:23, 4.51it/s] 107it [00:23, 4.36it/s] 108it [00:24, 4.42it/s] 109it [00:24, 4.46it/s] 110it [00:24, 4.48it/s] 111it [00:24, 4.48it/s] 112it [00:24, 4.49it/s] 113it [00:25, 4.45it/s] 114it [00:25, 4.46it/s] 115it [00:25, 4.36it/s] 116it [00:25, 4.41it/s] 117it [00:26, 4.44it/s] 118it [00:26, 4.50it/s] 119it [00:26, 4.51it/s] 120it [00:26, 4.45it/s] 121it [00:26, 4.50it/s] 122it [00:27, 4.50it/s] 123it [00:27, 4.53it/s] 124it [00:27, 4.51it/s] 125it [00:27, 4.48it/s] 126it [00:28, 4.37it/s] 127it [00:28, 4.43it/s] 128it [00:28, 4.43it/s] 129it [00:28, 4.49it/s] 130it [00:28, 4.51it/s] 131it [00:29, 4.51it/s] 132it [00:29, 4.57it/s] 133it [00:29, 4.42it/s] 134it [00:29, 4.48it/s] 135it [00:30, 4.48it/s] 136it [00:30, 4.51it/s] 137it [00:30, 4.54it/s] 138it [00:30, 4.55it/s] 139it [00:30, 4.39it/s] 140it [00:31, 4.45it/s] 141it [00:31, 4.50it/s] 142it [00:31, 4.52it/s] 143it [00:31, 4.57it/s] 144it [00:32, 4.59it/s] 145it [00:32, 4.45it/s] 146it [00:32, 4.52it/s] 147it [00:32, 4.55it/s] 148it [00:32, 4.57it/s] 149it [00:33, 4.59it/s] 150it [00:33, 4.60it/s]2025-05-26 02:01:32,414 - INFO - [Epoch 018 | Batch 0150] IWAE-loss 3520.7913 | mean log_px -0.0254 | KL -2092.53 + 151it [00:33, 4.44it/s] 152it [00:33, 4.51it/s] 153it [00:34, 4.54it/s] 154it [00:34, 4.56it/s] 155it [00:34, 4.57it/s] 156it [00:34, 4.53it/s] 157it [00:34, 4.42it/s] 158it [00:35, 4.45it/s] 159it [00:35, 4.49it/s] 160it [00:35, 4.48it/s] 161it [00:35, 4.39it/s] 162it [00:36, 4.42it/s] 163it [00:36, 4.50it/s] 164it [00:36, 4.54it/s] 165it [00:36, 4.57it/s] 166it [00:36, 4.56it/s] 167it [00:37, 4.44it/s] 168it [00:37, 4.49it/s] 169it [00:37, 4.53it/s] 170it [00:37, 4.55it/s] 171it [00:38, 4.56it/s] 172it [00:38, 4.57it/s] 173it [00:38, 4.57it/s] 174it [00:38, 4.40it/s] 175it [00:38, 4.48it/s] 176it [00:39, 4.52it/s] 177it [00:39, 4.49it/s] 178it [00:39, 4.45it/s] 179it [00:39, 4.52it/s] 180it [00:40, 4.55it/s] 181it [00:40, 4.58it/s] 182it [00:40, 4.43it/s] 183it [00:40, 4.48it/s] 184it [00:40, 4.52it/s] 185it [00:41, 4.56it/s] 186it [00:41, 4.50it/s] 187it [00:41, 4.55it/s] 188it [00:41, 4.41it/s] 189it [00:42, 4.49it/s] 190it [00:42, 4.53it/s] 191it [00:42, 4.56it/s] 192it [00:42, 4.59it/s] 193it [00:42, 4.58it/s] 194it [00:43, 4.44it/s] 195it [00:43, 4.42it/s] 196it [00:43, 4.48it/s] 196it [00:43, 4.49it/s] +2025-05-26 02:01:42,550 - INFO - Epoch: 18, Objective: tensor([2600.6919], device='cuda:0', grad_fn=), Loss: 0.01254788413643837, KL/n: 42.441864013671875 + 0it [00:00, ?it/s]2025-05-26 02:01:42,933 - INFO - [Epoch 019 | Batch 0000] IWAE-loss 2569.3970 | mean log_px -0.0069 | KL -2083.59 + 1it [00:00, 3.22it/s] 2it [00:00, 3.94it/s] 3it [00:00, 4.18it/s] 4it [00:01, 4.08it/s] 5it [00:01, 4.25it/s] 6it [00:01, 4.35it/s] 7it [00:01, 4.44it/s] 8it [00:01, 4.49it/s] 9it [00:02, 4.50it/s] 10it [00:02, 4.37it/s] 11it [00:02, 4.44it/s] 12it [00:02, 4.46it/s] 13it [00:03, 4.43it/s] 14it [00:03, 4.47it/s] 15it [00:03, 4.54it/s] 16it [00:03, 4.55it/s] 17it [00:03, 4.41it/s] 18it [00:04, 4.46it/s] 19it [00:04, 4.51it/s] 20it [00:04, 4.54it/s] 21it [00:04, 4.56it/s] 22it [00:05, 4.40it/s] 23it [00:05, 4.48it/s] 24it [00:05, 4.52it/s] 25it [00:05, 4.55it/s] 26it [00:05, 4.56it/s] 27it [00:06, 4.60it/s] 28it [00:06, 4.45it/s] 29it [00:06, 4.51it/s] 30it [00:06, 4.53it/s] 31it [00:06, 4.53it/s] 32it [00:07, 4.57it/s] 33it [00:07, 4.57it/s] 34it [00:07, 4.43it/s] 35it [00:07, 4.49it/s] 36it [00:08, 4.53it/s] 37it [00:08, 4.53it/s] 38it [00:08, 4.55it/s] 39it [00:08, 4.57it/s] 40it [00:08, 4.38it/s] 41it [00:09, 4.45it/s] 42it [00:09, 4.50it/s] 43it [00:09, 4.55it/s] 44it [00:09, 4.56it/s] 45it [00:10, 4.57it/s] 46it [00:10, 4.43it/s] 47it [00:10, 4.50it/s] 48it [00:10, 4.48it/s] 49it [00:11, 4.38it/s] 50it [00:11, 4.45it/s]2025-05-26 02:01:54,063 - INFO - [Epoch 019 | Batch 0050] IWAE-loss 2562.2981 | mean log_px -0.0159 | KL -2057.50 + 51it [00:11, 4.49it/s] 52it [00:11, 4.48it/s] 53it [00:11, 4.52it/s] 54it [00:12, 4.54it/s] 55it [00:12, 4.42it/s] 56it [00:12, 4.49it/s] 57it [00:12, 4.48it/s] 58it [00:13, 4.31it/s] 59it [00:13, 4.41it/s] 60it [00:13, 4.40it/s] 61it [00:13, 4.47it/s] 62it [00:13, 4.36it/s] 63it [00:14, 4.44it/s] 64it [00:14, 4.50it/s] 65it [00:14, 4.54it/s] 66it [00:14, 4.56it/s] 67it [00:15, 4.59it/s] 68it [00:15, 4.44it/s] 69it [00:15, 4.51it/s] 70it [00:15, 4.55it/s] 71it [00:15, 4.58it/s] 72it [00:16, 4.59it/s] 73it [00:16, 4.59it/s] 74it [00:16, 4.44it/s] 75it [00:16, 4.51it/s] 76it [00:17, 4.46it/s] 77it [00:17, 4.51it/s] 78it [00:17, 4.54it/s] 79it [00:17, 4.51it/s] 80it [00:17, 4.52it/s] 81it [00:18, 4.40it/s] 82it [00:18, 4.45it/s] 83it [00:18, 4.49it/s] 84it [00:18, 4.49it/s] 85it [00:19, 4.53it/s] 86it [00:19, 4.54it/s] 87it [00:19, 4.42it/s] 88it [00:19, 4.46it/s] 89it [00:19, 4.53it/s] 90it [00:20, 4.56it/s] 91it [00:20, 4.59it/s] 92it [00:20, 4.61it/s] 93it [00:20, 4.48it/s] 94it [00:20, 4.54it/s] 95it [00:21, 4.58it/s] 96it [00:21, 4.60it/s] 97it [00:21, 4.62it/s] 98it [00:21, 4.63it/s] 99it [00:22, 4.48it/s] 100it [00:22, 4.55it/s]2025-05-26 02:02:05,147 - INFO - [Epoch 019 | Batch 0100] IWAE-loss 2413.2510 | mean log_px -0.0084 | KL -2045.86 + 101it [00:22, 4.58it/s] 102it [00:22, 4.60it/s] 103it [00:22, 4.62it/s] 104it [00:23, 4.62it/s] 105it [00:23, 4.49it/s] 106it [00:23, 4.54it/s] 107it [00:23, 4.58it/s] 108it [00:24, 4.58it/s] 109it [00:24, 4.61it/s] 110it [00:24, 4.61it/s] 111it [00:24, 4.47it/s] 112it [00:24, 4.54it/s] 113it [00:25, 4.58it/s] 114it [00:25, 4.59it/s] 115it [00:25, 4.61it/s] 116it [00:25, 4.47it/s] 117it [00:26, 4.54it/s] 118it [00:26, 4.57it/s] 119it [00:26, 4.59it/s] 120it [00:26, 4.61it/s] 121it [00:26, 4.63it/s] 122it [00:27, 4.49it/s] 123it [00:27, 4.56it/s] 124it [00:27, 4.59it/s] 125it [00:27, 4.61it/s] 126it [00:27, 4.63it/s] 127it [00:28, 4.64it/s] 128it [00:28, 4.49it/s] 129it [00:28, 4.56it/s] 130it [00:28, 4.58it/s] 131it [00:29, 4.51it/s] 132it [00:29, 4.56it/s] 133it [00:29, 4.59it/s] 134it [00:29, 4.61it/s] 135it [00:29, 4.62it/s] 136it [00:30, 4.49it/s] 137it [00:30, 4.55it/s] 138it [00:30, 4.57it/s] 139it [00:30, 4.60it/s] 140it [00:31, 4.57it/s] 141it [00:31, 4.59it/s] 142it [00:31, 4.45it/s] 143it [00:31, 4.51it/s] 144it [00:31, 4.50it/s] 145it [00:32, 4.46it/s] 146it [00:32, 4.38it/s] 147it [00:32, 4.47it/s] 148it [00:32, 4.51it/s] 149it [00:33, 4.56it/s] 150it [00:33, 4.44it/s]2025-05-26 02:02:16,139 - INFO - [Epoch 019 | Batch 0150] IWAE-loss 2499.8535 | mean log_px -0.0090 | KL -2029.06 + 151it [00:33, 4.51it/s] 152it [00:33, 4.55it/s] 153it [00:33, 4.57it/s] 154it [00:34, 4.59it/s] 155it [00:34, 4.61it/s] 156it [00:34, 4.47it/s] 157it [00:34, 4.54it/s] 158it [00:35, 4.57it/s] 159it [00:35, 4.61it/s] 160it [00:35, 4.58it/s] 161it [00:35, 4.60it/s] 162it [00:35, 4.62it/s] 163it [00:36, 4.48it/s] 164it [00:36, 4.55it/s] 165it [00:36, 4.59it/s] 166it [00:36, 4.61it/s] 167it [00:36, 4.63it/s] 168it [00:37, 4.64it/s] 169it [00:37, 4.51it/s] 170it [00:37, 4.56it/s] 171it [00:37, 4.59it/s] 172it [00:38, 4.61it/s] 173it [00:38, 4.63it/s] 174it [00:38, 4.63it/s] 175it [00:38, 4.49it/s] 176it [00:38, 4.55it/s] 177it [00:39, 4.58it/s] 178it [00:39, 4.58it/s] 179it [00:39, 4.61it/s] 180it [00:39, 4.63it/s] 181it [00:40, 4.48it/s] 182it [00:40, 4.55it/s] 183it [00:40, 4.59it/s] 184it [00:40, 4.60it/s] 185it [00:40, 4.62it/s] 186it [00:41, 4.63it/s] 187it [00:41, 4.49it/s] 188it [00:41, 4.54it/s] 189it [00:41, 4.43it/s] 190it [00:42, 4.51it/s] 191it [00:42, 4.55it/s] 192it [00:42, 4.52it/s] 193it [00:42, 4.58it/s] 194it [00:42, 4.61it/s] 195it [00:43, 4.52it/s] 196it [00:43, 4.58it/s] 196it [00:43, 4.51it/s] +2025-05-26 02:02:26,107 - INFO - Epoch: 19, Objective: tensor([2346.0564], device='cuda:0', grad_fn=), Loss: 0.010250546969473362, KL/n: 41.190834045410156 + 0it [00:00, ?it/s]2025-05-26 02:02:26,658 - INFO - [Epoch 020 | Batch 0000] IWAE-loss 2297.0408 | mean log_px -0.0067 | KL -2018.12 + 1it [00:00, 3.08it/s] 2it [00:00, 3.86it/s] 3it [00:00, 4.21it/s] 4it [00:00, 4.39it/s] 5it [00:01, 4.49it/s] 6it [00:01, 4.55it/s] 7it [00:01, 4.60it/s] 8it [00:01, 4.62it/s] 9it [00:02, 4.65it/s] 10it [00:02, 4.65it/s] 11it [00:02, 4.46it/s] 12it [00:02, 4.53it/s] 13it [00:02, 4.58it/s] 14it [00:03, 4.61it/s] 15it [00:03, 4.63it/s] 16it [00:03, 4.62it/s] 17it [00:03, 4.44it/s] 18it [00:04, 4.50it/s] 19it [00:04, 4.52it/s] 20it [00:04, 4.56it/s] 21it [00:04, 4.58it/s] 22it [00:04, 4.51it/s] 23it [00:05, 4.38it/s] 24it [00:05, 4.44it/s] 25it [00:05, 4.51it/s] 26it [00:05, 4.40it/s] 27it [00:06, 4.45it/s] 28it [00:06, 4.51it/s] 29it [00:06, 4.56it/s] 30it [00:06, 4.59it/s] 31it [00:06, 4.47it/s] 32it [00:07, 4.52it/s] 33it [00:07, 4.57it/s] 34it [00:07, 4.60it/s] 35it [00:07, 4.62it/s] 36it [00:07, 4.63it/s] 37it [00:08, 4.56it/s] 38it [00:08, 4.46it/s] 39it [00:08, 4.53it/s] 40it [00:08, 4.57it/s] 41it [00:09, 4.60it/s] 42it [00:09, 4.62it/s] 43it [00:09, 4.64it/s] 44it [00:09, 4.48it/s] 45it [00:09, 4.54it/s] 46it [00:10, 4.47it/s] 47it [00:10, 4.51it/s] 48it [00:10, 4.55it/s] 49it [00:10, 4.58it/s] 50it [00:11, 4.44it/s]2025-05-26 02:02:37,668 - INFO - [Epoch 020 | Batch 0050] IWAE-loss 2567.9041 | mean log_px -0.0136 | KL -1997.04 + 51it [00:11, 4.50it/s] 52it [00:11, 4.54it/s] 53it [00:11, 4.57it/s] 54it [00:11, 4.58it/s] 55it [00:12, 4.61it/s] 56it [00:12, 4.44it/s] 57it [00:12, 4.52it/s] 58it [00:12, 4.56it/s] 59it [00:13, 4.59it/s] 60it [00:13, 4.54it/s] 61it [00:13, 4.56it/s] 62it [00:13, 4.58it/s] 63it [00:13, 4.61it/s] 64it [00:14, 4.62it/s] 65it [00:14, 4.49it/s] 66it [00:14, 4.55it/s] 67it [00:14, 4.58it/s] 68it [00:15, 4.60it/s] 69it [00:15, 4.62it/s] 70it [00:15, 4.47it/s] 71it [00:15, 4.53it/s] 72it [00:15, 4.56it/s] 73it [00:16, 4.59it/s] 74it [00:16, 4.61it/s] 75it [00:16, 4.62it/s] 76it [00:16, 4.39it/s] 77it [00:17, 4.43it/s] 78it [00:17, 4.50it/s] 79it [00:17, 4.55it/s] 80it [00:17, 4.44it/s] 81it [00:17, 4.52it/s] 82it [00:18, 4.54it/s] 83it [00:18, 4.58it/s] 84it [00:18, 4.51it/s] 85it [00:18, 4.54it/s] 86it [00:18, 4.58it/s] 87it [00:19, 4.44it/s] 88it [00:19, 4.51it/s] 89it [00:19, 4.55it/s] 90it [00:19, 4.52it/s] 91it [00:20, 4.43it/s] 92it [00:20, 4.49it/s] 93it [00:20, 4.53it/s] 94it [00:20, 4.56it/s] 95it [00:20, 4.55it/s] 96it [00:21, 4.56it/s] 97it [00:21, 4.59it/s] 98it [00:21, 4.43it/s] 99it [00:21, 4.51it/s] 100it [00:22, 4.54it/s]2025-05-26 02:02:48,678 - INFO - [Epoch 020 | Batch 0100] IWAE-loss 3235.3687 | mean log_px -0.0223 | KL -1973.44 + 101it [00:22, 4.58it/s] 102it [00:22, 4.60it/s] 103it [00:22, 4.63it/s] 104it [00:22, 4.64it/s] 105it [00:23, 4.65it/s] 106it [00:23, 4.66it/s] 107it [00:23, 4.50it/s] 108it [00:23, 4.55it/s] 109it [00:24, 4.59it/s] 110it [00:24, 4.61it/s] 111it [00:24, 4.62it/s] 112it [00:24, 4.62it/s] 113it [00:24, 4.48it/s] 114it [00:25, 4.42it/s] 115it [00:25, 4.49it/s] 116it [00:25, 4.54it/s] 117it [00:25, 4.58it/s] 118it [00:26, 4.61it/s] 119it [00:26, 4.47it/s] 120it [00:26, 4.53it/s] 121it [00:26, 4.56it/s] 122it [00:26, 4.60it/s] 123it [00:27, 4.61it/s] 124it [00:27, 4.63it/s] 125it [00:27, 4.64it/s] 126it [00:27, 4.48it/s] 127it [00:28, 4.53it/s] 128it [00:28, 4.56it/s] 129it [00:28, 4.59it/s] 130it [00:28, 4.59it/s] 131it [00:28, 4.61it/s] 132it [00:29, 4.62it/s] 133it [00:29, 4.63it/s] 134it [00:29, 4.63it/s] 135it [00:29, 4.49it/s] 136it [00:29, 4.53it/s] 137it [00:30, 4.55it/s] 138it [00:30, 4.58it/s] 139it [00:30, 4.60it/s] 140it [00:30, 4.61it/s] 141it [00:31, 4.61it/s] 142it [00:31, 4.62it/s] 143it [00:31, 4.64it/s] 144it [00:31, 4.48it/s] 145it [00:31, 4.54it/s] 146it [00:32, 4.57it/s] 147it [00:32, 4.60it/s] 148it [00:32, 4.60it/s] 149it [00:32, 4.62it/s] 150it [00:33, 4.61it/s]2025-05-26 02:02:59,595 - INFO - [Epoch 020 | Batch 0150] IWAE-loss 2351.8418 | mean log_px -0.0055 | KL -1967.71 + 151it [00:33, 4.61it/s] 152it [00:33, 4.62it/s] 153it [00:33, 4.48it/s] 154it [00:33, 4.52it/s] 155it [00:34, 4.56it/s] 156it [00:34, 4.57it/s] 157it [00:34, 4.44it/s] 158it [00:34, 4.48it/s] 159it [00:35, 4.54it/s] 160it [00:35, 4.55it/s] 161it [00:35, 4.57it/s] 162it [00:35, 4.59it/s] 163it [00:35, 4.60it/s] 164it [00:36, 4.47it/s] 165it [00:36, 4.53it/s] 166it [00:36, 4.56it/s] 167it [00:36, 4.59it/s] 168it [00:36, 4.59it/s] 169it [00:37, 4.61it/s] 170it [00:37, 4.61it/s] 171it [00:37, 4.48it/s] 172it [00:37, 4.53it/s] 173it [00:38, 4.42it/s] 174it [00:38, 4.48it/s] 175it [00:38, 4.52it/s] 176it [00:38, 4.54it/s] 177it [00:38, 4.57it/s] 178it [00:39, 4.59it/s] 179it [00:39, 4.59it/s] 180it [00:39, 4.46it/s] 181it [00:39, 4.50it/s] 182it [00:40, 4.53it/s] 183it [00:40, 4.57it/s] 184it [00:40, 4.59it/s] 185it [00:40, 4.61it/s] 186it [00:40, 4.60it/s] 187it [00:41, 4.51it/s] 188it [00:41, 4.55it/s] 189it [00:41, 4.57it/s] 190it [00:41, 4.57it/s] 191it [00:42, 4.59it/s] 192it [00:42, 4.47it/s] 193it [00:42, 4.52it/s] 194it [00:42, 4.54it/s] 195it [00:42, 4.44it/s] 196it [00:43, 4.50it/s] 196it [00:43, 4.54it/s] +2025-05-26 02:03:09,634 - INFO - Epoch: 20, Objective: tensor([2321.2383], device='cuda:0', grad_fn=), Loss: 0.013511824421584606, KL/n: 39.98223876953125 + 0it [00:00, ?it/s]2025-05-26 02:03:10,013 - INFO - [Epoch 021 | Batch 0000] IWAE-loss 2518.2864 | mean log_px -0.0100 | KL -1959.45 + 1it [00:00, 3.29it/s] 2it [00:00, 3.97it/s] 3it [00:00, 4.08it/s] 4it [00:00, 4.30it/s] 5it [00:01, 4.39it/s] 6it [00:01, 4.48it/s] 7it [00:01, 4.54it/s] 8it [00:01, 4.57it/s] 9it [00:02, 4.59it/s] 10it [00:02, 4.46it/s] 11it [00:02, 4.53it/s] 12it [00:02, 4.56it/s] 13it [00:02, 4.55it/s] 14it [00:03, 3.62it/s] 15it [00:03, 3.89it/s] 16it [00:03, 4.08it/s] 17it [00:04, 4.10it/s] 18it [00:04, 4.25it/s] 19it [00:04, 4.37it/s] 20it [00:04, 4.44it/s] 21it [00:04, 4.49it/s] 22it [00:05, 4.53it/s] 23it [00:05, 4.42it/s] 24it [00:05, 4.48it/s] 25it [00:05, 4.54it/s] 26it [00:05, 4.55it/s] 27it [00:06, 4.57it/s] 28it [00:06, 4.58it/s] 29it [00:06, 4.61it/s] 30it [00:06, 4.47it/s] 31it [00:07, 4.52it/s] 32it [00:07, 4.56it/s] 33it [00:07, 4.59it/s] 34it [00:07, 4.59it/s] 35it [00:07, 4.56it/s] 36it [00:08, 4.52it/s] 37it [00:08, 4.40it/s] 38it [00:08, 4.48it/s] 39it [00:08, 4.52it/s] 40it [00:09, 4.56it/s] 41it [00:09, 4.58it/s] 42it [00:09, 4.59it/s] 43it [00:09, 4.60it/s] 44it [00:09, 4.47it/s] 45it [00:10, 4.54it/s] 46it [00:10, 4.54it/s] 47it [00:10, 4.58it/s] 48it [00:10, 4.59it/s] 49it [00:11, 4.58it/s] 50it [00:11, 4.58it/s]2025-05-26 02:03:21,183 - INFO - [Epoch 021 | Batch 0050] IWAE-loss 2608.6096 | mean log_px -0.0148 | KL -1939.67 + 51it [00:11, 4.45it/s] 52it [00:11, 4.50it/s] 53it [00:11, 4.53it/s] 54it [00:12, 4.57it/s] 55it [00:12, 4.60it/s] 56it [00:12, 4.52it/s] 57it [00:12, 4.56it/s] 58it [00:13, 4.44it/s] 59it [00:13, 4.50it/s] 60it [00:13, 4.54it/s] 61it [00:13, 4.57it/s] 62it [00:13, 4.44it/s] 63it [00:14, 4.50it/s] 64it [00:14, 4.54it/s] 65it [00:14, 4.57it/s] 66it [00:14, 4.59it/s] 67it [00:15, 4.59it/s] 68it [00:15, 4.61it/s] 69it [00:15, 4.47it/s] 70it [00:15, 4.53it/s] 71it [00:15, 4.56it/s] 72it [00:16, 4.58it/s] 73it [00:16, 4.61it/s] 74it [00:16, 4.60it/s] 75it [00:16, 4.61it/s] 76it [00:16, 4.47it/s] 77it [00:17, 4.54it/s] 78it [00:17, 4.57it/s] 79it [00:17, 4.60it/s] 80it [00:17, 4.59it/s] 81it [00:18, 4.61it/s] 82it [00:18, 4.47it/s] 83it [00:18, 4.53it/s] 84it [00:18, 4.56it/s] 85it [00:18, 4.58it/s] 86it [00:19, 4.58it/s] 87it [00:19, 4.58it/s] 88it [00:19, 4.59it/s] 89it [00:19, 4.43it/s] 90it [00:20, 4.49it/s] 91it [00:20, 4.54it/s] 92it [00:20, 4.57it/s] 93it [00:20, 4.60it/s] 94it [00:20, 4.61it/s] 95it [00:21, 4.61it/s] 96it [00:21, 4.48it/s] 97it [00:21, 4.52it/s] 98it [00:21, 4.55it/s] 99it [00:22, 4.59it/s] 100it [00:22, 4.59it/s]2025-05-26 02:03:32,174 - INFO - [Epoch 021 | Batch 0100] IWAE-loss 2265.2100 | mean log_px -0.0051 | KL -1927.49 + 101it [00:22, 4.59it/s] 102it [00:22, 4.60it/s] 103it [00:22, 4.48it/s] 104it [00:23, 4.52it/s] 105it [00:23, 4.55it/s] 106it [00:23, 4.57it/s] 107it [00:23, 4.59it/s] 108it [00:24, 4.59it/s] 109it [00:24, 4.62it/s] 110it [00:24, 4.47it/s] 111it [00:24, 4.52it/s] 112it [00:24, 4.55it/s] 113it [00:25, 4.57it/s] 114it [00:25, 4.54it/s] 115it [00:25, 4.59it/s] 116it [00:25, 4.45it/s] 117it [00:25, 4.51it/s] 118it [00:26, 4.57it/s] 119it [00:26, 4.59it/s] 120it [00:26, 4.60it/s] 121it [00:26, 4.60it/s] 122it [00:27, 4.62it/s] 123it [00:27, 4.49it/s] 124it [00:27, 4.55it/s] 125it [00:27, 4.59it/s] 126it [00:27, 4.61it/s] 127it [00:28, 4.64it/s] 128it [00:28, 4.64it/s] 129it [00:28, 4.50it/s] 130it [00:28, 4.56it/s] 131it [00:29, 4.59it/s] 132it [00:29, 4.61it/s] 133it [00:29, 4.63it/s] 134it [00:29, 4.63it/s] 135it [00:29, 4.50it/s] 136it [00:30, 4.56it/s] 137it [00:30, 4.59it/s] 138it [00:30, 4.61it/s] 139it [00:30, 4.64it/s] 140it [00:30, 4.64it/s] 141it [00:31, 4.51it/s] 142it [00:31, 4.55it/s] 143it [00:31, 4.59it/s] 144it [00:31, 4.61it/s] 145it [00:32, 4.63it/s] 146it [00:32, 4.62it/s] 147it [00:32, 4.48it/s] 148it [00:32, 4.54it/s] 149it [00:32, 4.56it/s] 150it [00:33, 4.56it/s]2025-05-26 02:03:43,117 - INFO - [Epoch 021 | Batch 0150] IWAE-loss 2249.6196 | mean log_px -0.0076 | KL -1918.02 + 151it [00:33, 4.59it/s] 152it [00:33, 4.60it/s] 153it [00:33, 4.48it/s] 154it [00:34, 4.54it/s] 155it [00:34, 4.58it/s] 156it [00:34, 4.59it/s] 157it [00:34, 4.47it/s] 158it [00:34, 4.52it/s] 159it [00:35, 4.56it/s] 160it [00:35, 4.58it/s] 161it [00:35, 4.57it/s] 162it [00:35, 4.59it/s] 163it [00:36, 4.61it/s] 164it [00:36, 4.46it/s] 165it [00:36, 4.53it/s] 166it [00:36, 4.57it/s] 167it [00:36, 4.46it/s] 168it [00:37, 4.51it/s] 169it [00:37, 4.55it/s] 170it [00:37, 4.58it/s] 171it [00:37, 4.59it/s] 172it [00:38, 4.61it/s] 173it [00:38, 4.61it/s] 174it [00:38, 4.47it/s] 175it [00:38, 4.53it/s] 176it [00:38, 4.56it/s] 177it [00:39, 4.60it/s] 178it [00:39, 4.58it/s] 179it [00:39, 4.51it/s] 180it [00:39, 4.55it/s] 181it [00:39, 4.58it/s] 182it [00:40, 4.47it/s] 183it [00:40, 4.52it/s] 184it [00:40, 4.56it/s] 185it [00:40, 4.60it/s] 186it [00:41, 4.61it/s] 187it [00:41, 4.61it/s] 188it [00:41, 4.63it/s] 189it [00:41, 4.50it/s] 190it [00:41, 4.56it/s] 191it [00:42, 4.59it/s] 192it [00:42, 4.59it/s] 193it [00:42, 4.62it/s] 194it [00:42, 4.61it/s] 195it [00:43, 4.50it/s] 196it [00:43, 4.41it/s] 196it [00:43, 4.52it/s] +2025-05-26 02:03:53,138 - INFO - Epoch: 21, Objective: tensor([2395.0178], device='cuda:0', grad_fn=), Loss: 0.009308933280408382, KL/n: 39.00183868408203 + 0it [00:00, ?it/s]2025-05-26 02:03:53,520 - INFO - [Epoch 022 | Batch 0000] IWAE-loss 2293.9033 | mean log_px -0.0119 | KL -1907.14 + 1it [00:00, 3.35it/s] 2it [00:00, 4.00it/s] 3it [00:00, 4.29it/s] 4it [00:00, 4.43it/s] 5it [00:01, 4.53it/s] 6it [00:01, 4.39it/s] 7it [00:01, 4.47it/s] 8it [00:01, 4.53it/s] 9it [00:02, 4.57it/s] 10it [00:02, 4.60it/s] 11it [00:02, 4.62it/s] 12it [00:02, 4.64it/s] 13it [00:02, 4.50it/s] 14it [00:03, 4.52it/s] 15it [00:03, 4.57it/s] 16it [00:03, 4.56it/s] 17it [00:03, 4.58it/s] 18it [00:04, 4.59it/s] 19it [00:04, 4.62it/s] 20it [00:04, 4.53it/s] 21it [00:04, 4.57it/s] 22it [00:04, 4.59it/s] 23it [00:05, 4.61it/s] 24it [00:05, 4.62it/s] 25it [00:05, 4.64it/s] 26it [00:05, 4.64it/s] 27it [00:05, 4.50it/s] 28it [00:06, 4.54it/s] 29it [00:06, 4.58it/s] 30it [00:06, 4.59it/s] 31it [00:06, 4.61it/s] 32it [00:07, 4.63it/s] 33it [00:07, 4.64it/s] 34it [00:07, 4.48it/s] 35it [00:07, 4.54it/s] 36it [00:07, 4.57it/s] 37it [00:08, 4.59it/s] 38it [00:08, 4.59it/s] 39it [00:08, 4.62it/s] 40it [00:08, 4.62it/s] 41it [00:09, 4.64it/s] 42it [00:09, 4.64it/s] 43it [00:09, 4.50it/s] 44it [00:09, 4.54it/s] 45it [00:09, 4.58it/s] 46it [00:10, 4.59it/s] 47it [00:10, 4.60it/s] 48it [00:10, 4.61it/s] 49it [00:10, 4.62it/s] 50it [00:10, 4.61it/s]2025-05-26 02:04:04,413 - INFO - [Epoch 022 | Batch 0050] IWAE-loss 2142.6248 | mean log_px -0.0071 | KL -1895.51 + 51it [00:11, 4.63it/s] 52it [00:11, 4.48it/s] 53it [00:11, 4.55it/s] 54it [00:11, 4.56it/s] 55it [00:12, 4.59it/s] 56it [00:12, 4.59it/s] 57it [00:12, 4.60it/s] 58it [00:12, 4.61it/s] 59it [00:12, 4.47it/s] 60it [00:13, 4.54it/s] 61it [00:13, 4.57it/s] 62it [00:13, 4.58it/s] 63it [00:13, 4.34it/s] 64it [00:14, 4.40it/s] 65it [00:14, 4.45it/s] 66it [00:14, 4.50it/s] 67it [00:14, 4.54it/s] 68it [00:14, 4.52it/s] 69it [00:15, 4.52it/s] 70it [00:15, 4.56it/s] 71it [00:15, 4.44it/s] 72it [00:15, 4.49it/s] 73it [00:16, 4.54it/s] 74it [00:16, 4.56it/s] 75it [00:16, 4.59it/s] 76it [00:16, 4.60it/s] 77it [00:16, 4.61it/s] 78it [00:17, 4.63it/s] 79it [00:17, 4.63it/s] 80it [00:17, 4.65it/s] 81it [00:17, 4.50it/s] 82it [00:18, 4.53it/s] 83it [00:18, 4.57it/s] 84it [00:18, 4.57it/s] 85it [00:18, 4.60it/s] 86it [00:18, 4.61it/s] 87it [00:19, 4.62it/s] 88it [00:19, 4.49it/s] 89it [00:19, 4.55it/s] 90it [00:19, 4.57it/s] 91it [00:19, 4.59it/s] 92it [00:20, 4.60it/s] 93it [00:20, 4.49it/s] 94it [00:20, 4.54it/s] 95it [00:20, 4.58it/s] 96it [00:21, 4.58it/s] 97it [00:21, 4.61it/s] 98it [00:21, 4.62it/s] 99it [00:21, 4.48it/s] 100it [00:21, 4.53it/s]2025-05-26 02:04:15,413 - INFO - [Epoch 022 | Batch 0100] IWAE-loss 2433.9939 | mean log_px -0.0126 | KL -1877.79 + 101it [00:22, 4.56it/s] 102it [00:22, 4.42it/s] 103it [00:22, 4.50it/s] 104it [00:22, 4.53it/s] 105it [00:23, 4.56it/s] 106it [00:23, 4.58it/s] 107it [00:23, 4.59it/s] 108it [00:23, 4.60it/s] 109it [00:23, 4.62it/s] 110it [00:24, 4.62it/s] 111it [00:24, 4.47it/s] 112it [00:24, 4.53it/s] 113it [00:24, 4.55it/s] 114it [00:25, 4.58it/s] 115it [00:25, 4.60it/s] 116it [00:25, 4.60it/s] 117it [00:25, 4.62it/s] 118it [00:25, 4.47it/s] 119it [00:26, 4.53it/s] 120it [00:26, 4.51it/s] 121it [00:26, 4.48it/s] 122it [00:26, 4.52it/s] 123it [00:27, 4.57it/s] 124it [00:27, 4.37it/s] 125it [00:27, 4.40it/s] 126it [00:27, 4.47it/s] 127it [00:27, 4.52it/s] 128it [00:28, 4.54it/s] 129it [00:28, 4.55it/s] 130it [00:28, 4.58it/s] 131it [00:28, 4.45it/s] 132it [00:29, 4.52it/s] 133it [00:29, 4.56it/s] 134it [00:29, 4.58it/s] 135it [00:29, 4.59it/s] 136it [00:29, 4.59it/s] 137it [00:30, 4.61it/s] 138it [00:30, 4.46it/s] 139it [00:30, 4.53it/s] 140it [00:30, 4.54it/s] 141it [00:31, 4.58it/s] 142it [00:31, 4.60it/s] 143it [00:31, 4.60it/s] 144it [00:31, 4.46it/s] 145it [00:31, 4.51it/s] 146it [00:32, 4.51it/s] 147it [00:32, 4.56it/s] 148it [00:32, 4.56it/s] 149it [00:32, 4.59it/s] 150it [00:32, 4.55it/s]2025-05-26 02:04:26,427 - INFO - [Epoch 022 | Batch 0150] IWAE-loss 2279.8452 | mean log_px -0.0095 | KL -1866.57 + 151it [00:33, 4.58it/s] 152it [00:33, 4.57it/s] 153it [00:33, 4.61it/s] 154it [00:33, 4.62it/s] 155it [00:34, 4.57it/s] 156it [00:34, 4.57it/s] 157it [00:34, 4.61it/s] 158it [00:34, 4.62it/s] 159it [00:34, 4.48it/s] 160it [00:35, 4.55it/s] 161it [00:35, 4.58it/s] 162it [00:35, 4.58it/s] 163it [00:35, 4.59it/s] 164it [00:36, 4.60it/s] 165it [00:36, 4.57it/s] 166it [00:36, 4.61it/s] 167it [00:36, 4.46it/s] 168it [00:36, 4.51it/s] 169it [00:37, 4.54it/s] 170it [00:37, 4.57it/s] 171it [00:37, 4.60it/s] 172it [00:37, 4.62it/s] 173it [00:38, 4.45it/s] 174it [00:38, 4.52it/s] 175it [00:38, 4.56it/s] 176it [00:38, 4.59it/s] 177it [00:38, 4.61it/s] 178it [00:39, 4.61it/s] 179it [00:39, 4.63it/s] 180it [00:39, 4.63it/s] 181it [00:39, 4.50it/s] 182it [00:39, 4.55it/s] 183it [00:40, 4.58it/s] 184it [00:40, 4.46it/s] 185it [00:40, 4.53it/s] 186it [00:40, 4.56it/s] 187it [00:41, 4.60it/s] 188it [00:41, 4.62it/s] 189it [00:41, 4.62it/s] 190it [00:41, 4.62it/s] 191it [00:41, 4.64it/s] 192it [00:42, 4.64it/s] 193it [00:42, 4.50it/s] 194it [00:42, 4.55it/s] 195it [00:42, 4.45it/s] 196it [00:43, 4.51it/s] 196it [00:43, 4.54it/s] +2025-05-26 02:04:36,410 - INFO - Epoch: 22, Objective: tensor([2321.2053], device='cuda:0', grad_fn=), Loss: 0.0126264663413167, KL/n: 37.90328598022461 + 0it [00:00, ?it/s]2025-05-26 02:04:36,964 - INFO - [Epoch 023 | Batch 0000] IWAE-loss 2031.7919 | mean log_px -0.0048 | KL -1857.27 + 1it [00:00, 3.34it/s] 2it [00:00, 4.02it/s] 3it [00:00, 4.13it/s] 4it [00:00, 4.32it/s] 5it [00:01, 4.45it/s] 6it [00:01, 4.51it/s] 7it [00:01, 4.56it/s] 8it [00:01, 4.59it/s] 9it [00:02, 4.62it/s] 10it [00:02, 4.64it/s] 11it [00:02, 4.66it/s] 12it [00:02, 4.66it/s] 13it [00:02, 4.51it/s] 14it [00:03, 4.57it/s] 15it [00:03, 4.56it/s] 16it [00:03, 4.57it/s] 17it [00:03, 4.62it/s] 18it [00:03, 4.62it/s] 19it [00:04, 4.63it/s] 20it [00:04, 4.64it/s] 21it [00:04, 4.64it/s] 22it [00:04, 4.66it/s] 23it [00:05, 4.67it/s] 24it [00:05, 4.67it/s] 25it [00:05, 4.66it/s] 26it [00:05, 4.66it/s] 27it [00:05, 4.48it/s] 28it [00:06, 4.54it/s] 29it [00:06, 4.57it/s] 30it [00:06, 4.60it/s] 31it [00:06, 4.63it/s] 32it [00:07, 4.63it/s] 33it [00:07, 4.65it/s] 34it [00:07, 4.65it/s] 35it [00:07, 4.66it/s] 36it [00:07, 4.47it/s] 37it [00:08, 4.54it/s] 38it [00:08, 4.57it/s] 39it [00:08, 4.61it/s] 40it [00:08, 4.63it/s] 41it [00:08, 4.49it/s] 42it [00:09, 4.54it/s] 43it [00:09, 4.58it/s] 44it [00:09, 4.61it/s] 45it [00:09, 4.63it/s] 46it [00:10, 4.64it/s] 47it [00:10, 4.65it/s] 48it [00:10, 4.66it/s] 49it [00:10, 4.66it/s] 50it [00:10, 4.66it/s]2025-05-26 02:04:47,803 - INFO - [Epoch 023 | Batch 0050] IWAE-loss 2093.6794 | mean log_px -0.0058 | KL -1840.02 + 51it [00:11, 4.51it/s] 52it [00:11, 4.56it/s] 53it [00:11, 4.60it/s] 54it [00:11, 4.62it/s] 55it [00:12, 4.64it/s] 56it [00:12, 4.64it/s] 57it [00:12, 4.66it/s] 58it [00:12, 4.66it/s] 59it [00:12, 4.67it/s] 60it [00:13, 4.51it/s] 61it [00:13, 4.57it/s] 62it [00:13, 4.60it/s] 63it [00:13, 4.63it/s] 64it [00:13, 4.65it/s] 65it [00:14, 4.66it/s] 66it [00:14, 4.66it/s] 67it [00:14, 4.67it/s] 68it [00:14, 4.64it/s] 69it [00:15, 4.60it/s] 70it [00:15, 4.53it/s] 71it [00:15, 4.57it/s] 72it [00:15, 4.59it/s] 73it [00:15, 4.59it/s] 74it [00:16, 4.45it/s] 75it [00:16, 4.50it/s] 76it [00:16, 4.53it/s] 77it [00:16, 4.58it/s] 78it [00:17, 4.60it/s] 79it [00:17, 4.58it/s] 80it [00:17, 4.60it/s] 81it [00:17, 4.62it/s] 82it [00:17, 4.64it/s] 83it [00:18, 4.49it/s] 84it [00:18, 4.54it/s] 85it [00:18, 4.59it/s] 86it [00:18, 4.61it/s] 87it [00:18, 4.63it/s] 88it [00:19, 4.49it/s] 89it [00:19, 4.55it/s] 90it [00:19, 4.59it/s] 91it [00:19, 4.61it/s] 92it [00:20, 4.61it/s] 93it [00:20, 4.64it/s] 94it [00:20, 4.63it/s] 95it [00:20, 4.49it/s] 96it [00:20, 4.54it/s] 97it [00:21, 4.58it/s] 98it [00:21, 4.60it/s] 99it [00:21, 4.61it/s] 100it [00:21, 4.63it/s]2025-05-26 02:04:58,699 - INFO - [Epoch 023 | Batch 0100] IWAE-loss 2605.1060 | mean log_px -0.0202 | KL -1829.09 + 101it [00:22, 4.64it/s] 102it [00:22, 4.49it/s] 103it [00:22, 4.55it/s] 104it [00:22, 4.58it/s] 105it [00:22, 4.60it/s] 106it [00:23, 4.62it/s] 107it [00:23, 4.64it/s] 108it [00:23, 4.65it/s] 109it [00:23, 4.50it/s] 110it [00:24, 4.54it/s] 111it [00:24, 4.58it/s] 112it [00:24, 4.61it/s] 113it [00:24, 4.61it/s] 114it [00:24, 4.56it/s] 115it [00:25, 4.59it/s] 116it [00:25, 4.46it/s] 117it [00:25, 4.45it/s] 118it [00:25, 4.50it/s] 119it [00:25, 4.56it/s] 120it [00:26, 4.43it/s] 121it [00:26, 4.51it/s] 122it [00:26, 4.55it/s] 123it [00:26, 4.58it/s] 124it [00:27, 4.60it/s] 125it [00:27, 4.62it/s] 126it [00:27, 4.63it/s] 127it [00:27, 4.49it/s] 128it [00:27, 4.54it/s] 129it [00:28, 4.57it/s] 130it [00:28, 4.59it/s] 131it [00:28, 4.59it/s] 132it [00:28, 4.60it/s] 133it [00:29, 4.62it/s] 134it [00:29, 4.64it/s] 135it [00:29, 4.50it/s] 136it [00:29, 4.54it/s] 137it [00:29, 4.57it/s] 138it [00:30, 4.60it/s] 139it [00:30, 4.62it/s] 140it [00:30, 4.63it/s] 141it [00:30, 4.64it/s] 142it [00:31, 4.50it/s] 143it [00:31, 4.56it/s] 144it [00:31, 4.58it/s] 145it [00:31, 4.60it/s] 146it [00:31, 4.62it/s] 147it [00:32, 4.62it/s] 148it [00:32, 4.61it/s] 149it [00:32, 4.48it/s] 150it [00:32, 4.54it/s]2025-05-26 02:05:09,658 - INFO - [Epoch 023 | Batch 0150] IWAE-loss 2053.4185 | mean log_px -0.0083 | KL -1817.16 + 151it [00:32, 4.53it/s] 152it [00:33, 4.56it/s] 153it [00:33, 4.59it/s] 154it [00:33, 4.59it/s] 155it [00:33, 4.61it/s] 156it [00:34, 4.47it/s] 157it [00:34, 4.53it/s] 158it [00:34, 4.57it/s] 159it [00:34, 4.60it/s] 160it [00:34, 4.61it/s] 161it [00:35, 4.63it/s] 162it [00:35, 4.63it/s] 163it [00:35, 4.51it/s] 164it [00:35, 4.56it/s] 165it [00:36, 4.56it/s] 166it [00:36, 4.59it/s] 167it [00:36, 4.61it/s] 168it [00:36, 4.63it/s] 169it [00:36, 4.50it/s] 170it [00:37, 4.55it/s] 171it [00:37, 4.58it/s] 172it [00:37, 4.56it/s] 173it [00:37, 4.60it/s] 174it [00:38, 4.61it/s] 175it [00:38, 4.49it/s] 176it [00:38, 4.53it/s] 177it [00:38, 4.58it/s] 178it [00:38, 4.59it/s] 179it [00:39, 4.61it/s] 180it [00:39, 4.61it/s] 181it [00:39, 4.63it/s] 182it [00:39, 4.49it/s] 183it [00:39, 4.52it/s] 184it [00:40, 4.56it/s] 185it [00:40, 4.59it/s] 186it [00:40, 4.61it/s] 187it [00:40, 4.62it/s] 188it [00:41, 4.64it/s] 189it [00:41, 4.50it/s] 190it [00:41, 4.54it/s] 191it [00:41, 4.57it/s] 192it [00:41, 4.60it/s] 193it [00:42, 4.47it/s] 194it [00:42, 4.52it/s] 195it [00:42, 4.42it/s] 196it [00:42, 4.50it/s] 196it [00:42, 4.57it/s] +2025-05-26 02:05:19,653 - INFO - Epoch: 23, Objective: tensor([2333.9048], device='cuda:0', grad_fn=), Loss: 0.009835069067776203, KL/n: 36.8824462890625 + 0it [00:00, ?it/s]2025-05-26 02:05:20,048 - INFO - [Epoch 024 | Batch 0000] IWAE-loss 2042.8802 | mean log_px -0.0088 | KL -1806.51 + 1it [00:00, 3.12it/s] 2it [00:00, 3.88it/s] 3it [00:00, 4.22it/s] 4it [00:00, 4.20it/s] 5it [00:01, 4.37it/s] 6it [00:01, 4.45it/s] 7it [00:01, 4.52it/s] 8it [00:01, 4.56it/s] 9it [00:02, 4.60it/s] 10it [00:02, 4.47it/s] 11it [00:02, 3.60it/s] 12it [00:02, 3.86it/s] 13it [00:03, 4.07it/s] 14it [00:03, 4.21it/s] 15it [00:03, 4.26it/s] 16it [00:03, 4.35it/s] 17it [00:04, 4.43it/s] 18it [00:04, 4.47it/s] 19it [00:04, 4.52it/s] 20it [00:04, 4.54it/s] 21it [00:04, 4.43it/s] 22it [00:05, 4.46it/s] 23it [00:05, 4.51it/s] 24it [00:05, 4.56it/s] 25it [00:05, 4.59it/s] 26it [00:05, 4.61it/s] 27it [00:06, 4.63it/s] 28it [00:06, 4.50it/s] 29it [00:06, 4.56it/s] 30it [00:06, 4.58it/s] 31it [00:07, 4.62it/s] 32it [00:07, 4.63it/s] 33it [00:07, 4.63it/s] 34it [00:07, 4.50it/s] 35it [00:07, 4.56it/s] 36it [00:08, 4.59it/s] 37it [00:08, 4.58it/s] 38it [00:08, 4.59it/s] 39it [00:08, 4.61it/s] 40it [00:09, 4.60it/s] 41it [00:09, 4.48it/s] 42it [00:09, 4.53it/s] 43it [00:09, 4.56it/s] 44it [00:09, 4.59it/s] 45it [00:10, 4.63it/s] 46it [00:10, 4.63it/s] 47it [00:10, 4.50it/s] 48it [00:10, 4.55it/s] 49it [00:11, 4.59it/s] 50it [00:11, 4.60it/s]2025-05-26 02:05:31,167 - INFO - [Epoch 024 | Batch 0050] IWAE-loss 1896.7238 | mean log_px -0.0014 | KL -1796.85 + 51it [00:11, 4.61it/s] 52it [00:11, 4.62it/s] 53it [00:11, 4.49it/s] 54it [00:12, 4.54it/s] 55it [00:12, 4.59it/s] 56it [00:12, 4.60it/s] 57it [00:12, 4.57it/s] 58it [00:13, 4.37it/s] 59it [00:13, 4.46it/s] 60it [00:13, 4.37it/s] 61it [00:13, 4.37it/s] 62it [00:13, 4.47it/s] 63it [00:14, 4.53it/s] 64it [00:14, 4.56it/s] 65it [00:14, 4.60it/s] 66it [00:14, 4.47it/s] 67it [00:15, 4.50it/s] 68it [00:15, 4.55it/s] 69it [00:15, 4.57it/s] 70it [00:15, 4.60it/s] 71it [00:15, 4.60it/s] 72it [00:16, 4.48it/s] 73it [00:16, 4.55it/s] 74it [00:16, 4.44it/s] 75it [00:16, 4.46it/s] 76it [00:16, 4.51it/s] 77it [00:17, 4.48it/s] 78it [00:17, 4.52it/s] 79it [00:17, 4.55it/s] 80it [00:17, 4.57it/s] 81it [00:18, 4.45it/s] 82it [00:18, 4.50it/s] 83it [00:18, 4.53it/s] 84it [00:18, 4.56it/s] 85it [00:18, 4.58it/s] 86it [00:19, 4.59it/s] 87it [00:19, 4.47it/s] 88it [00:19, 4.51it/s] 89it [00:19, 4.53it/s] 90it [00:20, 4.43it/s] 91it [00:20, 4.51it/s] 92it [00:20, 4.55it/s] 93it [00:20, 4.59it/s] 94it [00:20, 4.60it/s] 95it [00:21, 4.62it/s] 96it [00:21, 4.49it/s] 97it [00:21, 4.55it/s] 98it [00:21, 4.58it/s] 99it [00:22, 4.59it/s] 100it [00:22, 4.61it/s]2025-05-26 02:05:42,209 - INFO - [Epoch 024 | Batch 0100] IWAE-loss 2474.6335 | mean log_px -0.0208 | KL -1782.80 + 101it [00:22, 4.61it/s] 102it [00:22, 4.46it/s] 103it [00:22, 4.49it/s] 104it [00:23, 4.51it/s] 105it [00:23, 4.55it/s] 106it [00:23, 4.57it/s] 107it [00:23, 4.59it/s] 108it [00:24, 4.59it/s] 109it [00:24, 4.48it/s] 110it [00:24, 4.52it/s] 111it [00:24, 4.56it/s] 112it [00:24, 4.57it/s] 113it [00:25, 4.60it/s] 114it [00:25, 4.47it/s] 115it [00:25, 4.54it/s] 116it [00:25, 4.57it/s] 117it [00:26, 4.60it/s] 118it [00:26, 4.61it/s] 119it [00:26, 4.62it/s] 120it [00:26, 4.49it/s] 121it [00:26, 4.55it/s] 122it [00:27, 4.57it/s] 123it [00:27, 4.59it/s] 124it [00:27, 4.60it/s] 125it [00:27, 4.61it/s] 126it [00:27, 4.62it/s] 127it [00:28, 4.49it/s] 128it [00:28, 4.53it/s] 129it [00:28, 4.57it/s] 130it [00:28, 4.59it/s] 131it [00:29, 4.60it/s] 132it [00:29, 4.61it/s] 133it [00:29, 4.55it/s] 134it [00:29, 4.57it/s] 135it [00:29, 4.60it/s] 136it [00:30, 4.62it/s] 137it [00:30, 4.63it/s] 138it [00:30, 4.51it/s] 139it [00:30, 4.55it/s] 140it [00:31, 4.56it/s] 141it [00:31, 4.56it/s] 142it [00:31, 4.59it/s] 143it [00:31, 4.62it/s] 144it [00:31, 4.50it/s] 145it [00:32, 4.55it/s] 146it [00:32, 4.57it/s] 147it [00:32, 4.60it/s] 148it [00:32, 4.61it/s] 149it [00:32, 4.62it/s] 150it [00:33, 4.47it/s]2025-05-26 02:05:53,176 - INFO - [Epoch 024 | Batch 0150] IWAE-loss 2033.4376 | mean log_px -0.0059 | KL -1774.52 + 151it [00:33, 4.52it/s] 152it [00:33, 4.51it/s] 153it [00:33, 4.56it/s] 154it [00:34, 4.58it/s] 155it [00:34, 4.45it/s] 156it [00:34, 4.50it/s] 157it [00:34, 4.53it/s] 158it [00:35, 4.49it/s] 159it [00:35, 4.52it/s] 160it [00:35, 4.54it/s] 161it [00:35, 4.55it/s] 162it [00:35, 4.41it/s] 163it [00:36, 4.45it/s] 164it [00:36, 4.49it/s] 165it [00:36, 4.54it/s] 166it [00:36, 4.57it/s] 167it [00:36, 4.60it/s] 168it [00:37, 4.46it/s] 169it [00:37, 4.53it/s] 170it [00:37, 4.57it/s] 171it [00:37, 4.59it/s] 172it [00:38, 4.60it/s] 173it [00:38, 4.61it/s] 174it [00:38, 4.48it/s] 175it [00:38, 4.52it/s] 176it [00:38, 4.54it/s] 177it [00:39, 4.57it/s] 178it [00:39, 4.59it/s] 179it [00:39, 4.60it/s] 180it [00:39, 4.60it/s] 181it [00:40, 4.44it/s] 182it [00:40, 4.51it/s] 183it [00:40, 4.56it/s] 184it [00:40, 4.58it/s] 185it [00:40, 4.59it/s] 186it [00:41, 4.45it/s] 187it [00:41, 4.52it/s] 188it [00:41, 4.56it/s] 189it [00:41, 4.57it/s] 190it [00:42, 4.59it/s] 191it [00:42, 4.61it/s] 192it [00:42, 4.46it/s] 193it [00:42, 4.51it/s] 194it [00:42, 4.55it/s] 195it [00:43, 4.47it/s] 196it [00:43, 4.54it/s] 196it [00:43, 4.51it/s] +2025-05-26 02:06:03,233 - INFO - Epoch: 24, Objective: tensor([2720.5593], device='cuda:0', grad_fn=), Loss: 0.01608070731163025, KL/n: 36.15454864501953 + 0it [00:00, ?it/s]2025-05-26 02:06:03,611 - INFO - [Epoch 025 | Batch 0000] IWAE-loss 2173.3323 | mean log_px -0.0057 | KL -1770.69 + 1it [00:00, 3.04it/s] 2it [00:00, 3.85it/s] 3it [00:00, 4.20it/s] 4it [00:00, 4.37it/s] 5it [00:01, 4.48it/s] 6it [00:01, 4.53it/s] 7it [00:01, 4.42it/s] 8it [00:01, 4.51it/s] 9it [00:02, 4.57it/s] 10it [00:02, 4.59it/s] 11it [00:02, 4.62it/s] 12it [00:02, 4.63it/s] 13it [00:02, 4.49it/s] 14it [00:03, 4.56it/s] 15it [00:03, 4.60it/s] 16it [00:03, 4.62it/s] 17it [00:03, 4.64it/s] 18it [00:04, 4.64it/s] 19it [00:04, 4.50it/s] 20it [00:04, 4.56it/s] 21it [00:04, 4.60it/s] 22it [00:04, 4.62it/s] 23it [00:05, 4.53it/s] 24it [00:05, 4.52it/s] 25it [00:05, 4.57it/s] 26it [00:05, 4.59it/s] 27it [00:05, 4.62it/s] 28it [00:06, 4.48it/s] 29it [00:06, 4.55it/s] 30it [00:06, 4.58it/s] 31it [00:06, 4.61it/s] 32it [00:07, 4.63it/s] 33it [00:07, 4.64it/s] 34it [00:07, 4.49it/s] 35it [00:07, 4.56it/s] 36it [00:07, 4.59it/s] 37it [00:08, 4.62it/s] 38it [00:08, 4.63it/s] 39it [00:08, 4.49it/s] 40it [00:08, 4.55it/s] 41it [00:09, 4.58it/s] 42it [00:09, 4.60it/s] 43it [00:09, 4.63it/s] 44it [00:09, 4.63it/s] 45it [00:09, 4.49it/s] 46it [00:10, 4.55it/s] 47it [00:10, 4.58it/s] 48it [00:10, 4.56it/s] 49it [00:10, 4.60it/s] 50it [00:11, 4.61it/s]2025-05-26 02:06:14,530 - INFO - [Epoch 025 | Batch 0050] IWAE-loss 1950.6661 | mean log_px -0.0028 | KL -1755.02 + 51it [00:11, 4.48it/s] 52it [00:11, 4.54it/s] 53it [00:11, 4.58it/s] 54it [00:11, 4.60it/s] 55it [00:12, 4.62it/s] 56it [00:12, 4.47it/s] 57it [00:12, 4.54it/s] 58it [00:12, 4.58it/s] 59it [00:12, 4.61it/s] 60it [00:13, 4.62it/s] 61it [00:13, 4.62it/s] 62it [00:13, 4.47it/s] 63it [00:13, 4.53it/s] 64it [00:14, 4.56it/s] 65it [00:14, 4.59it/s] 66it [00:14, 4.60it/s] 67it [00:14, 4.47it/s] 68it [00:14, 4.54it/s] 69it [00:15, 4.57it/s] 70it [00:15, 4.59it/s] 71it [00:15, 4.61it/s] 72it [00:15, 4.61it/s] 73it [00:16, 4.48it/s] 74it [00:16, 4.54it/s] 75it [00:16, 4.58it/s] 76it [00:16, 4.60it/s] 77it [00:16, 4.62it/s] 78it [00:17, 4.63it/s] 79it [00:17, 4.49it/s] 80it [00:17, 4.54it/s] 81it [00:17, 4.58it/s] 82it [00:18, 4.60it/s] 83it [00:18, 4.62it/s] 84it [00:18, 4.62it/s] 85it [00:18, 4.47it/s] 86it [00:18, 4.53it/s] 87it [00:19, 4.57it/s] 88it [00:19, 4.58it/s] 89it [00:19, 4.60it/s] 90it [00:19, 4.61it/s] 91it [00:20, 4.47it/s] 92it [00:20, 4.53it/s] 93it [00:20, 4.56it/s] 94it [00:20, 4.58it/s] 95it [00:20, 4.59it/s] 96it [00:21, 4.61it/s] 97it [00:21, 4.46it/s] 98it [00:21, 4.53it/s] 99it [00:21, 4.57it/s] 100it [00:21, 4.55it/s]2025-05-26 02:06:25,497 - INFO - [Epoch 025 | Batch 0100] IWAE-loss 1830.5348 | mean log_px -0.0022 | KL -1743.90 + 101it [00:22, 4.59it/s] 102it [00:22, 4.60it/s] 103it [00:22, 4.44it/s] 104it [00:22, 4.47it/s] 105it [00:23, 4.53it/s] 106it [00:23, 4.55it/s] 107it [00:23, 4.58it/s] 108it [00:23, 4.59it/s] 109it [00:23, 4.44it/s] 110it [00:24, 4.49it/s] 111it [00:24, 4.54it/s] 112it [00:24, 4.57it/s] 113it [00:24, 4.59it/s] 114it [00:25, 4.58it/s] 115it [00:25, 4.48it/s] 116it [00:25, 4.54it/s] 117it [00:25, 4.59it/s] 118it [00:25, 4.61it/s] 119it [00:26, 4.63it/s] 120it [00:26, 4.64it/s] 121it [00:26, 4.50it/s] 122it [00:26, 4.55it/s] 123it [00:27, 4.58it/s] 124it [00:27, 4.60it/s] 125it [00:27, 4.62it/s] 126it [00:27, 4.63it/s] 127it [00:27, 4.63it/s] 128it [00:28, 4.50it/s] 129it [00:28, 4.55it/s] 130it [00:28, 4.58it/s] 131it [00:28, 4.61it/s] 132it [00:28, 4.62it/s] 133it [00:29, 4.64it/s] 134it [00:29, 4.47it/s] 135it [00:29, 4.53it/s] 136it [00:29, 4.57it/s] 137it [00:30, 4.59it/s] 138it [00:30, 4.61it/s] 139it [00:30, 4.62it/s] 140it [00:30, 4.63it/s] 141it [00:30, 4.63it/s] 142it [00:31, 4.64it/s] 143it [00:31, 4.65it/s] 144it [00:31, 4.50it/s] 145it [00:31, 4.55it/s] 146it [00:32, 4.58it/s] 147it [00:32, 4.60it/s] 148it [00:32, 4.61it/s] 149it [00:32, 4.63it/s] 150it [00:32, 4.65it/s]2025-05-26 02:06:36,416 - INFO - [Epoch 025 | Batch 0150] IWAE-loss 2106.1345 | mean log_px -0.0053 | KL -1734.84 + 151it [00:33, 4.66it/s] 152it [00:33, 4.63it/s] 153it [00:33, 4.65it/s] 154it [00:33, 4.66it/s] 155it [00:33, 4.66it/s] 156it [00:34, 4.66it/s] 157it [00:34, 4.66it/s] 158it [00:34, 4.66it/s] 159it [00:34, 4.66it/s] 160it [00:35, 4.66it/s] 161it [00:35, 4.65it/s] 162it [00:35, 4.65it/s] 163it [00:35, 4.64it/s] 164it [00:35, 4.64it/s] 165it [00:36, 4.65it/s] 166it [00:36, 4.64it/s] 167it [00:36, 4.65it/s] 168it [00:36, 4.65it/s] 169it [00:36, 4.66it/s] 170it [00:37, 4.66it/s] 171it [00:37, 4.51it/s] 172it [00:37, 4.55it/s] 173it [00:37, 4.59it/s] 174it [00:38, 4.61it/s] 175it [00:38, 4.63it/s] 176it [00:38, 4.63it/s] 177it [00:38, 4.64it/s] 178it [00:38, 4.64it/s] 179it [00:39, 4.65it/s] 180it [00:39, 4.65it/s] 181it [00:39, 4.65it/s] 182it [00:39, 4.65it/s] 183it [00:40, 4.65it/s] 184it [00:40, 4.64it/s] 185it [00:40, 4.65it/s] 186it [00:40, 4.65it/s] 187it [00:40, 4.66it/s] 188it [00:41, 4.66it/s] 189it [00:41, 4.65it/s] 190it [00:41, 4.50it/s] 191it [00:41, 4.55it/s] 192it [00:41, 4.59it/s] 193it [00:42, 4.61it/s] 194it [00:42, 4.63it/s] 195it [00:42, 4.49it/s] 196it [00:42, 4.53it/s] 196it [00:42, 4.57it/s] +2025-05-26 02:06:46,280 - INFO - Epoch: 25, Objective: tensor([2120.1199], device='cuda:0', grad_fn=), Loss: 0.009839070029556751, KL/n: 35.31795120239258 + 0it [00:00, ?it/s]2025-05-26 02:06:46,847 - INFO - [Epoch 026 | Batch 0000] IWAE-loss 2901.0183 | mean log_px -0.0300 | KL -1724.86 + 1it [00:00, 3.02it/s] 2it [00:00, 3.82it/s] 3it [00:00, 4.16it/s] 4it [00:00, 4.33it/s] 5it [00:01, 4.44it/s] 6it [00:01, 4.51it/s] 7it [00:01, 4.36it/s] 8it [00:01, 4.46it/s] 9it [00:02, 4.49it/s] 10it [00:02, 4.55it/s] 11it [00:02, 4.59it/s] 12it [00:02, 4.60it/s] 13it [00:02, 4.62it/s] 14it [00:03, 4.46it/s] 15it [00:03, 4.54it/s] 16it [00:03, 4.58it/s] 17it [00:03, 4.59it/s] 18it [00:04, 4.60it/s] 19it [00:04, 4.64it/s] 20it [00:04, 4.63it/s] 21it [00:04, 4.64it/s] 22it [00:04, 4.65it/s] 23it [00:05, 4.65it/s] 24it [00:05, 4.65it/s] 25it [00:05, 4.66it/s] 26it [00:05, 4.65it/s] 27it [00:05, 4.62it/s] 28it [00:06, 4.61it/s] 29it [00:06, 4.63it/s] 30it [00:06, 4.64it/s] 31it [00:06, 4.63it/s] 32it [00:07, 4.64it/s] 33it [00:07, 4.52it/s] 34it [00:07, 4.55it/s] 35it [00:07, 4.58it/s] 36it [00:07, 4.60it/s] 37it [00:08, 4.63it/s] 38it [00:08, 4.64it/s] 39it [00:08, 4.64it/s] 40it [00:08, 4.64it/s] 41it [00:09, 4.66it/s] 42it [00:09, 4.66it/s] 43it [00:09, 4.67it/s] 44it [00:09, 4.66it/s] 45it [00:09, 4.64it/s] 46it [00:10, 4.65it/s] 47it [00:10, 4.50it/s] 48it [00:10, 4.56it/s] 49it [00:10, 4.54it/s] 50it [00:10, 4.41it/s]2025-05-26 02:06:57,751 - INFO - [Epoch 026 | Batch 0050] IWAE-loss 2016.3051 | mean log_px -0.0103 | KL -1714.56 + 51it [00:11, 4.49it/s] 52it [00:11, 4.55it/s] 53it [00:11, 4.61it/s] 54it [00:11, 4.63it/s] 55it [00:12, 4.62it/s] 56it [00:12, 4.62it/s] 57it [00:12, 4.64it/s] 58it [00:12, 4.64it/s] 59it [00:12, 4.62it/s] 60it [00:13, 4.60it/s] 61it [00:13, 4.60it/s] 62it [00:13, 4.59it/s] 63it [00:13, 4.55it/s] 64it [00:14, 4.37it/s] 65it [00:14, 4.45it/s] 66it [00:14, 4.51it/s] 67it [00:14, 4.54it/s] 68it [00:14, 4.57it/s] 69it [00:15, 4.49it/s] 70it [00:15, 4.53it/s] 71it [00:15, 4.55it/s] 72it [00:15, 4.59it/s] 73it [00:16, 4.61it/s] 74it [00:16, 4.63it/s] 75it [00:16, 4.64it/s] 76it [00:16, 4.65it/s] 77it [00:16, 4.55it/s] 78it [00:17, 4.58it/s] 79it [00:17, 4.60it/s] 80it [00:17, 4.62it/s] 81it [00:17, 4.64it/s] 82it [00:17, 4.64it/s] 83it [00:18, 4.48it/s] 84it [00:18, 4.54it/s] 85it [00:18, 4.58it/s] 86it [00:18, 4.60it/s] 87it [00:19, 4.62it/s] 88it [00:19, 4.63it/s] 89it [00:19, 4.66it/s] 90it [00:19, 4.66it/s] 91it [00:19, 4.66it/s] 92it [00:20, 4.67it/s] 93it [00:20, 4.67it/s] 94it [00:20, 4.66it/s] 95it [00:20, 4.67it/s] 96it [00:20, 4.66it/s] 97it [00:21, 4.67it/s] 98it [00:21, 4.67it/s] 99it [00:21, 4.67it/s] 100it [00:21, 4.66it/s]2025-05-26 02:07:08,598 - INFO - [Epoch 026 | Batch 0100] IWAE-loss 2671.4316 | mean log_px -0.0232 | KL -1705.30 + 101it [00:22, 4.66it/s] 102it [00:22, 4.66it/s] 103it [00:22, 4.67it/s] 104it [00:22, 4.67it/s] 105it [00:22, 4.67it/s] 106it [00:23, 4.67it/s] 107it [00:23, 4.66it/s] 108it [00:23, 4.66it/s] 109it [00:23, 4.66it/s] 110it [00:23, 4.66it/s] 111it [00:24, 4.66it/s] 112it [00:24, 4.48it/s] 113it [00:24, 4.54it/s] 114it [00:24, 4.58it/s] 115it [00:25, 4.61it/s] 116it [00:25, 4.62it/s] 117it [00:25, 4.65it/s] 118it [00:25, 4.65it/s] 119it [00:25, 4.66it/s] 120it [00:26, 4.66it/s] 121it [00:26, 4.67it/s] 122it [00:26, 4.66it/s] 123it [00:26, 4.66it/s] 124it [00:27, 4.65it/s] 125it [00:27, 4.65it/s] 126it [00:27, 4.65it/s] 127it [00:27, 4.66it/s] 128it [00:27, 4.66it/s] 129it [00:28, 4.48it/s] 130it [00:28, 4.54it/s] 131it [00:28, 4.58it/s] 132it [00:28, 4.61it/s] 133it [00:28, 4.63it/s] 134it [00:29, 4.64it/s] 135it [00:29, 4.65it/s] 136it [00:29, 4.63it/s] 137it [00:29, 4.66it/s] 138it [00:30, 4.67it/s] 139it [00:30, 4.67it/s] 140it [00:30, 4.67it/s] 141it [00:30, 4.53it/s] 142it [00:30, 4.56it/s] 143it [00:31, 4.59it/s] 144it [00:31, 4.62it/s] 145it [00:31, 4.64it/s] 146it [00:31, 4.65it/s] 147it [00:31, 4.65it/s] 148it [00:32, 4.65it/s] 149it [00:32, 4.67it/s] 150it [00:32, 4.67it/s]2025-05-26 02:07:19,389 - INFO - [Epoch 026 | Batch 0150] IWAE-loss 3300.8362 | mean log_px -0.0360 | KL -1700.18 + 151it [00:32, 4.67it/s] 152it [00:33, 4.51it/s] 153it [00:33, 4.57it/s] 154it [00:33, 4.59it/s] 155it [00:33, 4.61it/s] 156it [00:33, 4.62it/s] 157it [00:34, 4.61it/s] 158it [00:34, 4.63it/s] 159it [00:34, 4.65it/s] 160it [00:34, 4.65it/s] 161it [00:35, 4.66it/s] 162it [00:35, 4.51it/s] 163it [00:35, 4.57it/s] 164it [00:35, 4.56it/s] 165it [00:35, 4.58it/s] 166it [00:36, 4.60it/s] 167it [00:36, 4.63it/s] 168it [00:36, 4.64it/s] 169it [00:36, 4.65it/s] 170it [00:36, 4.65it/s] 171it [00:37, 4.66it/s] 172it [00:37, 4.64it/s] 173it [00:37, 4.65it/s] 174it [00:37, 4.65it/s] 175it [00:38, 4.66it/s] 176it [00:38, 4.67it/s] 177it [00:38, 4.67it/s] 178it [00:38, 4.67it/s] 179it [00:38, 4.67it/s] 180it [00:39, 4.67it/s] 181it [00:39, 4.67it/s] 182it [00:39, 4.67it/s] 183it [00:39, 4.68it/s] 184it [00:39, 4.68it/s] 185it [00:40, 4.67it/s] 186it [00:40, 4.67it/s] 187it [00:40, 4.68it/s] 188it [00:40, 4.68it/s] 189it [00:41, 4.58it/s] 190it [00:41, 4.61it/s] 191it [00:41, 4.62it/s] 192it [00:41, 4.63it/s] 193it [00:41, 4.63it/s] 194it [00:42, 4.50it/s] 195it [00:42, 4.27it/s] 196it [00:42, 4.40it/s] 196it [00:42, 4.59it/s] +2025-05-26 02:07:29,299 - INFO - Epoch: 26, Objective: tensor([2170.3135], device='cuda:0', grad_fn=), Loss: 0.008433881215751171, KL/n: 34.64965057373047 + 0it [00:00, ?it/s]2025-05-26 02:07:29,674 - INFO - [Epoch 027 | Batch 0000] IWAE-loss 1838.5685 | mean log_px -0.0048 | KL -1699.11 + 1it [00:00, 3.34it/s] 2it [00:00, 4.00it/s] 3it [00:00, 4.28it/s] 4it [00:00, 4.42it/s] 5it [00:01, 4.51it/s] 6it [00:01, 4.39it/s] 7it [00:01, 4.47it/s] 8it [00:01, 4.51it/s] 9it [00:02, 3.60it/s] 10it [00:02, 3.86it/s] 11it [00:02, 3.96it/s] 12it [00:02, 3.98it/s] 13it [00:03, 4.03it/s] 14it [00:03, 4.12it/s] 15it [00:03, 4.20it/s] 16it [00:03, 4.20it/s] 17it [00:04, 4.22it/s] 18it [00:04, 4.18it/s] 19it [00:04, 4.20it/s] 20it [00:04, 4.23it/s] 21it [00:05, 4.36it/s] 22it [00:05, 4.17it/s] 23it [00:05, 4.20it/s] 24it [00:05, 4.29it/s] 25it [00:05, 4.29it/s] 26it [00:06, 4.24it/s] 27it [00:06, 4.26it/s] 28it [00:06, 4.24it/s] 29it [00:06, 4.24it/s] 30it [00:07, 4.33it/s] 31it [00:07, 4.29it/s] 32it [00:07, 4.25it/s] 33it [00:07, 4.24it/s] 34it [00:08, 4.37it/s] 35it [00:08, 4.21it/s] 36it [00:08, 4.22it/s] 37it [00:08, 4.32it/s] 38it [00:09, 4.28it/s] 39it [00:09, 4.24it/s] 40it [00:09, 4.35it/s] 41it [00:09, 4.32it/s] 42it [00:09, 4.37it/s] 43it [00:10, 4.28it/s] 44it [00:10, 4.39it/s] 45it [00:10, 4.44it/s] 46it [00:10, 4.50it/s] 47it [00:11, 4.36it/s] 48it [00:11, 4.32it/s] 49it [00:11, 4.40it/s] 50it [00:11, 4.38it/s]2025-05-26 02:07:41,360 - INFO - [Epoch 027 | Batch 0050] IWAE-loss 2172.3386 | mean log_px -0.0069 | KL -1685.88 + 51it [00:11, 4.47it/s] 52it [00:12, 4.52it/s] 53it [00:12, 4.39it/s] 54it [00:12, 4.47it/s] 55it [00:12, 4.40it/s] 56it [00:13, 4.35it/s] 57it [00:13, 4.42it/s] 58it [00:13, 4.38it/s] 59it [00:13, 4.45it/s] 60it [00:14, 4.33it/s] 61it [00:14, 4.30it/s] 62it [00:14, 4.38it/s] 63it [00:14, 4.46it/s] 64it [00:14, 4.44it/s] 65it [00:15, 4.46it/s] 66it [00:15, 4.41it/s] 67it [00:15, 4.22it/s] 68it [00:15, 4.26it/s] 69it [00:16, 4.23it/s] 70it [00:16, 4.23it/s] 71it [00:16, 4.24it/s] 72it [00:16, 4.27it/s] 73it [00:17, 4.15it/s] 74it [00:17, 4.17it/s] 75it [00:17, 4.29it/s] 76it [00:17, 4.39it/s] 77it [00:17, 4.43it/s] 78it [00:18, 4.49it/s] 79it [00:18, 4.43it/s] 80it [00:18, 4.39it/s] 81it [00:18, 4.29it/s] 82it [00:19, 4.32it/s] 83it [00:19, 4.40it/s] 84it [00:19, 4.42it/s] 85it [00:19, 4.49it/s] 86it [00:19, 4.54it/s] 87it [00:20, 4.57it/s] 88it [00:20, 4.59it/s] 89it [00:20, 4.61it/s] 90it [00:20, 4.62it/s] 91it [00:21, 4.64it/s] 92it [00:21, 4.63it/s] 93it [00:21, 4.65it/s] 94it [00:21, 4.65it/s] 95it [00:21, 4.65it/s] 96it [00:22, 4.49it/s] 97it [00:22, 4.55it/s] 98it [00:22, 4.58it/s] 99it [00:22, 4.61it/s] 100it [00:23, 4.61it/s]2025-05-26 02:07:52,621 - INFO - [Epoch 027 | Batch 0100] IWAE-loss 2017.5281 | mean log_px -0.0098 | KL -1670.65 + 101it [00:23, 4.49it/s] 102it [00:23, 4.54it/s] 103it [00:23, 4.58it/s] 104it [00:23, 4.59it/s] 105it [00:24, 4.61it/s] 106it [00:24, 4.62it/s] 107it [00:24, 4.62it/s] 108it [00:24, 4.62it/s] 109it [00:24, 4.64it/s] 110it [00:25, 4.63it/s] 111it [00:25, 4.64it/s] 112it [00:25, 4.64it/s] 113it [00:25, 4.48it/s] 114it [00:26, 4.55it/s] 115it [00:26, 4.59it/s] 116it [00:26, 4.60it/s] 117it [00:26, 4.62it/s] 118it [00:26, 4.60it/s] 119it [00:27, 4.59it/s] 120it [00:27, 4.46it/s] 121it [00:27, 4.52it/s] 122it [00:27, 4.57it/s] 123it [00:28, 4.59it/s] 124it [00:28, 4.60it/s] 125it [00:28, 4.62it/s] 126it [00:28, 4.62it/s] 127it [00:28, 4.64it/s] 128it [00:29, 4.63it/s] 129it [00:29, 4.64it/s] 130it [00:29, 4.65it/s] 131it [00:29, 4.66it/s] 132it [00:29, 4.65it/s] 133it [00:30, 4.66it/s] 134it [00:30, 4.65it/s] 135it [00:30, 4.65it/s] 136it [00:30, 4.43it/s] 137it [00:31, 4.50it/s] 138it [00:31, 4.54it/s] 139it [00:31, 4.57it/s] 140it [00:31, 4.58it/s] 141it [00:31, 4.59it/s] 142it [00:32, 4.61it/s] 143it [00:32, 4.60it/s] 144it [00:32, 4.63it/s] 145it [00:32, 4.64it/s] 146it [00:33, 4.64it/s] 147it [00:33, 4.64it/s] 148it [00:33, 4.63it/s] 149it [00:33, 4.63it/s] 150it [00:33, 4.64it/s]2025-05-26 02:08:03,492 - INFO - [Epoch 027 | Batch 0150] IWAE-loss 2334.5696 | mean log_px -0.0127 | KL -1661.62 + 151it [00:34, 4.64it/s] 152it [00:34, 4.62it/s] 153it [00:34, 4.49it/s] 154it [00:34, 4.54it/s] 155it [00:35, 4.57it/s] 156it [00:35, 4.55it/s] 157it [00:35, 4.58it/s] 158it [00:35, 4.60it/s] 159it [00:35, 4.62it/s] 160it [00:36, 4.64it/s] 161it [00:36, 4.49it/s] 162it [00:36, 4.54it/s] 163it [00:36, 4.58it/s] 164it [00:36, 4.61it/s] 165it [00:37, 4.63it/s] 166it [00:37, 4.63it/s] 167it [00:37, 4.65it/s] 168it [00:37, 4.65it/s] 169it [00:38, 4.65it/s] 170it [00:38, 4.49it/s] 171it [00:38, 4.52it/s] 172it [00:38, 4.56it/s] 173it [00:38, 4.57it/s] 174it [00:39, 4.57it/s] 175it [00:39, 4.57it/s] 176it [00:39, 4.59it/s] 177it [00:39, 4.61it/s] 178it [00:40, 4.63it/s] 179it [00:40, 4.64it/s] 180it [00:40, 4.64it/s] 181it [00:40, 4.64it/s] 182it [00:40, 4.48it/s] 183it [00:41, 4.54it/s] 184it [00:41, 4.57it/s] 185it [00:41, 4.60it/s] 186it [00:41, 4.61it/s] 187it [00:41, 4.63it/s] 188it [00:42, 4.63it/s] 189it [00:42, 4.64it/s] 190it [00:42, 4.65it/s] 191it [00:42, 4.63it/s] 192it [00:43, 4.63it/s] 193it [00:43, 4.63it/s] 194it [00:43, 4.63it/s] 195it [00:43, 4.49it/s] 196it [00:43, 4.56it/s] 196it [00:43, 4.46it/s] +2025-05-26 02:08:13,418 - INFO - Epoch: 27, Objective: tensor([2400.2996], device='cuda:0', grad_fn=), Loss: 0.009168989956378937, KL/n: 33.872135162353516 + 0it [00:00, ?it/s]2025-05-26 02:08:13,768 - INFO - [Epoch 028 | Batch 0000] IWAE-loss 1821.6100 | mean log_px -0.0041 | KL -1660.52 + 1it [00:00, 3.34it/s] 2it [00:00, 4.00it/s] 3it [00:00, 4.31it/s] 4it [00:00, 4.43it/s] 5it [00:01, 4.51it/s] 6it [00:01, 4.54it/s] 7it [00:01, 4.37it/s] 8it [00:01, 4.40it/s] 9it [00:02, 4.47it/s] 10it [00:02, 4.52it/s] 11it [00:02, 4.39it/s] 12it [00:02, 4.35it/s] 13it [00:02, 4.29it/s] 14it [00:03, 4.28it/s] 15it [00:03, 4.24it/s] 16it [00:03, 4.23it/s] 17it [00:03, 4.21it/s] 18it [00:04, 4.30it/s] 19it [00:04, 4.24it/s] 20it [00:04, 4.35it/s] 21it [00:04, 4.33it/s] 22it [00:05, 4.31it/s] 23it [00:05, 4.42it/s] 24it [00:05, 4.36it/s] 25it [00:05, 4.29it/s] 26it [00:06, 4.36it/s] 27it [00:06, 4.33it/s] 28it [00:06, 4.37it/s] 29it [00:06, 4.28it/s] 30it [00:06, 4.37it/s] 31it [00:07, 4.31it/s] 32it [00:07, 4.25it/s] 33it [00:07, 4.23it/s] 34it [00:07, 4.22it/s] 35it [00:08, 4.34it/s] 36it [00:08, 4.45it/s] 37it [00:08, 4.51it/s] 38it [00:08, 4.55it/s] 39it [00:08, 4.60it/s] 40it [00:09, 4.61it/s] 41it [00:09, 4.63it/s] 42it [00:09, 4.63it/s] 43it [00:09, 4.62it/s] 44it [00:10, 4.62it/s] 45it [00:10, 4.51it/s] 46it [00:10, 4.56it/s] 47it [00:10, 4.58it/s] 48it [00:10, 4.61it/s] 49it [00:11, 4.61it/s] 50it [00:11, 4.62it/s]2025-05-26 02:08:25,054 - INFO - [Epoch 028 | Batch 0050] IWAE-loss 1886.0216 | mean log_px -0.0034 | KL -1643.58 + 51it [00:11, 4.50it/s] 52it [00:11, 4.55it/s] 53it [00:12, 4.58it/s] 54it [00:12, 4.60it/s] 55it [00:12, 4.63it/s] 56it [00:12, 4.62it/s] 57it [00:12, 4.63it/s] 58it [00:13, 4.48it/s] 59it [00:13, 4.53it/s] 60it [00:13, 4.56it/s] 61it [00:13, 4.58it/s] 62it [00:13, 4.59it/s] 63it [00:14, 4.59it/s] 64it [00:14, 4.61it/s] 65it [00:14, 4.62it/s] 66it [00:14, 4.62it/s] 67it [00:15, 4.64it/s] 68it [00:15, 4.48it/s] 69it [00:15, 4.53it/s] 70it [00:15, 4.58it/s] 71it [00:15, 4.61it/s] 72it [00:16, 4.57it/s] 73it [00:16, 4.60it/s] 74it [00:16, 4.61it/s] 75it [00:16, 4.62it/s] 76it [00:17, 4.64it/s] 77it [00:17, 4.45it/s] 78it [00:17, 4.52it/s] 79it [00:17, 4.56it/s] 80it [00:17, 4.57it/s] 81it [00:18, 4.51it/s] 82it [00:18, 4.55it/s] 83it [00:18, 4.57it/s] 84it [00:18, 4.59it/s] 85it [00:19, 4.60it/s] 86it [00:19, 4.59it/s] 87it [00:19, 4.61it/s] 88it [00:19, 4.63it/s] 89it [00:19, 4.63it/s] 90it [00:20, 4.64it/s] 91it [00:20, 4.65it/s] 92it [00:20, 4.64it/s] 93it [00:20, 4.64it/s] 94it [00:20, 4.64it/s] 95it [00:21, 4.64it/s] 96it [00:21, 4.64it/s] 97it [00:21, 4.65it/s] 98it [00:21, 4.64it/s] 99it [00:22, 4.63it/s] 100it [00:22, 4.48it/s]2025-05-26 02:08:35,967 - INFO - [Epoch 028 | Batch 0100] IWAE-loss 1992.9895 | mean log_px -0.0080 | KL -1643.61 + 101it [00:22, 4.55it/s] 102it [00:22, 4.57it/s] 103it [00:22, 4.60it/s] 104it [00:23, 4.62it/s] 105it [00:23, 4.64it/s] 106it [00:23, 4.64it/s] 107it [00:23, 4.65it/s] 108it [00:23, 4.64it/s] 109it [00:24, 4.48it/s] 110it [00:24, 4.53it/s] 111it [00:24, 4.57it/s] 112it [00:24, 4.58it/s] 113it [00:25, 4.61it/s] 114it [00:25, 4.61it/s] 115it [00:25, 4.62it/s] 116it [00:25, 4.47it/s] 117it [00:25, 4.53it/s] 118it [00:26, 4.54it/s] 119it [00:26, 4.58it/s] 120it [00:26, 4.60it/s] 121it [00:26, 4.62it/s] 122it [00:27, 4.63it/s] 123it [00:27, 4.63it/s] 124it [00:27, 4.64it/s] 125it [00:27, 4.64it/s] 126it [00:27, 4.64it/s] 127it [00:28, 4.65it/s] 128it [00:28, 4.63it/s] 129it [00:28, 4.62it/s] 130it [00:28, 4.62it/s] 131it [00:28, 4.63it/s] 132it [00:29, 4.63it/s] 133it [00:29, 4.62it/s] 134it [00:29, 4.62it/s] 135it [00:29, 4.63it/s] 136it [00:30, 4.62it/s] 137it [00:30, 4.64it/s] 138it [00:30, 4.65it/s] 139it [00:30, 4.64it/s] 140it [00:30, 4.64it/s] 141it [00:31, 4.66it/s] 142it [00:31, 4.52it/s] 143it [00:31, 4.57it/s] 144it [00:31, 4.57it/s] 145it [00:32, 4.59it/s] 146it [00:32, 4.59it/s] 147it [00:32, 4.61it/s] 148it [00:32, 4.63it/s] 149it [00:32, 4.64it/s] 150it [00:33, 4.64it/s]2025-05-26 02:08:46,808 - INFO - [Epoch 028 | Batch 0150] IWAE-loss 1948.8407 | mean log_px -0.0090 | KL -1636.46 + 151it [00:33, 4.64it/s] 152it [00:33, 4.64it/s] 153it [00:33, 4.66it/s] 154it [00:33, 4.66it/s] 155it [00:34, 4.51it/s] 156it [00:34, 4.56it/s] 157it [00:34, 4.60it/s] 158it [00:34, 4.60it/s] 159it [00:35, 4.63it/s] 160it [00:35, 4.63it/s] 161it [00:35, 4.65it/s] 162it [00:35, 4.65it/s] 163it [00:35, 4.64it/s] 164it [00:36, 4.64it/s] 165it [00:36, 4.66it/s] 166it [00:36, 4.65it/s] 167it [00:36, 4.67it/s] 168it [00:36, 4.67it/s] 169it [00:37, 4.67it/s] 170it [00:37, 4.67it/s] 171it [00:37, 4.66it/s] 172it [00:37, 4.67it/s] 173it [00:38, 4.67it/s] 174it [00:38, 4.66it/s] 175it [00:38, 4.66it/s] 176it [00:38, 4.65it/s] 177it [00:38, 4.66it/s] 178it [00:39, 4.65it/s] 179it [00:39, 4.64it/s] 180it [00:39, 4.64it/s] 181it [00:39, 4.61it/s] 182it [00:39, 4.60it/s] 183it [00:40, 4.62it/s] 184it [00:40, 4.61it/s] 185it [00:40, 4.62it/s] 186it [00:40, 4.63it/s] 187it [00:41, 4.63it/s] 188it [00:41, 4.60it/s] 189it [00:41, 4.62it/s] 190it [00:41, 4.61it/s] 191it [00:41, 4.63it/s] 192it [00:42, 4.48it/s] 193it [00:42, 4.54it/s] 194it [00:42, 4.57it/s] 195it [00:42, 4.46it/s] 196it [00:43, 4.51it/s] 196it [00:43, 4.54it/s] +2025-05-26 02:08:56,688 - INFO - Epoch: 28, Objective: tensor([2206.5891], device='cuda:0', grad_fn=), Loss: 0.015577034093439579, KL/n: 33.273502349853516 + 0it [00:00, ?it/s]2025-05-26 02:08:57,228 - INFO - [Epoch 029 | Batch 0000] IWAE-loss 1807.6621 | mean log_px -0.0057 | KL -1630.16 + 1it [00:00, 3.56it/s] 2it [00:00, 3.94it/s] 3it [00:00, 4.23it/s] 4it [00:00, 4.39it/s] 5it [00:01, 4.40it/s] 6it [00:01, 4.46it/s] 7it [00:01, 4.42it/s] 8it [00:01, 4.38it/s] 9it [00:02, 4.25it/s] 10it [00:02, 4.24it/s] 11it [00:02, 4.40it/s] 12it [00:02, 4.48it/s] 13it [00:02, 4.47it/s] 14it [00:03, 4.38it/s] 15it [00:03, 4.48it/s] 16it [00:03, 4.48it/s] 17it [00:03, 4.29it/s] 18it [00:04, 4.39it/s] 19it [00:04, 4.37it/s] 20it [00:04, 4.34it/s] 21it [00:04, 4.34it/s] 22it [00:05, 4.30it/s] 23it [00:05, 4.21it/s] 24it [00:05, 4.23it/s] 25it [00:05, 4.25it/s] 26it [00:06, 4.27it/s] 27it [00:06, 4.35it/s] 28it [00:06, 4.45it/s] 29it [00:06, 4.42it/s] 30it [00:06, 4.42it/s] 31it [00:07, 4.47it/s] 32it [00:07, 4.37it/s] 33it [00:07, 4.32it/s] 34it [00:07, 4.30it/s] 35it [00:08, 4.37it/s] 36it [00:08, 4.46it/s] 37it [00:08, 4.53it/s] 38it [00:08, 4.58it/s] 39it [00:08, 4.63it/s] 40it [00:09, 4.55it/s] 41it [00:09, 4.48it/s] 42it [00:09, 4.52it/s] 43it [00:09, 4.57it/s] 44it [00:10, 4.48it/s] 45it [00:10, 4.43it/s] 46it [00:10, 4.51it/s] 47it [00:10, 4.45it/s] 48it [00:10, 4.51it/s] 49it [00:11, 4.51it/s] 50it [00:11, 4.34it/s]2025-05-26 02:09:08,571 - INFO - [Epoch 029 | Batch 0050] IWAE-loss 1674.5372 | mean log_px -0.0011 | KL -1614.30 + 51it [00:11, 4.32it/s] 52it [00:11, 4.30it/s] 53it [00:12, 4.33it/s] 54it [00:12, 4.43it/s] 55it [00:12, 4.51it/s] 56it [00:12, 4.26it/s] 57it [00:13, 4.19it/s] 58it [00:13, 4.07it/s] 59it [00:13, 4.09it/s] 60it [00:13, 4.16it/s] 61it [00:14, 4.13it/s] 62it [00:14, 4.28it/s] 63it [00:14, 4.27it/s] 64it [00:14, 4.30it/s] 65it [00:14, 4.22it/s] 66it [00:15, 4.23it/s] 67it [00:15, 4.21it/s] 68it [00:15, 4.23it/s] 69it [00:15, 4.19it/s] 70it [00:16, 4.20it/s] 71it [00:16, 4.33it/s] 72it [00:16, 4.33it/s] 73it [00:16, 4.44it/s] 74it [00:16, 4.52it/s] 75it [00:17, 4.54it/s] 76it [00:17, 4.60it/s] 77it [00:17, 4.51it/s] 78it [00:17, 4.45it/s] 79it [00:18, 4.50it/s] 80it [00:18, 4.40it/s] 81it [00:18, 4.38it/s] 82it [00:18, 4.43it/s] 83it [00:19, 4.41it/s] 84it [00:19, 4.46it/s] 85it [00:19, 4.44it/s] 86it [00:19, 4.46it/s] 87it [00:19, 4.46it/s] 88it [00:20, 4.50it/s] 89it [00:20, 4.57it/s] 90it [00:20, 4.58it/s] 91it [00:20, 4.47it/s] 92it [00:21, 4.42it/s] 93it [00:21, 4.40it/s] 94it [00:21, 4.48it/s] 95it [00:21, 4.50it/s] 96it [00:21, 4.46it/s] 97it [00:22, 4.40it/s] 98it [00:22, 4.45it/s] 99it [00:22, 4.53it/s] 100it [00:22, 4.47it/s]2025-05-26 02:09:19,995 - INFO - [Epoch 029 | Batch 0100] IWAE-loss 1752.5222 | mean log_px -0.0047 | KL -1603.06 + 101it [00:23, 4.40it/s] 102it [00:23, 4.47it/s] 103it [00:23, 4.54it/s] 104it [00:23, 4.58it/s] 105it [00:23, 4.47it/s] 106it [00:24, 4.40it/s] 107it [00:24, 4.43it/s] 108it [00:24, 4.50it/s] 109it [00:24, 4.42it/s] 110it [00:25, 4.36it/s] 111it [00:25, 4.35it/s] 112it [00:25, 4.32it/s] 113it [00:25, 4.29it/s] 114it [00:25, 4.32it/s] 115it [00:26, 4.31it/s] 116it [00:26, 4.30it/s] 117it [00:26, 4.30it/s] 118it [00:26, 4.40it/s] 119it [00:27, 4.35it/s] 120it [00:27, 4.35it/s] 121it [00:27, 4.33it/s] 122it [00:27, 4.34it/s] 123it [00:28, 4.16it/s] 124it [00:28, 4.20it/s] 125it [00:28, 4.34it/s] 126it [00:28, 4.27it/s] 127it [00:29, 4.27it/s] 128it [00:29, 4.30it/s] 129it [00:29, 4.31it/s] 130it [00:29, 4.30it/s] 131it [00:29, 4.29it/s] 132it [00:30, 4.29it/s] 133it [00:30, 4.29it/s] 134it [00:30, 4.25it/s] 135it [00:30, 4.33it/s] 136it [00:31, 4.44it/s] 137it [00:31, 4.51it/s] 138it [00:31, 4.55it/s] 139it [00:31, 4.59it/s] 140it [00:31, 4.46it/s] 141it [00:32, 4.55it/s] 142it [00:32, 4.59it/s] 143it [00:32, 4.63it/s] 144it [00:32, 4.65it/s] 145it [00:33, 4.67it/s] 146it [00:33, 4.68it/s] 147it [00:33, 4.69it/s] 148it [00:33, 4.69it/s] 149it [00:33, 4.54it/s] 150it [00:34, 4.59it/s]2025-05-26 02:09:31,285 - INFO - [Epoch 029 | Batch 0150] IWAE-loss 1698.8661 | mean log_px -0.0024 | KL -1595.82 + 151it [00:34, 4.61it/s] 152it [00:34, 4.63it/s] 153it [00:34, 4.66it/s] 154it [00:34, 4.67it/s] 155it [00:35, 4.68it/s] 156it [00:35, 4.68it/s] 157it [00:35, 4.69it/s] 158it [00:35, 4.69it/s] 159it [00:36, 4.69it/s] 160it [00:36, 4.70it/s] 161it [00:36, 4.70it/s] 162it [00:36, 4.70it/s] 163it [00:36, 4.70it/s] 164it [00:37, 4.69it/s] 165it [00:37, 4.67it/s] 166it [00:37, 4.48it/s] 167it [00:37, 4.51it/s] 168it [00:38, 4.52it/s] 169it [00:38, 4.54it/s] 170it [00:38, 4.54it/s] 171it [00:38, 4.57it/s] 172it [00:38, 4.43it/s] 173it [00:39, 4.52it/s] 174it [00:39, 4.56it/s] 175it [00:39, 4.61it/s] 176it [00:39, 4.63it/s] 177it [00:39, 4.65it/s] 178it [00:40, 4.50it/s] 179it [00:40, 4.58it/s] 180it [00:40, 4.60it/s] 181it [00:40, 4.62it/s] 182it [00:41, 4.55it/s] 183it [00:41, 4.59it/s] 184it [00:41, 4.51it/s] 185it [00:41, 4.56it/s] 186it [00:41, 4.56it/s] 187it [00:42, 4.56it/s] 188it [00:42, 4.56it/s] 189it [00:42, 4.58it/s] 190it [00:42, 4.42it/s] 191it [00:43, 4.51it/s] 192it [00:43, 4.55it/s] 193it [00:43, 4.58it/s] 194it [00:43, 4.60it/s] 195it [00:43, 4.50it/s] 196it [00:44, 4.55it/s] 196it [00:44, 4.43it/s] +2025-05-26 02:09:41,231 - INFO - Epoch: 29, Objective: tensor([2066.5352], device='cuda:0', grad_fn=), Loss: 0.007869544439017773, KL/n: 32.472476959228516 + 0it [00:00, ?it/s]2025-05-26 02:09:41,594 - INFO - [Epoch 030 | Batch 0000] IWAE-loss 1742.8804 | mean log_px -0.0048 | KL -1591.28 + 1it [00:00, 3.37it/s] 2it [00:00, 4.02it/s] 3it [00:00, 4.31it/s] 4it [00:00, 4.25it/s] 5it [00:01, 4.40it/s] 6it [00:01, 4.48it/s] 7it [00:01, 4.54it/s] 8it [00:01, 4.58it/s] 9it [00:02, 4.60it/s] 10it [00:02, 4.60it/s] 11it [00:02, 4.62it/s] 12it [00:02, 4.63it/s] 13it [00:02, 4.49it/s] 14it [00:03, 4.52it/s] 15it [00:03, 4.54it/s] 16it [00:03, 4.55it/s] 17it [00:03, 4.59it/s] 18it [00:04, 4.58it/s] 19it [00:04, 4.46it/s] 20it [00:04, 4.51it/s] 21it [00:04, 4.52it/s] 22it [00:04, 4.53it/s] 23it [00:05, 4.56it/s] 24it [00:05, 4.50it/s] 25it [00:05, 4.54it/s] 26it [00:05, 4.55it/s] 27it [00:05, 4.57it/s] 28it [00:06, 4.59it/s] 29it [00:06, 4.51it/s] 30it [00:06, 4.55it/s] 31it [00:06, 4.52it/s] 32it [00:07, 4.48it/s] 33it [00:07, 4.54it/s] 34it [00:07, 4.48it/s] 35it [00:07, 4.55it/s] 36it [00:07, 4.58it/s] 37it [00:08, 4.59it/s] 38it [00:08, 4.60it/s] 39it [00:08, 4.59it/s] 40it [00:08, 4.59it/s] 41it [00:09, 4.60it/s] 42it [00:09, 4.57it/s] 43it [00:09, 4.57it/s] 44it [00:09, 4.45it/s] 45it [00:09, 4.53it/s] 46it [00:10, 4.55it/s] 47it [00:10, 4.53it/s] 48it [00:10, 4.56it/s] 49it [00:10, 4.56it/s] 50it [00:11, 4.57it/s]2025-05-26 02:09:52,568 - INFO - [Epoch 030 | Batch 0050] IWAE-loss 1974.8240 | mean log_px -0.0085 | KL -1577.82 + 51it [00:11, 4.58it/s] 52it [00:11, 4.43it/s] 53it [00:11, 4.49it/s] 54it [00:11, 4.48it/s] 55it [00:12, 4.47it/s] 56it [00:12, 4.41it/s] 57it [00:12, 4.36it/s] 58it [00:12, 4.41it/s] 59it [00:13, 4.45it/s] 60it [00:13, 4.43it/s] 61it [00:13, 4.46it/s] 62it [00:13, 4.35it/s] 63it [00:13, 4.42it/s] 64it [00:14, 4.47it/s] 65it [00:14, 4.46it/s] 66it [00:14, 4.52it/s] 67it [00:14, 4.55it/s] 68it [00:15, 4.54it/s] 69it [00:15, 4.55it/s] 70it [00:15, 4.56it/s] 71it [00:15, 4.58it/s] 72it [00:15, 4.58it/s] 73it [00:16, 4.59it/s] 74it [00:16, 4.59it/s] 75it [00:16, 4.60it/s] 76it [00:16, 4.60it/s] 77it [00:17, 3.57it/s] 78it [00:17, 3.82it/s] 79it [00:17, 4.03it/s] 80it [00:17, 4.17it/s] 81it [00:18, 4.22it/s] 82it [00:18, 4.34it/s] 83it [00:18, 4.28it/s] 84it [00:18, 4.36it/s] 85it [00:19, 4.38it/s] 86it [00:19, 4.45it/s] 87it [00:19, 4.49it/s] 88it [00:19, 4.53it/s] 89it [00:19, 4.54it/s] 90it [00:20, 4.55it/s] 91it [00:20, 4.58it/s] 92it [00:20, 4.44it/s] 93it [00:20, 4.40it/s] 94it [00:21, 4.46it/s] 95it [00:21, 4.51it/s] 96it [00:21, 4.42it/s] 97it [00:21, 4.44it/s] 98it [00:21, 4.47it/s] 99it [00:22, 4.51it/s] 100it [00:22, 4.53it/s]2025-05-26 02:10:03,886 - INFO - [Epoch 030 | Batch 0100] IWAE-loss 1863.1838 | mean log_px -0.0062 | KL -1573.59 + 101it [00:22, 4.56it/s] 102it [00:22, 4.42it/s] 103it [00:23, 4.48it/s] 104it [00:23, 4.52it/s] 105it [00:23, 4.55it/s] 106it [00:23, 4.53it/s] 107it [00:23, 4.56it/s] 108it [00:24, 4.57it/s] 109it [00:24, 4.39it/s] 110it [00:24, 4.26it/s] 111it [00:24, 4.37it/s] 112it [00:25, 4.37it/s] 113it [00:25, 4.45it/s] 114it [00:25, 4.48it/s] 115it [00:25, 4.51it/s] 116it [00:25, 4.52it/s] 117it [00:26, 4.54it/s] 118it [00:26, 4.53it/s] 119it [00:26, 4.54it/s] 120it [00:26, 4.52it/s] 121it [00:27, 4.39it/s] 122it [00:27, 4.46it/s] 123it [00:27, 4.49it/s] 124it [00:27, 4.52it/s] 125it [00:27, 4.54it/s] 126it [00:28, 4.54it/s] 127it [00:28, 4.58it/s] 128it [00:28, 4.60it/s] 129it [00:28, 4.59it/s] 130it [00:29, 4.46it/s] 131it [00:29, 4.52it/s] 132it [00:29, 4.55it/s] 133it [00:29, 4.56it/s] 134it [00:29, 4.54it/s] 135it [00:30, 4.56it/s] 136it [00:30, 4.54it/s] 137it [00:30, 4.56it/s] 138it [00:30, 4.57it/s] 139it [00:31, 4.45it/s] 140it [00:31, 4.50it/s] 141it [00:31, 4.53it/s] 142it [00:31, 4.50it/s] 143it [00:31, 4.54it/s] 144it [00:32, 4.50it/s] 145it [00:32, 4.52it/s] 146it [00:32, 4.41it/s] 147it [00:32, 4.47it/s] 148it [00:33, 4.50it/s] 149it [00:33, 4.47it/s] 150it [00:33, 4.51it/s]2025-05-26 02:10:14,997 - INFO - [Epoch 030 | Batch 0150] IWAE-loss 2044.0123 | mean log_px -0.0121 | KL -1569.41 + 151it [00:33, 4.53it/s] 152it [00:33, 4.46it/s] 153it [00:34, 4.50it/s] 154it [00:34, 4.54it/s] 155it [00:34, 4.56it/s] 156it [00:34, 4.53it/s] 157it [00:35, 4.56it/s] 158it [00:35, 4.56it/s] 159it [00:35, 4.59it/s] 160it [00:35, 4.59it/s] 161it [00:35, 4.60it/s] 162it [00:36, 4.59it/s] 163it [00:36, 4.46it/s] 164it [00:36, 4.51it/s] 165it [00:36, 4.54it/s] 166it [00:36, 4.55it/s] 167it [00:37, 4.53it/s] 168it [00:37, 4.54it/s] 169it [00:37, 4.56it/s] 170it [00:37, 4.56it/s] 171it [00:38, 4.58it/s] 172it [00:38, 4.58it/s] 173it [00:38, 4.60it/s] 174it [00:38, 4.59it/s] 175it [00:38, 4.46it/s] 176it [00:39, 4.51it/s] 177it [00:39, 4.55it/s] 178it [00:39, 4.56it/s] 179it [00:39, 4.57it/s] 180it [00:40, 4.58it/s] 181it [00:40, 4.45it/s] 182it [00:40, 4.51it/s] 183it [00:40, 4.54it/s] 184it [00:40, 4.55it/s] 185it [00:41, 4.57it/s] 186it [00:41, 4.56it/s] 187it [00:41, 4.57it/s] 188it [00:41, 4.55it/s] 189it [00:42, 4.57it/s] 190it [00:42, 4.57it/s] 191it [00:42, 4.57it/s] 192it [00:42, 4.57it/s] 193it [00:42, 4.53it/s] 194it [00:43, 4.54it/s] 195it [00:43, 4.43it/s] 196it [00:43, 4.46it/s] 196it [00:43, 4.49it/s] +2025-05-26 02:10:25,041 - INFO - Epoch: 30, Objective: tensor([1660.5792], device='cuda:0', grad_fn=), Loss: 0.002282704459503293, KL/n: 31.856414794921875 + 0it [00:00, ?it/s]2025-05-26 02:10:25,417 - INFO - [Epoch 031 | Batch 0000] IWAE-loss 1722.8004 | mean log_px -0.0030 | KL -1562.43 + 1it [00:00, 3.31it/s] 2it [00:00, 3.84it/s] 3it [00:00, 4.17it/s] 4it [00:00, 4.30it/s] 5it [00:01, 4.39it/s] 6it [00:01, 4.45it/s] 7it [00:01, 4.50it/s] 8it [00:01, 4.53it/s] 9it [00:02, 4.53it/s] 10it [00:02, 4.55it/s] 11it [00:02, 4.55it/s] 12it [00:02, 4.56it/s] 13it [00:02, 4.48it/s] 14it [00:03, 4.53it/s] 15it [00:03, 4.57it/s] 16it [00:03, 4.57it/s] 17it [00:03, 4.60it/s] 18it [00:04, 4.60it/s] 19it [00:04, 4.62it/s] 20it [00:04, 4.62it/s] 21it [00:04, 4.63it/s] 22it [00:04, 4.63it/s] 23it [00:05, 4.64it/s] 24it [00:05, 4.64it/s] 25it [00:05, 4.64it/s] 26it [00:05, 4.63it/s] 27it [00:05, 4.65it/s] 28it [00:06, 4.48it/s] 29it [00:06, 4.54it/s] 30it [00:06, 4.55it/s] 31it [00:06, 4.58it/s] 32it [00:07, 4.59it/s] 33it [00:07, 4.58it/s] 34it [00:07, 4.56it/s] 35it [00:07, 4.43it/s] 36it [00:07, 4.49it/s] 37it [00:08, 4.53it/s] 38it [00:08, 4.55it/s] 39it [00:08, 4.54it/s] 40it [00:08, 4.56it/s] 41it [00:09, 4.59it/s] 42it [00:09, 4.59it/s] 43it [00:09, 4.58it/s] 44it [00:09, 4.59it/s] 45it [00:09, 4.60it/s] 46it [00:10, 4.40it/s] 47it [00:10, 4.48it/s] 48it [00:10, 4.52it/s] 49it [00:10, 4.55it/s] 50it [00:11, 4.53it/s]2025-05-26 02:10:36,383 - INFO - [Epoch 031 | Batch 0050] IWAE-loss 1696.5232 | mean log_px -0.0034 | KL -1540.58 + 51it [00:11, 4.55it/s] 52it [00:11, 4.58it/s] 53it [00:11, 4.53it/s] 54it [00:11, 4.41it/s] 55it [00:12, 4.44it/s] 56it [00:12, 4.48it/s] 57it [00:12, 4.52it/s] 58it [00:12, 4.50it/s] 59it [00:13, 4.53it/s] 60it [00:13, 4.50it/s] 61it [00:13, 4.52it/s] 62it [00:13, 4.54it/s] 63it [00:13, 4.56it/s] 64it [00:14, 4.43it/s] 65it [00:14, 4.49it/s] 66it [00:14, 4.52it/s] 67it [00:14, 4.55it/s] 68it [00:15, 4.57it/s] 69it [00:15, 4.57it/s] 70it [00:15, 4.59it/s] 71it [00:15, 4.60it/s] 72it [00:15, 4.59it/s] 73it [00:16, 4.45it/s] 74it [00:16, 4.50it/s] 75it [00:16, 4.49it/s] 76it [00:16, 4.43it/s] 77it [00:17, 4.45it/s] 78it [00:17, 4.49it/s] 79it [00:17, 4.53it/s] 80it [00:17, 4.55it/s] 81it [00:17, 4.58it/s] 82it [00:18, 4.44it/s] 83it [00:18, 4.48it/s] 84it [00:18, 4.50it/s] 85it [00:18, 4.54it/s] 86it [00:19, 4.56it/s] 87it [00:19, 4.59it/s] 88it [00:19, 4.60it/s] 89it [00:19, 4.61it/s] 90it [00:19, 4.62it/s] 91it [00:20, 4.42it/s] 92it [00:20, 4.49it/s] 93it [00:20, 4.54it/s] 94it [00:20, 4.57it/s] 95it [00:20, 4.59it/s] 96it [00:21, 4.58it/s] 97it [00:21, 4.59it/s] 98it [00:21, 4.51it/s] 99it [00:21, 4.41it/s] 100it [00:22, 4.47it/s]2025-05-26 02:10:47,447 - INFO - [Epoch 031 | Batch 0100] IWAE-loss 1671.5338 | mean log_px -0.0022 | KL -1533.55 + 101it [00:22, 4.50it/s] 102it [00:22, 4.32it/s] 103it [00:22, 4.42it/s] 104it [00:23, 4.46it/s] 105it [00:23, 4.47it/s] 106it [00:23, 4.52it/s] 107it [00:23, 4.53it/s] 108it [00:23, 4.55it/s] 109it [00:24, 4.42it/s] 110it [00:24, 4.49it/s] 111it [00:24, 4.52it/s] 112it [00:24, 4.54it/s] 113it [00:24, 4.57it/s] 114it [00:25, 4.58it/s] 115it [00:25, 4.59it/s] 116it [00:25, 4.60it/s] 117it [00:25, 4.45it/s] 118it [00:26, 4.51it/s] 119it [00:26, 4.55it/s] 120it [00:26, 4.57it/s] 121it [00:26, 4.60it/s] 122it [00:26, 4.60it/s] 123it [00:27, 4.47it/s] 124it [00:27, 4.51it/s] 125it [00:27, 4.52it/s] 126it [00:27, 4.56it/s] 127it [00:28, 4.57it/s] 128it [00:28, 4.49it/s] 129it [00:28, 4.53it/s] 130it [00:28, 4.49it/s] 131it [00:28, 4.52it/s] 132it [00:29, 4.56it/s] 133it [00:29, 4.57it/s] 134it [00:29, 4.42it/s] 135it [00:29, 4.49it/s] 136it [00:30, 4.52it/s] 137it [00:30, 4.55it/s] 138it [00:30, 4.56it/s] 139it [00:30, 4.58it/s] 140it [00:30, 4.59it/s] 141it [00:31, 4.51it/s] 142it [00:31, 4.54it/s] 143it [00:31, 4.57it/s] 144it [00:31, 4.59it/s] 145it [00:32, 4.45it/s] 146it [00:32, 4.52it/s] 147it [00:32, 4.55it/s] 148it [00:32, 4.57it/s] 149it [00:32, 4.60it/s] 150it [00:33, 4.61it/s]2025-05-26 02:10:58,475 - INFO - [Epoch 031 | Batch 0150] IWAE-loss 1709.1289 | mean log_px -0.0036 | KL -1533.10 + 151it [00:33, 4.62it/s] 152it [00:33, 4.62it/s] 153it [00:33, 4.59it/s] 154it [00:34, 4.42it/s] 155it [00:34, 4.49it/s] 156it [00:34, 4.51it/s] 157it [00:34, 4.53it/s] 158it [00:34, 4.56it/s] 159it [00:35, 4.59it/s] 160it [00:35, 4.60it/s] 161it [00:35, 4.62it/s] 162it [00:35, 4.62it/s] 163it [00:35, 4.61it/s] 164it [00:36, 4.45it/s] 165it [00:36, 4.43it/s] 166it [00:36, 4.44it/s] 167it [00:36, 4.51it/s] 168it [00:37, 4.53it/s] 169it [00:37, 4.56it/s] 170it [00:37, 4.58it/s] 171it [00:37, 4.59it/s] 172it [00:38, 4.44it/s] 173it [00:38, 4.48it/s] 174it [00:38, 4.53it/s] 175it [00:38, 4.56it/s] 176it [00:38, 4.59it/s] 177it [00:39, 4.61it/s] 178it [00:39, 4.60it/s] 179it [00:39, 4.61it/s] 180it [00:39, 4.45it/s] 181it [00:39, 4.45it/s] 182it [00:40, 4.44it/s] 183it [00:40, 4.51it/s] 184it [00:40, 4.53it/s] 185it [00:40, 4.58it/s] 186it [00:41, 4.59it/s] 187it [00:41, 4.60it/s] 188it [00:41, 4.61it/s] 189it [00:41, 4.61it/s] 190it [00:41, 4.62it/s] 191it [00:42, 4.61it/s] 192it [00:42, 4.62it/s] 193it [00:42, 4.61it/s] 194it [00:42, 4.63it/s] 195it [00:43, 4.52it/s] 196it [00:43, 4.50it/s] 196it [00:43, 4.52it/s] +2025-05-26 02:11:08,507 - INFO - Epoch: 31, Objective: tensor([1998.8662], device='cuda:0', grad_fn=), Loss: 0.011031880974769592, KL/n: 31.218055725097656 + 0it [00:00, ?it/s]2025-05-26 02:11:09,070 - INFO - [Epoch 032 | Batch 0000] IWAE-loss 1605.7083 | mean log_px -0.0011 | KL -1530.47 + 1it [00:00, 3.16it/s] 2it [00:00, 3.89it/s] 3it [00:00, 4.14it/s] 4it [00:00, 4.30it/s] 5it [00:01, 4.41it/s] 6it [00:01, 4.42it/s] 7it [00:01, 4.48it/s] 8it [00:01, 4.52it/s] 9it [00:02, 4.44it/s] 10it [00:02, 4.50it/s] 11it [00:02, 4.53it/s] 12it [00:02, 4.54it/s] 13it [00:02, 4.54it/s] 14it [00:03, 4.58it/s] 15it [00:03, 4.62it/s] 16it [00:03, 4.47it/s] 17it [00:03, 4.55it/s] 18it [00:04, 4.58it/s] 19it [00:04, 4.61it/s] 20it [00:04, 4.63it/s] 21it [00:04, 4.64it/s] 22it [00:04, 4.65it/s] 23it [00:05, 4.67it/s] 24it [00:05, 4.67it/s] 25it [00:05, 4.52it/s] 26it [00:05, 4.58it/s] 27it [00:05, 4.61it/s] 28it [00:06, 4.63it/s] 29it [00:06, 4.65it/s] 30it [00:06, 4.65it/s] 31it [00:06, 4.67it/s] 32it [00:07, 4.67it/s] 33it [00:07, 4.68it/s] 34it [00:07, 4.52it/s] 35it [00:07, 4.58it/s] 36it [00:07, 4.60it/s] 37it [00:08, 4.64it/s] 38it [00:08, 4.65it/s] 39it [00:08, 4.67it/s] 40it [00:08, 4.62it/s] 41it [00:09, 4.64it/s] 42it [00:09, 4.65it/s] 43it [00:09, 4.50it/s] 44it [00:09, 4.56it/s] 45it [00:09, 4.58it/s] 46it [00:10, 4.63it/s] 47it [00:10, 4.65it/s] 48it [00:10, 4.65it/s] 49it [00:10, 4.67it/s] 50it [00:10, 4.51it/s]2025-05-26 02:11:19,968 - INFO - [Epoch 032 | Batch 0050] IWAE-loss 1871.9933 | mean log_px -0.0139 | KL -1516.54 + 51it [00:11, 4.56it/s] 52it [00:11, 4.60it/s] 53it [00:11, 4.62it/s] 54it [00:11, 4.64it/s] 55it [00:12, 4.66it/s] 56it [00:12, 4.50it/s] 57it [00:12, 4.57it/s] 58it [00:12, 4.61it/s] 59it [00:12, 4.63it/s] 60it [00:13, 4.63it/s] 61it [00:13, 4.65it/s] 62it [00:13, 4.51it/s] 63it [00:13, 4.58it/s] 64it [00:14, 4.61it/s] 65it [00:14, 4.63it/s] 66it [00:14, 4.65it/s] 67it [00:14, 4.65it/s] 68it [00:14, 4.50it/s] 69it [00:15, 4.53it/s] 70it [00:15, 4.59it/s] 71it [00:15, 4.62it/s] 72it [00:15, 4.60it/s] 73it [00:15, 4.62it/s] 74it [00:16, 4.64it/s] 75it [00:16, 4.65it/s] 76it [00:16, 4.65it/s] 77it [00:16, 4.66it/s] 78it [00:17, 4.63it/s] 79it [00:17, 4.62it/s] 80it [00:17, 4.62it/s] 81it [00:17, 4.64it/s] 82it [00:17, 4.51it/s] 83it [00:18, 4.56it/s] 84it [00:18, 4.59it/s] 85it [00:18, 4.60it/s] 86it [00:18, 4.62it/s] 87it [00:19, 4.63it/s] 88it [00:19, 4.65it/s] 89it [00:19, 4.66it/s] 90it [00:19, 4.56it/s] 91it [00:19, 4.61it/s] 92it [00:20, 4.63it/s] 93it [00:20, 4.64it/s] 94it [00:20, 4.65it/s] 95it [00:20, 4.67it/s] 96it [00:20, 4.65it/s] 97it [00:21, 4.66it/s] 98it [00:21, 4.66it/s] 99it [00:21, 4.52it/s] 100it [00:21, 4.56it/s]2025-05-26 02:11:30,812 - INFO - [Epoch 032 | Batch 0100] IWAE-loss 2199.9558 | mean log_px -0.0137 | KL -1505.77 + 101it [00:22, 4.59it/s] 102it [00:22, 4.60it/s] 103it [00:22, 4.62it/s] 104it [00:22, 4.63it/s] 105it [00:22, 4.64it/s] 106it [00:23, 4.65it/s] 107it [00:23, 4.64it/s] 108it [00:23, 4.47it/s] 109it [00:23, 4.53it/s] 110it [00:24, 4.55it/s] 111it [00:24, 4.59it/s] 112it [00:24, 4.55it/s] 113it [00:24, 4.56it/s] 114it [00:24, 4.58it/s] 115it [00:25, 4.61it/s] 116it [00:25, 4.62it/s] 117it [00:25, 4.49it/s] 118it [00:25, 4.55it/s] 119it [00:25, 4.58it/s] 120it [00:26, 4.60it/s] 121it [00:26, 4.63it/s] 122it [00:26, 4.63it/s] 123it [00:26, 4.51it/s] 124it [00:27, 4.57it/s] 125it [00:27, 4.60it/s] 126it [00:27, 4.59it/s] 127it [00:27, 4.63it/s] 128it [00:27, 4.64it/s] 129it [00:28, 4.65it/s] 130it [00:28, 4.66it/s] 131it [00:28, 4.66it/s] 132it [00:28, 4.65it/s] 133it [00:28, 4.63it/s] 134it [00:29, 4.61it/s] 135it [00:29, 4.61it/s] 136it [00:29, 4.52it/s] 137it [00:29, 4.57it/s] 138it [00:30, 4.59it/s] 139it [00:30, 4.63it/s] 140it [00:30, 4.64it/s] 141it [00:30, 4.64it/s] 142it [00:30, 4.49it/s] 143it [00:31, 4.48it/s] 144it [00:31, 4.52it/s] 145it [00:31, 4.55it/s] 146it [00:31, 4.53it/s] 147it [00:32, 4.52it/s] 148it [00:32, 4.36it/s] 149it [00:32, 4.45it/s] 150it [00:32, 4.50it/s]2025-05-26 02:11:41,742 - INFO - [Epoch 032 | Batch 0150] IWAE-loss 1934.8878 | mean log_px -0.0096 | KL -1507.10 + 151it [00:32, 4.54it/s] 152it [00:33, 4.56it/s] 153it [00:33, 4.58it/s] 154it [00:33, 4.59it/s] 155it [00:33, 4.47it/s] 156it [00:34, 4.51it/s] 157it [00:34, 4.56it/s] 158it [00:34, 4.59it/s] 159it [00:34, 4.60it/s] 160it [00:34, 4.48it/s] 161it [00:35, 4.54it/s] 162it [00:35, 4.55it/s] 163it [00:35, 4.60it/s] 164it [00:35, 4.57it/s] 165it [00:36, 4.61it/s] 166it [00:36, 4.62it/s] 167it [00:36, 4.49it/s] 168it [00:36, 4.55it/s] 169it [00:36, 4.58it/s] 170it [00:37, 4.60it/s] 171it [00:37, 4.64it/s] 172it [00:37, 4.64it/s] 173it [00:37, 4.65it/s] 174it [00:38, 4.51it/s] 175it [00:38, 4.57it/s] 176it [00:38, 4.59it/s] 177it [00:38, 4.61it/s] 178it [00:38, 4.46it/s] 179it [00:39, 4.53it/s] 180it [00:39, 4.55it/s] 181it [00:39, 4.59it/s] 182it [00:39, 4.57it/s] 183it [00:39, 4.58it/s] 184it [00:40, 4.59it/s] 185it [00:40, 4.47it/s] 186it [00:40, 4.54it/s] 187it [00:40, 4.54it/s] 188it [00:41, 4.59it/s] 189it [00:41, 4.61it/s] 190it [00:41, 4.62it/s] 191it [00:41, 4.63it/s] 192it [00:41, 4.50it/s] 193it [00:42, 4.55it/s] 194it [00:42, 4.58it/s] 195it [00:42, 4.47it/s] 196it [00:42, 4.53it/s] 196it [00:42, 4.57it/s] +2025-05-26 02:11:51,722 - INFO - Epoch: 32, Objective: tensor([1967.3446], device='cuda:0', grad_fn=), Loss: 0.012947743758559227, KL/n: 30.607524871826172 + 0it [00:00, ?it/s]2025-05-26 02:11:52,100 - INFO - [Epoch 033 | Batch 0000] IWAE-loss 1662.4415 | mean log_px -0.0023 | KL -1498.38 + 1it [00:00, 3.30it/s] 2it [00:00, 3.94it/s] 3it [00:00, 4.25it/s] 4it [00:00, 4.40it/s] 5it [00:01, 4.49it/s] 6it [00:01, 4.53it/s] 7it [00:01, 4.57it/s] 8it [00:01, 4.59it/s] 9it [00:02, 4.62it/s] 10it [00:02, 4.63it/s] 11it [00:02, 4.65it/s] 12it [00:02, 4.65it/s] 13it [00:02, 4.65it/s] 14it [00:03, 4.65it/s] 15it [00:03, 4.66it/s] 16it [00:03, 4.66it/s] 17it [00:03, 4.65it/s] 18it [00:03, 4.66it/s] 19it [00:04, 4.63it/s] 20it [00:04, 4.64it/s] 21it [00:04, 4.65it/s] 22it [00:04, 4.51it/s] 23it [00:05, 4.56it/s] 24it [00:05, 4.57it/s] 25it [00:05, 4.57it/s] 26it [00:05, 4.58it/s] 27it [00:06, 3.65it/s] 28it [00:06, 3.90it/s] 29it [00:06, 3.98it/s] 30it [00:06, 4.16it/s] 31it [00:06, 4.30it/s] 32it [00:07, 4.40it/s] 33it [00:07, 4.48it/s] 34it [00:07, 4.53it/s] 35it [00:07, 4.57it/s] 36it [00:08, 4.58it/s] 37it [00:08, 4.61it/s] 38it [00:08, 4.61it/s] 39it [00:08, 4.63it/s] 40it [00:08, 4.48it/s] 41it [00:09, 4.55it/s] 42it [00:09, 4.53it/s] 43it [00:09, 4.53it/s] 44it [00:09, 4.56it/s] 45it [00:10, 4.58it/s] 46it [00:10, 4.60it/s] 47it [00:10, 4.60it/s] 48it [00:10, 4.62it/s] 49it [00:10, 4.63it/s] 50it [00:11, 4.64it/s]2025-05-26 02:12:03,134 - INFO - [Epoch 033 | Batch 0050] IWAE-loss 1766.8324 | mean log_px -0.0126 | KL -1488.90 + 51it [00:11, 4.63it/s] 52it [00:11, 4.63it/s] 53it [00:11, 4.48it/s] 54it [00:12, 4.53it/s] 55it [00:12, 4.56it/s] 56it [00:12, 4.55it/s] 57it [00:12, 4.55it/s] 58it [00:12, 4.58it/s] 59it [00:13, 4.50it/s] 60it [00:13, 4.46it/s] 61it [00:13, 4.53it/s] 62it [00:13, 4.56it/s] 63it [00:13, 4.59it/s] 64it [00:14, 4.61it/s] 65it [00:14, 4.62it/s] 66it [00:14, 4.49it/s] 67it [00:14, 4.55it/s] 68it [00:15, 4.57it/s] 69it [00:15, 4.60it/s] 70it [00:15, 4.58it/s] 71it [00:15, 4.60it/s] 72it [00:15, 4.61it/s] 73it [00:16, 4.48it/s] 74it [00:16, 4.53it/s] 75it [00:16, 4.57it/s] 76it [00:16, 4.58it/s] 77it [00:17, 4.60it/s] 78it [00:17, 4.47it/s] 79it [00:17, 4.53it/s] 80it [00:17, 4.57it/s] 81it [00:17, 4.58it/s] 82it [00:18, 4.56it/s] 83it [00:18, 4.58it/s] 84it [00:18, 4.57it/s] 85it [00:18, 4.60it/s] 86it [00:19, 4.40it/s] 87it [00:19, 4.43it/s] 88it [00:19, 4.39it/s] 89it [00:19, 4.46it/s] 90it [00:19, 4.49it/s] 91it [00:20, 4.52it/s] 92it [00:20, 4.53it/s] 93it [00:20, 4.39it/s] 94it [00:20, 4.40it/s] 95it [00:21, 4.37it/s] 96it [00:21, 4.47it/s] 97it [00:21, 4.52it/s] 98it [00:21, 4.55it/s] 99it [00:21, 4.58it/s] 100it [00:22, 4.61it/s]2025-05-26 02:12:14,172 - INFO - [Epoch 033 | Batch 0100] IWAE-loss 1801.3687 | mean log_px -0.0054 | KL -1479.41 + 101it [00:22, 4.45it/s] 102it [00:22, 4.51it/s] 103it [00:22, 4.52it/s] 104it [00:23, 4.54it/s] 105it [00:23, 4.55it/s] 106it [00:23, 4.41it/s] 107it [00:23, 4.48it/s] 108it [00:23, 4.50it/s] 109it [00:24, 4.54it/s] 110it [00:24, 4.55it/s] 111it [00:24, 4.57it/s] 112it [00:24, 4.52it/s] 113it [00:25, 4.39it/s] 114it [00:25, 4.43it/s] 115it [00:25, 4.48it/s] 116it [00:25, 4.50it/s] 117it [00:25, 4.54it/s] 118it [00:26, 4.56it/s] 119it [00:26, 4.35it/s] 120it [00:26, 4.43it/s] 121it [00:26, 4.44it/s] 122it [00:27, 4.45it/s] 123it [00:27, 4.42it/s] 124it [00:27, 4.50it/s] 125it [00:27, 4.38it/s] 126it [00:27, 4.46it/s] 127it [00:28, 4.51it/s] 128it [00:28, 4.51it/s] 129it [00:28, 4.56it/s] 130it [00:28, 4.57it/s] 131it [00:29, 4.56it/s] 132it [00:29, 4.53it/s] 133it [00:29, 4.45it/s] 134it [00:29, 4.51it/s] 135it [00:29, 4.54it/s] 136it [00:30, 4.55it/s] 137it [00:30, 4.50it/s] 138it [00:30, 4.37it/s] 139it [00:30, 4.45it/s] 140it [00:31, 4.50it/s] 141it [00:31, 4.53it/s] 142it [00:31, 4.55it/s] 143it [00:31, 4.58it/s] 144it [00:31, 4.43it/s] 145it [00:32, 4.50it/s] 146it [00:32, 4.52it/s] 147it [00:32, 4.52it/s] 148it [00:32, 4.55it/s] 149it [00:33, 4.49it/s] 150it [00:33, 4.37it/s]2025-05-26 02:12:25,331 - INFO - [Epoch 033 | Batch 0150] IWAE-loss 1976.7753 | mean log_px -0.0103 | KL -1475.10 + 151it [00:33, 4.43it/s] 152it [00:33, 4.45it/s] 153it [00:33, 4.51it/s] 154it [00:34, 4.55it/s] 155it [00:34, 4.55it/s] 156it [00:34, 4.47it/s] 157it [00:34, 4.52it/s] 158it [00:35, 4.55it/s] 159it [00:35, 4.56it/s] 160it [00:35, 4.43it/s] 161it [00:35, 4.53it/s] 162it [00:35, 4.57it/s] 163it [00:36, 4.62it/s] 164it [00:36, 4.64it/s] 165it [00:36, 4.66it/s] 166it [00:36, 4.66it/s] 167it [00:37, 4.67it/s] 168it [00:37, 4.67it/s] 169it [00:37, 4.69it/s] 170it [00:37, 4.70it/s] 171it [00:37, 4.71it/s] 172it [00:38, 4.70it/s] 173it [00:38, 4.53it/s] 174it [00:38, 4.57it/s] 175it [00:38, 4.62it/s] 176it [00:38, 4.63it/s] 177it [00:39, 4.65it/s] 178it [00:39, 4.66it/s] 179it [00:39, 4.68it/s] 180it [00:39, 4.68it/s] 181it [00:40, 4.68it/s] 182it [00:40, 4.66it/s] 183it [00:40, 4.67it/s] 184it [00:40, 4.67it/s] 185it [00:40, 4.58it/s] 186it [00:41, 4.63it/s] 187it [00:41, 4.65it/s] 188it [00:41, 4.67it/s] 189it [00:41, 4.52it/s] 190it [00:41, 4.58it/s] 191it [00:42, 4.62it/s] 192it [00:42, 4.64it/s] 193it [00:42, 4.67it/s] 194it [00:42, 4.68it/s] 195it [00:43, 4.57it/s] 196it [00:43, 4.62it/s] 196it [00:43, 4.52it/s] +2025-05-26 02:12:35,198 - INFO - Epoch: 33, Objective: tensor([2188.4385], device='cuda:0', grad_fn=), Loss: 0.011592795141041279, KL/n: 29.990604400634766 + 0it [00:00, ?it/s]2025-05-26 02:12:35,553 - INFO - [Epoch 034 | Batch 0000] IWAE-loss 1666.0902 | mean log_px -0.0050 | KL -1469.55 + 1it [00:00, 3.29it/s] 2it [00:00, 4.00it/s] 3it [00:00, 4.30it/s] 4it [00:00, 4.44it/s] 5it [00:01, 4.54it/s] 6it [00:01, 4.59it/s] 7it [00:01, 4.63it/s] 8it [00:01, 4.64it/s] 9it [00:02, 4.68it/s] 10it [00:02, 4.67it/s] 11it [00:02, 4.69it/s] 12it [00:02, 4.69it/s] 13it [00:02, 4.51it/s] 14it [00:03, 4.58it/s] 15it [00:03, 4.61it/s] 16it [00:03, 4.63it/s] 17it [00:03, 4.65it/s] 18it [00:03, 4.66it/s] 19it [00:04, 4.67it/s] 20it [00:04, 4.64it/s] 21it [00:04, 4.67it/s] 22it [00:04, 4.66it/s] 23it [00:05, 4.67it/s] 24it [00:05, 4.68it/s] 25it [00:05, 4.69it/s] 26it [00:05, 4.69it/s] 27it [00:05, 4.70it/s] 28it [00:06, 4.69it/s] 29it [00:06, 4.66it/s] 30it [00:06, 4.66it/s] 31it [00:06, 4.67it/s] 32it [00:06, 4.67it/s] 33it [00:07, 4.55it/s] 34it [00:07, 4.51it/s] 35it [00:07, 4.56it/s] 36it [00:07, 4.59it/s] 37it [00:08, 4.62it/s] 38it [00:08, 4.48it/s] 39it [00:08, 4.56it/s] 40it [00:08, 4.60it/s] 41it [00:08, 4.63it/s] 42it [00:09, 4.64it/s] 43it [00:09, 4.66it/s] 44it [00:09, 4.67it/s] 45it [00:09, 4.69it/s] 46it [00:09, 4.65it/s] 47it [00:10, 4.66it/s] 48it [00:10, 4.51it/s] 49it [00:10, 4.58it/s] 50it [00:10, 4.61it/s]2025-05-26 02:12:46,355 - INFO - [Epoch 034 | Batch 0050] IWAE-loss 1685.5781 | mean log_px -0.0031 | KL -1466.24 + 51it [00:11, 4.63it/s] 52it [00:11, 4.64it/s] 53it [00:11, 4.43it/s] 54it [00:11, 4.38it/s] 55it [00:12, 4.28it/s] 56it [00:12, 4.28it/s] 57it [00:12, 4.38it/s] 58it [00:12, 4.31it/s] 59it [00:12, 4.40it/s] 60it [00:13, 4.45it/s] 61it [00:13, 4.50it/s] 62it [00:13, 4.52it/s] 63it [00:13, 4.53it/s] 64it [00:14, 4.55it/s] 65it [00:14, 4.56it/s] 66it [00:14, 4.57it/s] 67it [00:14, 4.59it/s] 68it [00:14, 4.59it/s] 69it [00:15, 4.60it/s] 70it [00:15, 4.39it/s] 71it [00:15, 4.46it/s] 72it [00:15, 4.51it/s] 73it [00:16, 4.55it/s] 74it [00:16, 4.57it/s] 75it [00:16, 4.60it/s] 76it [00:16, 4.61it/s] 77it [00:16, 4.48it/s] 78it [00:17, 4.53it/s] 79it [00:17, 4.56it/s] 80it [00:17, 4.57it/s] 81it [00:17, 4.57it/s] 82it [00:17, 4.57it/s] 83it [00:18, 4.59it/s] 84it [00:18, 4.59it/s] 85it [00:18, 4.50it/s] 86it [00:18, 4.54it/s] 87it [00:19, 4.58it/s] 88it [00:19, 4.59it/s] 89it [00:19, 4.59it/s] 90it [00:19, 4.43it/s] 91it [00:19, 4.51it/s] 92it [00:20, 4.56it/s] 93it [00:20, 4.61it/s] 94it [00:20, 4.64it/s] 95it [00:20, 4.63it/s] 96it [00:21, 4.65it/s] 97it [00:21, 4.67it/s] 98it [00:21, 4.68it/s] 99it [00:21, 4.69it/s] 100it [00:21, 4.70it/s]2025-05-26 02:12:57,365 - INFO - [Epoch 034 | Batch 0100] IWAE-loss 4595.9902 | mean log_px -0.0572 | KL -1454.45 + 101it [00:22, 4.70it/s] 102it [00:22, 4.70it/s] 103it [00:22, 4.71it/s] 104it [00:22, 4.71it/s] 105it [00:22, 4.72it/s] 106it [00:23, 4.72it/s] 107it [00:23, 4.72it/s] 108it [00:23, 4.71it/s] 109it [00:23, 4.73it/s] 110it [00:23, 4.74it/s] 111it [00:24, 4.72it/s] 112it [00:24, 4.72it/s] 113it [00:24, 4.73it/s] 114it [00:24, 4.72it/s] 115it [00:25, 4.73it/s] 116it [00:25, 4.72it/s] 117it [00:25, 4.72it/s] 118it [00:25, 4.72it/s] 119it [00:25, 4.71it/s] 120it [00:26, 4.70it/s] 121it [00:26, 4.70it/s] 122it [00:26, 4.70it/s] 123it [00:26, 4.69it/s] 124it [00:26, 4.69it/s] 125it [00:27, 4.70it/s] 126it [00:27, 4.70it/s] 127it [00:27, 4.71it/s] 128it [00:27, 4.71it/s] 129it [00:28, 4.72it/s] 130it [00:28, 4.71it/s] 131it [00:28, 4.72it/s] 132it [00:28, 4.72it/s] 133it [00:28, 4.72it/s] 134it [00:29, 4.69it/s] 135it [00:29, 4.70it/s] 136it [00:29, 4.67it/s] 137it [00:29, 4.69it/s] 138it [00:29, 4.70it/s] 139it [00:30, 4.71it/s] 140it [00:30, 4.71it/s] 141it [00:30, 4.72it/s] 142it [00:30, 4.71it/s] 143it [00:31, 4.72it/s] 144it [00:31, 4.72it/s] 145it [00:31, 4.73it/s] 146it [00:31, 4.72it/s] 147it [00:31, 4.72it/s] 148it [00:32, 4.70it/s] 149it [00:32, 4.71it/s] 150it [00:32, 4.71it/s]2025-05-26 02:13:07,976 - INFO - [Epoch 034 | Batch 0150] IWAE-loss 1796.6715 | mean log_px -0.0049 | KL -1448.83 + 151it [00:32, 4.71it/s] 152it [00:32, 4.69it/s] 153it [00:33, 4.70it/s] 154it [00:33, 4.70it/s] 155it [00:33, 4.70it/s] 156it [00:33, 4.70it/s] 157it [00:33, 4.71it/s] 158it [00:34, 4.71it/s] 159it [00:34, 4.71it/s] 160it [00:34, 4.72it/s] 161it [00:34, 4.72it/s] 162it [00:35, 4.72it/s] 163it [00:35, 4.72it/s] 164it [00:35, 4.72it/s] 165it [00:35, 4.73it/s] 166it [00:35, 4.72it/s] 167it [00:36, 4.73it/s] 168it [00:36, 4.72it/s] 169it [00:36, 4.73it/s] 170it [00:36, 4.72it/s] 171it [00:36, 4.73it/s] 172it [00:37, 4.73it/s] 173it [00:37, 4.72it/s] 174it [00:37, 4.72it/s] 175it [00:37, 4.72it/s] 176it [00:38, 4.72it/s] 177it [00:38, 4.72it/s] 178it [00:38, 4.72it/s] 179it [00:38, 4.73it/s] 180it [00:38, 4.65it/s] 181it [00:39, 4.61it/s] 182it [00:39, 4.62it/s] 183it [00:39, 4.63it/s] 184it [00:39, 4.62it/s] 185it [00:39, 4.62it/s] 186it [00:40, 4.62it/s] 187it [00:40, 4.63it/s] 188it [00:40, 4.64it/s] 189it [00:40, 4.66it/s] 190it [00:41, 4.68it/s] 191it [00:41, 4.69it/s] 192it [00:41, 4.70it/s] 193it [00:41, 4.71it/s] 194it [00:41, 4.71it/s] 195it [00:42, 4.59it/s] 196it [00:42, 4.64it/s] 196it [00:42, 4.63it/s] +2025-05-26 02:13:17,700 - INFO - Epoch: 34, Objective: tensor([1598.8741], device='cuda:0', grad_fn=), Loss: 0.003922741860151291, KL/n: 29.56195640563965 + 0it [00:00, ?it/s]2025-05-26 02:13:18,259 - INFO - [Epoch 035 | Batch 0000] IWAE-loss 1601.3729 | mean log_px -0.0040 | KL -1447.12 + 1it [00:00, 3.42it/s] 2it [00:00, 4.05it/s] 3it [00:00, 4.33it/s] 4it [00:00, 4.48it/s] 5it [00:01, 4.58it/s] 6it [00:01, 4.62it/s] 7it [00:01, 4.66it/s] 8it [00:01, 4.61it/s] 9it [00:01, 4.66it/s] 10it [00:02, 4.67it/s] 11it [00:02, 4.70it/s] 12it [00:02, 4.70it/s] 13it [00:02, 4.72it/s] 14it [00:03, 4.72it/s] 15it [00:03, 4.73it/s] 16it [00:03, 4.72it/s] 17it [00:03, 4.73it/s] 18it [00:03, 4.73it/s] 19it [00:04, 4.73it/s] 20it [00:04, 4.73it/s] 21it [00:04, 4.73it/s] 22it [00:04, 4.72it/s] 23it [00:04, 4.72it/s] 24it [00:05, 4.72it/s] 25it [00:05, 4.70it/s] 26it [00:05, 4.69it/s] 27it [00:05, 4.70it/s] 28it [00:06, 4.69it/s] 29it [00:06, 4.69it/s] 30it [00:06, 4.68it/s] 31it [00:06, 4.69it/s] 32it [00:06, 4.69it/s] 33it [00:07, 4.70it/s] 34it [00:07, 4.70it/s] 35it [00:07, 4.71it/s] 36it [00:07, 4.71it/s] 37it [00:07, 4.71it/s] 38it [00:08, 4.72it/s] 39it [00:08, 4.72it/s] 40it [00:08, 4.72it/s] 41it [00:08, 4.72it/s] 42it [00:08, 4.72it/s] 43it [00:09, 4.69it/s] 44it [00:09, 4.68it/s] 45it [00:09, 4.70it/s] 46it [00:09, 4.70it/s] 47it [00:10, 4.70it/s] 48it [00:10, 4.70it/s] 49it [00:10, 4.70it/s] 50it [00:10, 4.70it/s]2025-05-26 02:13:28,879 - INFO - [Epoch 035 | Batch 0050] IWAE-loss 1802.3173 | mean log_px -0.0079 | KL -1440.26 + 51it [00:10, 4.70it/s] 52it [00:11, 4.67it/s] 53it [00:11, 4.68it/s] 54it [00:11, 4.65it/s] 55it [00:11, 4.69it/s] 56it [00:11, 4.68it/s] 57it [00:12, 4.70it/s] 58it [00:12, 4.70it/s] 59it [00:12, 4.72it/s] 60it [00:12, 4.65it/s] 61it [00:13, 4.67it/s] 62it [00:13, 4.68it/s] 63it [00:13, 4.70it/s] 64it [00:13, 4.69it/s] 65it [00:13, 4.70it/s] 66it [00:14, 4.71it/s] 67it [00:14, 4.71it/s] 68it [00:14, 4.71it/s] 69it [00:14, 4.71it/s] 70it [00:14, 4.69it/s] 71it [00:15, 4.69it/s] 72it [00:15, 4.69it/s] 73it [00:15, 4.70it/s] 74it [00:15, 4.73it/s] 75it [00:16, 4.71it/s] 76it [00:16, 4.71it/s] 77it [00:16, 4.71it/s] 78it [00:16, 4.71it/s] 79it [00:16, 4.71it/s] 80it [00:17, 4.71it/s] 81it [00:17, 4.72it/s] 82it [00:17, 4.71it/s] 83it [00:17, 4.72it/s] 84it [00:17, 4.72it/s] 85it [00:18, 4.72it/s] 86it [00:18, 4.72it/s] 87it [00:18, 4.72it/s] 88it [00:18, 4.72it/s] 89it [00:18, 4.72it/s] 90it [00:19, 4.71it/s] 91it [00:19, 4.74it/s] 92it [00:19, 4.73it/s] 93it [00:19, 4.70it/s] 94it [00:20, 4.70it/s] 95it [00:20, 4.68it/s] 96it [00:20, 4.52it/s] 97it [00:20, 4.56it/s] 98it [00:20, 4.59it/s] 99it [00:21, 4.63it/s] 100it [00:21, 4.66it/s]2025-05-26 02:13:39,546 - INFO - [Epoch 035 | Batch 0100] IWAE-loss 1988.3760 | mean log_px -0.0165 | KL -1428.70 + 101it [00:21, 4.67it/s] 102it [00:21, 4.68it/s] 103it [00:22, 4.69it/s] 104it [00:22, 4.69it/s] 105it [00:22, 4.71it/s] 106it [00:22, 4.70it/s] 107it [00:22, 4.70it/s] 108it [00:23, 4.70it/s] 109it [00:23, 4.71it/s] 110it [00:23, 4.70it/s] 111it [00:23, 4.71it/s] 112it [00:23, 4.71it/s] 113it [00:24, 4.72it/s] 114it [00:24, 4.71it/s] 115it [00:24, 4.71it/s] 116it [00:24, 4.71it/s] 117it [00:25, 4.55it/s] 118it [00:25, 4.61it/s] 119it [00:25, 4.64it/s] 120it [00:25, 4.66it/s] 121it [00:25, 4.67it/s] 122it [00:26, 4.66it/s] 123it [00:26, 4.56it/s] 124it [00:26, 4.62it/s] 125it [00:26, 4.65it/s] 126it [00:26, 4.65it/s] 127it [00:27, 4.50it/s] 128it [00:27, 4.57it/s] 129it [00:27, 4.46it/s] 130it [00:27, 4.52it/s] 131it [00:28, 4.56it/s] 132it [00:28, 4.61it/s] 133it [00:28, 4.48it/s] 134it [00:28, 4.53it/s] 135it [00:28, 4.59it/s] 136it [00:29, 4.63it/s] 137it [00:29, 4.65it/s] 138it [00:29, 4.67it/s] 139it [00:29, 4.68it/s] 140it [00:29, 4.69it/s] 141it [00:30, 4.70it/s] 142it [00:30, 4.70it/s] 143it [00:30, 4.71it/s] 144it [00:30, 4.71it/s] 145it [00:31, 4.71it/s] 146it [00:31, 4.71it/s] 147it [00:31, 4.72it/s] 148it [00:31, 4.71it/s] 149it [00:31, 4.69it/s] 150it [00:32, 4.71it/s]2025-05-26 02:13:50,287 - INFO - [Epoch 035 | Batch 0150] IWAE-loss 1613.8336 | mean log_px -0.0041 | KL -1433.86 + 151it [00:32, 4.71it/s] 152it [00:32, 4.71it/s] 153it [00:32, 4.71it/s] 154it [00:32, 4.71it/s] 155it [00:33, 4.71it/s] 156it [00:33, 4.71it/s] 157it [00:33, 4.71it/s] 158it [00:33, 4.71it/s] 159it [00:34, 4.72it/s] 160it [00:34, 4.71it/s] 161it [00:34, 4.55it/s] 162it [00:34, 4.61it/s] 163it [00:34, 4.64it/s] 164it [00:35, 4.66it/s] 165it [00:35, 4.67it/s] 166it [00:35, 4.68it/s] 167it [00:35, 4.68it/s] 168it [00:35, 4.67it/s] 169it [00:36, 4.67it/s] 170it [00:36, 4.51it/s] 171it [00:36, 4.54it/s] 172it [00:36, 4.58it/s] 173it [00:37, 4.63it/s] 174it [00:37, 4.65it/s] 175it [00:37, 4.67it/s] 176it [00:37, 4.68it/s] 177it [00:37, 4.69it/s] 178it [00:38, 4.70it/s] 179it [00:38, 4.70it/s] 180it [00:38, 4.68it/s] 181it [00:38, 4.69it/s] 182it [00:38, 4.71it/s] 183it [00:39, 4.71it/s] 184it [00:39, 4.71it/s] 185it [00:39, 4.54it/s] 186it [00:39, 4.61it/s] 187it [00:40, 4.64it/s] 188it [00:40, 4.66it/s] 189it [00:40, 4.68it/s] 190it [00:40, 4.69it/s] 191it [00:40, 4.70it/s] 192it [00:41, 4.70it/s] 193it [00:41, 4.71it/s] 194it [00:41, 4.71it/s] 195it [00:41, 4.37it/s] 196it [00:42, 4.48it/s] 196it [00:42, 4.66it/s] +2025-05-26 02:14:00,105 - INFO - Epoch: 35, Objective: tensor([2143.9568], device='cuda:0', grad_fn=), Loss: 0.021683480590581894, KL/n: 29.22657012939453 + 0it [00:00, ?it/s]2025-05-26 02:14:00,501 - INFO - [Epoch 036 | Batch 0000] IWAE-loss 1631.0413 | mean log_px -0.0034 | KL -1429.53 + 1it [00:00, 3.14it/s] 2it [00:00, 3.66it/s] 3it [00:00, 3.89it/s] 4it [00:01, 4.15it/s] 5it [00:01, 4.28it/s] 6it [00:01, 4.38it/s] 7it [00:01, 4.47it/s] 8it [00:01, 4.53it/s] 9it [00:02, 4.58it/s] 10it [00:02, 4.44it/s] 11it [00:02, 4.51it/s] 12it [00:02, 4.47it/s] 13it [00:03, 4.47it/s] 14it [00:03, 4.35it/s] 15it [00:03, 4.39it/s] 16it [00:03, 4.26it/s] 17it [00:03, 4.40it/s] 18it [00:04, 4.32it/s] 19it [00:04, 4.43it/s] 20it [00:04, 4.48it/s] 21it [00:04, 4.46it/s] 22it [00:05, 4.37it/s] 23it [00:05, 4.41it/s] 24it [00:05, 4.33it/s] 25it [00:05, 4.21it/s] 26it [00:06, 3.44it/s] 27it [00:06, 3.75it/s] 28it [00:06, 3.96it/s] 29it [00:06, 4.16it/s] 30it [00:07, 4.17it/s] 31it [00:07, 4.32it/s] 32it [00:07, 4.19it/s] 33it [00:07, 4.29it/s] 34it [00:07, 4.33it/s] 35it [00:08, 4.29it/s] 36it [00:08, 4.32it/s] 37it [00:08, 4.43it/s] 38it [00:08, 4.35it/s] 39it [00:09, 4.31it/s] 40it [00:09, 4.28it/s] 41it [00:09, 4.40it/s] 42it [00:09, 4.30it/s] 43it [00:10, 4.21it/s] 44it [00:10, 4.33it/s] 45it [00:10, 4.29it/s] 46it [00:10, 4.39it/s] 47it [00:10, 4.41it/s] 48it [00:11, 4.48it/s] 49it [00:11, 4.47it/s] 50it [00:11, 4.38it/s]2025-05-26 02:14:12,069 - INFO - [Epoch 036 | Batch 0050] IWAE-loss 1841.2819 | mean log_px -0.0059 | KL -1423.28 + 51it [00:11, 4.26it/s] 52it [00:12, 4.39it/s] 53it [00:12, 4.41it/s] 54it [00:12, 4.29it/s] 55it [00:12, 4.28it/s] 56it [00:13, 4.26it/s] 57it [00:13, 4.30it/s] 58it [00:13, 4.25it/s] 59it [00:13, 4.25it/s] 60it [00:14, 4.29it/s] 61it [00:14, 4.32it/s] 62it [00:14, 4.44it/s] 63it [00:14, 4.36it/s] 64it [00:14, 4.45it/s] 65it [00:15, 4.52it/s] 66it [00:15, 4.57it/s] 67it [00:15, 4.62it/s] 68it [00:15, 4.30it/s] 69it [00:16, 4.31it/s] 70it [00:16, 4.28it/s] 71it [00:16, 4.37it/s] 72it [00:16, 4.34it/s] 73it [00:16, 4.25it/s] 74it [00:17, 4.08it/s] 75it [00:17, 3.95it/s] 76it [00:17, 4.00it/s] 77it [00:17, 4.04it/s] 78it [00:18, 4.13it/s] 79it [00:18, 4.26it/s] 80it [00:18, 4.22it/s] 81it [00:18, 4.28it/s] 82it [00:19, 4.24it/s] 83it [00:19, 4.23it/s] 84it [00:19, 4.22it/s] 85it [00:19, 4.23it/s] 86it [00:20, 4.35it/s] 87it [00:20, 4.45it/s] 88it [00:20, 4.35it/s] 89it [00:20, 4.38it/s] 90it [00:20, 4.30it/s] 91it [00:21, 4.28it/s] 92it [00:21, 4.28it/s] 93it [00:21, 4.36it/s] 94it [00:21, 4.38it/s] 95it [00:22, 4.35it/s] 96it [00:22, 4.32it/s] 97it [00:22, 4.30it/s] 98it [00:22, 4.29it/s] 99it [00:23, 4.39it/s] 100it [00:23, 4.46it/s]2025-05-26 02:14:23,675 - INFO - [Epoch 036 | Batch 0100] IWAE-loss 1601.9835 | mean log_px -0.0026 | KL -1416.70 + 101it [00:23, 4.53it/s] 102it [00:23, 4.58it/s] 103it [00:23, 4.48it/s] 104it [00:24, 4.54it/s] 105it [00:24, 4.58it/s] 106it [00:24, 4.44it/s] 107it [00:24, 4.40it/s] 108it [00:25, 4.34it/s] 109it [00:25, 4.20it/s] 110it [00:25, 4.33it/s] 111it [00:25, 4.28it/s] 112it [00:26, 4.27it/s] 113it [00:26, 4.26it/s] 114it [00:26, 4.30it/s] 115it [00:26, 4.30it/s] 116it [00:26, 4.28it/s] 117it [00:27, 4.26it/s] 118it [00:27, 4.13it/s] 119it [00:27, 4.18it/s] 120it [00:27, 4.20it/s] 121it [00:28, 4.26it/s] 122it [00:28, 4.24it/s] 123it [00:28, 4.23it/s] 124it [00:28, 4.25it/s] 125it [00:29, 4.22it/s] 126it [00:29, 4.24it/s] 127it [00:29, 4.37it/s] 128it [00:29, 4.39it/s] 129it [00:29, 4.45it/s] 130it [00:30, 4.43it/s] 131it [00:30, 4.36it/s] 132it [00:30, 4.34it/s] 133it [00:30, 4.26it/s] 134it [00:31, 4.20it/s] 135it [00:31, 4.29it/s] 136it [00:31, 4.37it/s] 137it [00:31, 4.30it/s] 138it [00:32, 4.39it/s] 139it [00:32, 4.46it/s] 140it [00:32, 4.44it/s] 141it [00:32, 4.34it/s] 142it [00:32, 4.30it/s] 143it [00:33, 4.27it/s] 144it [00:33, 4.28it/s] 145it [00:33, 4.31it/s] 146it [00:33, 4.29it/s] 147it [00:34, 4.33it/s] 148it [00:34, 4.13it/s] 149it [00:34, 4.18it/s] 150it [00:34, 4.18it/s]2025-05-26 02:14:35,312 - INFO - [Epoch 036 | Batch 0150] IWAE-loss 1938.5652 | mean log_px -0.0120 | KL -1410.55 + 151it [00:35, 4.20it/s] 152it [00:35, 4.16it/s] 153it [00:35, 4.08it/s] 154it [00:35, 4.13it/s] 155it [00:36, 4.16it/s] 156it [00:36, 4.27it/s] 157it [00:36, 4.39it/s] 158it [00:36, 4.24it/s] 159it [00:37, 4.29it/s] 160it [00:37, 4.29it/s] 161it [00:37, 4.27it/s] 162it [00:37, 4.32it/s] 163it [00:37, 4.23it/s] 164it [00:38, 4.29it/s] 165it [00:38, 4.38it/s] 166it [00:38, 4.32it/s] 167it [00:38, 4.42it/s] 168it [00:39, 4.36it/s] 169it [00:39, 4.48it/s] 170it [00:39, 4.51it/s] 171it [00:39, 4.59it/s] 172it [00:39, 4.50it/s] 173it [00:40, 4.43it/s] 174it [00:40, 4.42it/s] 175it [00:40, 4.35it/s] 176it [00:40, 4.29it/s] 177it [00:41, 4.40it/s] 178it [00:41, 4.44it/s] 179it [00:41, 4.41it/s] 180it [00:41, 4.37it/s] 181it [00:42, 4.47it/s] 182it [00:42, 4.53it/s] 183it [00:42, 4.43it/s] 184it [00:42, 4.37it/s] 185it [00:42, 4.46it/s] 186it [00:43, 4.52it/s] 187it [00:43, 4.44it/s] 188it [00:43, 4.41it/s] 189it [00:43, 4.37it/s] 190it [00:44, 4.20it/s] 191it [00:44, 4.29it/s] 192it [00:44, 4.25it/s] 193it [00:44, 4.30it/s] 194it [00:45, 4.30it/s] 195it [00:45, 4.30it/s] 196it [00:45, 4.27it/s] 196it [00:45, 4.30it/s] +2025-05-26 02:14:45,791 - INFO - Epoch: 36, Objective: tensor([1572.9171], device='cuda:0', grad_fn=), Loss: 0.004463386721909046, KL/n: 28.696121215820312 + 0it [00:00, ?it/s]2025-05-26 02:14:46,176 - INFO - [Epoch 037 | Batch 0000] IWAE-loss 1712.1151 | mean log_px -0.0071 | KL -1405.82 + 1it [00:00, 3.30it/s] 2it [00:00, 4.01it/s] 3it [00:00, 4.31it/s] 4it [00:00, 4.45it/s] 5it [00:01, 4.51it/s] 6it [00:01, 4.57it/s] 7it [00:01, 4.62it/s] 8it [00:01, 4.65it/s] 9it [00:02, 4.67it/s] 10it [00:02, 4.67it/s] 11it [00:02, 4.60it/s] 12it [00:02, 4.58it/s] 13it [00:02, 4.61it/s] 14it [00:03, 4.62it/s] 15it [00:03, 4.63it/s] 16it [00:03, 4.63it/s] 17it [00:03, 4.64it/s] 18it [00:03, 4.66it/s] 19it [00:04, 4.69it/s] 20it [00:04, 4.69it/s] 21it [00:04, 4.69it/s] 22it [00:04, 4.70it/s] 23it [00:05, 4.70it/s] 24it [00:05, 4.70it/s] 25it [00:05, 4.70it/s] 26it [00:05, 4.68it/s] 27it [00:05, 4.69it/s] 28it [00:06, 4.68it/s] 29it [00:06, 4.68it/s] 30it [00:06, 4.69it/s] 31it [00:06, 4.68it/s] 32it [00:06, 4.67it/s] 33it [00:07, 4.68it/s] 34it [00:07, 4.67it/s] 35it [00:07, 4.68it/s] 36it [00:07, 4.68it/s] 37it [00:08, 4.70it/s] 38it [00:08, 4.70it/s] 39it [00:08, 4.70it/s] 40it [00:08, 4.70it/s] 41it [00:08, 4.71it/s] 42it [00:09, 4.71it/s] 43it [00:09, 4.71it/s] 44it [00:09, 4.70it/s] 45it [00:09, 4.71it/s] 46it [00:09, 4.71it/s] 47it [00:10, 4.71it/s] 48it [00:10, 4.70it/s] 49it [00:10, 4.69it/s] 50it [00:10, 4.53it/s]2025-05-26 02:14:56,885 - INFO - [Epoch 037 | Batch 0050] IWAE-loss 1829.0848 | mean log_px -0.0077 | KL -1399.44 + 51it [00:11, 4.54it/s] 52it [00:11, 4.60it/s] 53it [00:11, 4.62it/s] 54it [00:11, 4.63it/s] 55it [00:11, 4.65it/s] 56it [00:12, 4.66it/s] 57it [00:12, 4.67it/s] 58it [00:12, 4.48it/s] 59it [00:12, 4.57it/s] 60it [00:12, 4.60it/s] 61it [00:13, 4.64it/s] 62it [00:13, 4.66it/s] 63it [00:13, 4.67it/s] 64it [00:13, 4.52it/s] 65it [00:14, 4.59it/s] 66it [00:14, 4.62it/s] 67it [00:14, 4.65it/s] 68it [00:14, 4.67it/s] 69it [00:14, 4.55it/s] 70it [00:15, 4.61it/s] 71it [00:15, 4.64it/s] 72it [00:15, 4.65it/s] 73it [00:15, 4.63it/s] 74it [00:16, 4.44it/s] 75it [00:16, 4.50it/s] 76it [00:16, 4.55it/s] 77it [00:16, 4.49it/s] 78it [00:16, 4.51it/s] 79it [00:17, 4.47it/s] 80it [00:17, 4.36it/s] 81it [00:17, 4.36it/s] 82it [00:17, 4.44it/s] 83it [00:18, 4.50it/s] 84it [00:18, 4.53it/s] 85it [00:18, 4.56it/s] 86it [00:18, 4.57it/s] 87it [00:18, 4.46it/s] 88it [00:19, 4.52it/s] 89it [00:19, 4.55it/s] 90it [00:19, 4.57it/s] 91it [00:19, 4.59it/s] 92it [00:19, 4.59it/s] 93it [00:20, 4.61it/s] 94it [00:20, 4.60it/s] 95it [00:20, 4.58it/s] 96it [00:20, 4.60it/s] 97it [00:21, 4.61it/s] 98it [00:21, 4.61it/s] 99it [00:21, 4.60it/s] 100it [00:21, 4.61it/s]2025-05-26 02:15:07,819 - INFO - [Epoch 037 | Batch 0100] IWAE-loss 1828.0680 | mean log_px -0.0090 | KL -1395.64 + 101it [00:21, 4.61it/s] 102it [00:22, 4.58it/s] 103it [00:22, 4.45it/s] 104it [00:22, 4.50it/s] 105it [00:22, 4.54it/s] 106it [00:23, 4.55it/s] 107it [00:23, 4.59it/s] 108it [00:23, 4.61it/s] 109it [00:23, 4.46it/s] 110it [00:23, 4.49it/s] 111it [00:24, 4.45it/s] 112it [00:24, 4.49it/s] 113it [00:24, 4.53it/s] 114it [00:24, 4.56it/s] 115it [00:25, 4.57it/s] 116it [00:25, 4.60it/s] 117it [00:25, 4.61it/s] 118it [00:25, 4.60it/s] 119it [00:25, 4.60it/s] 120it [00:26, 4.60it/s] 121it [00:26, 4.61it/s] 122it [00:26, 4.62it/s] 123it [00:26, 4.63it/s] 124it [00:26, 4.62it/s] 125it [00:27, 4.61it/s] 126it [00:27, 4.61it/s] 127it [00:27, 4.62it/s] 128it [00:27, 4.62it/s] 129it [00:28, 4.63it/s] 130it [00:28, 4.63it/s] 131it [00:28, 4.63it/s] 132it [00:28, 4.63it/s] 133it [00:28, 4.63it/s] 134it [00:29, 4.48it/s] 135it [00:29, 4.54it/s] 136it [00:29, 4.56it/s] 137it [00:29, 4.59it/s] 138it [00:30, 4.60it/s] 139it [00:30, 4.61it/s] 140it [00:30, 4.47it/s] 141it [00:30, 4.54it/s] 142it [00:30, 4.56it/s] 143it [00:31, 4.56it/s] 144it [00:31, 4.59it/s] 145it [00:31, 4.61it/s] 146it [00:31, 4.47it/s] 147it [00:32, 4.51it/s] 148it [00:32, 4.54it/s] 149it [00:32, 4.57it/s] 150it [00:32, 4.58it/s]2025-05-26 02:15:18,766 - INFO - [Epoch 037 | Batch 0150] IWAE-loss 2035.0342 | mean log_px -0.0140 | KL -1391.93 + 151it [00:32, 4.59it/s] 152it [00:33, 4.59it/s] 153it [00:33, 4.60it/s] 154it [00:33, 4.61it/s] 155it [00:33, 4.60it/s] 156it [00:34, 4.36it/s] 157it [00:34, 4.41it/s] 158it [00:34, 4.43it/s] 159it [00:34, 4.46it/s] 160it [00:34, 4.47it/s] 161it [00:35, 4.47it/s] 162it [00:35, 4.50it/s] 163it [00:35, 4.50it/s] 164it [00:35, 4.54it/s] 165it [00:36, 4.56it/s] 166it [00:36, 4.43it/s] 167it [00:36, 4.51it/s] 168it [00:36, 4.53it/s] 169it [00:36, 4.56it/s] 170it [00:37, 4.58it/s] 171it [00:37, 4.59it/s] 172it [00:37, 4.48it/s] 173it [00:37, 4.53it/s] 174it [00:37, 4.56it/s] 175it [00:38, 4.56it/s] 176it [00:38, 4.57it/s] 177it [00:38, 4.60it/s] 178it [00:38, 4.47it/s] 179it [00:39, 4.52it/s] 180it [00:39, 4.56it/s] 181it [00:39, 4.58it/s] 182it [00:39, 4.59it/s] 183it [00:39, 4.61it/s] 184it [00:40, 4.62it/s] 185it [00:40, 4.64it/s] 186it [00:40, 4.62it/s] 187it [00:40, 4.63it/s] 188it [00:41, 4.63it/s] 189it [00:41, 4.63it/s] 190it [00:41, 4.63it/s] 191it [00:41, 4.64it/s] 192it [00:41, 4.63it/s] 193it [00:42, 4.63it/s] 194it [00:42, 4.62it/s] 195it [00:42, 4.49it/s] 196it [00:42, 4.55it/s] 196it [00:42, 4.58it/s] +2025-05-26 02:15:28,764 - INFO - Epoch: 37, Objective: tensor([1723.5656], device='cuda:0', grad_fn=), Loss: 0.004755986854434013, KL/n: 28.372997283935547 + 0it [00:00, ?it/s]2025-05-26 02:15:29,320 - INFO - [Epoch 038 | Batch 0000] IWAE-loss 1650.8577 | mean log_px -0.0084 | KL -1389.24 + 1it [00:00, 3.33it/s] 2it [00:00, 4.01it/s] 3it [00:00, 4.29it/s] 4it [00:00, 4.43it/s] 5it [00:01, 4.50it/s] 6it [00:01, 4.56it/s] 7it [00:01, 4.60it/s] 8it [00:01, 4.44it/s] 9it [00:02, 4.52it/s] 10it [00:02, 4.55it/s] 11it [00:02, 4.57it/s] 12it [00:02, 4.59it/s] 13it [00:02, 4.62it/s] 14it [00:03, 4.60it/s] 15it [00:03, 4.58it/s] 16it [00:03, 4.60it/s] 17it [00:03, 4.62it/s] 18it [00:03, 4.61it/s] 19it [00:04, 4.64it/s] 20it [00:04, 4.56it/s] 21it [00:04, 4.60it/s] 22it [00:04, 4.62it/s] 23it [00:05, 4.65it/s] 24it [00:05, 4.65it/s] 25it [00:05, 4.53it/s] 26it [00:05, 4.59it/s] 27it [00:05, 4.62it/s] 28it [00:06, 4.62it/s] 29it [00:06, 4.65it/s] 30it [00:06, 4.65it/s] 31it [00:06, 4.67it/s] 32it [00:07, 4.67it/s] 33it [00:07, 4.68it/s] 34it [00:07, 4.68it/s] 35it [00:07, 4.68it/s] 36it [00:07, 4.68it/s] 37it [00:08, 4.68it/s] 38it [00:08, 4.68it/s] 39it [00:08, 4.69it/s] 40it [00:08, 4.69it/s] 41it [00:08, 4.68it/s] 42it [00:09, 4.68it/s] 43it [00:09, 4.45it/s] 44it [00:09, 4.52it/s] 45it [00:09, 4.57it/s] 46it [00:10, 4.57it/s] 47it [00:10, 4.60it/s] 48it [00:10, 4.56it/s] 49it [00:10, 4.48it/s] 50it [00:10, 4.54it/s]2025-05-26 02:15:40,162 - INFO - [Epoch 038 | Batch 0050] IWAE-loss 1416.7461 | mean log_px -0.0029 | KL -1381.36 + 51it [00:11, 4.56it/s] 52it [00:11, 4.57it/s] 53it [00:11, 4.57it/s] 54it [00:11, 4.39it/s] 55it [00:12, 4.46it/s] 56it [00:12, 4.47it/s] 57it [00:12, 4.49it/s] 58it [00:12, 4.49it/s] 59it [00:12, 4.50it/s] 60it [00:13, 4.50it/s] 61it [00:13, 4.38it/s] 62it [00:13, 4.46it/s] 63it [00:13, 4.51it/s] 64it [00:14, 4.52it/s] 65it [00:14, 4.54it/s] 66it [00:14, 4.56it/s] 67it [00:14, 4.44it/s] 68it [00:14, 4.49it/s] 69it [00:15, 4.50it/s] 70it [00:15, 4.53it/s] 71it [00:15, 4.56it/s] 72it [00:15, 4.57it/s] 73it [00:16, 4.58it/s] 74it [00:16, 4.45it/s] 75it [00:16, 4.50it/s] 76it [00:16, 4.52it/s] 77it [00:16, 4.56it/s] 78it [00:17, 4.55it/s] 79it [00:17, 4.56it/s] 80it [00:17, 4.56it/s] 81it [00:17, 4.43it/s] 82it [00:18, 4.45it/s] 83it [00:18, 4.48it/s] 84it [00:18, 4.50it/s] 85it [00:18, 4.54it/s] 86it [00:18, 4.56it/s] 87it [00:19, 4.57it/s] 88it [00:19, 4.45it/s] 89it [00:19, 4.50it/s] 90it [00:19, 4.49it/s] 91it [00:20, 4.54it/s] 92it [00:20, 4.54it/s] 93it [00:20, 4.56it/s] 94it [00:20, 4.56it/s] 95it [00:20, 4.47it/s] 96it [00:21, 4.52it/s] 97it [00:21, 4.45it/s] 98it [00:21, 4.49it/s] 99it [00:21, 4.51it/s] 100it [00:22, 4.49it/s]2025-05-26 02:15:51,271 - INFO - [Epoch 038 | Batch 0100] IWAE-loss 1494.8090 | mean log_px -0.0030 | KL -1374.98 + 101it [00:22, 4.45it/s] 102it [00:22, 4.34it/s] 103it [00:22, 4.38it/s] 104it [00:22, 4.42it/s] 105it [00:23, 4.44it/s] 106it [00:23, 4.45it/s] 107it [00:23, 4.49it/s] 108it [00:23, 4.52it/s] 109it [00:24, 4.39it/s] 110it [00:24, 4.43it/s] 111it [00:24, 4.48it/s] 112it [00:24, 4.50it/s] 113it [00:24, 4.53it/s] 114it [00:25, 4.49it/s] 115it [00:25, 4.48it/s] 116it [00:25, 4.39it/s] 117it [00:25, 4.46it/s] 118it [00:26, 4.46it/s] 119it [00:26, 4.52it/s] 120it [00:26, 4.47it/s] 121it [00:26, 4.53it/s] 122it [00:26, 4.55it/s] 123it [00:27, 4.44it/s] 124it [00:27, 4.48it/s] 125it [00:27, 4.52it/s] 126it [00:27, 4.55it/s] 127it [00:28, 4.57it/s] 128it [00:28, 4.57it/s] 129it [00:28, 4.44it/s] 130it [00:28, 4.49it/s] 131it [00:28, 4.50it/s] 132it [00:29, 4.45it/s] 133it [00:29, 4.51it/s] 134it [00:29, 4.52it/s] 135it [00:29, 4.42it/s] 136it [00:30, 4.48it/s] 137it [00:30, 4.51it/s] 138it [00:30, 4.52it/s] 139it [00:30, 4.55it/s] 140it [00:30, 4.57it/s] 141it [00:31, 4.45it/s] 142it [00:31, 4.49it/s] 143it [00:31, 4.52it/s] 144it [00:31, 4.48it/s] 145it [00:32, 4.52it/s] 146it [00:32, 4.54it/s] 147it [00:32, 4.56it/s] 148it [00:32, 4.43it/s] 149it [00:32, 4.50it/s] 150it [00:33, 4.45it/s]2025-05-26 02:16:02,418 - INFO - [Epoch 038 | Batch 0150] IWAE-loss 2008.2279 | mean log_px -0.0121 | KL -1368.49 + 151it [00:33, 4.50it/s] 152it [00:33, 4.46it/s] 153it [00:33, 4.51it/s] 154it [00:34, 4.39it/s] 155it [00:34, 4.44it/s] 156it [00:34, 4.44it/s] 157it [00:34, 4.51it/s] 158it [00:34, 4.53it/s] 159it [00:35, 4.55it/s] 160it [00:35, 4.44it/s] 161it [00:35, 4.49it/s] 162it [00:35, 4.52it/s] 163it [00:36, 4.50it/s] 164it [00:36, 4.51it/s] 165it [00:36, 4.52it/s] 166it [00:36, 4.36it/s] 167it [00:36, 4.43it/s] 168it [00:37, 4.49it/s] 169it [00:37, 4.50it/s] 170it [00:37, 4.37it/s] 171it [00:37, 4.42it/s] 172it [00:38, 4.43it/s] 173it [00:38, 4.48it/s] 174it [00:38, 4.48it/s] 175it [00:38, 4.52it/s] 176it [00:38, 4.53it/s] 177it [00:39, 4.56it/s] 178it [00:39, 4.54it/s] 179it [00:39, 4.56it/s] 180it [00:39, 4.55it/s] 181it [00:40, 4.59it/s] 182it [00:40, 4.59it/s] 183it [00:40, 4.60it/s] 184it [00:40, 4.46it/s] 185it [00:40, 4.43it/s] 186it [00:41, 4.43it/s] 187it [00:41, 4.48it/s] 188it [00:41, 4.50it/s] 189it [00:41, 4.51it/s] 190it [00:42, 4.54it/s] 191it [00:42, 4.53it/s] 192it [00:42, 4.53it/s] 193it [00:42, 4.45it/s] 194it [00:42, 4.48it/s] 195it [00:43, 4.40it/s] 196it [00:43, 4.46it/s] 196it [00:43, 4.51it/s] +2025-05-26 02:16:12,579 - INFO - Epoch: 38, Objective: tensor([1541.9781], device='cuda:0', grad_fn=), Loss: 0.006994233466684818, KL/n: 27.92793846130371 + 0it [00:00, ?it/s]2025-05-26 02:16:12,975 - INFO - [Epoch 039 | Batch 0000] IWAE-loss 2019.2355 | mean log_px -0.0157 | KL -1369.24 + 1it [00:00, 3.11it/s] 2it [00:00, 3.47it/s] 3it [00:00, 3.90it/s] 4it [00:01, 4.13it/s] 5it [00:01, 4.27it/s] 6it [00:01, 4.28it/s] 7it [00:01, 4.34it/s] 8it [00:01, 4.14it/s] 9it [00:02, 4.27it/s] 10it [00:02, 4.19it/s] 11it [00:02, 3.47it/s] 12it [00:03, 3.68it/s] 13it [00:03, 3.83it/s] 14it [00:03, 3.84it/s] 15it [00:03, 4.00it/s] 16it [00:04, 4.04it/s] 17it [00:04, 4.08it/s] 18it [00:04, 4.10it/s] 19it [00:04, 4.24it/s] 20it [00:04, 4.20it/s] 21it [00:05, 4.18it/s] 22it [00:05, 4.08it/s] 23it [00:05, 4.22it/s] 24it [00:05, 4.17it/s] 25it [00:06, 4.22it/s] 26it [00:06, 4.25it/s] 27it [00:06, 4.32it/s] 28it [00:06, 4.26it/s] 29it [00:07, 4.35it/s] 30it [00:07, 4.41it/s] 31it [00:07, 4.44it/s] 32it [00:07, 4.44it/s] 33it [00:07, 4.50it/s] 34it [00:08, 4.31it/s] 35it [00:08, 4.40it/s] 36it [00:08, 4.29it/s] 37it [00:08, 4.30it/s] 38it [00:09, 4.26it/s] 39it [00:09, 4.27it/s] 40it [00:09, 4.14it/s] 41it [00:09, 4.11it/s] 42it [00:10, 4.07it/s] 43it [00:10, 4.06it/s] 44it [00:10, 4.08it/s] 45it [00:10, 3.98it/s] 46it [00:11, 4.11it/s] 47it [00:11, 4.00it/s] 48it [00:11, 3.91it/s] 49it [00:11, 3.97it/s] 50it [00:12, 4.03it/s]2025-05-26 02:16:25,021 - INFO - [Epoch 039 | Batch 0050] IWAE-loss 1660.3208 | mean log_px -0.0043 | KL -1355.90 + 51it [00:12, 4.15it/s] 52it [00:12, 4.23it/s] 53it [00:12, 4.21it/s] 54it [00:13, 4.34it/s] 55it [00:13, 4.33it/s] 56it [00:13, 4.31it/s] 57it [00:13, 4.38it/s] 58it [00:13, 4.45it/s] 59it [00:14, 4.38it/s] 60it [00:14, 4.31it/s] 61it [00:14, 4.28it/s] 62it [00:14, 4.18it/s] 63it [00:15, 4.31it/s] 64it [00:15, 4.32it/s] 65it [00:15, 4.31it/s] 66it [00:15, 4.32it/s] 67it [00:16, 4.35it/s] 68it [00:16, 4.29it/s] 69it [00:16, 4.24it/s] 70it [00:16, 4.34it/s] 71it [00:16, 4.43it/s] 72it [00:17, 4.43it/s] 73it [00:17, 4.45it/s] 74it [00:17, 4.41it/s] 75it [00:17, 4.40it/s] 76it [00:18, 4.32it/s] 77it [00:18, 4.30it/s] 78it [00:18, 4.27it/s] 79it [00:18, 4.30it/s] 80it [00:19, 4.41it/s] 81it [00:19, 4.35it/s] 82it [00:19, 4.30it/s] 83it [00:19, 4.26it/s] 84it [00:19, 4.37it/s] 85it [00:20, 4.45it/s] 86it [00:20, 4.47it/s] 87it [00:20, 4.38it/s] 88it [00:20, 4.35it/s] 89it [00:21, 4.41it/s] 90it [00:21, 4.37it/s] 91it [00:21, 4.32it/s] 92it [00:21, 4.26it/s] 93it [00:22, 4.29it/s] 94it [00:22, 4.24it/s] 95it [00:22, 4.25it/s] 96it [00:22, 4.22it/s] 97it [00:23, 4.09it/s] 98it [00:23, 4.11it/s] 99it [00:23, 4.22it/s] 100it [00:23, 4.18it/s]2025-05-26 02:16:36,590 - INFO - [Epoch 039 | Batch 0100] IWAE-loss 2246.3765 | mean log_px -0.0212 | KL -1355.14 + 101it [00:23, 4.31it/s] 102it [00:24, 4.39it/s] 103it [00:24, 4.33it/s] 104it [00:24, 4.37it/s] 105it [00:24, 4.41it/s] 106it [00:25, 4.37it/s] 107it [00:25, 4.44it/s] 108it [00:25, 4.35it/s] 109it [00:25, 4.32it/s] 110it [00:26, 4.20it/s] 111it [00:26, 4.19it/s] 112it [00:26, 4.32it/s] 113it [00:26, 4.28it/s] 114it [00:26, 4.36it/s] 115it [00:27, 4.34it/s] 116it [00:27, 4.29it/s] 117it [00:27, 4.28it/s] 118it [00:27, 4.25it/s] 119it [00:28, 4.25it/s] 120it [00:28, 4.21it/s] 121it [00:28, 4.30it/s] 122it [00:28, 4.40it/s] 123it [00:29, 4.47it/s] 124it [00:29, 4.36it/s] 125it [00:29, 4.32it/s] 126it [00:29, 4.28it/s] 127it [00:29, 4.29it/s] 128it [00:30, 4.36it/s] 129it [00:30, 4.44it/s] 130it [00:30, 4.33it/s] 131it [00:30, 4.30it/s] 132it [00:31, 4.28it/s] 133it [00:31, 4.39it/s] 134it [00:31, 4.24it/s] 135it [00:31, 4.33it/s] 136it [00:32, 4.39it/s] 137it [00:32, 4.46it/s] 138it [00:32, 4.44it/s] 139it [00:32, 4.51it/s] 140it [00:32, 4.25it/s] 141it [00:33, 4.34it/s] 142it [00:33, 4.28it/s] 143it [00:33, 4.25it/s] 144it [00:33, 4.23it/s] 145it [00:34, 4.34it/s] 146it [00:34, 4.30it/s] 147it [00:34, 4.37it/s] 148it [00:34, 4.34it/s] 149it [00:35, 4.30it/s] 150it [00:35, 4.37it/s]2025-05-26 02:16:48,117 - INFO - [Epoch 039 | Batch 0150] IWAE-loss 1432.8291 | mean log_px -0.0022 | KL -1358.02 + 151it [00:35, 4.44it/s] 152it [00:35, 4.18it/s] 153it [00:35, 4.19it/s] 154it [00:36, 4.29it/s] 155it [00:36, 4.38it/s] 156it [00:36, 4.28it/s] 157it [00:36, 4.24it/s] 158it [00:37, 4.32it/s] 159it [00:37, 4.30it/s] 160it [00:37, 4.28it/s] 161it [00:37, 4.28it/s] 162it [00:38, 4.17it/s] 163it [00:38, 4.24it/s] 164it [00:38, 4.28it/s] 165it [00:38, 4.25it/s] 166it [00:39, 4.22it/s] 167it [00:39, 4.34it/s] 168it [00:39, 4.40it/s] 169it [00:39, 4.33it/s] 170it [00:39, 4.24it/s] 171it [00:40, 4.31it/s] 172it [00:40, 4.38it/s] 173it [00:40, 4.45it/s] 174it [00:40, 4.50it/s] 175it [00:41, 4.50it/s] 176it [00:41, 4.39it/s] 177it [00:41, 4.36it/s] 178it [00:41, 4.41it/s] 179it [00:41, 4.47it/s] 180it [00:42, 4.33it/s] 181it [00:42, 4.29it/s] 182it [00:42, 4.24it/s] 183it [00:42, 4.26it/s] 184it [00:43, 4.37it/s] 185it [00:43, 4.39it/s] 186it [00:43, 4.33it/s] 187it [00:43, 4.31it/s] 188it [00:44, 4.37it/s] 189it [00:44, 4.44it/s] 190it [00:44, 4.46it/s] 191it [00:44, 4.40it/s] 192it [00:44, 4.46it/s] 193it [00:45, 4.44it/s] 194it [00:45, 4.38it/s] 195it [00:45, 4.34it/s] 196it [00:45, 4.41it/s] 196it [00:45, 4.27it/s] +2025-05-26 02:16:58,629 - INFO - Epoch: 39, Objective: tensor([1496.1766], device='cuda:0', grad_fn=), Loss: 0.00248352880589664, KL/n: 27.671977996826172 + 0it [00:00, ?it/s]2025-05-26 02:16:58,997 - INFO - [Epoch 040 | Batch 0000] IWAE-loss 1431.6737 | mean log_px -0.0017 | KL -1354.64 + 1it [00:00, 3.10it/s] 2it [00:00, 3.89it/s] 3it [00:00, 4.21it/s] 4it [00:00, 4.37it/s] 5it [00:01, 4.47it/s] 6it [00:01, 4.54it/s] 7it [00:01, 4.43it/s] 8it [00:01, 4.51it/s] 9it [00:02, 4.55it/s] 10it [00:02, 4.57it/s] 11it [00:02, 4.57it/s] 12it [00:02, 4.58it/s] 13it [00:02, 4.60it/s] 14it [00:03, 4.61it/s] 15it [00:03, 4.62it/s] 16it [00:03, 4.63it/s] 17it [00:03, 4.64it/s] 18it [00:04, 4.63it/s] 19it [00:04, 4.63it/s] 20it [00:04, 4.64it/s] 21it [00:04, 4.65it/s] 22it [00:04, 4.49it/s] 23it [00:05, 4.54it/s] 24it [00:05, 4.52it/s] 25it [00:05, 4.56it/s] 26it [00:05, 4.59it/s] 27it [00:05, 4.62it/s] 28it [00:06, 4.45it/s] 29it [00:06, 4.51it/s] 30it [00:06, 4.53it/s] 31it [00:06, 4.55it/s] 32it [00:07, 4.59it/s] 33it [00:07, 4.61it/s] 34it [00:07, 4.61it/s] 35it [00:07, 4.62it/s] 36it [00:07, 4.63it/s] 37it [00:08, 4.64it/s] 38it [00:08, 4.63it/s] 39it [00:08, 4.65it/s] 40it [00:08, 4.65it/s] 41it [00:09, 4.67it/s] 42it [00:09, 4.65it/s] 43it [00:09, 4.50it/s] 44it [00:09, 4.55it/s] 45it [00:09, 4.59it/s] 46it [00:10, 4.59it/s] 47it [00:10, 4.60it/s] 48it [00:10, 4.60it/s] 49it [00:10, 4.61it/s] 50it [00:10, 4.62it/s]2025-05-26 02:17:09,897 - INFO - [Epoch 040 | Batch 0050] IWAE-loss 1473.0669 | mean log_px -0.0033 | KL -1345.21 + 51it [00:11, 4.60it/s] 52it [00:11, 4.62it/s] 53it [00:11, 4.62it/s] 54it [00:11, 4.62it/s] 55it [00:12, 4.64it/s] 56it [00:12, 4.63it/s] 57it [00:12, 4.50it/s] 58it [00:12, 4.56it/s] 59it [00:12, 4.59it/s] 60it [00:13, 4.60it/s] 61it [00:13, 4.62it/s] 62it [00:13, 4.62it/s] 63it [00:13, 4.63it/s] 64it [00:14, 4.63it/s] 65it [00:14, 4.64it/s] 66it [00:14, 4.64it/s] 67it [00:14, 4.65it/s] 68it [00:14, 4.63it/s] 69it [00:15, 4.65it/s] 70it [00:15, 4.63it/s] 71it [00:15, 4.64it/s] 72it [00:15, 4.63it/s] 73it [00:15, 4.61it/s] 74it [00:16, 4.61it/s] 75it [00:16, 4.63it/s] 76it [00:16, 4.61it/s] 77it [00:16, 4.61it/s] 78it [00:17, 4.47it/s] 79it [00:17, 4.52it/s] 80it [00:17, 4.55it/s] 81it [00:17, 4.57it/s] 82it [00:17, 4.59it/s] 83it [00:18, 4.59it/s] 84it [00:18, 4.59it/s] 85it [00:18, 4.61it/s] 86it [00:18, 4.62it/s] 87it [00:19, 4.63it/s] 88it [00:19, 4.62it/s] 89it [00:19, 4.47it/s] 90it [00:19, 4.51it/s] 91it [00:19, 4.52it/s] 92it [00:20, 4.52it/s] 93it [00:20, 4.53it/s] 94it [00:20, 4.50it/s] 95it [00:20, 4.50it/s] 96it [00:21, 4.50it/s] 97it [00:21, 4.51it/s] 98it [00:21, 4.54it/s] 99it [00:21, 4.55it/s] 100it [00:21, 4.51it/s]2025-05-26 02:17:20,822 - INFO - [Epoch 040 | Batch 0100] IWAE-loss 1605.0006 | mean log_px -0.0037 | KL -1343.43 + 101it [00:22, 4.50it/s] 102it [00:22, 4.38it/s] 103it [00:22, 4.45it/s] 104it [00:22, 4.49it/s] 105it [00:23, 4.52it/s] 106it [00:23, 4.54it/s] 107it [00:23, 4.57it/s] 108it [00:23, 4.58it/s] 109it [00:23, 4.45it/s] 110it [00:24, 4.49it/s] 111it [00:24, 4.53it/s] 112it [00:24, 4.55it/s] 113it [00:24, 4.57it/s] 114it [00:25, 4.41it/s] 115it [00:25, 4.47it/s] 116it [00:25, 4.51it/s] 117it [00:25, 4.55it/s] 118it [00:25, 4.56it/s] 119it [00:26, 4.58it/s] 120it [00:26, 4.58it/s] 121it [00:26, 4.42it/s] 122it [00:26, 4.44it/s] 123it [00:27, 4.47it/s] 124it [00:27, 4.51it/s] 125it [00:27, 4.53it/s] 126it [00:27, 4.55it/s] 127it [00:27, 4.59it/s] 128it [00:28, 4.59it/s] 129it [00:28, 4.59it/s] 130it [00:28, 4.59it/s] 131it [00:28, 4.46it/s] 132it [00:28, 4.52it/s] 133it [00:29, 4.55it/s] 134it [00:29, 4.58it/s] 135it [00:29, 4.59it/s] 136it [00:29, 4.60it/s] 137it [00:30, 4.61it/s] 138it [00:30, 4.61it/s] 139it [00:30, 4.62it/s] 140it [00:30, 4.61it/s] 141it [00:30, 4.62it/s] 142it [00:31, 4.62it/s] 143it [00:31, 4.61it/s] 144it [00:31, 4.62it/s] 145it [00:31, 4.62it/s] 146it [00:32, 4.62it/s] 147it [00:32, 4.63it/s] 148it [00:32, 4.62it/s] 149it [00:32, 4.63it/s] 150it [00:32, 4.50it/s]2025-05-26 02:17:31,813 - INFO - [Epoch 040 | Batch 0150] IWAE-loss 1694.4125 | mean log_px -0.0137 | KL -1343.96 + 151it [00:33, 4.54it/s] 152it [00:33, 4.55it/s] 153it [00:33, 4.59it/s] 154it [00:33, 4.59it/s] 155it [00:33, 4.60it/s] 156it [00:34, 4.60it/s] 157it [00:34, 4.62it/s] 158it [00:34, 4.63it/s] 159it [00:34, 4.62it/s] 160it [00:35, 4.64it/s] 161it [00:35, 4.64it/s] 162it [00:35, 4.63it/s] 163it [00:35, 4.65it/s] 164it [00:35, 4.63it/s] 165it [00:36, 4.64it/s] 166it [00:36, 4.49it/s] 167it [00:36, 4.54it/s] 168it [00:36, 4.56it/s] 169it [00:37, 4.58it/s] 170it [00:37, 4.59it/s] 171it [00:37, 4.44it/s] 172it [00:37, 4.48it/s] 173it [00:37, 4.53it/s] 174it [00:38, 4.54it/s] 175it [00:38, 4.56it/s] 176it [00:38, 4.56it/s] 177it [00:38, 4.57it/s] 178it [00:39, 4.44it/s] 179it [00:39, 4.51it/s] 180it [00:39, 4.54it/s] 181it [00:39, 4.51it/s] 182it [00:39, 4.56it/s] 183it [00:40, 4.57it/s] 184it [00:40, 4.60it/s] 185it [00:40, 4.61it/s] 186it [00:40, 4.58it/s] 187it [00:40, 4.56it/s] 188it [00:41, 4.44it/s] 189it [00:41, 4.50it/s] 190it [00:41, 4.52it/s] 191it [00:41, 4.55it/s] 192it [00:42, 4.57it/s] 193it [00:42, 4.58it/s] 194it [00:42, 4.59it/s] 195it [00:42, 4.33it/s] 196it [00:43, 4.43it/s] 196it [00:43, 4.55it/s] +2025-05-26 02:17:41,833 - INFO - Epoch: 40, Objective: tensor([1448.3232], device='cuda:0', grad_fn=), Loss: 0.0037635706830769777, KL/n: 27.25246238708496 + 0it [00:00, ?it/s]2025-05-26 02:17:42,407 - INFO - [Epoch 041 | Batch 0000] IWAE-loss 1551.8910 | mean log_px -0.0058 | KL -1334.23 + 1it [00:00, 3.10it/s] 2it [00:00, 3.70it/s] 3it [00:00, 3.92it/s] 4it [00:01, 4.12it/s] 5it [00:01, 4.13it/s] 6it [00:01, 4.26it/s] 7it [00:01, 4.27it/s] 8it [00:01, 4.12it/s] 9it [00:02, 4.14it/s] 10it [00:02, 4.17it/s] 11it [00:02, 4.17it/s] 12it [00:02, 4.18it/s] 13it [00:03, 4.19it/s] 14it [00:03, 4.16it/s] 15it [00:03, 4.23it/s] 16it [00:03, 4.18it/s] 17it [00:04, 4.31it/s] 18it [00:04, 4.40it/s] 19it [00:04, 4.40it/s] 20it [00:04, 4.46it/s] 21it [00:05, 4.35it/s] 22it [00:05, 4.41it/s] 23it [00:05, 4.37it/s] 24it [00:05, 4.17it/s] 25it [00:05, 4.17it/s] 26it [00:06, 4.27it/s] 27it [00:06, 4.36it/s] 28it [00:06, 4.30it/s] 29it [00:06, 4.27it/s] 30it [00:07, 4.24it/s] 31it [00:07, 4.35it/s] 32it [00:07, 4.40it/s] 33it [00:07, 4.30it/s] 34it [00:08, 4.31it/s] 35it [00:08, 4.37it/s] 36it [00:08, 4.36it/s] 37it [00:08, 4.37it/s] 38it [00:08, 4.36it/s] 39it [00:09, 4.30it/s] 40it [00:09, 4.28it/s] 41it [00:09, 4.13it/s] 42it [00:09, 4.15it/s] 43it [00:10, 4.21it/s] 44it [00:10, 4.20it/s] 45it [00:10, 4.24it/s] 46it [00:10, 4.21it/s] 47it [00:11, 4.27it/s] 48it [00:11, 4.35it/s] 49it [00:11, 4.20it/s] 50it [00:11, 4.18it/s]2025-05-26 02:17:54,126 - INFO - [Epoch 041 | Batch 0050] IWAE-loss 1382.9540 | mean log_px -0.0018 | KL -1326.47 + 51it [00:12, 4.17it/s] 52it [00:12, 4.17it/s] 53it [00:12, 4.15it/s] 54it [00:12, 4.13it/s] 55it [00:13, 4.15it/s] 56it [00:13, 4.14it/s] 57it [00:13, 4.14it/s] 58it [00:13, 3.94it/s] 59it [00:14, 4.01it/s] 60it [00:14, 4.00it/s] 61it [00:14, 4.13it/s] 62it [00:14, 4.05it/s] 63it [00:14, 4.08it/s] 64it [00:15, 4.15it/s] 65it [00:15, 4.28it/s] 66it [00:15, 4.23it/s] 67it [00:15, 4.11it/s] 68it [00:16, 4.26it/s] 69it [00:16, 4.38it/s] 70it [00:16, 4.30it/s] 71it [00:16, 4.39it/s] 72it [00:17, 4.44it/s] 73it [00:17, 4.36it/s] 74it [00:17, 4.28it/s] 75it [00:17, 4.26it/s] 76it [00:17, 4.33it/s] 77it [00:18, 4.40it/s] 78it [00:18, 4.29it/s] 79it [00:18, 4.15it/s] 80it [00:18, 4.23it/s] 81it [00:19, 4.22it/s] 82it [00:19, 4.21it/s] 83it [00:19, 4.34it/s] 84it [00:19, 4.25it/s] 85it [00:20, 4.37it/s] 86it [00:20, 4.27it/s] 87it [00:20, 4.26it/s] 88it [00:20, 4.21it/s] 89it [00:21, 4.33it/s] 90it [00:21, 4.27it/s] 91it [00:21, 4.22it/s] 92it [00:21, 4.22it/s] 93it [00:21, 4.34it/s] 94it [00:22, 4.39it/s] 95it [00:22, 4.32it/s] 96it [00:22, 4.29it/s] 97it [00:22, 4.33it/s] 98it [00:23, 4.33it/s] 99it [00:23, 4.27it/s] 100it [00:23, 4.24it/s]2025-05-26 02:18:05,924 - INFO - [Epoch 041 | Batch 0100] IWAE-loss 1411.5579 | mean log_px -0.0019 | KL -1321.44 + 101it [00:23, 4.12it/s] 102it [00:24, 4.14it/s] 103it [00:24, 4.24it/s] 104it [00:24, 4.20it/s] 105it [00:24, 4.21it/s] 106it [00:25, 4.20it/s] 107it [00:25, 4.07it/s] 108it [00:25, 4.20it/s] 109it [00:25, 4.31it/s] 110it [00:25, 4.38it/s] 111it [00:26, 4.44it/s] 112it [00:26, 4.26it/s] 113it [00:26, 4.25it/s] 114it [00:26, 4.31it/s] 115it [00:27, 4.34it/s] 116it [00:27, 4.42it/s] 117it [00:27, 4.46it/s] 118it [00:27, 4.37it/s] 119it [00:28, 4.39it/s] 120it [00:28, 4.42it/s] 121it [00:28, 4.41it/s] 122it [00:28, 4.39it/s] 123it [00:28, 4.21it/s] 124it [00:29, 4.23it/s] 125it [00:29, 4.20it/s] 126it [00:29, 4.17it/s] 127it [00:29, 4.13it/s] 128it [00:30, 4.22it/s] 129it [00:30, 4.32it/s] 130it [00:30, 4.15it/s] 131it [00:30, 4.27it/s] 132it [00:31, 4.30it/s] 133it [00:31, 4.29it/s] 134it [00:31, 4.37it/s] 135it [00:31, 4.34it/s] 136it [00:32, 4.29it/s] 137it [00:32, 4.38it/s] 138it [00:32, 4.38it/s] 139it [00:32, 4.32it/s] 140it [00:32, 4.27it/s] 141it [00:33, 4.27it/s] 142it [00:33, 4.34it/s] 143it [00:33, 4.41it/s] 144it [00:33, 4.31it/s] 145it [00:34, 4.41it/s] 146it [00:34, 4.37it/s] 147it [00:34, 4.34it/s] 148it [00:34, 4.27it/s] 149it [00:35, 4.33it/s] 150it [00:35, 4.28it/s]2025-05-26 02:18:17,572 - INFO - [Epoch 041 | Batch 0150] IWAE-loss 1899.3881 | mean log_px -0.0105 | KL -1315.73 + 151it [00:35, 4.25it/s] 152it [00:35, 4.26it/s] 153it [00:35, 4.13it/s] 154it [00:36, 4.14it/s] 155it [00:36, 4.21it/s] 156it [00:36, 4.21it/s] 157it [00:36, 4.21it/s] 158it [00:37, 4.21it/s] 159it [00:37, 4.32it/s] 160it [00:37, 4.43it/s] 161it [00:37, 4.48it/s] 162it [00:38, 4.27it/s] 163it [00:38, 4.39it/s] 164it [00:38, 4.43it/s] 165it [00:38, 4.47it/s] 166it [00:38, 4.37it/s] 167it [00:39, 4.34it/s] 168it [00:39, 4.32it/s] 169it [00:39, 4.42it/s] 170it [00:39, 4.21it/s] 171it [00:40, 4.29it/s] 172it [00:40, 4.39it/s] 173it [00:40, 4.35it/s] 174it [00:40, 4.30it/s] 175it [00:41, 4.30it/s] 176it [00:41, 4.26it/s] 177it [00:41, 4.34it/s] 178it [00:41, 4.27it/s] 179it [00:41, 4.27it/s] 180it [00:42, 4.36it/s] 181it [00:42, 4.42it/s] 182it [00:42, 4.48it/s] 183it [00:42, 4.43it/s] 184it [00:43, 4.50it/s] 185it [00:43, 4.40it/s] 186it [00:43, 4.19it/s] 187it [00:43, 4.19it/s] 188it [00:44, 4.16it/s] 189it [00:44, 4.27it/s] 190it [00:44, 4.31it/s] 191it [00:44, 4.27it/s] 192it [00:44, 4.26it/s] 193it [00:45, 4.23it/s] 194it [00:45, 4.33it/s] 195it [00:45, 4.29it/s] 196it [00:45, 4.35it/s] 196it [00:45, 4.26it/s] +2025-05-26 02:18:28,139 - INFO - Epoch: 41, Objective: tensor([1496.4008], device='cuda:0', grad_fn=), Loss: 0.004434915725141764, KL/n: 26.789295196533203 + 0it [00:00, ?it/s]2025-05-26 02:18:28,524 - INFO - [Epoch 042 | Batch 0000] IWAE-loss 1575.5166 | mean log_px -0.0100 | KL -1312.57 + 1it [00:00, 3.29it/s] 2it [00:00, 3.94it/s] 3it [00:00, 4.21it/s] 4it [00:00, 4.35it/s] 5it [00:01, 4.27it/s] 6it [00:01, 4.39it/s] 7it [00:01, 4.45it/s] 8it [00:01, 4.33it/s] 9it [00:02, 4.44it/s] 10it [00:02, 3.57it/s] 11it [00:02, 3.84it/s] 12it [00:02, 4.04it/s] 13it [00:03, 4.20it/s] 14it [00:03, 4.31it/s] 15it [00:03, 4.41it/s] 16it [00:03, 4.47it/s] 17it [00:04, 4.52it/s] 18it [00:04, 4.57it/s] 19it [00:04, 4.59it/s] 20it [00:04, 4.60it/s] 21it [00:04, 4.50it/s] 22it [00:05, 4.49it/s] 23it [00:05, 4.56it/s] 24it [00:05, 4.56it/s] 25it [00:05, 4.42it/s] 26it [00:06, 4.43it/s] 27it [00:06, 4.51it/s] 28it [00:06, 4.56it/s] 29it [00:06, 4.61it/s] 30it [00:06, 4.63it/s] 31it [00:07, 4.64it/s] 32it [00:07, 4.62it/s] 33it [00:07, 4.64it/s] 34it [00:07, 4.65it/s] 35it [00:07, 4.66it/s] 36it [00:08, 4.65it/s] 37it [00:08, 4.66it/s] 38it [00:08, 4.49it/s] 39it [00:08, 4.56it/s] 40it [00:09, 4.58it/s] 41it [00:09, 4.59it/s] 42it [00:09, 4.61it/s] 43it [00:09, 4.62it/s] 44it [00:09, 4.48it/s] 45it [00:10, 4.55it/s] 46it [00:10, 4.57it/s] 47it [00:10, 4.61it/s] 48it [00:10, 4.62it/s] 49it [00:10, 4.64it/s] 50it [00:11, 4.65it/s]2025-05-26 02:18:39,640 - INFO - [Epoch 042 | Batch 0050] IWAE-loss 1876.5878 | mean log_px -0.0155 | KL -1306.35 + 51it [00:11, 4.66it/s] 52it [00:11, 4.65it/s] 53it [00:11, 4.66it/s] 54it [00:12, 4.66it/s] 55it [00:12, 4.67it/s] 56it [00:12, 4.64it/s] 57it [00:12, 4.65it/s] 58it [00:12, 4.65it/s] 59it [00:13, 4.65it/s] 60it [00:13, 4.65it/s] 61it [00:13, 4.65it/s] 62it [00:13, 4.65it/s] 63it [00:14, 4.51it/s] 64it [00:14, 4.56it/s] 65it [00:14, 4.59it/s] 66it [00:14, 4.61it/s] 67it [00:14, 4.62it/s] 68it [00:15, 4.61it/s] 69it [00:15, 4.48it/s] 70it [00:15, 4.55it/s] 71it [00:15, 4.58it/s] 72it [00:15, 4.58it/s] 73it [00:16, 4.61it/s] 74it [00:16, 4.62it/s] 75it [00:16, 4.51it/s] 76it [00:16, 4.56it/s] 77it [00:17, 4.60it/s] 78it [00:17, 4.61it/s] 79it [00:17, 4.63it/s] 80it [00:17, 4.48it/s] 81it [00:17, 4.55it/s] 82it [00:18, 4.57it/s] 83it [00:18, 4.60it/s] 84it [00:18, 4.60it/s] 85it [00:18, 4.59it/s] 86it [00:19, 4.61it/s] 87it [00:19, 4.62it/s] 88it [00:19, 4.63it/s] 89it [00:19, 4.64it/s] 90it [00:19, 4.64it/s] 91it [00:20, 4.49it/s] 92it [00:20, 4.54it/s] 93it [00:20, 4.59it/s] 94it [00:20, 4.60it/s] 95it [00:20, 4.62it/s] 96it [00:21, 4.63it/s] 97it [00:21, 4.49it/s] 98it [00:21, 4.55it/s] 99it [00:21, 4.58it/s] 100it [00:22, 4.59it/s]2025-05-26 02:18:50,522 - INFO - [Epoch 042 | Batch 0100] IWAE-loss 1476.0132 | mean log_px -0.0030 | KL -1307.70 + 101it [00:22, 4.61it/s] 102it [00:22, 4.61it/s] 103it [00:22, 4.62it/s] 104it [00:22, 4.62it/s] 105it [00:23, 4.63it/s] 106it [00:23, 4.44it/s] 107it [00:23, 4.52it/s] 108it [00:23, 4.55it/s] 109it [00:24, 4.57it/s] 110it [00:24, 4.59it/s] 111it [00:24, 4.57it/s] 112it [00:24, 4.56it/s] 113it [00:24, 4.55it/s] 114it [00:25, 4.55it/s] 115it [00:25, 4.42it/s] 116it [00:25, 4.49it/s] 117it [00:25, 4.53it/s] 118it [00:26, 4.56it/s] 119it [00:26, 4.59it/s] 120it [00:26, 4.55it/s] 121it [00:26, 4.58it/s] 122it [00:26, 4.59it/s] 123it [00:27, 4.60it/s] 124it [00:27, 4.61it/s] 125it [00:27, 4.62it/s] 126it [00:27, 4.63it/s] 127it [00:27, 4.64it/s] 128it [00:28, 4.63it/s] 129it [00:28, 4.64it/s] 130it [00:28, 4.63it/s] 131it [00:28, 4.53it/s] 132it [00:29, 4.58it/s] 133it [00:29, 4.61it/s] 134it [00:29, 4.61it/s] 135it [00:29, 4.61it/s] 136it [00:29, 4.48it/s] 137it [00:30, 4.53it/s] 138it [00:30, 4.57it/s] 139it [00:30, 4.59it/s] 140it [00:30, 4.61it/s] 141it [00:31, 4.63it/s] 142it [00:31, 4.46it/s] 143it [00:31, 4.43it/s] 144it [00:31, 4.49it/s] 145it [00:31, 4.54it/s] 146it [00:32, 4.57it/s] 147it [00:32, 4.61it/s] 148it [00:32, 4.46it/s] 149it [00:32, 4.52it/s] 150it [00:33, 4.55it/s]2025-05-26 02:19:01,484 - INFO - [Epoch 042 | Batch 0150] IWAE-loss 1960.0638 | mean log_px -0.0210 | KL -1302.23 + 151it [00:33, 4.55it/s] 152it [00:33, 4.58it/s] 153it [00:33, 4.60it/s] 154it [00:33, 4.47it/s] 155it [00:34, 4.54it/s] 156it [00:34, 4.57it/s] 157it [00:34, 4.59it/s] 158it [00:34, 4.60it/s] 159it [00:35, 4.61it/s] 160it [00:35, 4.47it/s] 161it [00:35, 4.51it/s] 162it [00:35, 4.55it/s] 163it [00:35, 4.59it/s] 164it [00:36, 4.59it/s] 165it [00:36, 4.60it/s] 166it [00:36, 4.46it/s] 167it [00:36, 4.53it/s] 168it [00:36, 4.56it/s] 169it [00:37, 4.59it/s] 170it [00:37, 4.59it/s] 171it [00:37, 4.61it/s] 172it [00:37, 4.48it/s] 173it [00:38, 4.53it/s] 174it [00:38, 4.56it/s] 175it [00:38, 4.59it/s] 176it [00:38, 4.60it/s] 177it [00:38, 4.62it/s] 178it [00:39, 4.63it/s] 179it [00:39, 4.49it/s] 180it [00:39, 4.53it/s] 181it [00:39, 4.56it/s] 182it [00:40, 4.58it/s] 183it [00:40, 4.60it/s] 184it [00:40, 4.46it/s] 185it [00:40, 4.50it/s] 186it [00:40, 4.55it/s] 187it [00:41, 4.58it/s] 188it [00:41, 4.59it/s] 189it [00:41, 4.61it/s] 190it [00:41, 4.57it/s] 191it [00:42, 4.44it/s] 192it [00:42, 4.51it/s] 193it [00:42, 4.54it/s] 194it [00:42, 4.56it/s] 195it [00:42, 4.46it/s] 196it [00:43, 4.52it/s] 196it [00:43, 4.54it/s] +2025-05-26 02:19:11,486 - INFO - Epoch: 42, Objective: tensor([1482.2252], device='cuda:0', grad_fn=), Loss: 0.007103536278009415, KL/n: 26.547670364379883 + 0it [00:00, ?it/s]2025-05-26 02:19:11,882 - INFO - [Epoch 043 | Batch 0000] IWAE-loss 1369.3737 | mean log_px -0.0017 | KL -1301.93 + 1it [00:00, 3.11it/s] 2it [00:00, 3.87it/s] 3it [00:00, 4.20it/s] 4it [00:00, 4.37it/s] 5it [00:01, 4.47it/s] 6it [00:01, 4.50it/s] 7it [00:01, 4.41it/s] 8it [00:01, 4.47it/s] 9it [00:02, 4.52it/s] 10it [00:02, 4.54it/s] 11it [00:02, 4.43it/s] 12it [00:02, 4.48it/s] 13it [00:02, 4.53it/s] 14it [00:03, 4.55it/s] 15it [00:03, 4.58it/s] 16it [00:03, 4.60it/s] 17it [00:03, 4.62it/s] 18it [00:04, 4.61it/s] 19it [00:04, 4.61it/s] 20it [00:04, 4.62it/s] 21it [00:04, 4.63it/s] 22it [00:04, 4.62it/s] 23it [00:05, 4.49it/s] 24it [00:05, 4.53it/s] 25it [00:05, 4.56it/s] 26it [00:05, 4.57it/s] 27it [00:06, 4.59it/s] 28it [00:06, 4.60it/s] 29it [00:06, 4.62it/s] 30it [00:06, 4.62it/s] 31it [00:06, 4.63it/s] 32it [00:07, 4.63it/s] 33it [00:07, 4.63it/s] 34it [00:07, 4.63it/s] 35it [00:07, 4.63it/s] 36it [00:07, 4.63it/s] 37it [00:08, 4.62it/s] 38it [00:08, 4.49it/s] 39it [00:08, 4.54it/s] 40it [00:08, 4.56it/s] 41it [00:09, 4.58it/s] 42it [00:09, 4.60it/s] 43it [00:09, 4.61it/s] 44it [00:09, 4.58it/s] 45it [00:09, 4.58it/s] 46it [00:10, 4.57it/s] 47it [00:10, 4.59it/s] 48it [00:10, 4.59it/s] 49it [00:10, 4.61it/s] 50it [00:11, 4.61it/s]2025-05-26 02:19:22,781 - INFO - [Epoch 043 | Batch 0050] IWAE-loss 1440.7559 | mean log_px -0.0027 | KL -1296.14 + 51it [00:11, 4.63it/s] 52it [00:11, 4.63it/s] 53it [00:11, 4.63it/s] 54it [00:11, 4.61it/s] 55it [00:12, 4.61it/s] 56it [00:12, 4.62it/s] 57it [00:12, 4.63it/s] 58it [00:12, 4.49it/s] 59it [00:12, 4.55it/s] 60it [00:13, 4.57it/s] 61it [00:13, 4.59it/s] 62it [00:13, 4.58it/s] 63it [00:13, 4.55it/s] 64it [00:14, 4.57it/s] 65it [00:14, 4.60it/s] 66it [00:14, 4.60it/s] 67it [00:14, 4.60it/s] 68it [00:14, 4.61it/s] 69it [00:15, 4.62it/s] 70it [00:15, 4.62it/s] 71it [00:15, 4.62it/s] 72it [00:15, 4.61it/s] 73it [00:16, 4.47it/s] 74it [00:16, 4.53it/s] 75it [00:16, 4.56it/s] 76it [00:16, 4.57it/s] 77it [00:16, 4.59it/s] 78it [00:17, 4.60it/s] 79it [00:17, 4.60it/s] 80it [00:17, 4.48it/s] 81it [00:17, 4.54it/s] 82it [00:17, 4.56it/s] 83it [00:18, 4.58it/s] 84it [00:18, 4.59it/s] 85it [00:18, 4.61it/s] 86it [00:18, 4.60it/s] 87it [00:19, 4.47it/s] 88it [00:19, 4.51it/s] 89it [00:19, 4.43it/s] 90it [00:19, 4.47it/s] 91it [00:19, 4.49it/s] 92it [00:20, 4.49it/s] 93it [00:20, 4.50it/s] 94it [00:20, 4.48it/s] 95it [00:20, 4.52it/s] 96it [00:21, 4.41it/s] 97it [00:21, 4.48it/s] 98it [00:21, 4.47it/s] 99it [00:21, 4.52it/s] 100it [00:21, 4.55it/s]2025-05-26 02:19:33,766 - INFO - [Epoch 043 | Batch 0100] IWAE-loss 1553.6163 | mean log_px -0.0052 | KL -1291.85 + 101it [00:22, 4.58it/s] 102it [00:22, 4.58it/s] 103it [00:22, 4.60it/s] 104it [00:22, 4.61it/s] 105it [00:23, 4.61it/s] 106it [00:23, 4.61it/s] 107it [00:23, 4.62it/s] 108it [00:23, 4.62it/s] 109it [00:23, 4.63it/s] 110it [00:24, 4.48it/s] 111it [00:24, 4.54it/s] 112it [00:24, 4.55it/s] 113it [00:24, 4.58it/s] 114it [00:25, 4.60it/s] 115it [00:25, 4.61it/s] 116it [00:25, 4.62it/s] 117it [00:25, 4.63it/s] 118it [00:25, 4.62it/s] 119it [00:26, 4.63it/s] 120it [00:26, 4.64it/s] 121it [00:26, 4.48it/s] 122it [00:26, 4.53it/s] 123it [00:27, 4.55it/s] 124it [00:27, 4.56it/s] 125it [00:27, 4.59it/s] 126it [00:27, 4.60it/s] 127it [00:27, 4.61it/s] 128it [00:28, 4.60it/s] 129it [00:28, 4.62it/s] 130it [00:28, 4.61it/s] 131it [00:28, 4.62it/s] 132it [00:28, 4.62it/s] 133it [00:29, 4.62it/s] 134it [00:29, 4.63it/s] 135it [00:29, 4.63it/s] 136it [00:29, 4.62it/s] 137it [00:30, 4.64it/s] 138it [00:30, 4.62it/s] 139it [00:30, 4.64it/s] 140it [00:30, 4.62it/s] 141it [00:30, 4.63it/s] 142it [00:31, 4.48it/s] 143it [00:31, 4.55it/s] 144it [00:31, 4.58it/s] 145it [00:31, 4.59it/s] 146it [00:31, 4.60it/s] 147it [00:32, 4.62it/s] 148it [00:32, 4.61it/s] 149it [00:32, 4.62it/s] 150it [00:32, 4.60it/s]2025-05-26 02:19:44,637 - INFO - [Epoch 043 | Batch 0150] IWAE-loss 2060.3196 | mean log_px -0.0110 | KL -1286.15 + 151it [00:33, 4.46it/s] 152it [00:33, 4.49it/s] 153it [00:33, 4.55it/s] 154it [00:33, 4.57it/s] 155it [00:33, 4.60it/s] 156it [00:34, 4.61it/s] 157it [00:34, 4.47it/s] 158it [00:34, 4.53it/s] 159it [00:34, 4.55it/s] 160it [00:35, 4.57it/s] 161it [00:35, 4.59it/s] 162it [00:35, 4.60it/s] 163it [00:35, 4.62it/s] 164it [00:35, 4.47it/s] 165it [00:36, 4.53it/s] 166it [00:36, 4.56it/s] 167it [00:36, 4.58it/s] 168it [00:36, 4.59it/s] 169it [00:37, 4.60it/s] 170it [00:37, 4.61it/s] 171it [00:37, 4.63it/s] 172it [00:37, 4.62it/s] 173it [00:37, 4.62it/s] 174it [00:38, 4.63it/s] 175it [00:38, 4.47it/s] 176it [00:38, 4.53it/s] 177it [00:38, 4.57it/s] 178it [00:38, 4.58it/s] 179it [00:39, 4.59it/s] 180it [00:39, 4.59it/s] 181it [00:39, 4.62it/s] 182it [00:39, 4.63it/s] 183it [00:40, 4.49it/s] 184it [00:40, 4.55it/s] 185it [00:40, 4.58it/s] 186it [00:40, 4.59it/s] 187it [00:40, 4.60it/s] 188it [00:41, 4.59it/s] 189it [00:41, 4.60it/s] 190it [00:41, 4.61it/s] 191it [00:41, 4.61it/s] 192it [00:42, 4.61it/s] 193it [00:42, 4.62it/s] 194it [00:42, 4.62it/s] 195it [00:42, 4.37it/s] 196it [00:42, 4.46it/s] 196it [00:43, 4.56it/s] +2025-05-26 02:19:54,629 - INFO - Epoch: 43, Objective: tensor([1422.8802], device='cuda:0', grad_fn=), Loss: 0.004217221401631832, KL/n: 26.26324462890625 + 0it [00:00, ?it/s]2025-05-26 02:19:55,181 - INFO - [Epoch 044 | Batch 0000] IWAE-loss 1640.3896 | mean log_px -0.0097 | KL -1284.26 + 1it [00:00, 3.33it/s] 2it [00:00, 3.95it/s] 3it [00:00, 4.20it/s] 4it [00:00, 4.28it/s] 5it [00:01, 4.42it/s] 6it [00:01, 4.47it/s] 7it [00:01, 4.51it/s] 8it [00:01, 4.51it/s] 9it [00:02, 4.52it/s] 10it [00:02, 4.48it/s] 11it [00:02, 4.52it/s] 12it [00:02, 4.54it/s] 13it [00:02, 4.53it/s] 14it [00:03, 4.53it/s] 15it [00:03, 4.54it/s] 16it [00:03, 4.59it/s] 17it [00:03, 4.48it/s] 18it [00:04, 4.56it/s] 19it [00:04, 4.62it/s] 20it [00:04, 4.65it/s] 21it [00:04, 4.68it/s] 22it [00:04, 4.69it/s] 23it [00:05, 4.71it/s] 24it [00:05, 4.71it/s] 25it [00:05, 4.73it/s] 26it [00:05, 4.72it/s] 27it [00:05, 4.74it/s] 28it [00:06, 4.49it/s] 29it [00:06, 4.43it/s] 30it [00:06, 4.51it/s] 31it [00:06, 4.53it/s] 32it [00:07, 4.58it/s] 33it [00:07, 4.63it/s] 34it [00:07, 4.55it/s] 35it [00:07, 4.44it/s] 36it [00:07, 4.35it/s] 37it [00:08, 4.45it/s] 38it [00:08, 4.50it/s] 39it [00:08, 4.52it/s] 40it [00:08, 4.56it/s] 41it [00:09, 4.61it/s] 42it [00:09, 4.61it/s] 43it [00:09, 4.50it/s] 44it [00:09, 4.46it/s] 45it [00:09, 4.54it/s] 46it [00:10, 4.51it/s] 47it [00:10, 4.57it/s] 48it [00:10, 4.60it/s] 49it [00:10, 4.63it/s] 50it [00:11, 4.63it/s]2025-05-26 02:20:06,125 - INFO - [Epoch 044 | Batch 0050] IWAE-loss 1426.9062 | mean log_px -0.0024 | KL -1280.41 + 51it [00:11, 4.65it/s] 52it [00:11, 4.51it/s] 53it [00:11, 4.58it/s] 54it [00:11, 4.62it/s] 55it [00:12, 4.64it/s] 56it [00:12, 4.59it/s] 57it [00:12, 4.64it/s] 58it [00:12, 4.51it/s] 59it [00:12, 4.58it/s] 60it [00:13, 4.61it/s] 61it [00:13, 4.63it/s] 62it [00:13, 4.66it/s] 63it [00:13, 4.67it/s] 64it [00:14, 4.67it/s] 65it [00:14, 4.68it/s] 66it [00:14, 4.53it/s] 67it [00:14, 4.54it/s] 68it [00:14, 4.59it/s] 69it [00:15, 4.61it/s] 70it [00:15, 4.65it/s] 71it [00:15, 4.65it/s] 72it [00:15, 4.67it/s] 73it [00:16, 4.69it/s] 74it [00:16, 4.54it/s] 75it [00:16, 4.61it/s] 76it [00:16, 4.60it/s] 77it [00:16, 4.60it/s] 78it [00:17, 4.64it/s] 79it [00:17, 4.67it/s] 80it [00:17, 4.67it/s] 81it [00:17, 4.53it/s] 82it [00:17, 4.59it/s] 83it [00:18, 4.63it/s] 84it [00:18, 4.64it/s] 85it [00:18, 4.67it/s] 86it [00:18, 4.66it/s] 87it [00:19, 4.69it/s] 88it [00:19, 4.70it/s] 89it [00:19, 4.70it/s] 90it [00:19, 4.54it/s] 91it [00:19, 4.61it/s] 92it [00:20, 4.64it/s] 93it [00:20, 4.66it/s] 94it [00:20, 4.65it/s] 95it [00:20, 4.69it/s] 96it [00:20, 4.69it/s] 97it [00:21, 4.67it/s] 98it [00:21, 4.54it/s] 99it [00:21, 4.60it/s] 100it [00:21, 4.62it/s]2025-05-26 02:20:16,940 - INFO - [Epoch 044 | Batch 0100] IWAE-loss 1384.5699 | mean log_px -0.0015 | KL -1274.65 + 101it [00:22, 4.62it/s] 102it [00:22, 4.64it/s] 103it [00:22, 4.68it/s] 104it [00:22, 4.69it/s] 105it [00:22, 4.69it/s] 106it [00:23, 4.69it/s] 107it [00:23, 4.70it/s] 108it [00:23, 4.70it/s] 109it [00:23, 4.67it/s] 110it [00:23, 4.66it/s] 111it [00:24, 4.69it/s] 112it [00:24, 4.52it/s] 113it [00:24, 4.59it/s] 114it [00:24, 4.61it/s] 115it [00:25, 4.64it/s] 116it [00:25, 4.65it/s] 117it [00:25, 4.67it/s] 118it [00:25, 4.51it/s] 119it [00:25, 4.57it/s] 120it [00:26, 4.62it/s] 121it [00:26, 4.65it/s] 122it [00:26, 4.66it/s] 123it [00:26, 4.68it/s] 124it [00:27, 4.68it/s] 125it [00:27, 4.69it/s] 126it [00:27, 4.52it/s] 127it [00:27, 4.57it/s] 128it [00:27, 4.63it/s] 129it [00:28, 4.66it/s] 130it [00:28, 4.67it/s] 131it [00:28, 4.68it/s] 132it [00:28, 4.69it/s] 133it [00:28, 4.70it/s] 134it [00:29, 4.67it/s] 135it [00:29, 4.54it/s] 136it [00:29, 4.61it/s] 137it [00:29, 4.64it/s] 138it [00:30, 4.66it/s] 139it [00:30, 4.68it/s] 140it [00:30, 4.68it/s] 141it [00:30, 4.59it/s] 142it [00:30, 4.61it/s] 143it [00:31, 4.64it/s] 144it [00:31, 4.68it/s] 145it [00:31, 4.69it/s] 146it [00:31, 4.54it/s] 147it [00:31, 4.61it/s] 148it [00:32, 4.63it/s] 149it [00:32, 4.65it/s] 150it [00:32, 4.63it/s]2025-05-26 02:20:27,715 - INFO - [Epoch 044 | Batch 0150] IWAE-loss 1477.1619 | mean log_px -0.0045 | KL -1270.62 + 151it [00:32, 4.49it/s] 152it [00:33, 4.56it/s] 153it [00:33, 4.62it/s] 154it [00:33, 4.64it/s] 155it [00:33, 4.65it/s] 156it [00:33, 4.66it/s] 157it [00:34, 4.64it/s] 158it [00:34, 4.66it/s] 159it [00:34, 4.51it/s] 160it [00:34, 4.58it/s] 161it [00:35, 4.62it/s] 162it [00:35, 4.62it/s] 163it [00:35, 4.64it/s] 164it [00:35, 4.66it/s] 165it [00:35, 4.51it/s] 166it [00:36, 4.58it/s] 167it [00:36, 4.62it/s] 168it [00:36, 4.63it/s] 169it [00:36, 4.65it/s] 170it [00:36, 4.66it/s] 171it [00:37, 4.67it/s] 172it [00:37, 4.68it/s] 173it [00:37, 4.69it/s] 174it [00:37, 4.69it/s] 175it [00:38, 4.54it/s] 176it [00:38, 4.60it/s] 177it [00:38, 4.63it/s] 178it [00:38, 4.65it/s] 179it [00:38, 4.62it/s] 180it [00:39, 4.41it/s] 181it [00:39, 4.51it/s] 182it [00:39, 4.56it/s] 183it [00:39, 4.61it/s] 184it [00:39, 4.63it/s] 185it [00:40, 4.49it/s] 186it [00:40, 4.53it/s] 187it [00:40, 4.59it/s] 188it [00:40, 4.62it/s] 189it [00:41, 4.65it/s] 190it [00:41, 4.66it/s] 191it [00:41, 4.67it/s] 192it [00:41, 4.53it/s] 193it [00:41, 4.60it/s] 194it [00:42, 4.63it/s] 195it [00:42, 4.51it/s] 196it [00:42, 4.58it/s] 196it [00:42, 4.59it/s] +2025-05-26 02:20:37,631 - INFO - Epoch: 44, Objective: tensor([1421.5844], device='cuda:0', grad_fn=), Loss: 0.0031296706292778254, KL/n: 25.87446403503418 + 0it [00:00, ?it/s]2025-05-26 02:20:38,028 - INFO - [Epoch 045 | Batch 0000] IWAE-loss 1360.7262 | mean log_px -0.0022 | KL -1263.72 + 1it [00:00, 2.89it/s] 2it [00:00, 3.52it/s] 3it [00:00, 3.76it/s] 4it [00:01, 3.96it/s] 5it [00:01, 4.02it/s] 6it [00:01, 4.09it/s] 7it [00:01, 4.12it/s] 8it [00:02, 4.15it/s] 9it [00:02, 4.20it/s] 10it [00:02, 4.35it/s] 11it [00:02, 4.45it/s] 12it [00:02, 4.39it/s] 13it [00:03, 4.40it/s] 14it [00:03, 4.35it/s] 15it [00:03, 4.30it/s] 16it [00:03, 4.29it/s] 17it [00:04, 4.26it/s] 18it [00:04, 4.16it/s] 19it [00:04, 4.31it/s] 20it [00:04, 4.33it/s] 21it [00:05, 4.30it/s] 22it [00:05, 4.38it/s] 23it [00:05, 4.21it/s] 24it [00:05, 4.17it/s] 25it [00:05, 4.14it/s] 26it [00:06, 4.24it/s] 27it [00:06, 4.36it/s] 28it [00:06, 4.45it/s] 29it [00:06, 4.34it/s] 30it [00:07, 4.45it/s] 31it [00:07, 4.40it/s] 32it [00:07, 4.42it/s] 33it [00:07, 4.48it/s] 34it [00:07, 4.41it/s] 35it [00:08, 4.47it/s] 36it [00:08, 4.26it/s] 37it [00:08, 4.28it/s] 38it [00:08, 4.41it/s] 39it [00:09, 4.36it/s] 40it [00:09, 4.32it/s] 41it [00:09, 4.34it/s] 42it [00:09, 4.28it/s] 43it [00:10, 4.30it/s] 44it [00:10, 4.34it/s] 45it [00:10, 4.42it/s] 46it [00:10, 4.47it/s] 47it [00:10, 4.40it/s] 48it [00:11, 4.33it/s] 49it [00:11, 4.40it/s] 50it [00:11, 4.48it/s]2025-05-26 02:20:49,596 - INFO - [Epoch 045 | Batch 0050] IWAE-loss 1378.6949 | mean log_px -0.0038 | KL -1256.42 + 51it [00:11, 4.40it/s] 52it [00:12, 4.34it/s] 53it [00:12, 4.30it/s] 54it [00:12, 4.24it/s] 55it [00:12, 4.38it/s] 56it [00:13, 4.31it/s] 57it [00:13, 4.30it/s] 58it [00:13, 4.29it/s] 59it [00:13, 4.42it/s] 60it [00:13, 4.35it/s] 61it [00:14, 4.44it/s] 62it [00:14, 4.50it/s] 63it [00:14, 4.46it/s] 64it [00:14, 4.26it/s] 65it [00:15, 4.32it/s] 66it [00:15, 4.32it/s] 67it [00:15, 4.37it/s] 68it [00:15, 4.45it/s] 69it [00:16, 4.43it/s] 70it [00:16, 4.35it/s] 71it [00:16, 4.20it/s] 72it [00:16, 4.30it/s] 73it [00:16, 4.28it/s] 74it [00:17, 4.28it/s] 75it [00:17, 4.26it/s] 76it [00:17, 4.33it/s] 77it [00:17, 4.27it/s] 78it [00:18, 4.36it/s] 79it [00:18, 4.35it/s] 80it [00:18, 4.28it/s] 81it [00:18, 4.25it/s] 82it [00:19, 4.28it/s] 83it [00:19, 4.27it/s] 84it [00:19, 4.25it/s] 85it [00:19, 4.14it/s] 86it [00:20, 4.27it/s] 87it [00:20, 4.28it/s] 88it [00:20, 4.27it/s] 89it [00:20, 4.27it/s] 90it [00:20, 4.36it/s] 91it [00:21, 4.39it/s] 92it [00:21, 3.47it/s] 93it [00:21, 3.73it/s] 94it [00:22, 3.86it/s] 95it [00:22, 4.03it/s] 96it [00:22, 4.21it/s] 97it [00:22, 4.23it/s] 98it [00:22, 4.24it/s] 99it [00:23, 4.24it/s] 100it [00:23, 4.21it/s]2025-05-26 02:21:01,365 - INFO - [Epoch 045 | Batch 0100] IWAE-loss 1430.3690 | mean log_px -0.0046 | KL -1253.53 + 101it [00:23, 4.22it/s] 102it [00:23, 4.33it/s] 103it [00:24, 4.40it/s] 104it [00:24, 4.46it/s] 105it [00:24, 4.25it/s] 106it [00:24, 4.35it/s] 107it [00:25, 4.41it/s] 108it [00:25, 4.49it/s] 109it [00:25, 4.56it/s] 110it [00:25, 4.42it/s] 111it [00:25, 4.32it/s] 112it [00:26, 4.42it/s] 113it [00:26, 4.48it/s] 114it [00:26, 4.50it/s] 115it [00:26, 4.25it/s] 116it [00:27, 4.25it/s] 117it [00:27, 4.34it/s] 118it [00:27, 4.40it/s] 119it [00:27, 4.39it/s] 120it [00:27, 4.30it/s] 121it [00:28, 4.23it/s] 122it [00:28, 4.11it/s] 123it [00:28, 4.19it/s] 124it [00:28, 4.21it/s] 125it [00:29, 4.33it/s] 126it [00:29, 4.32it/s] 127it [00:29, 4.30it/s] 128it [00:29, 4.14it/s] 129it [00:30, 4.30it/s] 130it [00:30, 4.29it/s] 131it [00:30, 4.40it/s] 132it [00:30, 4.35it/s] 133it [00:31, 4.31it/s] 134it [00:31, 4.17it/s] 135it [00:31, 4.32it/s] 136it [00:31, 4.40it/s] 137it [00:31, 4.47it/s] 138it [00:32, 4.53it/s] 139it [00:32, 4.57it/s] 140it [00:32, 4.45it/s] 141it [00:32, 4.53it/s] 142it [00:33, 4.58it/s] 143it [00:33, 4.61it/s] 144it [00:33, 4.63it/s] 145it [00:33, 4.65it/s] 146it [00:33, 4.49it/s] 147it [00:34, 4.57it/s] 148it [00:34, 4.60it/s] 149it [00:34, 4.63it/s] 150it [00:34, 4.64it/s]2025-05-26 02:21:12,679 - INFO - [Epoch 045 | Batch 0150] IWAE-loss 1851.1366 | mean log_px -0.0243 | KL -1258.04 + 151it [00:34, 4.65it/s] 152it [00:35, 4.64it/s] 153it [00:35, 4.65it/s] 154it [00:35, 4.66it/s] 155it [00:35, 4.50it/s] 156it [00:36, 4.55it/s] 157it [00:36, 4.61it/s] 158it [00:36, 4.63it/s] 159it [00:36, 4.65it/s] 160it [00:36, 4.65it/s] 161it [00:37, 4.67it/s] 162it [00:37, 4.68it/s] 163it [00:37, 4.69it/s] 164it [00:37, 4.45it/s] 165it [00:38, 4.52it/s] 166it [00:38, 4.56it/s] 167it [00:38, 4.60it/s] 168it [00:38, 4.63it/s] 169it [00:38, 4.65it/s] 170it [00:39, 4.66it/s] 171it [00:39, 4.51it/s] 172it [00:39, 4.57it/s] 173it [00:39, 4.61it/s] 174it [00:39, 4.63it/s] 175it [00:40, 4.63it/s] 176it [00:40, 4.64it/s] 177it [00:40, 4.49it/s] 178it [00:40, 4.56it/s] 179it [00:41, 4.60it/s] 180it [00:41, 4.63it/s] 181it [00:41, 4.64it/s] 182it [00:41, 4.65it/s] 183it [00:41, 4.67it/s] 184it [00:42, 4.68it/s] 185it [00:42, 4.69it/s] 186it [00:42, 4.69it/s] 187it [00:42, 4.69it/s] 188it [00:42, 4.69it/s] 189it [00:43, 4.69it/s] 190it [00:43, 4.69it/s] 191it [00:43, 4.70it/s] 192it [00:43, 4.69it/s] 193it [00:44, 4.70it/s] 194it [00:44, 4.69it/s] 195it [00:44, 4.56it/s] 196it [00:44, 4.61it/s] 196it [00:44, 4.38it/s] +2025-05-26 02:21:22,538 - INFO - Epoch: 45, Objective: tensor([1544.8090], device='cuda:0', grad_fn=), Loss: 0.005014732480049133, KL/n: 25.61770248413086 + 0it [00:00, ?it/s]2025-05-26 02:21:22,889 - INFO - [Epoch 046 | Batch 0000] IWAE-loss 1496.1056 | mean log_px -0.0046 | KL -1254.61 + 1it [00:00, 3.31it/s] 2it [00:00, 4.01it/s] 3it [00:00, 4.30it/s] 4it [00:00, 4.43it/s] 5it [00:01, 4.53it/s] 6it [00:01, 4.56it/s] 7it [00:01, 4.61it/s] 8it [00:01, 4.65it/s] 9it [00:02, 4.64it/s] 10it [00:02, 4.65it/s] 11it [00:02, 4.67it/s] 12it [00:02, 4.68it/s] 13it [00:02, 4.65it/s] 14it [00:03, 4.62it/s] 15it [00:03, 4.57it/s] 16it [00:03, 4.55it/s] 17it [00:03, 4.57it/s] 18it [00:03, 4.55it/s] 19it [00:04, 4.42it/s] 20it [00:04, 4.50it/s] 21it [00:04, 4.55it/s] 22it [00:04, 4.52it/s] 23it [00:05, 4.52it/s] 24it [00:05, 4.55it/s] 25it [00:05, 4.60it/s] 26it [00:05, 4.63it/s] 27it [00:05, 4.65it/s] 28it [00:06, 4.63it/s] 29it [00:06, 4.65it/s] 30it [00:06, 4.66it/s] 31it [00:06, 4.68it/s] 32it [00:07, 4.68it/s] 33it [00:07, 4.69it/s] 34it [00:07, 4.69it/s] 35it [00:07, 4.70it/s] 36it [00:07, 4.70it/s] 37it [00:08, 4.70it/s] 38it [00:08, 4.70it/s] 39it [00:08, 4.70it/s] 40it [00:08, 4.70it/s] 41it [00:08, 4.70it/s] 42it [00:09, 4.69it/s] 43it [00:09, 4.69it/s] 44it [00:09, 4.52it/s] 45it [00:09, 4.59it/s] 46it [00:10, 4.55it/s] 47it [00:10, 4.57it/s] 48it [00:10, 4.62it/s] 49it [00:10, 4.65it/s] 50it [00:10, 4.66it/s]2025-05-26 02:21:33,707 - INFO - [Epoch 046 | Batch 0050] IWAE-loss 1504.4362 | mean log_px -0.0047 | KL -1249.88 + 51it [00:11, 4.47it/s] 52it [00:11, 4.55it/s] 53it [00:11, 4.59it/s] 54it [00:11, 4.61it/s] 55it [00:11, 4.64it/s] 56it [00:12, 4.65it/s] 57it [00:12, 4.67it/s] 58it [00:12, 4.68it/s] 59it [00:12, 4.69it/s] 60it [00:13, 4.69it/s] 61it [00:13, 4.69it/s] 62it [00:13, 4.69it/s] 63it [00:13, 4.70it/s] 64it [00:13, 4.69it/s] 65it [00:14, 4.39it/s] 66it [00:14, 4.32it/s] 67it [00:14, 4.28it/s] 68it [00:14, 4.23it/s] 69it [00:15, 4.21it/s] 70it [00:15, 4.17it/s] 71it [00:15, 4.30it/s] 72it [00:15, 4.41it/s] 73it [00:16, 4.50it/s] 74it [00:16, 4.55it/s] 75it [00:16, 4.59it/s] 76it [00:16, 4.62it/s] 77it [00:16, 4.65it/s] 78it [00:17, 4.50it/s] 79it [00:17, 4.55it/s] 80it [00:17, 4.60it/s] 81it [00:17, 4.63it/s] 82it [00:17, 4.65it/s] 83it [00:18, 4.66it/s] 84it [00:18, 4.66it/s] 85it [00:18, 4.67it/s] 86it [00:18, 4.67it/s] 87it [00:19, 4.69it/s] 88it [00:19, 4.58it/s] 89it [00:19, 4.63it/s] 90it [00:19, 4.65it/s] 91it [00:19, 4.67it/s] 92it [00:20, 4.67it/s] 93it [00:20, 4.68it/s] 94it [00:20, 4.69it/s] 95it [00:20, 4.69it/s] 96it [00:20, 4.69it/s] 97it [00:21, 4.70it/s] 98it [00:21, 4.53it/s] 99it [00:21, 4.60it/s] 100it [00:21, 4.63it/s]2025-05-26 02:21:44,642 - INFO - [Epoch 046 | Batch 0100] IWAE-loss 2131.2534 | mean log_px -0.0194 | KL -1246.14 + 101it [00:22, 4.65it/s] 102it [00:22, 4.65it/s] 103it [00:22, 4.66it/s] 104it [00:22, 4.54it/s] 105it [00:22, 4.61it/s] 106it [00:23, 4.63it/s] 107it [00:23, 4.65it/s] 108it [00:23, 4.66it/s] 109it [00:23, 4.68it/s] 110it [00:23, 4.67it/s] 111it [00:24, 4.68it/s] 112it [00:24, 4.68it/s] 113it [00:24, 4.69it/s] 114it [00:24, 4.69it/s] 115it [00:25, 4.54it/s] 116it [00:25, 4.60it/s] 117it [00:25, 4.63it/s] 118it [00:25, 4.65it/s] 119it [00:25, 4.67it/s] 120it [00:26, 4.66it/s] 121it [00:26, 4.69it/s] 122it [00:26, 4.53it/s] 123it [00:26, 4.59it/s] 124it [00:26, 4.59it/s] 125it [00:27, 4.60it/s] 126it [00:27, 4.62it/s] 127it [00:27, 4.65it/s] 128it [00:27, 4.66it/s] 129it [00:28, 4.66it/s] 130it [00:28, 4.67it/s] 131it [00:28, 4.68it/s] 132it [00:28, 4.52it/s] 133it [00:28, 4.58it/s] 134it [00:29, 4.61it/s] 135it [00:29, 4.64it/s] 136it [00:29, 4.65it/s] 137it [00:29, 4.67it/s] 138it [00:30, 4.64it/s] 139it [00:30, 4.60it/s] 140it [00:30, 4.50it/s] 141it [00:30, 4.56it/s] 142it [00:30, 4.44it/s] 143it [00:31, 4.53it/s] 144it [00:31, 4.56it/s] 145it [00:31, 4.61it/s] 146it [00:31, 4.64it/s] 147it [00:31, 4.66it/s] 148it [00:32, 4.67it/s] 149it [00:32, 4.69it/s] 150it [00:32, 4.69it/s]2025-05-26 02:21:55,448 - INFO - [Epoch 046 | Batch 0150] IWAE-loss 1519.1067 | mean log_px -0.0050 | KL -1243.51 + 151it [00:32, 4.69it/s] 152it [00:33, 4.52it/s] 153it [00:33, 4.58it/s] 154it [00:33, 4.61it/s] 155it [00:33, 4.62it/s] 156it [00:33, 4.56it/s] 157it [00:34, 4.59it/s] 158it [00:34, 4.62it/s] 159it [00:34, 4.47it/s] 160it [00:34, 4.53it/s] 161it [00:35, 4.57it/s] 162it [00:35, 4.59it/s] 163it [00:35, 4.62it/s] 164it [00:35, 4.63it/s] 165it [00:35, 4.65it/s] 166it [00:36, 4.66it/s] 167it [00:36, 4.67it/s] 168it [00:36, 4.67it/s] 169it [00:36, 4.68it/s] 170it [00:36, 4.68it/s] 171it [00:37, 4.69it/s] 172it [00:37, 4.69it/s] 173it [00:37, 4.70it/s] 174it [00:37, 4.70it/s] 175it [00:38, 4.70it/s] 176it [00:38, 4.68it/s] 177it [00:38, 4.68it/s] 178it [00:38, 4.65it/s] 179it [00:38, 4.66it/s] 180it [00:39, 4.65it/s] 181it [00:39, 4.67it/s] 182it [00:39, 4.68it/s] 183it [00:39, 4.68it/s] 184it [00:39, 4.51it/s] 185it [00:40, 4.58it/s] 186it [00:40, 4.61it/s] 187it [00:40, 4.61it/s] 188it [00:40, 4.56it/s] 189it [00:41, 4.57it/s] 190it [00:41, 4.59it/s] 191it [00:41, 4.59it/s] 192it [00:41, 4.60it/s] 193it [00:41, 4.45it/s] 194it [00:42, 4.44it/s] 195it [00:42, 4.41it/s] 196it [00:42, 4.47it/s] 196it [00:42, 4.59it/s] +2025-05-26 02:22:05,358 - INFO - Epoch: 46, Objective: tensor([1405.0212], device='cuda:0', grad_fn=), Loss: 0.008077585138380527, KL/n: 25.350950241088867 + 0it [00:00, ?it/s]2025-05-26 02:22:05,912 - INFO - [Epoch 047 | Batch 0000] IWAE-loss 1908.2433 | mean log_px -0.0132 | KL -1241.40 + 1it [00:00, 3.30it/s] 2it [00:00, 3.96it/s] 3it [00:00, 4.25it/s] 4it [00:00, 4.39it/s] 5it [00:01, 4.31it/s] 6it [00:01, 4.42it/s] 7it [00:01, 4.50it/s] 8it [00:01, 4.53it/s] 9it [00:02, 4.57it/s] 10it [00:02, 4.58it/s] 11it [00:02, 4.40it/s] 12it [00:02, 4.40it/s] 13it [00:02, 4.45it/s] 14it [00:03, 4.49it/s] 15it [00:03, 4.54it/s] 16it [00:03, 4.56it/s] 17it [00:03, 4.43it/s] 18it [00:04, 4.50it/s] 19it [00:04, 4.54it/s] 20it [00:04, 4.55it/s] 21it [00:04, 4.56it/s] 22it [00:04, 4.57it/s] 23it [00:05, 4.57it/s] 24it [00:05, 4.57it/s] 25it [00:05, 4.57it/s] 26it [00:05, 4.57it/s] 27it [00:06, 4.56it/s] 28it [00:06, 4.57it/s] 29it [00:06, 4.58it/s] 30it [00:06, 4.43it/s] 31it [00:06, 4.48it/s] 32it [00:07, 4.52it/s] 33it [00:07, 4.56it/s] 34it [00:07, 4.57it/s] 35it [00:07, 4.59it/s] 36it [00:08, 4.59it/s] 37it [00:08, 4.60it/s] 38it [00:08, 4.61it/s] 39it [00:08, 4.61it/s] 40it [00:08, 4.60it/s] 41it [00:09, 4.56it/s] 42it [00:09, 4.60it/s] 43it [00:09, 4.60it/s] 44it [00:09, 4.59it/s] 45it [00:09, 4.48it/s] 46it [00:10, 4.54it/s] 47it [00:10, 4.57it/s] 48it [00:10, 4.58it/s] 49it [00:10, 4.56it/s] 50it [00:11, 4.56it/s]2025-05-26 02:22:16,902 - INFO - [Epoch 047 | Batch 0050] IWAE-loss 1597.2115 | mean log_px -0.0160 | KL -1236.86 + 51it [00:11, 4.57it/s] 52it [00:11, 4.57it/s] 53it [00:11, 4.58it/s] 54it [00:11, 4.43it/s] 55it [00:12, 4.50it/s] 56it [00:12, 4.51it/s] 57it [00:12, 4.53it/s] 58it [00:12, 4.54it/s] 59it [00:13, 4.55it/s] 60it [00:13, 4.56it/s] 61it [00:13, 4.58it/s] 62it [00:13, 4.58it/s] 63it [00:13, 4.45it/s] 64it [00:14, 4.50it/s] 65it [00:14, 4.53it/s] 66it [00:14, 4.55it/s] 67it [00:14, 4.57it/s] 68it [00:15, 4.58it/s] 69it [00:15, 4.60it/s] 70it [00:15, 4.45it/s] 71it [00:15, 4.52it/s] 72it [00:15, 4.55it/s] 73it [00:16, 4.58it/s] 74it [00:16, 4.59it/s] 75it [00:16, 4.59it/s] 76it [00:16, 4.31it/s] 77it [00:17, 4.39it/s] 78it [00:17, 4.43it/s] 79it [00:17, 4.34it/s] 80it [00:17, 4.24it/s] 81it [00:18, 4.19it/s] 82it [00:18, 4.30it/s] 83it [00:18, 4.38it/s] 84it [00:18, 4.28it/s] 85it [00:18, 4.40it/s] 86it [00:19, 4.45it/s] 87it [00:19, 4.48it/s] 88it [00:19, 4.51it/s] 89it [00:19, 4.50it/s] 90it [00:20, 4.52it/s] 91it [00:20, 4.53it/s] 92it [00:20, 4.54it/s] 93it [00:20, 4.41it/s] 94it [00:20, 4.45it/s] 95it [00:21, 4.51it/s] 96it [00:21, 4.52it/s] 97it [00:21, 4.54it/s] 98it [00:21, 4.57it/s] 99it [00:21, 4.58it/s] 100it [00:22, 4.59it/s]2025-05-26 02:22:28,036 - INFO - [Epoch 047 | Batch 0100] IWAE-loss 2198.4983 | mean log_px -0.0194 | KL -1234.72 + 101it [00:22, 4.61it/s] 102it [00:22, 4.60it/s] 103it [00:22, 4.60it/s] 104it [00:23, 4.60it/s] 105it [00:23, 4.61it/s] 106it [00:23, 4.62it/s] 107it [00:23, 4.62it/s] 108it [00:23, 4.47it/s] 109it [00:24, 4.53it/s] 110it [00:24, 4.54it/s] 111it [00:24, 4.55it/s] 112it [00:24, 4.56it/s] 113it [00:25, 4.57it/s] 114it [00:25, 4.57it/s] 115it [00:25, 4.60it/s] 116it [00:25, 4.60it/s] 117it [00:25, 4.46it/s] 118it [00:26, 4.52it/s] 119it [00:26, 4.55it/s] 120it [00:26, 4.57it/s] 121it [00:26, 4.60it/s] 122it [00:27, 4.61it/s] 123it [00:27, 4.61it/s] 124it [00:27, 4.61it/s] 125it [00:27, 4.62it/s] 126it [00:27, 4.47it/s] 127it [00:28, 4.53it/s] 128it [00:28, 4.56it/s] 129it [00:28, 4.54it/s] 130it [00:28, 4.55it/s] 131it [00:28, 4.57it/s] 132it [00:29, 4.58it/s] 133it [00:29, 4.59it/s] 134it [00:29, 4.58it/s] 135it [00:29, 4.43it/s] 136it [00:30, 4.48it/s] 137it [00:30, 4.53it/s] 138it [00:30, 4.55it/s] 139it [00:30, 4.57it/s] 140it [00:30, 4.58it/s] 141it [00:31, 4.59it/s] 142it [00:31, 4.60it/s] 143it [00:31, 4.60it/s] 144it [00:31, 4.45it/s] 145it [00:32, 4.50it/s] 146it [00:32, 4.53it/s] 147it [00:32, 4.55it/s] 148it [00:32, 4.55it/s] 149it [00:32, 4.55it/s] 150it [00:33, 4.42it/s]2025-05-26 02:22:39,028 - INFO - [Epoch 047 | Batch 0150] IWAE-loss 1541.9181 | mean log_px -0.0085 | KL -1228.83 + 151it [00:33, 4.47it/s] 152it [00:33, 4.51it/s] 153it [00:33, 4.49it/s] 154it [00:34, 4.48it/s] 155it [00:34, 4.53it/s] 156it [00:34, 4.56it/s] 157it [00:34, 4.58it/s] 158it [00:34, 4.60it/s] 159it [00:35, 4.45it/s] 160it [00:35, 4.50it/s] 161it [00:35, 4.51it/s] 162it [00:35, 4.54it/s] 163it [00:36, 4.56it/s] 164it [00:36, 4.57it/s] 165it [00:36, 4.57it/s] 166it [00:36, 4.58it/s] 167it [00:36, 4.59it/s] 168it [00:37, 4.44it/s] 169it [00:37, 4.50it/s] 170it [00:37, 4.53it/s] 171it [00:37, 4.55it/s] 172it [00:38, 4.57it/s] 173it [00:38, 4.57it/s] 174it [00:38, 4.58it/s] 175it [00:38, 4.59it/s] 176it [00:38, 4.60it/s] 177it [00:39, 4.46it/s] 178it [00:39, 4.49it/s] 179it [00:39, 4.53it/s] 180it [00:39, 4.54it/s] 181it [00:40, 4.56it/s] 182it [00:40, 4.58it/s] 183it [00:40, 4.58it/s] 184it [00:40, 4.59it/s] 185it [00:40, 4.46it/s] 186it [00:41, 4.50it/s] 187it [00:41, 4.53it/s] 188it [00:41, 4.55it/s] 189it [00:41, 4.57it/s] 190it [00:41, 4.58it/s] 191it [00:42, 4.59it/s] 192it [00:42, 4.59it/s] 193it [00:42, 4.60it/s] 194it [00:42, 4.61it/s] 195it [00:43, 4.34it/s] 196it [00:43, 4.45it/s] 196it [00:43, 4.52it/s] +2025-05-26 02:22:49,075 - INFO - Epoch: 47, Objective: tensor([1696.6771], device='cuda:0', grad_fn=), Loss: 0.011943808756768703, KL/n: 25.065183639526367 + 0it [00:00, ?it/s]2025-05-26 02:22:49,456 - INFO - [Epoch 048 | Batch 0000] IWAE-loss 2080.8501 | mean log_px -0.0122 | KL -1227.69 + 1it [00:00, 3.31it/s] 2it [00:00, 3.97it/s] 3it [00:00, 4.27it/s] 4it [00:00, 4.39it/s] 5it [00:01, 4.48it/s] 6it [00:01, 4.53it/s] 7it [00:01, 4.40it/s] 8it [00:01, 4.45it/s] 9it [00:02, 4.51it/s] 10it [00:02, 4.53it/s] 11it [00:02, 4.55it/s] 12it [00:02, 4.55it/s] 13it [00:02, 4.56it/s] 14it [00:03, 4.57it/s] 15it [00:03, 4.59it/s] 16it [00:03, 4.59it/s] 17it [00:03, 4.61it/s] 18it [00:04, 4.61it/s] 19it [00:04, 4.48it/s] 20it [00:04, 4.54it/s] 21it [00:04, 4.57it/s] 22it [00:04, 4.58it/s] 23it [00:05, 4.60it/s] 24it [00:05, 4.60it/s] 25it [00:05, 4.52it/s] 26it [00:05, 4.56it/s] 27it [00:05, 4.59it/s] 28it [00:06, 4.60it/s] 29it [00:06, 4.61it/s] 30it [00:06, 4.60it/s] 31it [00:06, 4.61it/s] 32it [00:07, 4.60it/s] 33it [00:07, 4.60it/s] 34it [00:07, 4.46it/s] 35it [00:07, 4.51it/s] 36it [00:07, 4.55it/s] 37it [00:08, 4.58it/s] 38it [00:08, 4.58it/s] 39it [00:08, 4.59it/s] 40it [00:08, 4.60it/s] 41it [00:09, 4.45it/s] 42it [00:09, 4.52it/s] 43it [00:09, 4.56it/s] 44it [00:09, 4.58it/s] 45it [00:09, 4.59it/s] 46it [00:10, 4.60it/s] 47it [00:10, 4.48it/s] 48it [00:10, 4.53it/s] 49it [00:10, 4.57it/s] 50it [00:11, 4.52it/s]2025-05-26 02:23:00,410 - INFO - [Epoch 048 | Batch 0050] IWAE-loss 1285.0804 | mean log_px -0.0012 | KL -1222.04 + 51it [00:11, 4.57it/s] 52it [00:11, 4.53it/s] 53it [00:11, 4.55it/s] 54it [00:11, 4.55it/s] 55it [00:12, 4.56it/s] 56it [00:12, 4.42it/s] 57it [00:12, 4.47it/s] 58it [00:12, 4.51it/s] 59it [00:13, 4.52it/s] 60it [00:13, 4.52it/s] 61it [00:13, 4.53it/s] 62it [00:13, 4.55it/s] 63it [00:13, 4.56it/s] 64it [00:14, 3.63it/s] 65it [00:14, 3.87it/s] 66it [00:14, 4.04it/s] 67it [00:14, 4.19it/s] 68it [00:15, 4.30it/s] 69it [00:15, 4.37it/s] 70it [00:15, 4.39it/s] 71it [00:15, 4.47it/s] 72it [00:16, 4.50it/s] 73it [00:16, 4.51it/s] 74it [00:16, 4.53it/s] 75it [00:16, 4.40it/s] 76it [00:16, 4.45it/s] 77it [00:17, 4.49it/s] 78it [00:17, 4.51it/s] 79it [00:17, 4.53it/s] 80it [00:17, 4.54it/s] 81it [00:18, 4.56it/s] 82it [00:18, 4.51it/s] 83it [00:18, 4.42it/s] 84it [00:18, 4.47it/s] 85it [00:18, 4.49it/s] 86it [00:19, 4.50it/s] 87it [00:19, 4.52it/s] 88it [00:19, 4.53it/s] 89it [00:19, 4.53it/s] 90it [00:20, 4.52it/s] 91it [00:20, 4.54it/s] 92it [00:20, 4.53it/s] 93it [00:20, 4.54it/s] 94it [00:20, 4.53it/s] 95it [00:21, 4.55it/s] 96it [00:21, 4.56it/s] 97it [00:21, 4.41it/s] 98it [00:21, 4.42it/s] 99it [00:22, 4.46it/s] 100it [00:22, 4.51it/s]2025-05-26 02:23:11,665 - INFO - [Epoch 048 | Batch 0100] IWAE-loss 1300.4762 | mean log_px -0.0050 | KL -1212.15 + 101it [00:22, 4.50it/s] 102it [00:22, 4.54it/s] 103it [00:22, 4.56it/s] 104it [00:23, 4.57it/s] 105it [00:23, 4.58it/s] 106it [00:23, 4.60it/s] 107it [00:23, 4.59it/s] 108it [00:24, 4.60it/s] 109it [00:24, 4.61it/s] 110it [00:24, 4.56it/s] 111it [00:24, 4.58it/s] 112it [00:24, 4.52it/s] 113it [00:25, 4.55it/s] 114it [00:25, 4.55it/s] 115it [00:25, 4.44it/s] 116it [00:25, 4.47it/s] 117it [00:26, 4.51it/s] 118it [00:26, 4.51it/s] 119it [00:26, 4.54it/s] 120it [00:26, 4.54it/s] 121it [00:26, 4.55it/s] 122it [00:27, 4.52it/s] 123it [00:27, 4.55it/s] 124it [00:27, 4.46it/s] 125it [00:27, 4.52it/s] 126it [00:28, 4.53it/s] 127it [00:28, 4.50it/s] 128it [00:28, 4.52it/s] 129it [00:28, 4.54it/s] 130it [00:28, 4.54it/s] 131it [00:29, 4.55it/s] 132it [00:29, 4.56it/s] 133it [00:29, 4.48it/s] 134it [00:29, 4.52it/s] 135it [00:29, 4.54it/s] 136it [00:30, 4.56it/s] 137it [00:30, 4.56it/s] 138it [00:30, 4.43it/s] 139it [00:30, 4.48it/s] 140it [00:31, 4.52it/s] 141it [00:31, 4.54it/s] 142it [00:31, 4.55it/s] 143it [00:31, 4.55it/s] 144it [00:31, 4.55it/s] 145it [00:32, 4.55it/s] 146it [00:32, 4.41it/s] 147it [00:32, 4.47it/s] 148it [00:32, 4.51it/s] 149it [00:33, 4.54it/s] 150it [00:33, 4.53it/s]2025-05-26 02:23:22,694 - INFO - [Epoch 048 | Batch 0150] IWAE-loss 1771.9763 | mean log_px -0.0080 | KL -1212.38 + 151it [00:33, 4.55it/s] 152it [00:33, 4.56it/s] 153it [00:33, 4.57it/s] 154it [00:34, 4.56it/s] 155it [00:34, 4.54it/s] 156it [00:34, 4.55it/s] 157it [00:34, 4.54it/s] 158it [00:35, 4.48it/s] 159it [00:35, 4.43it/s] 160it [00:35, 4.41it/s] 161it [00:35, 4.45it/s] 162it [00:35, 4.49it/s] 163it [00:36, 4.46it/s] 164it [00:36, 4.49it/s] 165it [00:36, 4.52it/s] 166it [00:36, 4.53it/s] 167it [00:37, 4.55it/s] 168it [00:37, 4.43it/s] 169it [00:37, 4.49it/s] 170it [00:37, 4.50it/s] 171it [00:37, 4.53it/s] 172it [00:38, 4.53it/s] 173it [00:38, 4.54it/s] 174it [00:38, 4.54it/s] 175it [00:38, 4.56it/s] 176it [00:39, 4.55it/s] 177it [00:39, 4.56it/s] 178it [00:39, 4.44it/s] 179it [00:39, 4.47it/s] 180it [00:39, 4.50it/s] 181it [00:40, 4.52it/s] 182it [00:40, 4.49it/s] 183it [00:40, 4.52it/s] 184it [00:40, 4.40it/s] 185it [00:41, 4.46it/s] 186it [00:41, 4.49it/s] 187it [00:41, 4.52it/s] 188it [00:41, 4.55it/s] 189it [00:41, 4.55it/s] 190it [00:42, 4.55it/s] 191it [00:42, 4.43it/s] 192it [00:42, 4.47it/s] 193it [00:42, 4.50it/s] 194it [00:43, 4.53it/s] 195it [00:43, 4.41it/s] 196it [00:43, 4.28it/s] 196it [00:43, 4.49it/s] +2025-05-26 02:23:32,857 - INFO - Epoch: 48, Objective: tensor([1534.0585], device='cuda:0', grad_fn=), Loss: 0.016182228922843933, KL/n: 24.804851531982422 + 0it [00:00, ?it/s]2025-05-26 02:23:33,233 - INFO - [Epoch 049 | Batch 0000] IWAE-loss 1611.0990 | mean log_px -0.0056 | KL -1216.53 + 1it [00:00, 3.30it/s] 2it [00:00, 3.73it/s] 3it [00:00, 4.09it/s] 4it [00:00, 4.26it/s] 5it [00:01, 4.36it/s] 6it [00:01, 4.43it/s] 7it [00:01, 4.44it/s] 8it [00:01, 4.48it/s] 9it [00:02, 4.51it/s] 10it [00:02, 4.53it/s] 11it [00:02, 4.54it/s] 12it [00:02, 4.54it/s] 13it [00:02, 4.42it/s] 14it [00:03, 4.45it/s] 15it [00:03, 4.49it/s] 16it [00:03, 4.52it/s] 17it [00:03, 4.53it/s] 18it [00:04, 4.54it/s] 19it [00:04, 4.55it/s] 20it [00:04, 4.42it/s] 21it [00:04, 4.48it/s] 22it [00:04, 4.50it/s] 23it [00:05, 4.50it/s] 24it [00:05, 4.38it/s] 25it [00:05, 4.39it/s] 26it [00:05, 4.45it/s] 27it [00:06, 4.48it/s] 28it [00:06, 4.47it/s] 29it [00:06, 4.37it/s] 30it [00:06, 4.40it/s] 31it [00:07, 4.43it/s] 32it [00:07, 4.47it/s] 33it [00:07, 4.50it/s] 34it [00:07, 4.51it/s] 35it [00:07, 4.54it/s] 36it [00:08, 4.53it/s] 37it [00:08, 4.54it/s] 38it [00:08, 4.34it/s] 39it [00:08, 4.42it/s] 40it [00:09, 4.46it/s] 41it [00:09, 4.48it/s] 42it [00:09, 4.44it/s] 43it [00:09, 4.44it/s] 44it [00:09, 4.49it/s] 45it [00:10, 4.53it/s] 46it [00:10, 4.53it/s] 47it [00:10, 4.56it/s] 48it [00:10, 4.56it/s] 49it [00:11, 4.41it/s] 50it [00:11, 4.44it/s]2025-05-26 02:23:44,399 - INFO - [Epoch 049 | Batch 0050] IWAE-loss 1382.5945 | mean log_px -0.0030 | KL -1212.96 + 51it [00:11, 4.48it/s] 52it [00:11, 4.50it/s] 53it [00:11, 4.51it/s] 54it [00:12, 4.52it/s] 55it [00:12, 4.39it/s] 56it [00:12, 4.45it/s] 57it [00:12, 4.49it/s] 58it [00:13, 4.47it/s] 59it [00:13, 4.50it/s] 60it [00:13, 4.48it/s] 61it [00:13, 4.51it/s] 62it [00:13, 4.54it/s] 63it [00:14, 4.50it/s] 64it [00:14, 4.53it/s] 65it [00:14, 4.41it/s] 66it [00:14, 4.45it/s] 67it [00:15, 4.44it/s] 68it [00:15, 4.49it/s] 69it [00:15, 4.52it/s] 70it [00:15, 4.53it/s] 71it [00:15, 4.52it/s] 72it [00:16, 4.55it/s] 73it [00:16, 4.55it/s] 74it [00:16, 4.56it/s] 75it [00:16, 4.41it/s] 76it [00:17, 4.41it/s] 77it [00:17, 4.46it/s] 78it [00:17, 4.47it/s] 79it [00:17, 4.48it/s] 80it [00:17, 4.50it/s] 81it [00:18, 4.51it/s] 82it [00:18, 4.44it/s] 83it [00:18, 4.49it/s] 84it [00:18, 4.51it/s] 85it [00:19, 4.52it/s] 86it [00:19, 4.55it/s] 87it [00:19, 4.51it/s] 88it [00:19, 4.53it/s] 89it [00:19, 4.55it/s] 90it [00:20, 4.56it/s] 91it [00:20, 4.57it/s] 92it [00:20, 4.54it/s] 93it [00:20, 4.55it/s] 94it [00:21, 4.55it/s] 95it [00:21, 4.43it/s] 96it [00:21, 4.48it/s] 97it [00:21, 4.49it/s] 98it [00:21, 4.53it/s] 99it [00:22, 4.54it/s] 100it [00:22, 4.50it/s]2025-05-26 02:23:55,508 - INFO - [Epoch 049 | Batch 0100] IWAE-loss 1519.3214 | mean log_px -0.0086 | KL -1206.96 + 101it [00:22, 4.37it/s] 102it [00:22, 4.42it/s] 103it [00:23, 4.47it/s] 104it [00:23, 4.44it/s] 105it [00:23, 4.50it/s] 106it [00:23, 4.44it/s] 107it [00:23, 4.49it/s] 108it [00:24, 4.51it/s] 109it [00:24, 4.34it/s] 110it [00:24, 4.38it/s] 111it [00:24, 4.43it/s] 112it [00:25, 4.44it/s] 113it [00:25, 4.45it/s] 114it [00:25, 4.49it/s] 115it [00:25, 4.50it/s] 116it [00:25, 4.53it/s] 117it [00:26, 4.54it/s] 118it [00:26, 4.55it/s] 119it [00:26, 4.43it/s] 120it [00:26, 4.49it/s] 121it [00:27, 4.51it/s] 122it [00:27, 4.50it/s] 123it [00:27, 4.48it/s] 124it [00:27, 4.50it/s] 125it [00:27, 4.51it/s] 126it [00:28, 4.53it/s] 127it [00:28, 4.55it/s] 128it [00:28, 4.43it/s] 129it [00:28, 4.44it/s] 130it [00:29, 4.46it/s] 131it [00:29, 4.49it/s] 132it [00:29, 4.51it/s] 133it [00:29, 4.54it/s] 134it [00:29, 4.54it/s] 135it [00:30, 4.55it/s] 136it [00:30, 4.56it/s] 137it [00:30, 4.44it/s] 138it [00:30, 4.49it/s] 139it [00:31, 4.51it/s] 140it [00:31, 4.52it/s] 141it [00:31, 4.53it/s] 142it [00:31, 4.52it/s] 143it [00:31, 4.54it/s] 144it [00:32, 4.56it/s] 145it [00:32, 4.41it/s] 146it [00:32, 4.44it/s] 147it [00:32, 4.48it/s] 148it [00:33, 4.50it/s] 149it [00:33, 4.51it/s] 150it [00:33, 4.52it/s]2025-05-26 02:24:06,655 - INFO - [Epoch 049 | Batch 0150] IWAE-loss 1296.9624 | mean log_px -0.0015 | KL -1203.38 + 151it [00:33, 4.50it/s] 152it [00:33, 4.43it/s] 153it [00:34, 4.49it/s] 154it [00:34, 4.50it/s] 155it [00:34, 4.52it/s] 156it [00:34, 4.47it/s] 157it [00:35, 4.44it/s] 158it [00:35, 4.49it/s] 159it [00:35, 4.53it/s] 160it [00:35, 4.34it/s] 161it [00:35, 4.42it/s] 162it [00:36, 4.42it/s] 163it [00:36, 4.46it/s] 164it [00:36, 4.50it/s] 165it [00:36, 4.52it/s] 166it [00:37, 4.52it/s] 167it [00:37, 4.51it/s] 168it [00:37, 4.53it/s] 169it [00:37, 4.41it/s] 170it [00:37, 4.46it/s] 171it [00:38, 4.49it/s] 172it [00:38, 4.50it/s] 173it [00:38, 4.50it/s] 174it [00:38, 4.51it/s] 175it [00:39, 4.52it/s] 176it [00:39, 4.53it/s] 177it [00:39, 4.55it/s] 178it [00:39, 4.40it/s] 179it [00:39, 4.47it/s] 180it [00:40, 4.45it/s] 181it [00:40, 4.48it/s] 182it [00:40, 4.48it/s] 183it [00:40, 4.40it/s] 184it [00:41, 4.45it/s] 185it [00:41, 4.48it/s] 186it [00:41, 4.51it/s] 187it [00:41, 4.54it/s] 188it [00:42, 4.41it/s] 189it [00:42, 4.46it/s] 190it [00:42, 4.50it/s] 191it [00:42, 4.52it/s] 192it [00:42, 4.54it/s] 193it [00:43, 4.55it/s] 194it [00:43, 4.54it/s] 195it [00:43, 4.28it/s] 196it [00:43, 4.36it/s] 196it [00:43, 4.47it/s] +2025-05-26 02:24:16,855 - INFO - Epoch: 49, Objective: tensor([1426.3483], device='cuda:0', grad_fn=), Loss: 0.002869151998311281, KL/n: 24.51639175415039 + 0it [00:00, ?it/s]2025-05-26 02:24:17,419 - INFO - [Epoch 050 | Batch 0000] IWAE-loss 1417.0724 | mean log_px -0.0090 | KL -1203.12 + 1it [00:00, 3.30it/s] 2it [00:00, 3.90it/s] 3it [00:00, 4.18it/s] 4it [00:00, 4.34it/s] 5it [00:01, 4.38it/s] 6it [00:01, 4.39it/s] 7it [00:01, 4.46it/s] 8it [00:01, 4.49it/s] 9it [00:02, 4.51it/s] 10it [00:02, 4.53it/s] 11it [00:02, 4.38it/s] 12it [00:02, 4.43it/s] 13it [00:02, 4.50it/s] 14it [00:03, 4.52it/s] 15it [00:03, 4.55it/s] 16it [00:03, 4.49it/s] 17it [00:03, 4.47it/s] 18it [00:04, 4.36it/s] 19it [00:04, 4.40it/s] 20it [00:04, 4.42it/s] 21it [00:04, 4.45it/s] 22it [00:04, 4.48it/s] 23it [00:05, 4.49it/s] 24it [00:05, 4.50it/s] 25it [00:05, 4.54it/s] 26it [00:05, 4.52it/s] 27it [00:06, 4.38it/s] 28it [00:06, 4.34it/s] 29it [00:06, 4.40it/s] 30it [00:06, 4.46it/s] 31it [00:07, 4.47it/s] 32it [00:07, 4.51it/s] 33it [00:07, 4.53it/s] 34it [00:07, 4.40it/s] 35it [00:07, 4.44it/s] 36it [00:08, 4.49it/s] 37it [00:08, 4.53it/s] 38it [00:08, 4.54it/s] 39it [00:08, 4.55it/s] 40it [00:08, 4.56it/s] 41it [00:09, 4.58it/s] 42it [00:09, 4.57it/s] 43it [00:09, 4.57it/s] 44it [00:09, 4.53it/s] 45it [00:10, 4.55it/s] 46it [00:10, 4.56it/s] 47it [00:10, 4.55it/s] 48it [00:10, 4.38it/s] 49it [00:11, 4.44it/s] 50it [00:11, 4.48it/s]2025-05-26 02:24:28,556 - INFO - [Epoch 050 | Batch 0050] IWAE-loss 1422.3885 | mean log_px -0.0056 | KL -1198.54 + 51it [00:11, 4.51it/s] 52it [00:11, 4.50it/s] 53it [00:11, 4.54it/s] 54it [00:12, 4.36it/s] 55it [00:12, 4.40it/s] 56it [00:12, 4.45it/s] 57it [00:12, 4.49it/s] 58it [00:13, 4.50it/s] 59it [00:13, 4.53it/s] 60it [00:13, 4.55it/s] 61it [00:13, 4.55it/s] 62it [00:13, 4.55it/s] 63it [00:14, 4.58it/s] 64it [00:14, 4.46it/s] 65it [00:14, 4.51it/s] 66it [00:14, 4.54it/s] 67it [00:14, 4.54it/s] 68it [00:15, 4.55it/s] 69it [00:15, 4.56it/s] 70it [00:15, 4.57it/s] 71it [00:15, 4.44it/s] 72it [00:16, 4.49it/s] 73it [00:16, 4.52it/s] 74it [00:16, 4.41it/s] 75it [00:16, 4.47it/s] 76it [00:16, 4.50it/s] 77it [00:17, 4.54it/s] 78it [00:17, 4.54it/s] 79it [00:17, 4.52it/s] 80it [00:17, 4.52it/s] 81it [00:18, 4.54it/s] 82it [00:18, 4.55it/s] 83it [00:18, 4.37it/s] 84it [00:18, 4.40it/s] 85it [00:19, 4.42it/s] 86it [00:19, 4.47it/s] 87it [00:19, 4.50it/s] 88it [00:19, 4.53it/s] 89it [00:19, 4.55it/s] 90it [00:20, 4.55it/s] 91it [00:20, 4.45it/s] 92it [00:20, 4.50it/s] 93it [00:20, 4.53it/s] 94it [00:20, 4.54it/s] 95it [00:21, 4.50it/s] 96it [00:21, 4.52it/s] 97it [00:21, 4.40it/s] 98it [00:21, 4.46it/s] 99it [00:22, 4.49it/s] 100it [00:22, 4.51it/s]2025-05-26 02:24:39,665 - INFO - [Epoch 050 | Batch 0100] IWAE-loss 1353.2869 | mean log_px -0.0037 | KL -1194.16 + 101it [00:22, 4.54it/s] 102it [00:22, 4.54it/s] 103it [00:22, 4.56it/s] 104it [00:23, 4.53it/s] 105it [00:23, 4.54it/s] 106it [00:23, 4.53it/s] 107it [00:23, 4.56it/s] 108it [00:24, 4.56it/s] 109it [00:24, 4.57it/s] 110it [00:24, 4.44it/s] 111it [00:24, 4.49it/s] 112it [00:24, 4.50it/s] 113it [00:25, 4.53it/s] 114it [00:25, 4.53it/s] 115it [00:25, 4.54it/s] 116it [00:25, 4.54it/s] 117it [00:26, 4.55it/s] 118it [00:26, 4.43it/s] 119it [00:26, 4.43it/s] 120it [00:26, 4.48it/s] 121it [00:26, 4.52it/s] 122it [00:27, 4.52it/s] 123it [00:27, 4.54it/s] 124it [00:27, 4.52it/s] 125it [00:27, 4.56it/s] 126it [00:28, 4.32it/s] 127it [00:28, 4.42it/s] 128it [00:28, 4.47it/s] 129it [00:28, 4.51it/s] 130it [00:28, 4.49it/s] 131it [00:29, 4.51it/s] 132it [00:29, 4.54it/s] 133it [00:29, 4.56it/s] 134it [00:29, 4.41it/s] 135it [00:30, 4.48it/s] 136it [00:30, 4.43it/s] 137it [00:30, 4.35it/s] 138it [00:30, 4.42it/s] 139it [00:31, 4.42it/s] 140it [00:31, 4.44it/s] 141it [00:31, 4.44it/s] 142it [00:31, 4.49it/s] 143it [00:31, 4.53it/s] 144it [00:32, 4.54it/s] 145it [00:32, 4.42it/s] 146it [00:32, 4.46it/s] 147it [00:32, 4.50it/s] 148it [00:33, 4.52it/s] 149it [00:33, 4.49it/s] 150it [00:33, 4.51it/s]2025-05-26 02:24:50,790 - INFO - [Epoch 050 | Batch 0150] IWAE-loss 1559.9613 | mean log_px -0.0173 | KL -1188.04 + 151it [00:33, 4.56it/s] 152it [00:33, 4.56it/s] 153it [00:34, 4.57it/s] 154it [00:34, 4.57it/s] 155it [00:34, 4.45it/s] 156it [00:34, 4.48it/s] 157it [00:35, 4.43it/s] 158it [00:35, 4.45it/s] 159it [00:35, 4.49it/s] 160it [00:35, 4.52it/s] 161it [00:35, 4.53it/s] 162it [00:36, 4.46it/s] 163it [00:36, 4.38it/s] 164it [00:36, 4.43it/s] 165it [00:36, 4.46it/s] 166it [00:37, 4.44it/s] 167it [00:37, 4.49it/s] 168it [00:37, 4.48it/s] 169it [00:37, 4.52it/s] 170it [00:37, 4.39it/s] 171it [00:38, 4.45it/s] 172it [00:38, 4.46it/s] 173it [00:38, 4.50it/s] 174it [00:38, 4.50it/s] 175it [00:39, 4.53it/s] 176it [00:39, 4.54it/s] 177it [00:39, 4.56it/s] 178it [00:39, 4.42it/s] 179it [00:39, 4.48it/s] 180it [00:40, 4.42it/s] 181it [00:40, 4.48it/s] 182it [00:40, 4.50it/s] 183it [00:40, 4.53it/s] 184it [00:41, 4.54it/s] 185it [00:41, 4.49it/s] 186it [00:41, 4.39it/s] 187it [00:41, 4.45it/s] 188it [00:41, 4.43it/s] 189it [00:42, 4.48it/s] 190it [00:42, 4.51it/s] 191it [00:42, 4.53it/s] 192it [00:42, 4.54it/s] 193it [00:43, 4.55it/s] 194it [00:43, 4.56it/s] 195it [00:43, 4.42it/s] 196it [00:43, 4.35it/s] 196it [00:43, 4.48it/s] +2025-05-26 02:25:00,966 - INFO - Epoch: 50, Objective: tensor([1407.9646], device='cuda:0', grad_fn=), Loss: 0.00830838456749916, KL/n: 24.236207962036133 + 0it [00:00, ?it/s]2025-05-26 02:25:01,374 - INFO - [Epoch 051 | Batch 0000] IWAE-loss 1334.0294 | mean log_px -0.0045 | KL -1185.92 + 1it [00:00, 2.98it/s] 2it [00:00, 3.67it/s] 3it [00:00, 4.04it/s] 4it [00:01, 4.06it/s] 5it [00:01, 4.18it/s] 6it [00:01, 4.33it/s] 7it [00:01, 4.33it/s] 8it [00:01, 4.30it/s] 9it [00:02, 4.41it/s] 10it [00:02, 4.23it/s] 11it [00:02, 4.22it/s] 12it [00:02, 4.23it/s] 13it [00:03, 4.26it/s] 14it [00:03, 4.17it/s] 15it [00:03, 4.26it/s] 16it [00:03, 4.28it/s] 17it [00:04, 4.26it/s] 18it [00:04, 4.26it/s] 19it [00:04, 4.15it/s] 20it [00:04, 4.18it/s] 21it [00:05, 4.23it/s] 22it [00:05, 4.36it/s] 23it [00:05, 4.46it/s] 24it [00:05, 4.50it/s] 25it [00:06, 3.46it/s] 26it [00:06, 3.67it/s] 27it [00:06, 3.84it/s] 28it [00:06, 3.96it/s] 29it [00:07, 4.13it/s] 30it [00:07, 4.02it/s] 31it [00:07, 4.21it/s] 32it [00:07, 4.20it/s] 33it [00:07, 4.22it/s] 34it [00:08, 4.23it/s] 35it [00:08, 4.13it/s] 36it [00:08, 4.20it/s] 37it [00:08, 4.27it/s] 38it [00:09, 4.32it/s] 39it [00:09, 4.39it/s] 40it [00:09, 4.41it/s] 41it [00:09, 4.50it/s] 42it [00:09, 4.56it/s] 43it [00:10, 4.36it/s] 44it [00:10, 4.32it/s] 45it [00:10, 4.27it/s] 46it [00:10, 4.24it/s] 47it [00:11, 4.24it/s] 48it [00:11, 4.21it/s] 49it [00:11, 4.34it/s] 50it [00:11, 4.39it/s]2025-05-26 02:25:13,155 - INFO - [Epoch 051 | Batch 0050] IWAE-loss 1236.7412 | mean log_px -0.0013 | KL -1183.91 + 51it [00:12, 4.39it/s] 52it [00:12, 4.47it/s] 53it [00:12, 4.24it/s] 54it [00:12, 4.23it/s] 55it [00:13, 4.22it/s] 56it [00:13, 4.27it/s] 57it [00:13, 4.34it/s] 58it [00:13, 4.30it/s] 59it [00:13, 4.34it/s] 60it [00:14, 4.19it/s] 61it [00:14, 4.35it/s] 62it [00:14, 4.41it/s] 63it [00:14, 4.37it/s] 64it [00:15, 4.36it/s] 65it [00:15, 4.39it/s] 66it [00:15, 4.09it/s] 67it [00:15, 4.18it/s] 68it [00:16, 4.19it/s] 69it [00:16, 4.24it/s] 70it [00:16, 4.24it/s] 71it [00:16, 4.31it/s] 72it [00:17, 4.31it/s] 73it [00:17, 4.40it/s] 74it [00:17, 4.46it/s] 75it [00:17, 4.47it/s] 76it [00:17, 4.47it/s] 77it [00:18, 4.47it/s] 78it [00:18, 4.48it/s] 79it [00:18, 4.34it/s] 80it [00:18, 4.35it/s] 81it [00:19, 4.33it/s] 82it [00:19, 4.37it/s] 83it [00:19, 4.47it/s] 84it [00:19, 4.39it/s] 85it [00:19, 4.37it/s] 86it [00:20, 4.36it/s] 87it [00:20, 4.31it/s] 88it [00:20, 4.15it/s] 89it [00:20, 4.26it/s] 90it [00:21, 4.23it/s] 91it [00:21, 4.30it/s] 92it [00:21, 4.31it/s] 93it [00:21, 4.41it/s] 94it [00:22, 4.49it/s] 95it [00:22, 4.29it/s] 96it [00:22, 4.24it/s] 97it [00:22, 4.23it/s] 98it [00:23, 4.24it/s] 99it [00:23, 4.26it/s] 100it [00:23, 4.28it/s]2025-05-26 02:25:24,742 - INFO - [Epoch 051 | Batch 0100] IWAE-loss 1498.0203 | mean log_px -0.0071 | KL -1184.13 + 101it [00:23, 4.28it/s] 102it [00:23, 4.29it/s] 103it [00:24, 4.11it/s] 104it [00:24, 4.14it/s] 105it [00:24, 4.26it/s] 106it [00:24, 4.36it/s] 107it [00:25, 4.37it/s] 108it [00:25, 4.43it/s] 109it [00:25, 4.35it/s] 110it [00:25, 4.14it/s] 111it [00:26, 4.21it/s] 112it [00:26, 4.35it/s] 113it [00:26, 4.43it/s] 114it [00:26, 4.36it/s] 115it [00:26, 4.30it/s] 116it [00:27, 4.28it/s] 117it [00:27, 4.33it/s] 118it [00:27, 4.42it/s] 119it [00:27, 4.35it/s] 120it [00:28, 4.45it/s] 121it [00:28, 4.50it/s] 122it [00:28, 4.39it/s] 123it [00:28, 4.32it/s] 124it [00:29, 4.28it/s] 125it [00:29, 4.20it/s] 126it [00:29, 4.21it/s] 127it [00:29, 4.30it/s] 128it [00:29, 4.30it/s] 129it [00:30, 4.33it/s] 130it [00:30, 4.31it/s] 131it [00:30, 4.20it/s] 132it [00:30, 4.22it/s] 133it [00:31, 4.21it/s] 134it [00:31, 4.29it/s] 135it [00:31, 4.32it/s] 136it [00:31, 4.31it/s] 137it [00:32, 4.34it/s] 138it [00:32, 4.38it/s] 139it [00:32, 4.22it/s] 140it [00:32, 4.26it/s] 141it [00:33, 4.28it/s] 142it [00:33, 4.28it/s] 143it [00:33, 4.41it/s] 144it [00:33, 4.29it/s] 145it [00:33, 4.39it/s] 146it [00:34, 4.39it/s] 147it [00:34, 4.34it/s] 148it [00:34, 4.33it/s] 149it [00:34, 4.30it/s] 150it [00:35, 4.27it/s]2025-05-26 02:25:36,355 - INFO - [Epoch 051 | Batch 0150] IWAE-loss 1679.6946 | mean log_px -0.0117 | KL -1184.98 + 151it [00:35, 4.29it/s] 152it [00:35, 4.25it/s] 153it [00:35, 4.22it/s] 154it [00:36, 4.33it/s] 155it [00:36, 4.42it/s] 156it [00:36, 4.21it/s] 157it [00:36, 4.24it/s] 158it [00:36, 4.29it/s] 159it [00:37, 4.26it/s] 160it [00:37, 4.27it/s] 161it [00:37, 4.21it/s] 162it [00:37, 4.23it/s] 163it [00:38, 4.35it/s] 164it [00:38, 4.33it/s] 165it [00:38, 4.30it/s] 166it [00:38, 4.27it/s] 167it [00:39, 4.39it/s] 168it [00:39, 4.41it/s] 169it [00:39, 4.49it/s] 170it [00:39, 4.45it/s] 171it [00:39, 4.46it/s] 172it [00:40, 4.43it/s] 173it [00:40, 4.43it/s] 174it [00:40, 4.51it/s] 175it [00:40, 4.57it/s] 176it [00:41, 4.54it/s] 177it [00:41, 4.59it/s] 178it [00:41, 4.58it/s] 179it [00:41, 4.48it/s] 180it [00:41, 4.40it/s] 181it [00:42, 4.46it/s] 182it [00:42, 4.54it/s] 183it [00:42, 4.42it/s] 184it [00:42, 4.49it/s] 185it [00:43, 4.54it/s] 186it [00:43, 4.57it/s] 187it [00:43, 4.55it/s] 188it [00:43, 4.51it/s] 189it [00:43, 4.45it/s] 190it [00:44, 4.35it/s] 191it [00:44, 4.42it/s] 192it [00:44, 4.45it/s] 193it [00:44, 4.50it/s] 194it [00:45, 4.33it/s] 195it [00:45, 4.33it/s] 196it [00:45, 4.42it/s] 196it [00:45, 4.30it/s] +2025-05-26 02:25:46,689 - INFO - Epoch: 51, Objective: tensor([1720.4115], device='cuda:0', grad_fn=), Loss: 0.011251946911215782, KL/n: 24.17317771911621 + 0it [00:00, ?it/s]2025-05-26 02:25:47,061 - INFO - [Epoch 052 | Batch 0000] IWAE-loss 1308.6581 | mean log_px -0.0024 | KL -1183.32 + 1it [00:00, 3.37it/s] 2it [00:00, 4.06it/s] 3it [00:00, 4.35it/s] 4it [00:00, 4.32it/s] 5it [00:01, 4.26it/s] 6it [00:01, 4.38it/s] 7it [00:01, 4.48it/s] 8it [00:01, 4.53it/s] 9it [00:02, 4.58it/s] 10it [00:02, 4.59it/s] 11it [00:02, 4.64it/s] 12it [00:02, 4.62it/s] 13it [00:02, 4.67it/s] 14it [00:03, 4.68it/s] 15it [00:03, 4.70it/s] 16it [00:03, 4.54it/s] 17it [00:03, 4.62it/s] 18it [00:03, 4.65it/s] 19it [00:04, 4.66it/s] 20it [00:04, 4.69it/s] 21it [00:04, 4.70it/s] 22it [00:04, 4.70it/s] 23it [00:05, 4.54it/s] 24it [00:05, 4.60it/s] 25it [00:05, 4.64it/s] 26it [00:05, 4.65it/s] 27it [00:05, 4.67it/s] 28it [00:06, 4.68it/s] 29it [00:06, 4.68it/s] 30it [00:06, 4.68it/s] 31it [00:06, 4.69it/s] 32it [00:06, 4.70it/s] 33it [00:07, 4.70it/s] 34it [00:07, 4.70it/s] 35it [00:07, 4.71it/s] 36it [00:07, 4.71it/s] 37it [00:08, 4.72it/s] 38it [00:08, 4.71it/s] 39it [00:08, 4.71it/s] 40it [00:08, 4.54it/s] 41it [00:08, 4.60it/s] 42it [00:09, 4.63it/s] 43it [00:09, 4.66it/s] 44it [00:09, 4.68it/s] 45it [00:09, 4.70it/s] 46it [00:09, 4.69it/s] 47it [00:10, 4.70it/s] 48it [00:10, 4.54it/s] 49it [00:10, 4.61it/s] 50it [00:10, 4.63it/s]2025-05-26 02:25:57,828 - INFO - [Epoch 052 | Batch 0050] IWAE-loss 1253.5378 | mean log_px -0.0022 | KL -1182.44 + 51it [00:11, 4.65it/s] 52it [00:11, 4.66it/s] 53it [00:11, 4.68it/s] 54it [00:11, 4.67it/s] 55it [00:11, 4.69it/s] 56it [00:12, 4.69it/s] 57it [00:12, 4.70it/s] 58it [00:12, 4.53it/s] 59it [00:12, 4.54it/s] 60it [00:13, 4.58it/s] 61it [00:13, 4.62it/s] 62it [00:13, 4.64it/s] 63it [00:13, 4.66it/s] 64it [00:13, 4.67it/s] 65it [00:14, 4.63it/s] 66it [00:14, 4.65it/s] 67it [00:14, 4.68it/s] 68it [00:14, 4.67it/s] 69it [00:14, 4.68it/s] 70it [00:15, 4.67it/s] 71it [00:15, 4.68it/s] 72it [00:15, 4.68it/s] 73it [00:15, 4.69it/s] 74it [00:16, 4.68it/s] 75it [00:16, 4.69it/s] 76it [00:16, 4.67it/s] 77it [00:16, 4.68it/s] 78it [00:16, 4.64it/s] 79it [00:17, 4.67it/s] 80it [00:17, 4.68it/s] 81it [00:17, 4.59it/s] 82it [00:17, 4.62it/s] 83it [00:17, 4.64it/s] 84it [00:18, 4.65it/s] 85it [00:18, 4.50it/s] 86it [00:18, 4.55it/s] 87it [00:18, 4.61it/s] 88it [00:19, 4.63it/s] 89it [00:19, 4.63it/s] 90it [00:19, 4.66it/s] 91it [00:19, 4.68it/s] 92it [00:19, 4.68it/s] 93it [00:20, 4.71it/s] 94it [00:20, 4.54it/s] 95it [00:20, 4.61it/s] 96it [00:20, 4.62it/s] 97it [00:20, 4.64it/s] 98it [00:21, 4.65it/s] 99it [00:21, 4.67it/s] 100it [00:21, 4.68it/s]2025-05-26 02:26:08,585 - INFO - [Epoch 052 | Batch 0100] IWAE-loss 1299.2296 | mean log_px -0.0027 | KL -1181.27 + 101it [00:21, 4.52it/s] 102it [00:22, 4.59it/s] 103it [00:22, 4.62it/s] 104it [00:22, 4.64it/s] 105it [00:22, 4.67it/s] 106it [00:22, 4.67it/s] 107it [00:23, 4.69it/s] 108it [00:23, 4.68it/s] 109it [00:23, 4.70it/s] 110it [00:23, 4.69it/s] 111it [00:23, 4.71it/s] 112it [00:24, 4.72it/s] 113it [00:24, 4.72it/s] 114it [00:24, 4.71it/s] 115it [00:24, 4.71it/s] 116it [00:25, 4.72it/s] 117it [00:25, 4.68it/s] 118it [00:25, 4.49it/s] 119it [00:25, 4.58it/s] 120it [00:25, 4.62it/s] 121it [00:26, 4.65it/s] 122it [00:26, 4.66it/s] 123it [00:26, 4.68it/s] 124it [00:26, 4.69it/s] 125it [00:26, 4.70it/s] 126it [00:27, 4.69it/s] 127it [00:27, 4.71it/s] 128it [00:27, 4.54it/s] 129it [00:27, 4.60it/s] 130it [00:28, 4.63it/s] 131it [00:28, 4.66it/s] 132it [00:28, 4.67it/s] 133it [00:28, 4.68it/s] 134it [00:28, 4.67it/s] 135it [00:29, 4.52it/s] 136it [00:29, 4.60it/s] 137it [00:29, 4.62it/s] 138it [00:29, 4.65it/s] 139it [00:29, 4.65it/s] 140it [00:30, 4.66it/s] 141it [00:30, 4.67it/s] 142it [00:30, 4.66it/s] 143it [00:30, 4.70it/s] 144it [00:31, 4.53it/s] 145it [00:31, 4.59it/s] 146it [00:31, 4.62it/s] 147it [00:31, 4.65it/s] 148it [00:31, 4.67it/s] 149it [00:32, 4.69it/s] 150it [00:32, 4.65it/s]2025-05-26 02:26:19,354 - INFO - [Epoch 052 | Batch 0150] IWAE-loss 1224.5007 | mean log_px -0.0009 | KL -1180.44 + 151it [00:32, 4.39it/s] 152it [00:32, 4.48it/s] 153it [00:33, 4.56it/s] 154it [00:33, 4.60it/s] 155it [00:33, 4.63it/s] 156it [00:33, 4.65it/s] 157it [00:33, 4.68it/s] 158it [00:34, 4.65it/s] 159it [00:34, 4.66it/s] 160it [00:34, 4.67it/s] 161it [00:34, 4.70it/s] 162it [00:34, 4.70it/s] 163it [00:35, 4.54it/s] 164it [00:35, 4.59it/s] 165it [00:35, 4.64it/s] 166it [00:35, 4.65it/s] 167it [00:36, 4.67it/s] 168it [00:36, 4.68it/s] 169it [00:36, 4.68it/s] 170it [00:36, 4.52it/s] 171it [00:36, 4.60it/s] 172it [00:37, 4.63it/s] 173it [00:37, 4.65it/s] 174it [00:37, 4.67it/s] 175it [00:37, 4.68it/s] 176it [00:37, 4.65it/s] 177it [00:38, 4.69it/s] 178it [00:38, 4.69it/s] 179it [00:38, 4.70it/s] 180it [00:38, 4.70it/s] 181it [00:39, 4.72it/s] 182it [00:39, 4.72it/s] 183it [00:39, 4.69it/s] 184it [00:39, 4.71it/s] 185it [00:39, 4.55it/s] 186it [00:40, 4.61it/s] 187it [00:40, 4.64it/s] 188it [00:40, 4.66it/s] 189it [00:40, 4.68it/s] 190it [00:40, 4.56it/s] 191it [00:41, 4.62it/s] 192it [00:41, 4.63it/s] 193it [00:41, 4.67it/s] 194it [00:41, 4.68it/s] 195it [00:42, 4.59it/s] 196it [00:42, 4.64it/s] 196it [00:42, 4.63it/s] +2025-05-26 02:26:29,172 - INFO - Epoch: 52, Objective: tensor([1489.6241], device='cuda:0', grad_fn=), Loss: 0.0029403548687696457, KL/n: 23.974336624145508 + 0it [00:00, ?it/s]2025-05-26 02:26:29,733 - INFO - [Epoch 053 | Batch 0000] IWAE-loss 1426.3737 | mean log_px -0.0070 | KL -1176.55 + 1it [00:00, 3.06it/s] 2it [00:00, 3.87it/s] 3it [00:00, 4.23it/s] 4it [00:00, 4.40it/s] 5it [00:01, 4.52it/s] 6it [00:01, 4.58it/s] 7it [00:01, 4.63it/s] 8it [00:01, 4.66it/s] 9it [00:02, 4.68it/s] 10it [00:02, 4.69it/s] 11it [00:02, 4.71it/s] 12it [00:02, 4.70it/s] 13it [00:02, 4.72it/s] 14it [00:03, 4.71it/s] 15it [00:03, 4.70it/s] 16it [00:03, 4.72it/s] 17it [00:03, 4.72it/s] 18it [00:03, 4.71it/s] 19it [00:04, 4.71it/s] 20it [00:04, 4.50it/s] 21it [00:04, 4.53it/s] 22it [00:04, 4.57it/s] 23it [00:05, 4.48it/s] 24it [00:05, 4.54it/s] 25it [00:05, 4.56it/s] 26it [00:05, 4.60it/s] 27it [00:05, 4.59it/s] 28it [00:06, 4.61it/s] 29it [00:06, 4.48it/s] 30it [00:06, 4.56it/s] 31it [00:06, 4.60it/s] 32it [00:07, 4.64it/s] 33it [00:07, 4.66it/s] 34it [00:07, 4.47it/s] 35it [00:07, 4.55it/s] 36it [00:07, 4.59it/s] 37it [00:08, 4.63it/s] 38it [00:08, 4.65it/s] 39it [00:08, 4.66it/s] 40it [00:08, 4.68it/s] 41it [00:08, 4.49it/s] 42it [00:09, 4.57it/s] 43it [00:09, 4.60it/s] 44it [00:09, 4.63it/s] 45it [00:09, 4.62it/s] 46it [00:10, 4.62it/s] 47it [00:10, 4.67it/s] 48it [00:10, 4.67it/s] 49it [00:10, 4.69it/s] 50it [00:10, 4.70it/s]2025-05-26 02:26:40,537 - INFO - [Epoch 053 | Batch 0050] IWAE-loss 1257.6678 | mean log_px -0.0016 | KL -1169.34 + 51it [00:11, 4.53it/s] 52it [00:11, 4.58it/s] 53it [00:11, 4.63it/s] 54it [00:11, 4.63it/s] 55it [00:11, 4.68it/s] 56it [00:12, 4.70it/s] 57it [00:12, 4.70it/s] 58it [00:12, 4.53it/s] 59it [00:12, 4.60it/s] 60it [00:13, 4.63it/s] 61it [00:13, 4.64it/s] 62it [00:13, 4.65it/s] 63it [00:13, 4.69it/s] 64it [00:13, 4.69it/s] 65it [00:14, 4.69it/s] 66it [00:14, 4.70it/s] 67it [00:14, 4.70it/s] 68it [00:14, 4.71it/s] 69it [00:14, 4.71it/s] 70it [00:15, 4.69it/s] 71it [00:15, 4.72it/s] 72it [00:15, 4.71it/s] 73it [00:15, 4.72it/s] 74it [00:16, 4.72it/s] 75it [00:16, 4.72it/s] 76it [00:16, 4.71it/s] 77it [00:16, 4.71it/s] 78it [00:16, 4.73it/s] 79it [00:17, 4.73it/s] 80it [00:17, 4.70it/s] 81it [00:17, 4.70it/s] 82it [00:17, 4.70it/s] 83it [00:17, 4.71it/s] 84it [00:18, 4.71it/s] 85it [00:18, 4.72it/s] 86it [00:18, 4.72it/s] 87it [00:18, 4.72it/s] 88it [00:19, 4.72it/s] 89it [00:19, 4.73it/s] 90it [00:19, 4.72it/s] 91it [00:19, 4.72it/s] 92it [00:19, 4.71it/s] 93it [00:20, 4.68it/s] 94it [00:20, 4.69it/s] 95it [00:20, 4.70it/s] 96it [00:20, 4.70it/s] 97it [00:20, 4.71it/s] 98it [00:21, 4.68it/s] 99it [00:21, 4.63it/s] 100it [00:21, 4.64it/s]2025-05-26 02:26:51,217 - INFO - [Epoch 053 | Batch 0100] IWAE-loss 1240.2892 | mean log_px -0.0014 | KL -1168.91 + 101it [00:21, 4.49it/s] 102it [00:22, 4.56it/s] 103it [00:22, 4.59it/s] 104it [00:22, 4.62it/s] 105it [00:22, 4.64it/s] 106it [00:22, 4.49it/s] 107it [00:23, 4.57it/s] 108it [00:23, 4.59it/s] 109it [00:23, 4.63it/s] 110it [00:23, 4.66it/s] 111it [00:23, 4.67it/s] 112it [00:24, 4.55it/s] 113it [00:24, 4.61it/s] 114it [00:24, 4.63it/s] 115it [00:24, 4.52it/s] 116it [00:25, 4.59it/s] 117it [00:25, 4.63it/s] 118it [00:25, 4.65it/s] 119it [00:25, 4.68it/s] 120it [00:25, 4.68it/s] 121it [00:26, 4.70it/s] 122it [00:26, 4.70it/s] 123it [00:26, 4.70it/s] 124it [00:26, 4.70it/s] 125it [00:26, 4.71it/s] 126it [00:27, 4.71it/s] 127it [00:27, 4.71it/s] 128it [00:27, 4.72it/s] 129it [00:27, 4.55it/s] 130it [00:28, 4.60it/s] 131it [00:28, 4.65it/s] 132it [00:28, 4.66it/s] 133it [00:28, 4.64it/s] 134it [00:28, 4.66it/s] 135it [00:29, 4.68it/s] 136it [00:29, 4.68it/s] 137it [00:29, 4.53it/s] 138it [00:29, 4.59it/s] 139it [00:29, 4.63it/s] 140it [00:30, 4.65it/s] 141it [00:30, 4.67it/s] 142it [00:30, 4.68it/s] 143it [00:30, 4.69it/s] 144it [00:31, 4.70it/s] 145it [00:31, 4.70it/s] 146it [00:31, 4.70it/s] 147it [00:31, 4.53it/s] 148it [00:31, 4.59it/s] 149it [00:32, 4.63it/s] 150it [00:32, 4.65it/s]2025-05-26 02:27:02,007 - INFO - [Epoch 053 | Batch 0150] IWAE-loss 1517.0568 | mean log_px -0.0129 | KL -1162.64 + 151it [00:32, 4.65it/s] 152it [00:32, 4.67it/s] 153it [00:32, 4.68it/s] 154it [00:33, 4.52it/s] 155it [00:33, 4.59it/s] 156it [00:33, 4.62it/s] 157it [00:33, 4.65it/s] 158it [00:34, 4.66it/s] 159it [00:34, 4.67it/s] 160it [00:34, 4.68it/s] 161it [00:34, 4.70it/s] 162it [00:34, 4.70it/s] 163it [00:35, 4.70it/s] 164it [00:35, 4.70it/s] 165it [00:35, 4.71it/s] 166it [00:35, 4.71it/s] 167it [00:35, 4.72it/s] 168it [00:36, 4.71it/s] 169it [00:36, 4.72it/s] 170it [00:36, 4.72it/s] 171it [00:36, 4.71it/s] 172it [00:37, 4.71it/s] 173it [00:37, 4.72it/s] 174it [00:37, 4.71it/s] 175it [00:37, 4.71it/s] 176it [00:37, 4.72it/s] 177it [00:38, 4.72it/s] 178it [00:38, 4.71it/s] 179it [00:38, 4.72it/s] 180it [00:38, 4.71it/s] 181it [00:38, 4.70it/s] 182it [00:39, 4.54it/s] 183it [00:39, 4.56it/s] 184it [00:39, 4.62it/s] 185it [00:39, 4.66it/s] 186it [00:40, 4.63it/s] 187it [00:40, 4.65it/s] 188it [00:40, 4.66it/s] 189it [00:40, 4.68it/s] 190it [00:40, 4.64it/s] 191it [00:41, 4.51it/s] 192it [00:41, 4.58it/s] 193it [00:41, 4.63it/s] 194it [00:41, 4.65it/s] 195it [00:42, 4.58it/s] 196it [00:42, 4.64it/s] 196it [00:42, 4.63it/s] +2025-05-26 02:27:11,783 - INFO - Epoch: 53, Objective: tensor([1300.9849], device='cuda:0', grad_fn=), Loss: 0.0023734073620289564, KL/n: 23.757631301879883 + 0it [00:00, ?it/s]2025-05-26 02:27:12,158 - INFO - [Epoch 054 | Batch 0000] IWAE-loss 1428.1246 | mean log_px -0.0070 | KL -1163.56 + 1it [00:00, 3.09it/s] 2it [00:00, 3.89it/s] 3it [00:00, 4.23it/s] 4it [00:00, 4.41it/s] 5it [00:01, 4.52it/s] 6it [00:01, 4.58it/s] 7it [00:01, 4.60it/s] 8it [00:01, 4.63it/s] 9it [00:02, 4.65it/s] 10it [00:02, 4.66it/s] 11it [00:02, 4.59it/s] 12it [00:02, 3.63it/s] 13it [00:03, 3.89it/s] 14it [00:03, 4.07it/s] 15it [00:03, 4.23it/s] 16it [00:03, 4.33it/s] 17it [00:03, 4.19it/s] 18it [00:04, 4.27it/s] 19it [00:04, 4.35it/s] 20it [00:04, 4.44it/s] 21it [00:04, 4.52it/s] 22it [00:05, 4.57it/s] 23it [00:05, 4.62it/s] 24it [00:05, 4.65it/s] 25it [00:05, 4.68it/s] 26it [00:05, 4.52it/s] 27it [00:06, 4.59it/s] 28it [00:06, 4.62it/s] 29it [00:06, 4.66it/s] 30it [00:06, 4.67it/s] 31it [00:07, 4.69it/s] 32it [00:07, 4.70it/s] 33it [00:07, 4.71it/s] 34it [00:07, 4.49it/s] 35it [00:07, 4.56it/s] 36it [00:08, 4.61it/s] 37it [00:08, 4.64it/s] 38it [00:08, 4.66it/s] 39it [00:08, 4.68it/s] 40it [00:08, 4.68it/s] 41it [00:09, 4.50it/s] 42it [00:09, 4.57it/s] 43it [00:09, 4.62it/s] 44it [00:09, 4.64it/s] 45it [00:10, 4.65it/s] 46it [00:10, 4.58it/s] 47it [00:10, 4.62it/s] 48it [00:10, 4.62it/s] 49it [00:10, 4.66it/s] 50it [00:11, 4.67it/s]2025-05-26 02:27:23,194 - INFO - [Epoch 054 | Batch 0050] IWAE-loss 1222.4982 | mean log_px -0.0012 | KL -1156.77 + 51it [00:11, 4.53it/s] 52it [00:11, 4.58it/s] 53it [00:11, 4.57it/s] 54it [00:12, 4.45it/s] 55it [00:12, 4.52it/s] 56it [00:12, 4.58it/s] 57it [00:12, 4.62it/s] 58it [00:12, 4.63it/s] 59it [00:13, 4.65it/s] 60it [00:13, 4.67it/s] 61it [00:13, 4.66it/s] 62it [00:13, 4.52it/s] 63it [00:13, 4.59it/s] 64it [00:14, 4.62it/s] 65it [00:14, 4.65it/s] 66it [00:14, 4.67it/s] 67it [00:14, 4.66it/s] 68it [00:15, 4.67it/s] 69it [00:15, 4.68it/s] 70it [00:15, 4.68it/s] 71it [00:15, 4.70it/s] 72it [00:15, 4.54it/s] 73it [00:16, 4.61it/s] 74it [00:16, 4.64it/s] 75it [00:16, 4.67it/s] 76it [00:16, 4.67it/s] 77it [00:16, 4.69it/s] 78it [00:17, 4.68it/s] 79it [00:17, 4.70it/s] 80it [00:17, 4.70it/s] 81it [00:17, 4.54it/s] 82it [00:18, 4.59it/s] 83it [00:18, 4.63it/s] 84it [00:18, 4.64it/s] 85it [00:18, 4.68it/s] 86it [00:18, 4.66it/s] 87it [00:19, 4.52it/s] 88it [00:19, 4.58it/s] 89it [00:19, 4.62it/s] 90it [00:19, 4.63it/s] 91it [00:19, 4.65it/s] 92it [00:20, 4.67it/s] 93it [00:20, 4.68it/s] 94it [00:20, 4.64it/s] 95it [00:20, 4.57it/s] 96it [00:21, 4.63it/s] 97it [00:21, 4.65it/s] 98it [00:21, 4.67it/s] 99it [00:21, 4.51it/s] 100it [00:21, 4.57it/s]2025-05-26 02:27:34,022 - INFO - [Epoch 054 | Batch 0100] IWAE-loss 1336.7174 | mean log_px -0.0042 | KL -1150.52 + 101it [00:22, 4.61it/s] 102it [00:22, 4.64it/s] 103it [00:22, 4.65it/s] 104it [00:22, 4.68it/s] 105it [00:23, 4.68it/s] 106it [00:23, 4.69it/s] 107it [00:23, 4.70it/s] 108it [00:23, 4.69it/s] 109it [00:23, 4.53it/s] 110it [00:24, 4.59it/s] 111it [00:24, 4.63it/s] 112it [00:24, 4.66it/s] 113it [00:24, 4.68it/s] 114it [00:24, 4.68it/s] 115it [00:25, 4.69it/s] 116it [00:25, 4.70it/s] 117it [00:25, 4.62it/s] 118it [00:25, 4.66it/s] 119it [00:26, 4.68it/s] 120it [00:26, 4.69it/s] 121it [00:26, 4.57it/s] 122it [00:26, 4.59it/s] 123it [00:26, 4.60it/s] 124it [00:27, 4.59it/s] 125it [00:27, 4.61it/s] 126it [00:27, 4.61it/s] 127it [00:27, 4.60it/s] 128it [00:27, 4.59it/s] 129it [00:28, 4.61it/s] 130it [00:28, 4.60it/s] 131it [00:28, 4.48it/s] 132it [00:28, 4.52it/s] 133it [00:29, 4.53it/s] 134it [00:29, 4.56it/s] 135it [00:29, 4.58it/s] 136it [00:29, 4.60it/s] 137it [00:29, 4.45it/s] 138it [00:30, 4.54it/s] 139it [00:30, 4.59it/s] 140it [00:30, 4.59it/s] 141it [00:30, 4.61it/s] 142it [00:31, 4.48it/s] 143it [00:31, 4.56it/s] 144it [00:31, 4.60it/s] 145it [00:31, 4.64it/s] 146it [00:31, 4.62it/s] 147it [00:32, 4.64it/s] 148it [00:32, 4.50it/s] 149it [00:32, 4.58it/s] 150it [00:32, 4.60it/s]2025-05-26 02:27:44,872 - INFO - [Epoch 054 | Batch 0150] IWAE-loss 1233.8479 | mean log_px -0.0012 | KL -1151.34 + 151it [00:33, 4.47it/s] 152it [00:33, 4.55it/s] 153it [00:33, 4.58it/s] 154it [00:33, 4.62it/s] 155it [00:33, 4.65it/s] 156it [00:34, 4.66it/s] 157it [00:34, 4.69it/s] 158it [00:34, 4.53it/s] 159it [00:34, 4.59it/s] 160it [00:34, 4.62it/s] 161it [00:35, 4.65it/s] 162it [00:35, 4.67it/s] 163it [00:35, 4.69it/s] 164it [00:35, 4.69it/s] 165it [00:36, 4.71it/s] 166it [00:36, 4.71it/s] 167it [00:36, 4.55it/s] 168it [00:36, 4.60it/s] 169it [00:36, 4.64it/s] 170it [00:37, 4.66it/s] 171it [00:37, 4.68it/s] 172it [00:37, 4.53it/s] 173it [00:37, 4.60it/s] 174it [00:37, 4.61it/s] 175it [00:38, 4.65it/s] 176it [00:38, 4.66it/s] 177it [00:38, 4.68it/s] 178it [00:38, 4.52it/s] 179it [00:39, 4.58it/s] 180it [00:39, 4.62it/s] 181it [00:39, 4.65it/s] 182it [00:39, 4.67it/s] 183it [00:39, 4.52it/s] 184it [00:40, 4.59it/s] 185it [00:40, 4.62it/s] 186it [00:40, 4.65it/s] 187it [00:40, 4.67it/s] 188it [00:41, 4.52it/s] 189it [00:41, 4.60it/s] 190it [00:41, 4.58it/s] 191it [00:41, 4.55it/s] 192it [00:41, 4.59it/s] 193it [00:42, 4.62it/s] 194it [00:42, 4.48it/s] 195it [00:42, 4.45it/s] 196it [00:42, 4.52it/s] 196it [00:42, 4.57it/s] +2025-05-26 02:27:54,780 - INFO - Epoch: 54, Objective: tensor([1524.9691], device='cuda:0', grad_fn=), Loss: 0.006559988018125296, KL/n: 23.41026496887207 + 0it [00:00, ?it/s]2025-05-26 02:27:55,162 - INFO - [Epoch 055 | Batch 0000] IWAE-loss 1968.7968 | mean log_px -0.0207 | KL -1144.99 + 1it [00:00, 3.26it/s] 2it [00:00, 3.99it/s] 3it [00:00, 4.30it/s] 4it [00:00, 4.06it/s] 5it [00:01, 4.21it/s] 6it [00:01, 4.19it/s] 7it [00:01, 4.28it/s] 8it [00:01, 4.35it/s] 9it [00:02, 4.29it/s] 10it [00:02, 4.27it/s] 11it [00:02, 4.16it/s] 12it [00:02, 4.21it/s] 13it [00:03, 4.23it/s] 14it [00:03, 4.37it/s] 15it [00:03, 4.39it/s] 16it [00:03, 4.34it/s] 17it [00:04, 4.18it/s] 18it [00:04, 4.29it/s] 19it [00:04, 4.41it/s] 20it [00:04, 4.47it/s] 21it [00:04, 4.53it/s] 22it [00:05, 4.58it/s] 23it [00:05, 4.64it/s] 24it [00:05, 4.49it/s] 25it [00:05, 4.44it/s] 26it [00:06, 4.51it/s] 27it [00:06, 4.53it/s] 28it [00:06, 4.47it/s] 29it [00:06, 4.53it/s] 30it [00:06, 4.27it/s] 31it [00:07, 4.30it/s] 32it [00:07, 4.41it/s] 33it [00:07, 4.38it/s] 34it [00:07, 4.47it/s] 35it [00:08, 4.38it/s] 36it [00:08, 4.47it/s] 37it [00:08, 4.42it/s] 38it [00:08, 4.35it/s] 39it [00:08, 4.29it/s] 40it [00:09, 4.28it/s] 41it [00:09, 4.36it/s] 42it [00:09, 4.15it/s] 43it [00:09, 4.18it/s] 44it [00:10, 4.19it/s] 45it [00:10, 4.18it/s] 46it [00:10, 4.20it/s] 47it [00:10, 4.06it/s] 48it [00:11, 4.11it/s] 49it [00:11, 4.16it/s] 50it [00:11, 4.18it/s]2025-05-26 02:28:06,714 - INFO - [Epoch 055 | Batch 0050] IWAE-loss 1384.5171 | mean log_px -0.0034 | KL -1144.44 + 51it [00:11, 4.21it/s] 52it [00:12, 4.11it/s] 53it [00:12, 4.16it/s] 54it [00:12, 4.30it/s] 55it [00:12, 4.27it/s] 56it [00:13, 4.21it/s] 57it [00:13, 4.25it/s] 58it [00:13, 4.29it/s] 59it [00:13, 4.27it/s] 60it [00:13, 4.21it/s] 61it [00:14, 4.19it/s] 62it [00:14, 4.19it/s] 63it [00:14, 4.15it/s] 64it [00:14, 4.17it/s] 65it [00:15, 4.29it/s] 66it [00:15, 4.15it/s] 67it [00:15, 4.16it/s] 68it [00:15, 4.23it/s] 69it [00:16, 4.26it/s] 70it [00:16, 4.26it/s] 71it [00:16, 4.25it/s] 72it [00:16, 4.24it/s] 73it [00:17, 4.35it/s] 74it [00:17, 4.29it/s] 75it [00:17, 4.15it/s] 76it [00:17, 4.14it/s] 77it [00:18, 4.27it/s] 78it [00:18, 4.35it/s] 79it [00:18, 4.35it/s] 80it [00:18, 4.30it/s] 81it [00:18, 4.26it/s] 82it [00:19, 4.26it/s] 83it [00:19, 4.14it/s] 84it [00:19, 4.12it/s] 85it [00:19, 4.20it/s] 86it [00:20, 4.31it/s] 87it [00:20, 4.35it/s] 88it [00:20, 4.34it/s] 89it [00:20, 4.30it/s] 90it [00:21, 4.26it/s] 91it [00:21, 4.32it/s] 92it [00:21, 4.27it/s] 93it [00:21, 4.34it/s] 94it [00:21, 4.18it/s] 95it [00:22, 4.31it/s] 96it [00:22, 4.40it/s] 97it [00:22, 4.37it/s] 98it [00:22, 4.31it/s] 99it [00:23, 4.31it/s] 100it [00:23, 4.28it/s]2025-05-26 02:28:18,459 - INFO - [Epoch 055 | Batch 0100] IWAE-loss 1683.7357 | mean log_px -0.0097 | KL -1142.95 + 101it [00:23, 4.20it/s] 102it [00:23, 4.31it/s] 103it [00:24, 4.41it/s] 104it [00:24, 4.35it/s] 105it [00:24, 4.40it/s] 106it [00:24, 4.33it/s] 107it [00:24, 4.26it/s] 108it [00:25, 4.37it/s] 109it [00:25, 4.38it/s] 110it [00:25, 4.41it/s] 111it [00:25, 4.44it/s] 112it [00:26, 4.42it/s] 113it [00:26, 4.33it/s] 114it [00:26, 4.32it/s] 115it [00:26, 4.40it/s] 116it [00:27, 4.46it/s] 117it [00:27, 4.42it/s] 118it [00:27, 4.37it/s] 119it [00:27, 4.35it/s] 120it [00:27, 4.29it/s] 121it [00:28, 4.29it/s] 122it [00:28, 4.35it/s] 123it [00:28, 4.43it/s] 124it [00:28, 4.46it/s] 125it [00:29, 4.47it/s] 126it [00:29, 4.24it/s] 127it [00:29, 4.32it/s] 128it [00:29, 4.41it/s] 129it [00:29, 4.43it/s] 130it [00:30, 4.39it/s] 131it [00:30, 4.46it/s] 132it [00:30, 4.37it/s] 133it [00:30, 4.45it/s] 134it [00:31, 4.51it/s] 135it [00:31, 4.48it/s] 136it [00:31, 4.52it/s] 137it [00:31, 4.55it/s] 138it [00:32, 4.42it/s] 139it [00:32, 4.32it/s] 140it [00:32, 4.20it/s] 141it [00:32, 4.19it/s] 142it [00:32, 4.16it/s] 143it [00:33, 4.21it/s] 144it [00:33, 4.28it/s] 145it [00:33, 4.31it/s] 146it [00:33, 4.25it/s] 147it [00:34, 4.22it/s] 148it [00:34, 4.27it/s] 149it [00:34, 4.33it/s] 150it [00:34, 4.36it/s]2025-05-26 02:28:29,912 - INFO - [Epoch 055 | Batch 0150] IWAE-loss 1441.7352 | mean log_px -0.0088 | KL -1140.60 + 151it [00:35, 4.42it/s] 152it [00:35, 4.41it/s] 153it [00:35, 4.35it/s] 154it [00:35, 4.28it/s] 155it [00:36, 4.25it/s] 156it [00:36, 4.33it/s] 157it [00:36, 4.22it/s] 158it [00:36, 4.19it/s] 159it [00:36, 4.19it/s] 160it [00:37, 4.17it/s] 161it [00:37, 4.23it/s] 162it [00:37, 4.10it/s] 163it [00:37, 4.16it/s] 164it [00:38, 4.28it/s] 165it [00:38, 4.24it/s] 166it [00:38, 4.20it/s] 167it [00:38, 4.31it/s] 168it [00:39, 4.22it/s] 169it [00:39, 4.15it/s] 170it [00:39, 4.15it/s] 171it [00:39, 4.04it/s] 172it [00:40, 4.13it/s] 173it [00:40, 4.16it/s] 174it [00:40, 4.21it/s] 175it [00:40, 4.23it/s] 176it [00:41, 4.21it/s] 177it [00:41, 4.25it/s] 178it [00:41, 4.33it/s] 179it [00:41, 4.15it/s] 180it [00:41, 4.12it/s] 181it [00:42, 4.08it/s] 182it [00:42, 4.11it/s] 183it [00:42, 4.07it/s] 184it [00:42, 4.08it/s] 185it [00:43, 4.13it/s] 186it [00:43, 4.08it/s] 187it [00:43, 4.09it/s] 188it [00:43, 4.13it/s] 189it [00:44, 4.11it/s] 190it [00:44, 4.07it/s] 191it [00:44, 4.12it/s] 192it [00:44, 4.23it/s] 193it [00:45, 4.25it/s] 194it [00:45, 4.22it/s] 195it [00:45, 3.95it/s] 196it [00:45, 4.08it/s] 196it [00:45, 4.27it/s] +2025-05-26 02:28:40,855 - INFO - Epoch: 55, Objective: tensor([2532.4099], device='cuda:0', grad_fn=), Loss: 0.026845891028642654, KL/n: 23.29350471496582 + 0it [00:00, ?it/s]2025-05-26 02:28:41,433 - INFO - [Epoch 056 | Batch 0000] IWAE-loss 1829.8907 | mean log_px -0.0137 | KL -1141.24 + 1it [00:00, 3.01it/s] 2it [00:00, 3.66it/s] 3it [00:00, 3.87it/s] 4it [00:01, 4.00it/s] 5it [00:01, 3.93it/s] 6it [00:01, 4.02it/s] 7it [00:01, 3.96it/s] 8it [00:02, 4.04it/s] 9it [00:02, 4.13it/s] 10it [00:02, 4.13it/s] 11it [00:02, 4.14it/s] 12it [00:02, 4.16it/s] 13it [00:03, 4.15it/s] 14it [00:03, 4.07it/s] 15it [00:03, 4.12it/s] 16it [00:03, 4.22it/s] 17it [00:04, 4.23it/s] 18it [00:04, 4.22it/s] 19it [00:04, 4.30it/s] 20it [00:04, 4.14it/s] 21it [00:05, 4.21it/s] 22it [00:05, 4.22it/s] 23it [00:05, 4.31it/s] 24it [00:05, 4.28it/s] 25it [00:06, 4.25it/s] 26it [00:06, 4.14it/s] 27it [00:06, 4.27it/s] 28it [00:06, 4.24it/s] 29it [00:07, 4.23it/s] 30it [00:07, 4.26it/s] 31it [00:07, 4.24it/s] 32it [00:07, 4.09it/s] 33it [00:07, 4.13it/s] 34it [00:08, 4.15it/s] 35it [00:08, 4.17it/s] 36it [00:08, 4.18it/s] 37it [00:08, 4.29it/s] 38it [00:09, 4.24it/s] 39it [00:09, 4.13it/s] 40it [00:09, 4.24it/s] 41it [00:09, 4.21it/s] 42it [00:10, 4.17it/s] 43it [00:10, 4.18it/s] 44it [00:10, 4.14it/s] 45it [00:10, 4.14it/s] 46it [00:11, 4.17it/s] 47it [00:11, 4.18it/s] 48it [00:11, 4.17it/s] 49it [00:11, 4.05it/s] 50it [00:12, 4.10it/s]2025-05-26 02:28:53,411 - INFO - [Epoch 056 | Batch 0050] IWAE-loss 1205.6969 | mean log_px -0.0039 | KL -1133.87 + 51it [00:12, 4.11it/s] 52it [00:12, 4.16it/s] 53it [00:12, 4.05it/s] 54it [00:13, 4.06it/s] 55it [00:13, 4.10it/s] 56it [00:13, 4.09it/s] 57it [00:13, 4.14it/s] 58it [00:13, 4.26it/s] 59it [00:14, 4.22it/s] 60it [00:14, 4.09it/s] 61it [00:14, 4.14it/s] 62it [00:14, 4.20it/s] 63it [00:15, 4.21it/s] 64it [00:15, 4.20it/s] 65it [00:15, 4.18it/s] 66it [00:15, 4.20it/s] 67it [00:16, 4.23it/s] 68it [00:16, 4.08it/s] 69it [00:16, 4.15it/s] 70it [00:16, 4.17it/s] 71it [00:17, 4.29it/s] 72it [00:17, 4.34it/s] 73it [00:17, 4.31it/s] 74it [00:17, 4.30it/s] 75it [00:18, 4.30it/s] 76it [00:18, 4.29it/s] 77it [00:18, 4.14it/s] 78it [00:18, 4.19it/s] 79it [00:18, 4.27it/s] 80it [00:19, 4.28it/s] 81it [00:19, 4.28it/s] 82it [00:19, 4.14it/s] 83it [00:19, 4.18it/s] 84it [00:20, 4.19it/s] 85it [00:20, 4.21it/s] 86it [00:20, 4.23it/s] 87it [00:20, 4.24it/s] 88it [00:21, 4.27it/s] 89it [00:21, 4.31it/s] 90it [00:21, 4.39it/s] 91it [00:21, 4.35it/s] 92it [00:22, 4.16it/s] 93it [00:22, 4.24it/s] 94it [00:22, 4.35it/s] 95it [00:22, 4.44it/s] 96it [00:22, 4.49it/s] 97it [00:23, 4.42it/s] 98it [00:23, 4.39it/s] 99it [00:23, 4.38it/s] 100it [00:23, 4.31it/s]2025-05-26 02:29:05,198 - INFO - [Epoch 056 | Batch 0100] IWAE-loss 1527.7909 | mean log_px -0.0108 | KL -1131.17 + 101it [00:24, 4.28it/s] 102it [00:24, 4.25it/s] 103it [00:24, 4.12it/s] 104it [00:24, 4.26it/s] 105it [00:25, 4.36it/s] 106it [00:25, 4.33it/s] 107it [00:25, 4.32it/s] 108it [00:25, 4.30it/s] 109it [00:25, 4.31it/s] 110it [00:26, 4.34it/s] 111it [00:26, 4.18it/s] 112it [00:26, 4.30it/s] 113it [00:26, 4.37it/s] 114it [00:27, 4.37it/s] 115it [00:27, 4.43it/s] 116it [00:27, 4.37it/s] 117it [00:27, 4.31it/s] 118it [00:28, 4.32it/s] 119it [00:28, 4.33it/s] 120it [00:28, 4.37it/s] 121it [00:28, 4.31it/s] 122it [00:28, 4.29it/s] 123it [00:29, 4.32it/s] 124it [00:29, 4.32it/s] 125it [00:29, 4.30it/s] 126it [00:29, 4.32it/s] 127it [00:30, 4.39it/s] 128it [00:30, 4.34it/s] 129it [00:30, 4.18it/s] 130it [00:30, 4.21it/s] 131it [00:31, 4.24it/s] 132it [00:31, 4.27it/s] 133it [00:31, 4.27it/s] 134it [00:31, 4.31it/s] 135it [00:31, 4.32it/s] 136it [00:32, 4.41it/s] 137it [00:32, 4.43it/s] 138it [00:32, 4.40it/s] 139it [00:32, 4.40it/s] 140it [00:33, 4.36it/s] 141it [00:33, 4.32it/s] 142it [00:33, 4.38it/s] 143it [00:33, 4.34it/s] 144it [00:34, 4.33it/s] 145it [00:34, 4.39it/s] 146it [00:34, 4.23it/s] 147it [00:34, 4.34it/s] 148it [00:34, 4.31it/s] 149it [00:35, 4.30it/s] 150it [00:35, 4.32it/s]2025-05-26 02:29:16,776 - INFO - [Epoch 056 | Batch 0150] IWAE-loss 1384.1519 | mean log_px -0.0041 | KL -1127.91 + 151it [00:35, 4.33it/s] 152it [00:35, 4.29it/s] 153it [00:36, 4.32it/s] 154it [00:36, 4.29it/s] 155it [00:36, 4.15it/s] 156it [00:36, 4.26it/s] 157it [00:37, 4.24it/s] 158it [00:37, 4.28it/s] 159it [00:37, 4.26it/s] 160it [00:37, 4.31it/s] 161it [00:38, 4.35it/s] 162it [00:38, 4.34it/s] 163it [00:38, 4.14it/s] 164it [00:38, 4.24it/s] 165it [00:38, 4.32it/s] 166it [00:39, 4.32it/s] 167it [00:39, 4.38it/s] 168it [00:39, 4.31it/s] 169it [00:39, 4.31it/s] 170it [00:40, 4.33it/s] 171it [00:40, 4.20it/s] 172it [00:40, 4.21it/s] 173it [00:40, 4.24it/s] 174it [00:41, 4.27it/s] 175it [00:41, 4.27it/s] 176it [00:41, 4.39it/s] 177it [00:41, 4.25it/s] 178it [00:41, 4.25it/s] 179it [00:42, 4.36it/s] 180it [00:42, 4.37it/s] 181it [00:42, 4.33it/s] 182it [00:42, 4.32it/s] 183it [00:43, 4.16it/s] 184it [00:43, 4.19it/s] 185it [00:43, 4.19it/s] 186it [00:43, 4.20it/s] 187it [00:44, 4.27it/s] 188it [00:44, 4.27it/s] 189it [00:44, 4.11it/s] 190it [00:44, 4.18it/s] 191it [00:45, 4.19it/s] 192it [00:45, 4.22it/s] 193it [00:45, 4.21it/s] 194it [00:45, 4.25it/s] 195it [00:46, 4.08it/s] 196it [00:46, 4.12it/s] 196it [00:46, 4.23it/s] +2025-05-26 02:29:27,513 - INFO - Epoch: 56, Objective: tensor([1635.1464], device='cuda:0', grad_fn=), Loss: 0.0118552902713418, KL/n: 23.14141273498535 + 0it [00:00, ?it/s]2025-05-26 02:29:27,931 - INFO - [Epoch 057 | Batch 0000] IWAE-loss 1257.1718 | mean log_px -0.0018 | KL -1129.48 + 1it [00:00, 2.94it/s] 2it [00:00, 3.72it/s] 3it [00:00, 4.11it/s] 4it [00:01, 4.10it/s] 5it [00:01, 4.15it/s] 6it [00:01, 4.13it/s] 7it [00:01, 4.18it/s] 8it [00:02, 3.26it/s] 9it [00:02, 3.58it/s] 10it [00:02, 3.79it/s] 11it [00:02, 3.93it/s] 12it [00:03, 4.10it/s] 13it [00:03, 4.04it/s] 14it [00:03, 4.09it/s] 15it [00:03, 4.18it/s] 16it [00:04, 4.19it/s] 17it [00:04, 4.23it/s] 18it [00:04, 4.27it/s] 19it [00:04, 4.29it/s] 20it [00:04, 4.16it/s] 21it [00:05, 4.17it/s] 22it [00:05, 4.14it/s] 23it [00:05, 4.15it/s] 24it [00:05, 4.20it/s] 25it [00:06, 4.25it/s] 26it [00:06, 4.11it/s] 27it [00:06, 4.16it/s] 28it [00:06, 4.16it/s] 29it [00:07, 4.22it/s] 30it [00:07, 4.19it/s] 31it [00:07, 4.14it/s] 32it [00:07, 4.14it/s] 33it [00:08, 4.16it/s] 34it [00:08, 4.25it/s] 35it [00:08, 4.24it/s] 36it [00:08, 4.16it/s] 37it [00:09, 4.20it/s] 38it [00:09, 4.23it/s] 39it [00:09, 4.23it/s] 40it [00:09, 4.20it/s] 41it [00:09, 4.20it/s] 42it [00:10, 4.16it/s] 43it [00:10, 4.28it/s] 44it [00:10, 4.36it/s] 45it [00:10, 4.33it/s] 46it [00:11, 4.16it/s] 47it [00:11, 4.16it/s] 48it [00:11, 4.19it/s] 49it [00:11, 4.19it/s] 50it [00:12, 4.22it/s]2025-05-26 02:29:39,936 - INFO - [Epoch 057 | Batch 0050] IWAE-loss 1460.0142 | mean log_px -0.0058 | KL -1131.17 + 51it [00:12, 4.34it/s] 52it [00:12, 4.28it/s] 53it [00:12, 4.21it/s] 54it [00:13, 4.27it/s] 55it [00:13, 4.39it/s] 56it [00:13, 4.25it/s] 57it [00:13, 4.11it/s] 58it [00:14, 4.15it/s] 59it [00:14, 4.24it/s] 60it [00:14, 4.25it/s] 61it [00:14, 4.36it/s] 62it [00:14, 4.33it/s] 63it [00:15, 4.33it/s] 64it [00:15, 4.36it/s] 65it [00:15, 4.38it/s] 66it [00:15, 4.17it/s] 67it [00:16, 4.21it/s] 68it [00:16, 4.19it/s] 69it [00:16, 4.18it/s] 70it [00:16, 4.25it/s] 71it [00:17, 4.12it/s] 72it [00:17, 4.13it/s] 73it [00:17, 4.18it/s] 74it [00:17, 4.12it/s] 75it [00:18, 4.27it/s] 76it [00:18, 4.32it/s] 77it [00:18, 4.40it/s] 78it [00:18, 4.32it/s] 79it [00:18, 4.23it/s] 80it [00:19, 4.10it/s] 81it [00:19, 4.13it/s] 82it [00:19, 4.17it/s] 83it [00:19, 4.22it/s] 84it [00:20, 4.20it/s] 85it [00:20, 4.21it/s] 86it [00:20, 4.05it/s] 87it [00:20, 4.07it/s] 88it [00:21, 4.12it/s] 89it [00:21, 4.15it/s] 90it [00:21, 4.13it/s] 91it [00:21, 4.11it/s] 92it [00:22, 4.00it/s] 93it [00:22, 4.12it/s] 94it [00:22, 4.17it/s] 95it [00:22, 4.29it/s] 96it [00:23, 4.28it/s] 97it [00:23, 4.24it/s] 98it [00:23, 4.09it/s] 99it [00:23, 4.18it/s] 100it [00:24, 4.19it/s]2025-05-26 02:29:51,841 - INFO - [Epoch 057 | Batch 0100] IWAE-loss 1242.8251 | mean log_px -0.0040 | KL -1129.03 + 101it [00:24, 4.17it/s] 102it [00:24, 4.12it/s] 103it [00:24, 4.12it/s] 104it [00:25, 4.01it/s] 105it [00:25, 4.10it/s] 106it [00:25, 4.10it/s] 107it [00:25, 4.12it/s] 108it [00:25, 4.13it/s] 109it [00:26, 4.24it/s] 110it [00:26, 4.16it/s] 111it [00:26, 4.16it/s] 112it [00:26, 4.04it/s] 113it [00:27, 4.11it/s] 114it [00:27, 4.06it/s] 115it [00:27, 4.11it/s] 116it [00:27, 4.13it/s] 117it [00:28, 4.22it/s] 118it [00:28, 4.19it/s] 119it [00:28, 4.19it/s] 120it [00:28, 4.30it/s] 121it [00:29, 4.22it/s] 122it [00:29, 4.33it/s] 123it [00:29, 4.25it/s] 124it [00:29, 4.22it/s] 125it [00:30, 4.10it/s] 126it [00:30, 4.16it/s] 127it [00:30, 4.16it/s] 128it [00:30, 4.15it/s] 129it [00:30, 4.14it/s] 130it [00:31, 4.18it/s] 131it [00:31, 4.00it/s] 132it [00:31, 4.01it/s] 133it [00:31, 4.07it/s] 134it [00:32, 4.16it/s] 135it [00:32, 4.26it/s] 136it [00:32, 4.30it/s] 137it [00:32, 4.27it/s] 138it [00:33, 4.09it/s] 139it [00:33, 4.10it/s] 140it [00:33, 4.07it/s] 141it [00:33, 4.10it/s] 142it [00:34, 4.14it/s] 143it [00:34, 4.17it/s] 144it [00:34, 4.03it/s] 145it [00:34, 4.05it/s] 146it [00:35, 4.09it/s] 147it [00:35, 4.01it/s] 148it [00:35, 4.02it/s] 149it [00:35, 4.09it/s] 150it [00:36, 4.03it/s]2025-05-26 02:30:03,955 - INFO - [Epoch 057 | Batch 0150] IWAE-loss 1292.4027 | mean log_px -0.0033 | KL -1125.85 + 151it [00:36, 4.07it/s] 152it [00:36, 4.14it/s] 153it [00:36, 4.13it/s] 154it [00:37, 4.11it/s] 155it [00:37, 4.11it/s] 156it [00:37, 4.10it/s] 157it [00:37, 4.12it/s] 158it [00:38, 4.00it/s] 159it [00:38, 4.16it/s] 160it [00:38, 4.16it/s] 161it [00:38, 4.29it/s] 162it [00:38, 4.34it/s] 163it [00:39, 4.43it/s] 164it [00:39, 4.17it/s] 165it [00:39, 4.20it/s] 166it [00:39, 4.20it/s] 167it [00:40, 4.24it/s] 168it [00:40, 4.14it/s] 169it [00:40, 4.10it/s] 170it [00:40, 4.09it/s] 171it [00:41, 4.06it/s] 172it [00:41, 3.94it/s] 173it [00:41, 4.11it/s] 174it [00:41, 4.23it/s] 175it [00:42, 4.16it/s] 176it [00:42, 4.17it/s] 177it [00:42, 4.15it/s] 178it [00:42, 4.28it/s] 179it [00:43, 4.24it/s] 180it [00:43, 4.35it/s] 181it [00:43, 4.24it/s] 182it [00:43, 4.22it/s] 183it [00:44, 4.21it/s] 184it [00:44, 4.22it/s] 185it [00:44, 4.23it/s] 186it [00:44, 4.27it/s] 187it [00:44, 4.28it/s] 188it [00:45, 4.28it/s] 189it [00:45, 4.29it/s] 190it [00:45, 4.28it/s] 191it [00:45, 4.23it/s] 192it [00:46, 4.13it/s] 193it [00:46, 4.27it/s] 194it [00:46, 4.20it/s] 195it [00:46, 4.11it/s] 196it [00:47, 4.26it/s] 196it [00:47, 4.16it/s] +2025-05-26 02:30:14,803 - INFO - Epoch: 57, Objective: tensor([1774.2374], device='cuda:0', grad_fn=), Loss: 0.010805794037878513, KL/n: 22.974790573120117 + 0it [00:00, ?it/s]2025-05-26 02:30:15,206 - INFO - [Epoch 058 | Batch 0000] IWAE-loss 1154.4401 | mean log_px -0.0014 | KL -1126.00 + 1it [00:00, 2.79it/s] 2it [00:00, 3.49it/s] 3it [00:00, 3.92it/s] 4it [00:01, 4.02it/s] 5it [00:01, 4.24it/s] 6it [00:01, 4.36it/s] 7it [00:01, 4.40it/s] 8it [00:01, 4.23it/s] 9it [00:02, 4.26it/s] 10it [00:02, 4.20it/s] 11it [00:02, 4.22it/s] 12it [00:02, 4.21it/s] 13it [00:03, 4.30it/s] 14it [00:03, 4.16it/s] 15it [00:03, 4.26it/s] 16it [00:03, 4.26it/s] 17it [00:04, 4.34it/s] 18it [00:04, 4.34it/s] 19it [00:04, 4.31it/s] 20it [00:04, 4.18it/s] 21it [00:05, 4.32it/s] 22it [00:05, 4.23it/s] 23it [00:05, 4.22it/s] 24it [00:05, 4.31it/s] 25it [00:05, 4.41it/s] 26it [00:06, 4.47it/s] 27it [00:06, 4.23it/s] 28it [00:06, 4.21it/s] 29it [00:06, 4.23it/s] 30it [00:07, 4.23it/s] 31it [00:07, 4.21it/s] 32it [00:07, 4.23it/s] 33it [00:07, 4.29it/s] 34it [00:08, 4.26it/s] 35it [00:08, 4.21it/s] 36it [00:08, 4.22it/s] 37it [00:08, 4.09it/s] 38it [00:09, 4.10it/s] 39it [00:09, 4.25it/s] 40it [00:09, 4.20it/s] 41it [00:09, 4.20it/s] 42it [00:09, 4.17it/s] 43it [00:10, 4.19it/s] 44it [00:10, 4.07it/s] 45it [00:10, 4.19it/s] 46it [00:10, 4.19it/s] 47it [00:11, 4.27it/s] 48it [00:11, 4.27it/s] 49it [00:11, 4.24it/s] 50it [00:11, 4.33it/s]2025-05-26 02:30:26,964 - INFO - [Epoch 058 | Batch 0050] IWAE-loss 1403.6750 | mean log_px -0.0124 | KL -1118.93 + 51it [00:12, 4.35it/s] 52it [00:12, 4.25it/s] 53it [00:12, 4.14it/s] 54it [00:12, 4.13it/s] 55it [00:13, 4.12it/s] 56it [00:13, 4.15it/s] 57it [00:13, 4.16it/s] 58it [00:13, 4.29it/s] 59it [00:14, 4.23it/s] 60it [00:14, 4.26it/s] 61it [00:14, 4.23it/s] 62it [00:14, 4.20it/s] 63it [00:14, 4.07it/s] 64it [00:15, 4.14it/s] 65it [00:15, 4.14it/s] 66it [00:15, 4.06it/s] 67it [00:15, 4.13it/s] 68it [00:16, 4.24it/s] 69it [00:16, 4.21it/s] 70it [00:16, 4.07it/s] 71it [00:16, 4.10it/s] 72it [00:17, 4.12it/s] 73it [00:17, 4.13it/s] 74it [00:17, 4.14it/s] 75it [00:17, 4.18it/s] 76it [00:18, 4.21it/s] 77it [00:18, 4.21it/s] 78it [00:18, 4.15it/s] 79it [00:18, 4.17it/s] 80it [00:19, 4.15it/s] 81it [00:19, 4.17it/s] 82it [00:19, 4.15it/s] 83it [00:19, 3.98it/s] 84it [00:20, 4.03it/s] 85it [00:20, 4.06it/s] 86it [00:20, 4.10it/s] 87it [00:20, 4.15it/s] 88it [00:21, 4.16it/s] 89it [00:21, 4.20it/s] 90it [00:21, 4.23it/s] 91it [00:21, 4.28it/s] 92it [00:21, 4.32it/s] 93it [00:22, 4.39it/s] 94it [00:22, 4.34it/s] 95it [00:22, 4.29it/s] 96it [00:22, 4.28it/s] 97it [00:23, 4.26it/s] 98it [00:23, 4.21it/s] 99it [00:23, 4.24it/s] 100it [00:23, 4.22it/s]2025-05-26 02:30:38,943 - INFO - [Epoch 058 | Batch 0100] IWAE-loss 1223.3649 | mean log_px -0.0015 | KL -1114.54 + 101it [00:24, 4.21it/s] 102it [00:24, 4.24it/s] 103it [00:24, 4.34it/s] 104it [00:24, 4.36it/s] 105it [00:24, 4.28it/s] 106it [00:25, 4.13it/s] 107it [00:25, 4.14it/s] 108it [00:25, 4.19it/s] 109it [00:25, 4.21it/s] 110it [00:26, 4.26it/s] 111it [00:26, 4.29it/s] 112it [00:26, 4.39it/s] 113it [00:26, 4.38it/s] 114it [00:27, 4.23it/s] 115it [00:27, 4.25it/s] 116it [00:27, 4.36it/s] 117it [00:27, 4.30it/s] 118it [00:28, 4.36it/s] 119it [00:28, 4.28it/s] 120it [00:28, 4.29it/s] 121it [00:28, 4.30it/s] 122it [00:28, 4.23it/s] 123it [00:29, 4.24it/s] 124it [00:29, 4.36it/s] 125it [00:29, 4.36it/s] 126it [00:29, 4.40it/s] 127it [00:30, 4.37it/s] 128it [00:30, 4.31it/s] 129it [00:30, 4.23it/s] 130it [00:30, 4.20it/s] 131it [00:31, 4.21it/s] 132it [00:31, 4.32it/s] 133it [00:31, 4.24it/s] 134it [00:31, 4.21it/s] 135it [00:32, 4.17it/s] 136it [00:32, 4.20it/s] 137it [00:32, 4.24it/s] 138it [00:32, 4.21it/s] 139it [00:32, 4.05it/s] 140it [00:33, 4.11it/s] 141it [00:33, 4.26it/s] 142it [00:33, 4.20it/s] 143it [00:33, 4.22it/s] 144it [00:34, 4.22it/s] 145it [00:34, 4.14it/s] 146it [00:34, 4.15it/s] 147it [00:34, 4.21it/s] 148it [00:35, 4.24it/s] 149it [00:35, 4.23it/s] 150it [00:35, 4.33it/s]2025-05-26 02:30:50,693 - INFO - [Epoch 058 | Batch 0150] IWAE-loss 1539.7325 | mean log_px -0.0100 | KL -1111.33 + 151it [00:35, 4.27it/s] 152it [00:36, 4.16it/s] 153it [00:36, 4.17it/s] 154it [00:36, 4.18it/s] 155it [00:36, 4.22it/s] 156it [00:37, 4.24it/s] 157it [00:37, 4.32it/s] 158it [00:37, 4.20it/s] 159it [00:37, 4.30it/s] 160it [00:37, 4.34it/s] 161it [00:38, 4.10it/s] 162it [00:38, 4.10it/s] 163it [00:38, 4.23it/s] 164it [00:38, 4.22it/s] 165it [00:39, 4.27it/s] 166it [00:39, 4.10it/s] 167it [00:39, 4.11it/s] 168it [00:39, 4.16it/s] 169it [00:40, 4.27it/s] 170it [00:40, 4.21it/s] 171it [00:40, 4.20it/s] 172it [00:40, 4.03it/s] 173it [00:41, 4.06it/s] 174it [00:41, 4.20it/s] 175it [00:41, 4.32it/s] 176it [00:41, 4.29it/s] 177it [00:42, 4.25it/s] 178it [00:42, 4.21it/s] 179it [00:42, 4.19it/s] 180it [00:42, 4.09it/s] 181it [00:42, 4.13it/s] 182it [00:43, 4.23it/s] 183it [00:43, 4.31it/s] 184it [00:43, 4.27it/s] 185it [00:43, 4.37it/s] 186it [00:44, 4.33it/s] 187it [00:44, 4.44it/s] 188it [00:44, 4.46it/s] 189it [00:44, 4.34it/s] 190it [00:45, 4.32it/s] 191it [00:45, 4.43it/s] 192it [00:45, 4.45it/s] 193it [00:45, 4.46it/s] 194it [00:45, 4.36it/s] 195it [00:46, 4.17it/s] 196it [00:46, 4.31it/s] 196it [00:46, 4.22it/s] +2025-05-26 02:31:01,404 - INFO - Epoch: 58, Objective: tensor([1163.4995], device='cuda:0', grad_fn=), Loss: 0.0014143032021820545, KL/n: 22.712282180786133 + 0it [00:00, ?it/s]2025-05-26 02:31:01,974 - INFO - [Epoch 059 | Batch 0000] IWAE-loss 1306.7094 | mean log_px -0.0034 | KL -1115.00 + 1it [00:00, 2.98it/s] 2it [00:00, 3.75it/s] 3it [00:00, 4.09it/s] 4it [00:00, 4.26it/s] 5it [00:01, 4.38it/s] 6it [00:01, 4.27it/s] 7it [00:01, 4.36it/s] 8it [00:01, 4.44it/s] 9it [00:02, 4.49it/s] 10it [00:02, 4.52it/s] 11it [00:02, 4.52it/s] 12it [00:02, 4.54it/s] 13it [00:02, 4.54it/s] 14it [00:03, 4.53it/s] 15it [00:03, 4.53it/s] 16it [00:03, 4.56it/s] 17it [00:03, 4.62it/s] 18it [00:04, 4.49it/s] 19it [00:04, 4.57it/s] 20it [00:04, 4.60it/s] 21it [00:04, 4.63it/s] 22it [00:04, 4.66it/s] 23it [00:05, 4.68it/s] 24it [00:05, 4.69it/s] 25it [00:05, 4.70it/s] 26it [00:05, 4.71it/s] 27it [00:05, 4.71it/s] 28it [00:06, 4.71it/s] 29it [00:06, 4.71it/s] 30it [00:06, 4.70it/s] 31it [00:06, 4.71it/s] 32it [00:07, 4.70it/s] 33it [00:07, 4.70it/s] 34it [00:07, 4.69it/s] 35it [00:07, 4.71it/s] 36it [00:07, 4.70it/s] 37it [00:08, 4.51it/s] 38it [00:08, 4.59it/s] 39it [00:08, 4.62it/s] 40it [00:08, 4.64it/s] 41it [00:09, 4.67it/s] 42it [00:09, 4.52it/s] 43it [00:09, 4.59it/s] 44it [00:09, 4.63it/s] 45it [00:09, 4.66it/s] 46it [00:10, 4.66it/s] 47it [00:10, 4.67it/s] 48it [00:10, 4.68it/s] 49it [00:10, 4.68it/s] 50it [00:10, 4.58it/s]2025-05-26 02:31:12,828 - INFO - [Epoch 059 | Batch 0050] IWAE-loss 1501.0148 | mean log_px -0.0083 | KL -1108.41 + 51it [00:11, 4.63it/s] 52it [00:11, 4.64it/s] 53it [00:11, 4.66it/s] 54it [00:11, 4.66it/s] 55it [00:12, 4.68it/s] 56it [00:12, 4.68it/s] 57it [00:12, 4.69it/s] 58it [00:12, 4.69it/s] 59it [00:12, 4.70it/s] 60it [00:13, 4.70it/s] 61it [00:13, 4.70it/s] 62it [00:13, 4.55it/s] 63it [00:13, 4.61it/s] 64it [00:13, 4.63it/s] 65it [00:14, 4.66it/s] 66it [00:14, 4.67it/s] 67it [00:14, 4.68it/s] 68it [00:14, 4.58it/s] 69it [00:15, 4.64it/s] 70it [00:15, 4.65it/s] 71it [00:15, 4.66it/s] 72it [00:15, 4.67it/s] 73it [00:15, 4.68it/s] 74it [00:16, 4.69it/s] 75it [00:16, 4.70it/s] 76it [00:16, 4.70it/s] 77it [00:16, 4.71it/s] 78it [00:16, 4.70it/s] 79it [00:17, 4.70it/s] 80it [00:17, 4.70it/s] 81it [00:17, 4.70it/s] 82it [00:17, 4.70it/s] 83it [00:18, 4.71it/s] 84it [00:18, 4.70it/s] 85it [00:18, 4.71it/s] 86it [00:18, 4.70it/s] 87it [00:18, 4.71it/s] 88it [00:19, 4.70it/s] 89it [00:19, 4.71it/s] 90it [00:19, 4.51it/s] 91it [00:19, 4.57it/s] 92it [00:19, 4.61it/s] 93it [00:20, 4.64it/s] 94it [00:20, 4.64it/s] 95it [00:20, 4.66it/s] 96it [00:20, 4.50it/s] 97it [00:21, 4.58it/s] 98it [00:21, 4.61it/s] 99it [00:21, 4.64it/s] 100it [00:21, 4.64it/s]2025-05-26 02:31:23,557 - INFO - [Epoch 059 | Batch 0100] IWAE-loss 1170.6613 | mean log_px -0.0009 | KL -1106.82 + 101it [00:21, 4.65it/s] 102it [00:22, 4.66it/s] 103it [00:22, 4.67it/s] 104it [00:22, 4.51it/s] 105it [00:22, 4.56it/s] 106it [00:22, 4.56it/s] 107it [00:23, 4.58it/s] 108it [00:23, 4.61it/s] 109it [00:23, 4.64it/s] 110it [00:23, 4.65it/s] 111it [00:24, 4.51it/s] 112it [00:24, 4.58it/s] 113it [00:24, 4.61it/s] 114it [00:24, 4.63it/s] 115it [00:24, 4.66it/s] 116it [00:25, 4.66it/s] 117it [00:25, 4.67it/s] 118it [00:25, 4.68it/s] 119it [00:25, 4.69it/s] 120it [00:26, 4.70it/s] 121it [00:26, 4.70it/s] 122it [00:26, 4.71it/s] 123it [00:26, 4.70it/s] 124it [00:26, 4.70it/s] 125it [00:27, 4.70it/s] 126it [00:27, 4.70it/s] 127it [00:27, 4.70it/s] 128it [00:27, 4.70it/s] 129it [00:27, 4.69it/s] 130it [00:28, 4.69it/s] 131it [00:28, 4.71it/s] 132it [00:28, 4.70it/s] 133it [00:28, 4.70it/s] 134it [00:28, 4.67it/s] 135it [00:29, 4.69it/s] 136it [00:29, 4.69it/s] 137it [00:29, 4.54it/s] 138it [00:29, 4.59it/s] 139it [00:30, 4.62it/s] 140it [00:30, 4.64it/s] 141it [00:30, 4.66it/s] 142it [00:30, 4.64it/s] 143it [00:30, 4.48it/s] 144it [00:31, 4.48it/s] 145it [00:31, 4.42it/s] 146it [00:31, 4.38it/s] 147it [00:31, 4.45it/s] 148it [00:32, 4.50it/s] 149it [00:32, 4.53it/s] 150it [00:32, 4.55it/s]2025-05-26 02:31:34,388 - INFO - [Epoch 059 | Batch 0150] IWAE-loss 1656.5128 | mean log_px -0.0145 | KL -1106.05 + 151it [00:32, 4.59it/s] 152it [00:32, 4.62it/s] 153it [00:33, 4.65it/s] 154it [00:33, 4.67it/s] 155it [00:33, 4.68it/s] 156it [00:33, 4.68it/s] 157it [00:34, 4.68it/s] 158it [00:34, 4.67it/s] 159it [00:34, 4.67it/s] 160it [00:34, 4.67it/s] 161it [00:34, 4.62it/s] 162it [00:35, 4.61it/s] 163it [00:35, 4.64it/s] 164it [00:35, 4.61it/s] 165it [00:35, 4.62it/s] 166it [00:35, 4.63it/s] 167it [00:36, 4.67it/s] 168it [00:36, 4.66it/s] 169it [00:36, 4.67it/s] 170it [00:36, 4.70it/s] 171it [00:37, 4.69it/s] 172it [00:37, 4.67it/s] 173it [00:37, 4.69it/s] 174it [00:37, 4.70it/s] 175it [00:37, 4.69it/s] 176it [00:38, 4.69it/s] 177it [00:38, 4.72it/s] 178it [00:38, 4.71it/s] 179it [00:38, 4.69it/s] 180it [00:38, 4.71it/s] 181it [00:39, 4.67it/s] 182it [00:39, 4.70it/s] 183it [00:39, 4.67it/s] 184it [00:39, 4.68it/s] 185it [00:39, 4.66it/s] 186it [00:40, 4.65it/s] 187it [00:40, 4.65it/s] 188it [00:40, 4.64it/s] 189it [00:40, 4.65it/s] 190it [00:41, 4.63it/s] 191it [00:41, 4.64it/s] 192it [00:41, 4.64it/s] 193it [00:41, 4.62it/s] 194it [00:41, 4.62it/s] 195it [00:42, 4.51it/s] 196it [00:42, 4.54it/s] 196it [00:42, 4.62it/s] +2025-05-26 02:31:44,188 - INFO - Epoch: 59, Objective: tensor([1502.0814], device='cuda:0', grad_fn=), Loss: 0.015234545804560184, KL/n: 22.524457931518555 + 0it [00:00, ?it/s]2025-05-26 02:31:44,570 - INFO - [Epoch 060 | Batch 0000] IWAE-loss 1251.1169 | mean log_px -0.0041 | KL -1102.64 + 1it [00:00, 3.32it/s] 2it [00:00, 3.89it/s] 3it [00:00, 4.21it/s] 4it [00:00, 4.40it/s] 5it [00:01, 4.52it/s] 6it [00:01, 4.58it/s] 7it [00:01, 4.47it/s] 8it [00:01, 4.51it/s] 9it [00:02, 4.41it/s] 10it [00:02, 4.35it/s] 11it [00:02, 4.33it/s] 12it [00:02, 4.43it/s] 13it [00:02, 4.31it/s] 14it [00:03, 4.37it/s] 15it [00:03, 4.47it/s] 16it [00:03, 4.55it/s] 17it [00:03, 4.48it/s] 18it [00:04, 4.40it/s] 19it [00:04, 4.41it/s] 20it [00:04, 4.34it/s] 21it [00:04, 4.44it/s] 22it [00:05, 4.34it/s] 23it [00:05, 4.29it/s] 24it [00:05, 4.39it/s] 25it [00:05, 4.38it/s] 26it [00:05, 4.35it/s] 27it [00:06, 4.41it/s] 28it [00:06, 4.39it/s] 29it [00:06, 4.48it/s] 30it [00:06, 4.52it/s] 31it [00:07, 4.47it/s] 32it [00:07, 4.39it/s] 33it [00:07, 4.39it/s] 34it [00:07, 4.34it/s] 35it [00:07, 4.44it/s] 36it [00:08, 4.48it/s] 37it [00:08, 4.45it/s] 38it [00:08, 4.48it/s] 39it [00:08, 4.42it/s] 40it [00:09, 4.48it/s] 41it [00:09, 4.53it/s] 42it [00:09, 4.42it/s] 43it [00:09, 4.50it/s] 44it [00:09, 4.42it/s] 45it [00:10, 4.36it/s] 46it [00:10, 4.30it/s] 47it [00:10, 4.30it/s] 48it [00:10, 4.27it/s] 49it [00:11, 4.17it/s] 50it [00:11, 4.17it/s]2025-05-26 02:31:55,932 - INFO - [Epoch 060 | Batch 0050] IWAE-loss 1318.0186 | mean log_px -0.0060 | KL -1099.36 + 51it [00:11, 4.19it/s] 52it [00:11, 4.19it/s] 53it [00:12, 4.20it/s] 54it [00:12, 4.28it/s] 55it [00:12, 4.26it/s] 56it [00:12, 4.26it/s] 57it [00:13, 4.26it/s] 58it [00:13, 4.39it/s] 59it [00:13, 4.42it/s] 60it [00:13, 4.38it/s] 61it [00:13, 4.29it/s] 62it [00:14, 4.26it/s] 63it [00:14, 4.22it/s] 64it [00:14, 4.25it/s] 65it [00:14, 4.23it/s] 66it [00:15, 4.21it/s] 67it [00:15, 4.23it/s] 68it [00:15, 4.21it/s] 69it [00:15, 4.25it/s] 70it [00:16, 4.36it/s] 71it [00:16, 4.37it/s] 72it [00:16, 4.45it/s] 73it [00:16, 4.39it/s] 74it [00:17, 4.32it/s] 75it [00:17, 4.27it/s] 76it [00:17, 4.36it/s] 77it [00:17, 4.43it/s] 78it [00:17, 4.48it/s] 79it [00:18, 4.35it/s] 80it [00:18, 4.31it/s] 81it [00:18, 4.26it/s] 82it [00:18, 4.37it/s] 83it [00:19, 4.40it/s] 84it [00:19, 4.46it/s] 85it [00:19, 4.38it/s] 86it [00:19, 4.31it/s] 87it [00:19, 4.32it/s] 88it [00:20, 4.38it/s] 89it [00:20, 4.26it/s] 90it [00:20, 4.36it/s] 91it [00:20, 4.46it/s] 92it [00:21, 3.59it/s] 93it [00:21, 3.84it/s] 94it [00:21, 4.06it/s] 95it [00:21, 4.23it/s] 96it [00:22, 4.36it/s] 97it [00:22, 4.45it/s] 98it [00:22, 4.49it/s] 99it [00:22, 4.54it/s] 100it [00:23, 4.58it/s]2025-05-26 02:32:07,501 - INFO - [Epoch 060 | Batch 0100] IWAE-loss 1443.9005 | mean log_px -0.0049 | KL -1095.84 + 101it [00:23, 4.61it/s] 102it [00:23, 4.62it/s] 103it [00:23, 4.62it/s] 104it [00:23, 4.64it/s] 105it [00:24, 4.64it/s] 106it [00:24, 4.64it/s] 107it [00:24, 4.65it/s] 108it [00:24, 4.66it/s] 109it [00:24, 4.67it/s] 110it [00:25, 4.67it/s] 111it [00:25, 4.68it/s] 112it [00:25, 4.67it/s] 113it [00:25, 4.68it/s] 114it [00:26, 4.69it/s] 115it [00:26, 4.69it/s] 116it [00:26, 4.67it/s] 117it [00:26, 4.69it/s] 118it [00:26, 4.69it/s] 119it [00:27, 4.68it/s] 120it [00:27, 4.68it/s] 121it [00:27, 4.68it/s] 122it [00:27, 4.67it/s] 123it [00:27, 4.67it/s] 124it [00:28, 4.68it/s] 125it [00:28, 4.67it/s] 126it [00:28, 4.65it/s] 127it [00:28, 4.66it/s] 128it [00:29, 4.65it/s] 129it [00:29, 4.65it/s] 130it [00:29, 4.67it/s] 131it [00:29, 4.67it/s] 132it [00:29, 4.65it/s] 133it [00:30, 4.62it/s] 134it [00:30, 4.64it/s] 135it [00:30, 4.62it/s] 136it [00:30, 4.62it/s] 137it [00:30, 4.64it/s] 138it [00:31, 4.63it/s] 139it [00:31, 4.65it/s] 140it [00:31, 4.65it/s] 141it [00:31, 4.65it/s] 142it [00:32, 4.65it/s] 143it [00:32, 4.66it/s] 144it [00:32, 4.65it/s] 145it [00:32, 4.67it/s] 146it [00:32, 4.68it/s] 147it [00:33, 4.68it/s] 148it [00:33, 4.68it/s] 149it [00:33, 4.68it/s] 150it [00:33, 4.67it/s]2025-05-26 02:32:18,223 - INFO - [Epoch 060 | Batch 0150] IWAE-loss 1876.3032 | mean log_px -0.0125 | KL -1099.04 + 151it [00:33, 4.67it/s] 152it [00:34, 4.66it/s] 153it [00:34, 4.68it/s] 154it [00:34, 4.67it/s] 155it [00:34, 4.68it/s] 156it [00:35, 4.68it/s] 157it [00:35, 4.66it/s] 158it [00:35, 4.52it/s] 159it [00:35, 4.59it/s] 160it [00:35, 4.60it/s] 161it [00:36, 4.63it/s] 162it [00:36, 4.65it/s] 163it [00:36, 4.67it/s] 164it [00:36, 4.69it/s] 165it [00:36, 4.67it/s] 166it [00:37, 4.68it/s] 167it [00:37, 4.52it/s] 168it [00:37, 4.59it/s] 169it [00:37, 4.63it/s] 170it [00:38, 4.65it/s] 171it [00:38, 4.67it/s] 172it [00:38, 4.68it/s] 173it [00:38, 4.69it/s] 174it [00:38, 4.70it/s] 175it [00:39, 4.71it/s] 176it [00:39, 4.57it/s] 177it [00:39, 4.63it/s] 178it [00:39, 4.65it/s] 179it [00:39, 4.68it/s] 180it [00:40, 4.52it/s] 181it [00:40, 4.58it/s] 182it [00:40, 4.62it/s] 183it [00:40, 4.65it/s] 184it [00:41, 4.66it/s] 185it [00:41, 4.69it/s] 186it [00:41, 4.69it/s] 187it [00:41, 4.70it/s] 188it [00:41, 4.70it/s] 189it [00:42, 4.54it/s] 190it [00:42, 4.59it/s] 191it [00:42, 4.64it/s] 192it [00:42, 4.66it/s] 193it [00:42, 4.67it/s] 194it [00:43, 4.69it/s] 195it [00:43, 4.44it/s] 196it [00:43, 4.55it/s] 196it [00:43, 4.48it/s] +2025-05-26 02:32:28,072 - INFO - Epoch: 60, Objective: tensor([1335.1680], device='cuda:0', grad_fn=), Loss: 0.0030267671681940556, KL/n: 22.3603515625 + 0it [00:00, ?it/s]2025-05-26 02:32:28,474 - INFO - [Epoch 061 | Batch 0000] IWAE-loss 1409.4937 | mean log_px -0.0081 | KL -1098.50 + 1it [00:00, 3.09it/s] 2it [00:00, 3.76it/s] 3it [00:00, 3.92it/s] 4it [00:01, 4.03it/s] 5it [00:01, 4.24it/s] 6it [00:01, 4.23it/s] 7it [00:01, 4.26it/s] 8it [00:01, 4.29it/s] 9it [00:02, 4.26it/s] 10it [00:02, 4.32it/s] 11it [00:02, 4.31it/s] 12it [00:02, 4.27it/s] 13it [00:03, 4.39it/s] 14it [00:03, 4.22it/s] 15it [00:03, 4.27it/s] 16it [00:03, 4.30it/s] 17it [00:04, 4.35it/s] 18it [00:04, 4.21it/s] 19it [00:04, 4.26it/s] 20it [00:04, 4.31it/s] 21it [00:04, 4.30it/s] 22it [00:05, 4.29it/s] 23it [00:05, 4.35it/s] 24it [00:05, 4.44it/s] 25it [00:05, 4.52it/s] 26it [00:06, 4.53it/s] 27it [00:06, 4.43it/s] 28it [00:06, 4.42it/s] 29it [00:06, 4.49it/s] 30it [00:06, 4.39it/s] 31it [00:07, 4.48it/s] 32it [00:07, 4.30it/s] 33it [00:07, 4.40it/s] 34it [00:07, 4.26it/s] 35it [00:08, 4.37it/s] 36it [00:08, 4.30it/s] 37it [00:08, 4.41it/s] 38it [00:08, 4.20it/s] 39it [00:09, 4.23it/s] 40it [00:09, 4.34it/s] 41it [00:09, 4.33it/s] 42it [00:09, 4.45it/s] 43it [00:09, 4.51it/s] 44it [00:10, 4.41it/s] 45it [00:10, 4.50it/s] 46it [00:10, 4.41it/s] 47it [00:10, 4.44it/s] 48it [00:11, 4.43it/s] 49it [00:11, 4.29it/s] 50it [00:11, 4.33it/s]2025-05-26 02:32:39,947 - INFO - [Epoch 061 | Batch 0050] IWAE-loss 1398.4414 | mean log_px -0.0127 | KL -1090.44 + 51it [00:11, 4.41it/s] 52it [00:12, 4.34it/s] 53it [00:12, 4.31it/s] 54it [00:12, 4.28it/s] 55it [00:12, 4.40it/s] 56it [00:12, 4.29it/s] 57it [00:13, 4.28it/s] 58it [00:13, 4.32it/s] 59it [00:13, 4.29it/s] 60it [00:13, 4.31it/s] 61it [00:14, 4.16it/s] 62it [00:14, 4.17it/s] 63it [00:14, 4.21it/s] 64it [00:14, 4.26it/s] 65it [00:15, 4.30it/s] 66it [00:15, 4.27it/s] 67it [00:15, 4.27it/s] 68it [00:15, 4.22it/s] 69it [00:16, 4.24it/s] 70it [00:16, 4.08it/s] 71it [00:16, 4.15it/s] 72it [00:16, 4.17it/s] 73it [00:16, 4.32it/s] 74it [00:17, 4.42it/s] 75it [00:17, 4.41it/s] 76it [00:17, 4.35it/s] 77it [00:17, 4.42it/s] 78it [00:18, 4.49it/s] 79it [00:18, 4.28it/s] 80it [00:18, 4.40it/s] 81it [00:18, 4.41it/s] 82it [00:19, 4.37it/s] 83it [00:19, 4.33it/s] 84it [00:19, 4.31it/s] 85it [00:19, 4.42it/s] 86it [00:19, 4.33it/s] 87it [00:20, 4.29it/s] 88it [00:20, 4.30it/s] 89it [00:20, 4.30it/s] 90it [00:20, 4.31it/s] 91it [00:21, 4.28it/s] 92it [00:21, 4.32it/s] 93it [00:21, 4.16it/s] 94it [00:21, 4.18it/s] 95it [00:22, 4.31it/s] 96it [00:22, 4.38it/s] 97it [00:22, 4.48it/s] 98it [00:22, 4.50it/s] 99it [00:22, 4.43it/s] 100it [00:23, 4.32it/s]2025-05-26 02:32:51,573 - INFO - [Epoch 061 | Batch 0100] IWAE-loss 1398.7993 | mean log_px -0.0086 | KL -1086.49 + 101it [00:23, 4.29it/s] 102it [00:23, 4.14it/s] 103it [00:23, 4.31it/s] 104it [00:24, 4.26it/s] 105it [00:24, 4.32it/s] 106it [00:24, 4.25it/s] 107it [00:24, 4.39it/s] 108it [00:25, 4.16it/s] 109it [00:25, 4.32it/s] 110it [00:25, 4.20it/s] 111it [00:25, 4.34it/s] 112it [00:25, 4.39it/s] 113it [00:26, 4.42it/s] 114it [00:26, 4.39it/s] 115it [00:26, 4.40it/s] 116it [00:26, 4.36it/s] 117it [00:27, 4.46it/s] 118it [00:27, 4.49it/s] 119it [00:27, 4.37it/s] 120it [00:27, 4.34it/s] 121it [00:28, 4.44it/s] 122it [00:28, 4.51it/s] 123it [00:28, 4.57it/s] 124it [00:28, 4.57it/s] 125it [00:28, 4.49it/s] 126it [00:29, 4.41it/s] 127it [00:29, 4.42it/s] 128it [00:29, 4.44it/s] 129it [00:29, 4.34it/s] 130it [00:30, 4.31it/s] 131it [00:30, 4.39it/s] 132it [00:30, 4.48it/s] 133it [00:30, 4.49it/s] 134it [00:30, 4.29it/s] 135it [00:31, 4.26it/s] 136it [00:31, 4.29it/s] 137it [00:31, 4.27it/s] 138it [00:31, 4.29it/s] 139it [00:32, 4.24it/s] 140it [00:32, 4.13it/s] 141it [00:32, 4.15it/s] 142it [00:32, 4.27it/s] 143it [00:33, 4.24it/s] 144it [00:33, 4.19it/s] 145it [00:33, 4.21it/s] 146it [00:33, 4.20it/s] 147it [00:34, 4.18it/s] 148it [00:34, 4.20it/s] 149it [00:34, 4.24it/s] 150it [00:34, 4.36it/s]2025-05-26 02:33:03,127 - INFO - [Epoch 061 | Batch 0150] IWAE-loss 1164.0669 | mean log_px -0.0021 | KL -1089.75 + 151it [00:34, 4.30it/s] 152it [00:35, 4.34it/s] 153it [00:35, 4.31it/s] 154it [00:35, 4.30it/s] 155it [00:35, 4.20it/s] 156it [00:36, 4.21it/s] 157it [00:36, 4.20it/s] 158it [00:36, 4.22it/s] 159it [00:36, 4.24it/s] 160it [00:37, 4.24it/s] 161it [00:37, 4.20it/s] 162it [00:37, 4.16it/s] 163it [00:37, 4.25it/s] 164it [00:38, 4.24it/s] 165it [00:38, 4.33it/s] 166it [00:38, 4.42it/s] 167it [00:38, 4.43it/s] 168it [00:38, 4.51it/s] 169it [00:39, 4.57it/s] 170it [00:39, 4.29it/s] 171it [00:39, 4.36it/s] 172it [00:39, 4.34it/s] 173it [00:40, 4.33it/s] 174it [00:40, 4.32it/s] 175it [00:40, 4.41it/s] 176it [00:40, 4.50it/s] 177it [00:40, 4.36it/s] 178it [00:41, 4.46it/s] 179it [00:41, 4.35it/s] 180it [00:41, 4.44it/s] 181it [00:41, 4.37it/s] 182it [00:42, 4.46it/s] 183it [00:42, 4.37it/s] 184it [00:42, 4.36it/s] 185it [00:42, 4.33it/s] 186it [00:43, 4.33it/s] 187it [00:43, 4.32it/s] 188it [00:43, 4.32it/s] 189it [00:43, 4.26it/s] 190it [00:43, 4.30it/s] 191it [00:44, 4.27it/s] 192it [00:44, 4.25it/s] 193it [00:44, 4.22it/s] 194it [00:44, 4.08it/s] 195it [00:45, 4.03it/s] 196it [00:45, 4.22it/s] 196it [00:45, 4.31it/s] +2025-05-26 02:33:13,711 - INFO - Epoch: 61, Objective: tensor([2204.2148], device='cuda:0', grad_fn=), Loss: 0.01952478662133217, KL/n: 22.221717834472656 + 0it [00:00, ?it/s]2025-05-26 02:33:14,278 - INFO - [Epoch 062 | Batch 0000] IWAE-loss 1198.3219 | mean log_px -0.0081 | KL -1089.96 + 1it [00:00, 3.34it/s] 2it [00:00, 4.00it/s] 3it [00:00, 4.24it/s] 4it [00:00, 4.40it/s] 5it [00:01, 4.33it/s] 6it [00:01, 4.41it/s] 7it [00:01, 4.53it/s] 8it [00:01, 4.58it/s] 9it [00:02, 4.63it/s] 10it [00:02, 4.48it/s] 11it [00:02, 4.57it/s] 12it [00:02, 4.61it/s] 13it [00:02, 4.60it/s] 14it [00:03, 4.65it/s] 15it [00:03, 4.67it/s] 16it [00:03, 4.68it/s] 17it [00:03, 4.70it/s] 18it [00:03, 4.53it/s] 19it [00:04, 4.59it/s] 20it [00:04, 4.58it/s] 21it [00:04, 4.62it/s] 22it [00:04, 4.64it/s] 23it [00:05, 4.65it/s] 24it [00:05, 4.67it/s] 25it [00:05, 4.69it/s] 26it [00:05, 4.70it/s] 27it [00:05, 4.70it/s] 28it [00:06, 4.71it/s] 29it [00:06, 4.54it/s] 30it [00:06, 4.61it/s] 31it [00:06, 4.65it/s] 32it [00:07, 4.66it/s] 33it [00:07, 4.68it/s] 34it [00:07, 4.69it/s] 35it [00:07, 4.54it/s] 36it [00:07, 4.61it/s] 37it [00:08, 4.64it/s] 38it [00:08, 4.65it/s] 39it [00:08, 4.67it/s] 40it [00:08, 4.68it/s] 41it [00:08, 4.69it/s] 42it [00:09, 4.69it/s] 43it [00:09, 4.70it/s] 44it [00:09, 4.52it/s] 45it [00:09, 4.60it/s] 46it [00:10, 4.62it/s] 47it [00:10, 4.66it/s] 48it [00:10, 4.66it/s] 49it [00:10, 4.52it/s] 50it [00:10, 4.59it/s]2025-05-26 02:33:25,088 - INFO - [Epoch 062 | Batch 0050] IWAE-loss 1275.6980 | mean log_px -0.0043 | KL -1085.77 + 51it [00:11, 4.62it/s] 52it [00:11, 4.63it/s] 53it [00:11, 4.67it/s] 54it [00:11, 4.51it/s] 55it [00:11, 4.57it/s] 56it [00:12, 4.62it/s] 57it [00:12, 4.65it/s] 58it [00:12, 4.67it/s] 59it [00:12, 4.64it/s] 60it [00:13, 4.66it/s] 61it [00:13, 4.68it/s] 62it [00:13, 4.69it/s] 63it [00:13, 4.69it/s] 64it [00:13, 4.70it/s] 65it [00:14, 4.70it/s] 66it [00:14, 4.54it/s] 67it [00:14, 4.61it/s] 68it [00:14, 4.64it/s] 69it [00:14, 4.67it/s] 70it [00:15, 4.67it/s] 71it [00:15, 4.52it/s] 72it [00:15, 4.54it/s] 73it [00:15, 4.59it/s] 74it [00:16, 4.63it/s] 75it [00:16, 4.65it/s] 76it [00:16, 4.67it/s] 77it [00:16, 4.68it/s] 78it [00:16, 4.69it/s] 79it [00:17, 4.53it/s] 80it [00:17, 4.60it/s] 81it [00:17, 4.64it/s] 82it [00:17, 4.65it/s] 83it [00:18, 4.68it/s] 84it [00:18, 4.68it/s] 85it [00:18, 4.70it/s] 86it [00:18, 4.69it/s] 87it [00:18, 4.70it/s] 88it [00:19, 4.51it/s] 89it [00:19, 4.59it/s] 90it [00:19, 4.62it/s] 91it [00:19, 4.65it/s] 92it [00:19, 4.51it/s] 93it [00:20, 4.58it/s] 94it [00:20, 4.62it/s] 95it [00:20, 4.66it/s] 96it [00:20, 4.67it/s] 97it [00:21, 4.69it/s] 98it [00:21, 4.69it/s] 99it [00:21, 4.70it/s] 100it [00:21, 4.70it/s]2025-05-26 02:33:35,859 - INFO - [Epoch 062 | Batch 0100] IWAE-loss 1882.4122 | mean log_px -0.0167 | KL -1085.27 + 101it [00:21, 4.53it/s] 102it [00:22, 4.59it/s] 103it [00:22, 4.61it/s] 104it [00:22, 4.64it/s] 105it [00:22, 4.66it/s] 106it [00:22, 4.67it/s] 107it [00:23, 4.68it/s] 108it [00:23, 4.70it/s] 109it [00:23, 4.54it/s] 110it [00:23, 4.60it/s] 111it [00:24, 4.63it/s] 112it [00:24, 4.58it/s] 113it [00:24, 4.63it/s] 114it [00:24, 4.47it/s] 115it [00:24, 4.49it/s] 116it [00:25, 4.55it/s] 117it [00:25, 4.59it/s] 118it [00:25, 4.61it/s] 119it [00:25, 4.63it/s] 120it [00:26, 4.51it/s] 121it [00:26, 4.59it/s] 122it [00:26, 4.62it/s] 123it [00:26, 4.65it/s] 124it [00:26, 4.66it/s] 125it [00:27, 4.68it/s] 126it [00:27, 4.69it/s] 127it [00:27, 4.53it/s] 128it [00:27, 4.60it/s] 129it [00:27, 4.63it/s] 130it [00:28, 4.65it/s] 131it [00:28, 4.66it/s] 132it [00:28, 4.54it/s] 133it [00:28, 4.61it/s] 134it [00:29, 4.63it/s] 135it [00:29, 4.66it/s] 136it [00:29, 4.52it/s] 137it [00:29, 4.59it/s] 138it [00:29, 4.63it/s] 139it [00:30, 4.64it/s] 140it [00:30, 4.66it/s] 141it [00:30, 4.69it/s] 142it [00:30, 4.69it/s] 143it [00:30, 4.70it/s] 144it [00:31, 4.71it/s] 145it [00:31, 4.71it/s] 146it [00:31, 4.70it/s] 147it [00:31, 4.71it/s] 148it [00:32, 4.70it/s] 149it [00:32, 4.71it/s] 150it [00:32, 4.70it/s]2025-05-26 02:33:46,666 - INFO - [Epoch 062 | Batch 0150] IWAE-loss 1197.9325 | mean log_px -0.0030 | KL -1087.20 + 151it [00:32, 4.70it/s] 152it [00:32, 4.69it/s] 153it [00:33, 4.53it/s] 154it [00:33, 4.59it/s] 155it [00:33, 4.63it/s] 156it [00:33, 4.65it/s] 157it [00:33, 4.66it/s] 158it [00:34, 4.66it/s] 159it [00:34, 4.68it/s] 160it [00:34, 4.69it/s] 161it [00:34, 4.69it/s] 162it [00:35, 4.51it/s] 163it [00:35, 4.59it/s] 164it [00:35, 4.62it/s] 165it [00:35, 4.61it/s] 166it [00:35, 4.63it/s] 167it [00:36, 4.66it/s] 168it [00:36, 4.50it/s] 169it [00:36, 4.58it/s] 170it [00:36, 4.61it/s] 171it [00:37, 4.64it/s] 172it [00:37, 4.66it/s] 173it [00:37, 4.68it/s] 174it [00:37, 4.69it/s] 175it [00:37, 4.70it/s] 176it [00:38, 4.70it/s] 177it [00:38, 4.54it/s] 178it [00:38, 4.60it/s] 179it [00:38, 4.63it/s] 180it [00:38, 4.65it/s] 181it [00:39, 4.67it/s] 182it [00:39, 4.67it/s] 183it [00:39, 4.52it/s] 184it [00:39, 4.58it/s] 185it [00:40, 4.61it/s] 186it [00:40, 4.63it/s] 187it [00:40, 4.66it/s] 188it [00:40, 4.47it/s] 189it [00:40, 4.54it/s] 190it [00:41, 4.60it/s] 191it [00:41, 4.64it/s] 192it [00:41, 4.66it/s] 193it [00:41, 4.51it/s] 194it [00:42, 4.58it/s] 195it [00:42, 4.54it/s] 196it [00:42, 4.59it/s] 196it [00:42, 4.61it/s] +2025-05-26 02:33:56,552 - INFO - Epoch: 62, Objective: tensor([1330.0718], device='cuda:0', grad_fn=), Loss: 0.0047620623372495174, KL/n: 22.193544387817383 + 0it [00:00, ?it/s]2025-05-26 02:33:56,949 - INFO - [Epoch 063 | Batch 0000] IWAE-loss 1133.7760 | mean log_px -0.0013 | KL -1085.79 + 1it [00:00, 3.09it/s] 2it [00:00, 3.76it/s] 3it [00:00, 3.97it/s] 4it [00:01, 4.02it/s] 5it [00:01, 4.14it/s] 6it [00:01, 4.28it/s] 7it [00:01, 4.10it/s] 8it [00:01, 4.09it/s] 9it [00:02, 4.27it/s] 10it [00:02, 4.38it/s] 11it [00:02, 4.47it/s] 12it [00:02, 4.42it/s] 13it [00:03, 4.48it/s] 14it [00:03, 4.52it/s] 15it [00:03, 4.57it/s] 16it [00:03, 4.30it/s] 17it [00:03, 4.42it/s] 18it [00:04, 4.33it/s] 19it [00:04, 4.43it/s] 20it [00:04, 4.44it/s] 21it [00:04, 4.42it/s] 22it [00:05, 4.49it/s] 23it [00:05, 4.56it/s] 24it [00:05, 4.54it/s] 25it [00:05, 4.31it/s] 26it [00:06, 4.26it/s] 27it [00:06, 4.24it/s] 28it [00:06, 4.21it/s] 29it [00:06, 4.24it/s] 30it [00:06, 4.24it/s] 31it [00:07, 4.26it/s] 32it [00:07, 4.27it/s] 33it [00:07, 4.17it/s] 34it [00:07, 4.30it/s] 35it [00:08, 4.42it/s] 36it [00:08, 4.32it/s] 37it [00:08, 4.32it/s] 38it [00:08, 4.15it/s] 39it [00:09, 4.18it/s] 40it [00:09, 4.20it/s] 41it [00:09, 4.21it/s] 42it [00:09, 4.22it/s] 43it [00:10, 4.27it/s] 44it [00:10, 4.38it/s] 45it [00:10, 4.47it/s] 46it [00:10, 4.37it/s] 47it [00:10, 4.37it/s] 48it [00:11, 4.21it/s] 49it [00:11, 4.36it/s] 50it [00:11, 4.44it/s]2025-05-26 02:34:08,463 - INFO - [Epoch 063 | Batch 0050] IWAE-loss 1150.0118 | mean log_px -0.0013 | KL -1081.11 + 51it [00:11, 4.51it/s] 52it [00:12, 4.26it/s] 53it [00:12, 4.35it/s] 54it [00:12, 4.41it/s] 55it [00:12, 4.42it/s] 56it [00:13, 4.35it/s] 57it [00:13, 4.31it/s] 58it [00:13, 4.13it/s] 59it [00:13, 4.18it/s] 60it [00:13, 4.28it/s] 61it [00:14, 4.38it/s] 62it [00:14, 4.34it/s] 63it [00:14, 4.32it/s] 64it [00:14, 4.31it/s] 65it [00:15, 4.40it/s] 66it [00:15, 4.38it/s] 67it [00:15, 4.33it/s] 68it [00:15, 4.30it/s] 69it [00:16, 4.20it/s] 70it [00:16, 4.35it/s] 71it [00:16, 4.35it/s] 72it [00:16, 4.32it/s] 73it [00:16, 4.36it/s] 74it [00:17, 4.31it/s] 75it [00:17, 4.29it/s] 76it [00:17, 4.26it/s] 77it [00:18, 3.48it/s] 78it [00:18, 3.76it/s] 79it [00:18, 3.90it/s] 80it [00:18, 4.09it/s] 81it [00:18, 4.26it/s] 82it [00:19, 4.33it/s] 83it [00:19, 4.22it/s] 84it [00:19, 4.25it/s] 85it [00:19, 4.38it/s] 86it [00:20, 4.36it/s] 87it [00:20, 4.48it/s] 88it [00:20, 4.46it/s] 89it [00:20, 4.51it/s] 90it [00:20, 4.49it/s] 91it [00:21, 4.48it/s] 92it [00:21, 4.53it/s] 93it [00:21, 4.53it/s] 94it [00:21, 4.54it/s] 95it [00:22, 4.57it/s] 96it [00:22, 4.58it/s] 97it [00:22, 4.58it/s] 98it [00:22, 4.43it/s] 99it [00:23, 4.27it/s] 100it [00:23, 4.25it/s]2025-05-26 02:34:20,081 - INFO - [Epoch 063 | Batch 0100] IWAE-loss 1351.5203 | mean log_px -0.0092 | KL -1081.81 + 101it [00:23, 4.37it/s] 102it [00:23, 4.31it/s] 103it [00:23, 4.30it/s] 104it [00:24, 4.28it/s] 105it [00:24, 4.28it/s] 106it [00:24, 4.25it/s] 107it [00:24, 4.38it/s] 108it [00:25, 4.47it/s] 109it [00:25, 4.40it/s] 110it [00:25, 4.36it/s] 111it [00:25, 4.35it/s] 112it [00:26, 4.28it/s] 113it [00:26, 4.32it/s] 114it [00:26, 4.25it/s] 115it [00:26, 4.27it/s] 116it [00:26, 4.24it/s] 117it [00:27, 4.28it/s] 118it [00:27, 4.12it/s] 119it [00:27, 4.23it/s] 120it [00:27, 4.34it/s] 121it [00:28, 4.44it/s] 122it [00:28, 4.40it/s] 123it [00:28, 4.46it/s] 124it [00:28, 4.41it/s] 125it [00:29, 4.35it/s] 126it [00:29, 4.44it/s] 127it [00:29, 4.40it/s] 128it [00:29, 4.39it/s] 129it [00:29, 4.36it/s] 130it [00:30, 4.33it/s] 131it [00:30, 4.36it/s] 132it [00:30, 4.44it/s] 133it [00:30, 4.38it/s] 134it [00:31, 4.34it/s] 135it [00:31, 4.33it/s] 136it [00:31, 4.44it/s] 137it [00:31, 4.38it/s] 138it [00:31, 4.45it/s] 139it [00:32, 4.38it/s] 140it [00:32, 4.35it/s] 141it [00:32, 4.37it/s] 142it [00:32, 4.46it/s] 143it [00:33, 4.47it/s] 144it [00:33, 4.52it/s] 145it [00:33, 4.32it/s] 146it [00:33, 4.14it/s] 147it [00:34, 4.18it/s] 148it [00:34, 4.33it/s] 149it [00:34, 4.44it/s] 150it [00:34, 4.51it/s]2025-05-26 02:34:31,539 - INFO - [Epoch 063 | Batch 0150] IWAE-loss 1242.8817 | mean log_px -0.0063 | KL -1077.83 + 151it [00:34, 4.41it/s] 152it [00:35, 4.35it/s] 153it [00:35, 4.46it/s] 154it [00:35, 4.50it/s] 155it [00:35, 4.43it/s] 156it [00:36, 4.28it/s] 157it [00:36, 4.31it/s] 158it [00:36, 4.41it/s] 159it [00:36, 4.36it/s] 160it [00:37, 4.25it/s] 161it [00:37, 4.36it/s] 162it [00:37, 4.46it/s] 163it [00:37, 4.44it/s] 164it [00:37, 4.34it/s] 165it [00:38, 4.29it/s] 166it [00:38, 4.34it/s] 167it [00:38, 4.43it/s] 168it [00:38, 4.31it/s] 169it [00:39, 4.16it/s] 170it [00:39, 4.31it/s] 171it [00:39, 4.29it/s] 172it [00:39, 4.27it/s] 173it [00:40, 4.31it/s] 174it [00:40, 4.33it/s] 175it [00:40, 4.30it/s] 176it [00:40, 4.11it/s] 177it [00:40, 4.29it/s] 178it [00:41, 4.27it/s] 179it [00:41, 4.40it/s] 180it [00:41, 4.33it/s] 181it [00:41, 4.33it/s] 182it [00:42, 4.32it/s] 183it [00:42, 4.31it/s] 184it [00:42, 4.25it/s] 185it [00:42, 4.28it/s] 186it [00:43, 4.24it/s] 187it [00:43, 4.31it/s] 188it [00:43, 4.11it/s] 189it [00:43, 4.16it/s] 190it [00:44, 4.19it/s] 191it [00:44, 4.26it/s] 192it [00:44, 4.28it/s] 193it [00:44, 4.39it/s] 194it [00:44, 4.42it/s] 195it [00:45, 4.15it/s] 196it [00:45, 4.28it/s] 196it [00:45, 4.31it/s] +2025-05-26 02:34:42,155 - INFO - Epoch: 63, Objective: tensor([1271.1880], device='cuda:0', grad_fn=), Loss: 0.0068045128136873245, KL/n: 21.986188888549805 + 0it [00:00, ?it/s]2025-05-26 02:34:42,546 - INFO - [Epoch 064 | Batch 0000] IWAE-loss 1491.5543 | mean log_px -0.0086 | KL -1077.20 + 1it [00:00, 3.14it/s] 2it [00:00, 3.88it/s] 3it [00:00, 4.19it/s] 4it [00:00, 4.34it/s] 5it [00:01, 4.46it/s] 6it [00:01, 4.42it/s] 7it [00:01, 4.51it/s] 8it [00:01, 4.55it/s] 9it [00:02, 4.60it/s] 10it [00:02, 4.62it/s] 11it [00:02, 4.60it/s] 12it [00:02, 4.48it/s] 13it [00:02, 4.50it/s] 14it [00:03, 4.55it/s] 15it [00:03, 4.60it/s] 16it [00:03, 4.63it/s] 17it [00:03, 4.61it/s] 18it [00:04, 4.64it/s] 19it [00:04, 4.64it/s] 20it [00:04, 4.65it/s] 21it [00:04, 4.66it/s] 22it [00:04, 4.52it/s] 23it [00:05, 4.59it/s] 24it [00:05, 4.62it/s] 25it [00:05, 4.65it/s] 26it [00:05, 4.67it/s] 27it [00:05, 4.58it/s] 28it [00:06, 4.63it/s] 29it [00:06, 4.65it/s] 30it [00:06, 4.66it/s] 31it [00:06, 4.68it/s] 32it [00:07, 4.54it/s] 33it [00:07, 4.61it/s] 34it [00:07, 4.64it/s] 35it [00:07, 4.66it/s] 36it [00:07, 4.68it/s] 37it [00:08, 4.69it/s] 38it [00:08, 4.69it/s] 39it [00:08, 4.70it/s] 40it [00:08, 4.54it/s] 41it [00:08, 4.60it/s] 42it [00:09, 4.62it/s] 43it [00:09, 4.65it/s] 44it [00:09, 4.65it/s] 45it [00:09, 4.67it/s] 46it [00:10, 4.67it/s] 47it [00:10, 4.68it/s] 48it [00:10, 4.69it/s] 49it [00:10, 4.67it/s] 50it [00:10, 4.70it/s]2025-05-26 02:34:53,343 - INFO - [Epoch 064 | Batch 0050] IWAE-loss 1201.7369 | mean log_px -0.0023 | KL -1074.23 + 51it [00:11, 4.69it/s] 52it [00:11, 4.53it/s] 53it [00:11, 4.59it/s] 54it [00:11, 4.62it/s] 55it [00:11, 4.64it/s] 56it [00:12, 4.65it/s] 57it [00:12, 4.67it/s] 58it [00:12, 4.69it/s] 59it [00:12, 4.70it/s] 60it [00:13, 4.70it/s] 61it [00:13, 4.71it/s] 62it [00:13, 4.55it/s] 63it [00:13, 4.62it/s] 64it [00:13, 4.63it/s] 65it [00:14, 4.66it/s] 66it [00:14, 4.61it/s] 67it [00:14, 4.49it/s] 68it [00:14, 4.53it/s] 69it [00:15, 4.57it/s] 70it [00:15, 4.59it/s] 71it [00:15, 4.61it/s] 72it [00:15, 4.46it/s] 73it [00:15, 4.54it/s] 74it [00:16, 4.54it/s] 75it [00:16, 4.59it/s] 76it [00:16, 4.61it/s] 77it [00:16, 4.64it/s] 78it [00:16, 4.66it/s] 79it [00:17, 4.68it/s] 80it [00:17, 4.67it/s] 81it [00:17, 4.70it/s] 82it [00:17, 4.53it/s] 83it [00:18, 4.60it/s] 84it [00:18, 4.63it/s] 85it [00:18, 4.64it/s] 86it [00:18, 4.66it/s] 87it [00:18, 4.62it/s] 88it [00:19, 4.58it/s] 89it [00:19, 4.63it/s] 90it [00:19, 4.65it/s] 91it [00:19, 4.49it/s] 92it [00:20, 4.47it/s] 93it [00:20, 4.53it/s] 94it [00:20, 4.57it/s] 95it [00:20, 4.61it/s] 96it [00:20, 4.63it/s] 97it [00:21, 4.65it/s] 98it [00:21, 4.66it/s] 99it [00:21, 4.68it/s] 100it [00:21, 4.69it/s]2025-05-26 02:35:04,185 - INFO - [Epoch 064 | Batch 0100] IWAE-loss 1448.6731 | mean log_px -0.0105 | KL -1068.36 + 101it [00:21, 4.69it/s] 102it [00:22, 4.69it/s] 103it [00:22, 4.70it/s] 104it [00:22, 4.70it/s] 105it [00:22, 4.71it/s] 106it [00:23, 4.71it/s] 107it [00:23, 4.72it/s] 108it [00:23, 4.56it/s] 109it [00:23, 4.62it/s] 110it [00:23, 4.64it/s] 111it [00:24, 4.66it/s] 112it [00:24, 4.67it/s] 113it [00:24, 4.68it/s] 114it [00:24, 4.69it/s] 115it [00:24, 4.70it/s] 116it [00:25, 4.70it/s] 117it [00:25, 4.71it/s] 118it [00:25, 4.70it/s] 119it [00:25, 4.71it/s] 120it [00:26, 4.69it/s] 121it [00:26, 4.70it/s] 122it [00:26, 4.71it/s] 123it [00:26, 4.68it/s] 124it [00:26, 4.54it/s] 125it [00:27, 4.60it/s] 126it [00:27, 4.57it/s] 127it [00:27, 4.58it/s] 128it [00:27, 4.62it/s] 129it [00:27, 4.65it/s] 130it [00:28, 4.65it/s] 131it [00:28, 4.66it/s] 132it [00:28, 4.68it/s] 133it [00:28, 4.69it/s] 134it [00:29, 4.69it/s] 135it [00:29, 4.70it/s] 136it [00:29, 4.70it/s] 137it [00:29, 4.70it/s] 138it [00:29, 4.69it/s] 139it [00:30, 4.70it/s] 140it [00:30, 4.70it/s] 141it [00:30, 4.70it/s] 142it [00:30, 4.68it/s] 143it [00:30, 4.41it/s] 144it [00:31, 4.22it/s] 145it [00:31, 4.22it/s] 146it [00:31, 4.20it/s] 147it [00:31, 4.19it/s] 148it [00:32, 4.31it/s] 149it [00:32, 4.41it/s] 150it [00:32, 4.49it/s]2025-05-26 02:35:15,057 - INFO - [Epoch 064 | Batch 0150] IWAE-loss 1139.3844 | mean log_px -0.0025 | KL -1069.10 + 151it [00:32, 4.54it/s] 152it [00:33, 4.59it/s] 153it [00:33, 4.63it/s] 154it [00:33, 4.64it/s] 155it [00:33, 4.66it/s] 156it [00:33, 4.67it/s] 157it [00:34, 4.68it/s] 158it [00:34, 4.53it/s] 159it [00:34, 4.60it/s] 160it [00:34, 4.63it/s] 161it [00:34, 4.65it/s] 162it [00:35, 4.66it/s] 163it [00:35, 4.67it/s] 164it [00:35, 4.68it/s] 165it [00:35, 4.69it/s] 166it [00:36, 4.69it/s] 167it [00:36, 4.70it/s] 168it [00:36, 4.69it/s] 169it [00:36, 4.69it/s] 170it [00:36, 4.69it/s] 171it [00:37, 4.68it/s] 172it [00:37, 4.68it/s] 173it [00:37, 4.69it/s] 174it [00:37, 4.69it/s] 175it [00:37, 4.70it/s] 176it [00:38, 4.70it/s] 177it [00:38, 4.70it/s] 178it [00:38, 4.69it/s] 179it [00:38, 4.66it/s] 180it [00:39, 4.67it/s] 181it [00:39, 4.68it/s] 182it [00:39, 4.68it/s] 183it [00:39, 4.70it/s] 184it [00:39, 4.69it/s] 185it [00:40, 4.70it/s] 186it [00:40, 4.69it/s] 187it [00:40, 4.58it/s] 188it [00:40, 4.63it/s] 189it [00:40, 4.65it/s] 190it [00:41, 4.65it/s] 191it [00:41, 4.66it/s] 192it [00:41, 4.66it/s] 193it [00:41, 4.66it/s] 194it [00:42, 4.66it/s] 195it [00:42, 4.54it/s] 196it [00:42, 4.59it/s] 196it [00:42, 4.61it/s] +2025-05-26 02:35:24,830 - INFO - Epoch: 64, Objective: tensor([1219.0177], device='cuda:0', grad_fn=), Loss: 0.005087015684694052, KL/n: 21.777986526489258 + 0it [00:00, ?it/s]2025-05-26 02:35:25,386 - INFO - [Epoch 065 | Batch 0000] IWAE-loss 1199.1672 | mean log_px -0.0037 | KL -1066.61 + 1it [00:00, 3.12it/s] 2it [00:00, 3.90it/s] 3it [00:00, 4.23it/s] 4it [00:00, 4.26it/s] 5it [00:01, 4.42it/s] 6it [00:01, 4.49it/s] 7it [00:01, 4.56it/s] 8it [00:01, 4.44it/s] 9it [00:02, 4.49it/s] 10it [00:02, 4.54it/s] 11it [00:02, 4.59it/s] 12it [00:02, 4.62it/s] 13it [00:02, 4.64it/s] 14it [00:03, 4.66it/s] 15it [00:03, 4.66it/s] 16it [00:03, 4.67it/s] 17it [00:03, 4.69it/s] 18it [00:03, 4.68it/s] 19it [00:04, 4.69it/s] 20it [00:04, 4.67it/s] 21it [00:04, 4.68it/s] 22it [00:04, 4.68it/s] 23it [00:05, 4.68it/s] 24it [00:05, 4.67it/s] 25it [00:05, 4.68it/s] 26it [00:05, 4.68it/s] 27it [00:05, 4.68it/s] 28it [00:06, 4.68it/s] 29it [00:06, 4.69it/s] 30it [00:06, 4.68it/s] 31it [00:06, 4.69it/s] 32it [00:06, 4.68it/s] 33it [00:07, 4.69it/s] 34it [00:07, 4.44it/s] 35it [00:07, 4.51it/s] 36it [00:07, 4.55it/s] 37it [00:08, 4.57it/s] 38it [00:08, 4.61it/s] 39it [00:08, 4.62it/s] 40it [00:08, 4.47it/s] 41it [00:08, 4.49it/s] 42it [00:09, 4.53it/s] 43it [00:09, 4.55it/s] 44it [00:09, 4.54it/s] 45it [00:09, 4.57it/s] 46it [00:10, 4.58it/s] 47it [00:10, 4.59it/s] 48it [00:10, 4.60it/s] 49it [00:10, 4.61it/s] 50it [00:10, 4.61it/s]2025-05-26 02:35:36,239 - INFO - [Epoch 065 | Batch 0050] IWAE-loss 1212.4058 | mean log_px -0.0064 | KL -1062.44 + 51it [00:11, 4.61it/s] 52it [00:11, 4.61it/s] 53it [00:11, 4.61it/s] 54it [00:11, 4.62it/s] 55it [00:12, 4.48it/s] 56it [00:12, 4.53it/s] 57it [00:12, 4.55it/s] 58it [00:12, 4.58it/s] 59it [00:12, 4.60it/s] 60it [00:13, 4.59it/s] 61it [00:13, 4.51it/s] 62it [00:13, 4.56it/s] 63it [00:13, 4.57it/s] 64it [00:13, 4.59it/s] 65it [00:14, 4.60it/s] 66it [00:14, 4.60it/s] 67it [00:14, 4.61it/s] 68it [00:14, 4.62it/s] 69it [00:15, 4.62it/s] 70it [00:15, 4.61it/s] 71it [00:15, 4.58it/s] 72it [00:15, 4.61it/s] 73it [00:15, 4.64it/s] 74it [00:16, 4.66it/s] 75it [00:16, 4.67it/s] 76it [00:16, 4.68it/s] 77it [00:16, 4.70it/s] 78it [00:17, 4.70it/s] 79it [00:17, 4.70it/s] 80it [00:17, 4.71it/s] 81it [00:17, 4.71it/s] 82it [00:17, 4.71it/s] 83it [00:18, 4.71it/s] 84it [00:18, 4.71it/s] 85it [00:18, 4.71it/s] 86it [00:18, 4.71it/s] 87it [00:18, 4.51it/s] 88it [00:19, 4.59it/s] 89it [00:19, 4.45it/s] 90it [00:19, 4.52it/s] 91it [00:19, 4.58it/s] 92it [00:20, 4.61it/s] 93it [00:20, 4.65it/s] 94it [00:20, 4.66it/s] 95it [00:20, 4.68it/s] 96it [00:20, 4.69it/s] 97it [00:21, 4.70it/s] 98it [00:21, 4.70it/s] 99it [00:21, 4.71it/s] 100it [00:21, 4.71it/s]2025-05-26 02:35:47,036 - INFO - [Epoch 065 | Batch 0100] IWAE-loss 1217.0249 | mean log_px -0.0038 | KL -1067.40 + 101it [00:21, 4.71it/s] 102it [00:22, 4.71it/s] 103it [00:22, 4.70it/s] 104it [00:22, 4.69it/s] 105it [00:22, 4.70it/s] 106it [00:23, 4.70it/s] 107it [00:23, 4.70it/s] 108it [00:23, 4.53it/s] 109it [00:23, 4.59it/s] 110it [00:23, 4.62it/s] 111it [00:24, 4.65it/s] 112it [00:24, 4.68it/s] 113it [00:24, 4.67it/s] 114it [00:24, 4.69it/s] 115it [00:24, 4.70it/s] 116it [00:25, 4.70it/s] 117it [00:25, 4.72it/s] 118it [00:25, 4.71it/s] 119it [00:25, 4.71it/s] 120it [00:26, 4.72it/s] 121it [00:26, 4.72it/s] 122it [00:26, 4.72it/s] 123it [00:26, 4.73it/s] 124it [00:26, 4.72it/s] 125it [00:27, 4.72it/s] 126it [00:27, 4.72it/s] 127it [00:27, 4.56it/s] 128it [00:27, 4.62it/s] 129it [00:27, 4.66it/s] 130it [00:28, 4.67it/s] 131it [00:28, 4.68it/s] 132it [00:28, 4.69it/s] 133it [00:28, 4.56it/s] 134it [00:29, 4.61it/s] 135it [00:29, 4.65it/s] 136it [00:29, 4.62it/s] 137it [00:29, 4.56it/s] 138it [00:29, 4.60it/s] 139it [00:30, 4.47it/s] 140it [00:30, 4.55it/s] 141it [00:30, 4.60it/s] 142it [00:30, 4.62it/s] 143it [00:30, 4.61it/s] 144it [00:31, 4.63it/s] 145it [00:31, 4.66it/s] 146it [00:31, 4.57it/s] 147it [00:31, 4.63it/s] 148it [00:32, 4.66it/s] 149it [00:32, 4.68it/s] 150it [00:32, 4.51it/s]2025-05-26 02:35:57,806 - INFO - [Epoch 065 | Batch 0150] IWAE-loss 1168.8063 | mean log_px -0.0032 | KL -1064.15 + 151it [00:32, 4.58it/s] 152it [00:32, 4.62it/s] 153it [00:33, 4.65it/s] 154it [00:33, 4.67it/s] 155it [00:33, 4.69it/s] 156it [00:33, 4.70it/s] 157it [00:33, 4.71it/s] 158it [00:34, 4.71it/s] 159it [00:34, 4.71it/s] 160it [00:34, 4.57it/s] 161it [00:34, 4.63it/s] 162it [00:35, 4.64it/s] 163it [00:35, 4.67it/s] 164it [00:35, 4.65it/s] 165it [00:35, 4.66it/s] 166it [00:35, 4.67it/s] 167it [00:36, 4.52it/s] 168it [00:36, 4.56it/s] 169it [00:36, 4.61it/s] 170it [00:36, 4.63it/s] 171it [00:37, 4.65it/s] 172it [00:37, 4.67it/s] 173it [00:37, 4.68it/s] 174it [00:37, 4.68it/s] 175it [00:37, 4.69it/s] 176it [00:38, 4.69it/s] 177it [00:38, 4.69it/s] 178it [00:38, 4.68it/s] 179it [00:38, 4.52it/s] 180it [00:38, 4.59it/s] 181it [00:39, 4.63it/s] 182it [00:39, 4.49it/s] 183it [00:39, 4.57it/s] 184it [00:39, 4.60it/s] 185it [00:40, 4.63it/s] 186it [00:40, 4.66it/s] 187it [00:40, 4.67it/s] 188it [00:40, 4.50it/s] 189it [00:40, 4.57it/s] 190it [00:41, 4.61it/s] 191it [00:41, 4.64it/s] 192it [00:41, 4.66it/s] 193it [00:41, 4.67it/s] 194it [00:41, 4.68it/s] 195it [00:42, 4.55it/s] 196it [00:42, 4.62it/s] 196it [00:42, 4.61it/s] +2025-05-26 02:36:07,639 - INFO - Epoch: 65, Objective: tensor([1230.9609], device='cuda:0', grad_fn=), Loss: 0.005760730244219303, KL/n: 21.655872344970703 + 0it [00:00, ?it/s]2025-05-26 02:36:08,015 - INFO - [Epoch 066 | Batch 0000] IWAE-loss 1246.0516 | mean log_px -0.0045 | KL -1060.09 + 1it [00:00, 3.10it/s] 2it [00:00, 3.90it/s] 3it [00:00, 4.24it/s] 4it [00:00, 4.39it/s] 5it [00:01, 4.49it/s] 6it [00:01, 4.56it/s] 7it [00:01, 4.62it/s] 8it [00:01, 4.47it/s] 9it [00:02, 4.57it/s] 10it [00:02, 4.61it/s] 11it [00:02, 4.65it/s] 12it [00:02, 4.66it/s] 13it [00:02, 4.52it/s] 14it [00:03, 4.59it/s] 15it [00:03, 4.58it/s] 16it [00:03, 4.62it/s] 17it [00:03, 4.65it/s] 18it [00:03, 4.67it/s] 19it [00:04, 4.52it/s] 20it [00:04, 4.59it/s] 21it [00:04, 4.63it/s] 22it [00:04, 4.65it/s] 23it [00:05, 4.67it/s] 24it [00:05, 4.68it/s] 25it [00:05, 4.70it/s] 26it [00:05, 4.70it/s] 27it [00:05, 4.71it/s] 28it [00:06, 4.52it/s] 29it [00:06, 4.59it/s] 30it [00:06, 4.63it/s] 31it [00:06, 4.66it/s] 32it [00:07, 4.67it/s] 33it [00:07, 4.68it/s] 34it [00:07, 4.69it/s] 35it [00:07, 4.70it/s] 36it [00:07, 4.71it/s] 37it [00:08, 4.54it/s] 38it [00:08, 4.38it/s] 39it [00:08, 4.47it/s] 40it [00:08, 4.51it/s] 41it [00:08, 4.56it/s] 42it [00:09, 4.59it/s] 43it [00:09, 4.61it/s] 44it [00:09, 4.63it/s] 45it [00:09, 4.66it/s] 46it [00:10, 4.67it/s] 47it [00:10, 4.69it/s] 48it [00:10, 4.69it/s] 49it [00:10, 4.71it/s] 50it [00:10, 4.71it/s]2025-05-26 02:36:18,834 - INFO - [Epoch 066 | Batch 0050] IWAE-loss 1207.2434 | mean log_px -0.0082 | KL -1055.60 + 51it [00:11, 4.68it/s] 52it [00:11, 3.68it/s] 53it [00:11, 3.95it/s] 54it [00:11, 4.15it/s] 55it [00:12, 4.16it/s] 56it [00:12, 4.33it/s] 57it [00:12, 4.45it/s] 58it [00:12, 4.52it/s] 59it [00:13, 4.58it/s] 60it [00:13, 4.62it/s] 61it [00:13, 4.65it/s] 62it [00:13, 4.67it/s] 63it [00:13, 4.69it/s] 64it [00:14, 4.53it/s] 65it [00:14, 4.60it/s] 66it [00:14, 4.63it/s] 67it [00:14, 4.66it/s] 68it [00:14, 4.67it/s] 69it [00:15, 4.68it/s] 70it [00:15, 4.68it/s] 71it [00:15, 4.68it/s] 72it [00:15, 4.67it/s] 73it [00:16, 4.51it/s] 74it [00:16, 4.57it/s] 75it [00:16, 4.61it/s] 76it [00:16, 4.64it/s] 77it [00:16, 4.63it/s] 78it [00:17, 4.65it/s] 79it [00:17, 4.67it/s] 80it [00:17, 4.69it/s] 81it [00:17, 4.70it/s] 82it [00:17, 4.69it/s] 83it [00:18, 4.54it/s] 84it [00:18, 4.60it/s] 85it [00:18, 4.64it/s] 86it [00:18, 4.65it/s] 87it [00:19, 4.68it/s] 88it [00:19, 4.68it/s] 89it [00:19, 4.70it/s] 90it [00:19, 4.70it/s] 91it [00:19, 4.71it/s] 92it [00:20, 4.53it/s] 93it [00:20, 4.60it/s] 94it [00:20, 4.63it/s] 95it [00:20, 4.67it/s] 96it [00:20, 4.68it/s] 97it [00:21, 4.66it/s] 98it [00:21, 4.68it/s] 99it [00:21, 4.69it/s] 100it [00:21, 4.69it/s]2025-05-26 02:36:29,772 - INFO - [Epoch 066 | Batch 0100] IWAE-loss 1485.7710 | mean log_px -0.0174 | KL -1055.98 + 101it [00:22, 4.51it/s] 102it [00:22, 4.55it/s] 103it [00:22, 4.58it/s] 104it [00:22, 4.59it/s] 105it [00:22, 4.61it/s] 106it [00:23, 4.63it/s] 107it [00:23, 4.50it/s] 108it [00:23, 4.57it/s] 109it [00:23, 4.62it/s] 110it [00:24, 4.64it/s] 111it [00:24, 4.66it/s] 112it [00:24, 4.67it/s] 113it [00:24, 4.68it/s] 114it [00:24, 4.68it/s] 115it [00:25, 4.70it/s] 116it [00:25, 4.53it/s] 117it [00:25, 4.61it/s] 118it [00:25, 4.63it/s] 119it [00:25, 4.66it/s] 120it [00:26, 4.67it/s] 121it [00:26, 4.69it/s] 122it [00:26, 4.69it/s] 123it [00:26, 4.70it/s] 124it [00:27, 4.70it/s] 125it [00:27, 4.71it/s] 126it [00:27, 4.71it/s] 127it [00:27, 4.72it/s] 128it [00:27, 4.55it/s] 129it [00:28, 4.61it/s] 130it [00:28, 4.64it/s] 131it [00:28, 4.67it/s] 132it [00:28, 4.68it/s] 133it [00:28, 4.70it/s] 134it [00:29, 4.52it/s] 135it [00:29, 4.58it/s] 136it [00:29, 4.62it/s] 137it [00:29, 4.65it/s] 138it [00:30, 4.66it/s] 139it [00:30, 4.67it/s] 140it [00:30, 4.51it/s] 141it [00:30, 4.59it/s] 142it [00:30, 4.62it/s] 143it [00:31, 4.53it/s] 144it [00:31, 4.59it/s] 145it [00:31, 4.65it/s] 146it [00:31, 4.66it/s] 147it [00:31, 4.68it/s] 148it [00:32, 4.52it/s] 149it [00:32, 4.60it/s] 150it [00:32, 4.63it/s]2025-05-26 02:36:40,588 - INFO - [Epoch 066 | Batch 0150] IWAE-loss 1216.0743 | mean log_px -0.0039 | KL -1054.95 + 151it [00:32, 4.65it/s] 152it [00:33, 4.66it/s] 153it [00:33, 4.68it/s] 154it [00:33, 4.69it/s] 155it [00:33, 4.70it/s] 156it [00:33, 4.51it/s] 157it [00:34, 4.59it/s] 158it [00:34, 4.62it/s] 159it [00:34, 4.66it/s] 160it [00:34, 4.67it/s] 161it [00:35, 4.52it/s] 162it [00:35, 4.59it/s] 163it [00:35, 4.62it/s] 164it [00:35, 4.64it/s] 165it [00:35, 4.66it/s] 166it [00:36, 4.51it/s] 167it [00:36, 4.58it/s] 168it [00:36, 4.61it/s] 169it [00:36, 4.48it/s] 170it [00:37, 4.56it/s] 171it [00:37, 4.62it/s] 172it [00:37, 4.64it/s] 173it [00:37, 4.67it/s] 174it [00:37, 4.68it/s] 175it [00:38, 4.53it/s] 176it [00:38, 4.60it/s] 177it [00:38, 4.63it/s] 178it [00:38, 4.65it/s] 179it [00:38, 4.68it/s] 180it [00:39, 4.69it/s] 181it [00:39, 4.70it/s] 182it [00:39, 4.48it/s] 183it [00:39, 4.52it/s] 184it [00:40, 4.55it/s] 185it [00:40, 4.58it/s] 186it [00:40, 4.59it/s] 187it [00:40, 4.60it/s] 188it [00:40, 4.63it/s] 189it [00:41, 4.49it/s] 190it [00:41, 4.57it/s] 191it [00:41, 4.62it/s] 192it [00:41, 4.65it/s] 193it [00:41, 4.64it/s] 194it [00:42, 4.66it/s] 195it [00:42, 4.59it/s] 196it [00:42, 4.64it/s] 196it [00:42, 4.59it/s] +2025-05-26 02:36:50,479 - INFO - Epoch: 66, Objective: tensor([1588.1846], device='cuda:0', grad_fn=), Loss: 0.013912596739828587, KL/n: 21.540197372436523 + 0it [00:00, ?it/s]2025-05-26 02:36:50,852 - INFO - [Epoch 067 | Batch 0000] IWAE-loss 1198.7195 | mean log_px -0.0020 | KL -1053.46 + 1it [00:00, 3.39it/s] 2it [00:00, 4.07it/s] 3it [00:00, 4.35it/s] 4it [00:00, 4.29it/s] 5it [00:01, 4.46it/s] 6it [00:01, 4.51it/s] 7it [00:01, 4.58it/s] 8it [00:01, 4.62it/s] 9it [00:02, 4.47it/s] 10it [00:02, 4.54it/s] 11it [00:02, 4.57it/s] 12it [00:02, 4.60it/s] 13it [00:02, 4.52it/s] 14it [00:03, 4.59it/s] 15it [00:03, 4.63it/s] 16it [00:03, 4.66it/s] 17it [00:03, 4.68it/s] 18it [00:03, 4.69it/s] 19it [00:04, 4.52it/s] 20it [00:04, 4.60it/s] 21it [00:04, 4.64it/s] 22it [00:04, 4.66it/s] 23it [00:05, 4.68it/s] 24it [00:05, 4.53it/s] 25it [00:05, 4.61it/s] 26it [00:05, 4.63it/s] 27it [00:05, 4.67it/s] 28it [00:06, 4.68it/s] 29it [00:06, 4.70it/s] 30it [00:06, 4.71it/s] 31it [00:06, 4.54it/s] 32it [00:07, 4.61it/s] 33it [00:07, 4.65it/s] 34it [00:07, 4.67it/s] 35it [00:07, 4.69it/s] 36it [00:07, 4.70it/s] 37it [00:08, 4.55it/s] 38it [00:08, 4.61it/s] 39it [00:08, 4.66it/s] 40it [00:08, 4.67it/s] 41it [00:08, 4.69it/s] 42it [00:09, 4.70it/s] 43it [00:09, 4.71it/s] 44it [00:09, 4.71it/s] 45it [00:09, 4.54it/s] 46it [00:10, 4.59it/s] 47it [00:10, 4.62it/s] 48it [00:10, 4.64it/s] 49it [00:10, 4.66it/s] 50it [00:10, 4.67it/s]2025-05-26 02:37:01,641 - INFO - [Epoch 067 | Batch 0050] IWAE-loss 1289.7285 | mean log_px -0.0091 | KL -1050.17 + 51it [00:11, 4.52it/s] 52it [00:11, 4.59it/s] 53it [00:11, 4.64it/s] 54it [00:11, 4.67it/s] 55it [00:11, 4.69it/s] 56it [00:12, 4.69it/s] 57it [00:12, 4.71it/s] 58it [00:12, 4.71it/s] 59it [00:12, 4.72it/s] 60it [00:13, 4.71it/s] 61it [00:13, 4.71it/s] 62it [00:13, 4.72it/s] 63it [00:13, 4.71it/s] 64it [00:13, 4.71it/s] 65it [00:14, 4.71it/s] 66it [00:14, 4.72it/s] 67it [00:14, 4.73it/s] 68it [00:14, 4.72it/s] 69it [00:14, 4.74it/s] 70it [00:15, 4.56it/s] 71it [00:15, 4.63it/s] 72it [00:15, 4.65it/s] 73it [00:15, 4.68it/s] 74it [00:16, 4.68it/s] 75it [00:16, 4.70it/s] 76it [00:16, 4.70it/s] 77it [00:16, 4.57it/s] 78it [00:16, 4.63it/s] 79it [00:17, 4.66it/s] 80it [00:17, 4.67it/s] 81it [00:17, 4.70it/s] 82it [00:17, 4.70it/s] 83it [00:17, 4.70it/s] 84it [00:18, 4.71it/s] 85it [00:18, 4.72it/s] 86it [00:18, 4.71it/s] 87it [00:18, 4.59it/s] 88it [00:19, 4.64it/s] 89it [00:19, 4.67it/s] 90it [00:19, 4.68it/s] 91it [00:19, 4.70it/s] 92it [00:19, 4.70it/s] 93it [00:20, 4.72it/s] 94it [00:20, 4.72it/s] 95it [00:20, 4.72it/s] 96it [00:20, 4.71it/s] 97it [00:20, 4.73it/s] 98it [00:21, 4.72it/s] 99it [00:21, 4.71it/s] 100it [00:21, 4.72it/s]2025-05-26 02:37:12,311 - INFO - [Epoch 067 | Batch 0100] IWAE-loss 1387.3746 | mean log_px -0.0188 | KL -1049.04 + 101it [00:21, 4.72it/s] 102it [00:21, 4.56it/s] 103it [00:22, 4.62it/s] 104it [00:22, 4.65it/s] 105it [00:22, 4.68it/s] 106it [00:22, 4.69it/s] 107it [00:23, 4.71it/s] 108it [00:23, 4.71it/s] 109it [00:23, 4.72it/s] 110it [00:23, 4.72it/s] 111it [00:23, 4.72it/s] 112it [00:24, 4.52it/s] 113it [00:24, 4.60it/s] 114it [00:24, 4.63it/s] 115it [00:24, 4.63it/s] 116it [00:24, 4.65it/s] 117it [00:25, 4.61it/s] 118it [00:25, 4.62it/s] 119it [00:25, 4.66it/s] 120it [00:25, 4.66it/s] 121it [00:26, 4.67it/s] 122it [00:26, 4.68it/s] 123it [00:26, 4.53it/s] 124it [00:26, 4.58it/s] 125it [00:26, 4.64it/s] 126it [00:27, 4.65it/s] 127it [00:27, 4.70it/s] 128it [00:27, 4.70it/s] 129it [00:27, 4.72it/s] 130it [00:28, 4.49it/s] 131it [00:28, 4.44it/s] 132it [00:28, 4.52it/s] 133it [00:28, 4.58it/s] 134it [00:28, 4.61it/s] 135it [00:29, 4.65it/s] 136it [00:29, 4.48it/s] 137it [00:29, 4.57it/s] 138it [00:29, 4.62it/s] 139it [00:29, 4.65it/s] 140it [00:30, 4.66it/s] 141it [00:30, 4.69it/s] 142it [00:30, 4.53it/s] 143it [00:30, 4.61it/s] 144it [00:31, 4.65it/s] 145it [00:31, 4.67it/s] 146it [00:31, 4.68it/s] 147it [00:31, 4.70it/s] 148it [00:31, 4.71it/s] 149it [00:32, 4.71it/s] 150it [00:32, 4.70it/s]2025-05-26 02:37:23,099 - INFO - [Epoch 067 | Batch 0150] IWAE-loss 1194.1609 | mean log_px -0.0024 | KL -1048.20 + 151it [00:32, 4.53it/s] 152it [00:32, 4.58it/s] 153it [00:32, 4.63it/s] 154it [00:33, 4.64it/s] 155it [00:33, 4.66it/s] 156it [00:33, 4.67it/s] 157it [00:33, 4.69it/s] 158it [00:34, 4.70it/s] 159it [00:34, 4.55it/s] 160it [00:34, 4.61it/s] 161it [00:34, 4.65it/s] 162it [00:34, 4.67it/s] 163it [00:35, 4.69it/s] 164it [00:35, 4.68it/s] 165it [00:35, 4.71it/s] 166it [00:35, 4.71it/s] 167it [00:36, 4.55it/s] 168it [00:36, 4.61it/s] 169it [00:36, 4.60it/s] 170it [00:36, 4.65it/s] 171it [00:36, 4.67it/s] 172it [00:37, 4.69it/s] 173it [00:37, 4.70it/s] 174it [00:37, 4.52it/s] 175it [00:37, 4.60it/s] 176it [00:37, 4.63it/s] 177it [00:38, 4.66it/s] 178it [00:38, 4.67it/s] 179it [00:38, 4.68it/s] 180it [00:38, 4.70it/s] 181it [00:38, 4.71it/s] 182it [00:39, 4.71it/s] 183it [00:39, 4.73it/s] 184it [00:39, 4.72it/s] 185it [00:39, 4.72it/s] 186it [00:40, 4.56it/s] 187it [00:40, 4.62it/s] 188it [00:40, 4.65it/s] 189it [00:40, 4.68it/s] 190it [00:40, 4.69it/s] 191it [00:41, 4.70it/s] 192it [00:41, 4.53it/s] 193it [00:41, 4.58it/s] 194it [00:41, 4.61it/s] 195it [00:42, 4.54it/s] 196it [00:42, 4.60it/s] 196it [00:42, 4.63it/s] +2025-05-26 02:37:32,921 - INFO - Epoch: 67, Objective: tensor([1625.6294], device='cuda:0', grad_fn=), Loss: 0.012983052060008049, KL/n: 21.431779861450195 + 0it [00:00, ?it/s]2025-05-26 02:37:33,482 - INFO - [Epoch 068 | Batch 0000] IWAE-loss 1262.3419 | mean log_px -0.0057 | KL -1050.64 + 1it [00:00, 3.39it/s] 2it [00:00, 4.05it/s] 3it [00:00, 4.34it/s] 4it [00:00, 4.48it/s] 5it [00:01, 4.39it/s] 6it [00:01, 4.50it/s] 7it [00:01, 4.58it/s] 8it [00:01, 4.62it/s] 9it [00:02, 4.66it/s] 10it [00:02, 4.68it/s] 11it [00:02, 4.53it/s] 12it [00:02, 4.60it/s] 13it [00:02, 4.64it/s] 14it [00:03, 4.67it/s] 15it [00:03, 4.68it/s] 16it [00:03, 4.69it/s] 17it [00:03, 4.71it/s] 18it [00:03, 4.70it/s] 19it [00:04, 4.71it/s] 20it [00:04, 4.71it/s] 21it [00:04, 4.70it/s] 22it [00:04, 4.54it/s] 23it [00:05, 4.61it/s] 24it [00:05, 4.60it/s] 25it [00:05, 4.46it/s] 26it [00:05, 4.55it/s] 27it [00:05, 4.60it/s] 28it [00:06, 4.64it/s] 29it [00:06, 4.67it/s] 30it [00:06, 4.64it/s] 31it [00:06, 4.51it/s] 32it [00:06, 4.59it/s] 33it [00:07, 4.63it/s] 34it [00:07, 4.66it/s] 35it [00:07, 4.69it/s] 36it [00:07, 4.70it/s] 37it [00:08, 4.72it/s] 38it [00:08, 4.56it/s] 39it [00:08, 4.62it/s] 40it [00:08, 4.65it/s] 41it [00:08, 4.67it/s] 42it [00:09, 4.69it/s] 43it [00:09, 4.71it/s] 44it [00:09, 4.70it/s] 45it [00:09, 4.72it/s] 46it [00:09, 4.71it/s] 47it [00:10, 4.73it/s] 48it [00:10, 4.72it/s] 49it [00:10, 4.73it/s] 50it [00:10, 4.72it/s]2025-05-26 02:37:44,218 - INFO - [Epoch 068 | Batch 0050] IWAE-loss 1151.6068 | mean log_px -0.0023 | KL -1047.97 + 51it [00:11, 4.73it/s] 52it [00:11, 4.73it/s] 53it [00:11, 4.73it/s] 54it [00:11, 4.72it/s] 55it [00:11, 4.72it/s] 56it [00:12, 4.70it/s] 57it [00:12, 4.71it/s] 58it [00:12, 4.54it/s] 59it [00:12, 4.59it/s] 60it [00:12, 4.62it/s] 61it [00:13, 4.65it/s] 62it [00:13, 4.65it/s] 63it [00:13, 4.67it/s] 64it [00:13, 4.51it/s] 65it [00:14, 4.59it/s] 66it [00:14, 4.63it/s] 67it [00:14, 4.66it/s] 68it [00:14, 4.68it/s] 69it [00:14, 4.69it/s] 70it [00:15, 4.70it/s] 71it [00:15, 4.72it/s] 72it [00:15, 4.71it/s] 73it [00:15, 4.72it/s] 74it [00:15, 4.71it/s] 75it [00:16, 4.72it/s] 76it [00:16, 4.56it/s] 77it [00:16, 4.60it/s] 78it [00:16, 4.55it/s] 79it [00:17, 4.52it/s] 80it [00:17, 4.57it/s] 81it [00:17, 4.62it/s] 82it [00:17, 4.65it/s] 83it [00:17, 4.68it/s] 84it [00:18, 4.68it/s] 85it [00:18, 4.68it/s] 86it [00:18, 4.56it/s] 87it [00:18, 4.63it/s] 88it [00:18, 4.66it/s] 89it [00:19, 4.69it/s] 90it [00:19, 4.69it/s] 91it [00:19, 4.71it/s] 92it [00:19, 4.71it/s] 93it [00:20, 4.72it/s] 94it [00:20, 4.72it/s] 95it [00:20, 4.72it/s] 96it [00:20, 4.58it/s] 97it [00:20, 4.64it/s] 98it [00:21, 4.66it/s] 99it [00:21, 4.69it/s] 100it [00:21, 4.69it/s]2025-05-26 02:37:54,953 - INFO - [Epoch 068 | Batch 0100] IWAE-loss 1225.7665 | mean log_px -0.0087 | KL -1041.03 + 101it [00:21, 4.71it/s] 102it [00:21, 4.71it/s] 103it [00:22, 4.70it/s] 104it [00:22, 4.71it/s] 105it [00:22, 4.72it/s] 106it [00:22, 4.73it/s] 107it [00:23, 4.73it/s] 108it [00:23, 4.72it/s] 109it [00:23, 4.73it/s] 110it [00:23, 4.73it/s] 111it [00:23, 4.73it/s] 112it [00:24, 4.73it/s] 113it [00:24, 4.73it/s] 114it [00:24, 4.73it/s] 115it [00:24, 4.74it/s] 116it [00:24, 4.73it/s] 117it [00:25, 4.73it/s] 118it [00:25, 4.72it/s] 119it [00:25, 4.73it/s] 120it [00:25, 4.73it/s] 121it [00:25, 4.73it/s] 122it [00:26, 4.69it/s] 123it [00:26, 4.68it/s] 124it [00:26, 4.67it/s] 125it [00:26, 4.69it/s] 126it [00:27, 4.70it/s] 127it [00:27, 4.72it/s] 128it [00:27, 4.72it/s] 129it [00:27, 4.72it/s] 130it [00:27, 4.69it/s] 131it [00:28, 4.73it/s] 132it [00:28, 4.72it/s] 133it [00:28, 4.56it/s] 134it [00:28, 4.62it/s] 135it [00:28, 4.64it/s] 136it [00:29, 4.65it/s] 137it [00:29, 4.66it/s] 138it [00:29, 4.68it/s] 139it [00:29, 4.68it/s] 140it [00:30, 4.69it/s] 141it [00:30, 4.57it/s] 142it [00:30, 4.62it/s] 143it [00:30, 4.66it/s] 144it [00:30, 4.68it/s] 145it [00:31, 4.69it/s] 146it [00:31, 4.53it/s] 147it [00:31, 4.57it/s] 148it [00:31, 4.61it/s] 149it [00:32, 4.65it/s] 150it [00:32, 4.66it/s]2025-05-26 02:38:05,626 - INFO - [Epoch 068 | Batch 0150] IWAE-loss 1264.9144 | mean log_px -0.0035 | KL -1042.59 + 151it [00:32, 4.68it/s] 152it [00:32, 4.70it/s] 153it [00:32, 4.71it/s] 154it [00:33, 4.70it/s] 155it [00:33, 4.57it/s] 156it [00:33, 4.63it/s] 157it [00:33, 4.67it/s] 158it [00:33, 4.51it/s] 159it [00:34, 4.49it/s] 160it [00:34, 4.55it/s] 161it [00:34, 4.60it/s] 162it [00:34, 4.51it/s] 163it [00:35, 4.58it/s] 164it [00:35, 4.61it/s] 165it [00:35, 4.64it/s] 166it [00:35, 4.64it/s] 167it [00:35, 4.66it/s] 168it [00:36, 4.52it/s] 169it [00:36, 4.59it/s] 170it [00:36, 4.62it/s] 171it [00:36, 4.67it/s] 172it [00:36, 4.68it/s] 173it [00:37, 4.70it/s] 174it [00:37, 4.47it/s] 175it [00:37, 4.56it/s] 176it [00:37, 4.60it/s] 177it [00:38, 4.64it/s] 178it [00:38, 4.67it/s] 179it [00:38, 4.52it/s] 180it [00:38, 4.59it/s] 181it [00:38, 4.63it/s] 182it [00:39, 4.66it/s] 183it [00:39, 4.65it/s] 184it [00:39, 4.67it/s] 185it [00:39, 4.69it/s] 186it [00:40, 4.54it/s] 187it [00:40, 4.61it/s] 188it [00:40, 4.64it/s] 189it [00:40, 4.68it/s] 190it [00:40, 4.69it/s] 191it [00:41, 4.70it/s] 192it [00:41, 4.70it/s] 193it [00:41, 4.55it/s] 194it [00:41, 4.62it/s] 195it [00:41, 4.55it/s] 196it [00:42, 4.61it/s] 196it [00:42, 4.64it/s] +2025-05-26 02:38:15,511 - INFO - Epoch: 68, Objective: tensor([1242.0751], device='cuda:0', grad_fn=), Loss: 0.003887968137860298, KL/n: 21.28978157043457 + 0it [00:00, ?it/s]2025-05-26 02:38:15,886 - INFO - [Epoch 069 | Batch 0000] IWAE-loss 1280.5768 | mean log_px -0.0051 | KL -1042.65 + 1it [00:00, 3.38it/s] 2it [00:00, 3.86it/s] 3it [00:00, 4.23it/s] 4it [00:00, 4.38it/s] 5it [00:01, 4.49it/s] 6it [00:01, 4.55it/s] 7it [00:01, 4.43it/s] 8it [00:01, 4.53it/s] 9it [00:02, 4.58it/s] 10it [00:02, 4.61it/s] 11it [00:02, 4.64it/s] 12it [00:02, 4.66it/s] 13it [00:02, 4.69it/s] 14it [00:03, 4.53it/s] 15it [00:03, 4.60it/s] 16it [00:03, 4.63it/s] 17it [00:03, 4.66it/s] 18it [00:03, 4.67it/s] 19it [00:04, 4.69it/s] 20it [00:04, 4.70it/s] 21it [00:04, 4.72it/s] 22it [00:04, 4.71it/s] 23it [00:05, 4.55it/s] 24it [00:05, 4.60it/s] 25it [00:05, 4.65it/s] 26it [00:05, 4.60it/s] 27it [00:06, 3.63it/s] 28it [00:06, 3.91it/s] 29it [00:06, 4.12it/s] 30it [00:06, 4.28it/s] 31it [00:06, 4.38it/s] 32it [00:07, 4.47it/s] 33it [00:07, 4.51it/s] 34it [00:07, 4.56it/s] 35it [00:07, 4.60it/s] 36it [00:08, 4.61it/s] 37it [00:08, 4.62it/s] 38it [00:08, 4.62it/s] 39it [00:08, 4.63it/s] 40it [00:08, 4.65it/s] 41it [00:09, 4.66it/s] 42it [00:09, 4.66it/s] 43it [00:09, 4.67it/s] 44it [00:09, 4.67it/s] 45it [00:09, 4.69it/s] 46it [00:10, 4.68it/s] 47it [00:10, 4.53it/s] 48it [00:10, 4.60it/s] 49it [00:10, 4.64it/s] 50it [00:11, 4.66it/s]2025-05-26 02:38:26,852 - INFO - [Epoch 069 | Batch 0050] IWAE-loss 1204.5205 | mean log_px -0.0046 | KL -1043.10 + 51it [00:11, 4.67it/s] 52it [00:11, 4.52it/s] 53it [00:11, 4.60it/s] 54it [00:11, 4.63it/s] 55it [00:12, 4.66it/s] 56it [00:12, 4.68it/s] 57it [00:12, 4.69it/s] 58it [00:12, 4.71it/s] 59it [00:12, 4.71it/s] 60it [00:13, 4.71it/s] 61it [00:13, 4.59it/s] 62it [00:13, 4.65it/s] 63it [00:13, 4.67it/s] 64it [00:14, 4.60it/s] 65it [00:14, 4.65it/s] 66it [00:14, 4.64it/s] 67it [00:14, 4.68it/s] 68it [00:14, 4.68it/s] 69it [00:15, 4.68it/s] 70it [00:15, 4.68it/s] 71it [00:15, 4.52it/s] 72it [00:15, 4.58it/s] 73it [00:16, 4.63it/s] 74it [00:16, 4.65it/s] 75it [00:16, 4.68it/s] 76it [00:16, 4.69it/s] 77it [00:16, 4.71it/s] 78it [00:17, 4.54it/s] 79it [00:17, 4.59it/s] 80it [00:17, 4.64it/s] 81it [00:17, 4.67it/s] 82it [00:17, 4.68it/s] 83it [00:18, 4.69it/s] 84it [00:18, 4.70it/s] 85it [00:18, 4.71it/s] 86it [00:18, 4.71it/s] 87it [00:18, 4.71it/s] 88it [00:19, 4.55it/s] 89it [00:19, 4.62it/s] 90it [00:19, 4.64it/s] 91it [00:19, 4.62it/s] 92it [00:20, 4.64it/s] 93it [00:20, 4.67it/s] 94it [00:20, 4.69it/s] 95it [00:20, 4.69it/s] 96it [00:20, 4.71it/s] 97it [00:21, 4.71it/s] 98it [00:21, 4.54it/s] 99it [00:21, 4.61it/s] 100it [00:21, 4.64it/s]2025-05-26 02:38:37,607 - INFO - [Epoch 069 | Batch 0100] IWAE-loss 1164.3147 | mean log_px -0.0017 | KL -1040.04 + 101it [00:22, 4.65it/s] 102it [00:22, 4.65it/s] 103it [00:22, 4.67it/s] 104it [00:22, 4.67it/s] 105it [00:22, 4.69it/s] 106it [00:23, 4.69it/s] 107it [00:23, 4.54it/s] 108it [00:23, 4.61it/s] 109it [00:23, 4.64it/s] 110it [00:23, 4.66it/s] 111it [00:24, 4.68it/s] 112it [00:24, 4.53it/s] 113it [00:24, 4.60it/s] 114it [00:24, 4.63it/s] 115it [00:25, 4.66it/s] 116it [00:25, 4.67it/s] 117it [00:25, 4.70it/s] 118it [00:25, 4.71it/s] 119it [00:25, 4.53it/s] 120it [00:26, 4.60it/s] 121it [00:26, 4.64it/s] 122it [00:26, 4.66it/s] 123it [00:26, 4.69it/s] 124it [00:26, 4.70it/s] 125it [00:27, 4.71it/s] 126it [00:27, 4.72it/s] 127it [00:27, 4.72it/s] 128it [00:27, 4.72it/s] 129it [00:28, 4.72it/s] 130it [00:28, 4.55it/s] 131it [00:28, 4.62it/s] 132it [00:28, 4.65it/s] 133it [00:28, 4.68it/s] 134it [00:29, 4.68it/s] 135it [00:29, 4.70it/s] 136it [00:29, 4.70it/s] 137it [00:29, 4.71it/s] 138it [00:29, 4.71it/s] 139it [00:30, 4.72it/s] 140it [00:30, 4.71it/s] 141it [00:30, 4.73it/s] 142it [00:30, 4.72it/s] 143it [00:31, 4.73it/s] 144it [00:31, 4.51it/s] 145it [00:31, 4.59it/s] 146it [00:31, 4.62it/s] 147it [00:31, 4.66it/s] 148it [00:32, 4.67it/s] 149it [00:32, 4.69it/s] 150it [00:32, 4.47it/s]2025-05-26 02:38:48,363 - INFO - [Epoch 069 | Batch 0150] IWAE-loss 1321.3817 | mean log_px -0.0040 | KL -1039.04 + 151it [00:32, 4.55it/s] 152it [00:32, 4.60it/s] 153it [00:33, 4.64it/s] 154it [00:33, 4.66it/s] 155it [00:33, 4.68it/s] 156it [00:33, 4.70it/s] 157it [00:34, 4.71it/s] 158it [00:34, 4.71it/s] 159it [00:34, 4.55it/s] 160it [00:34, 4.62it/s] 161it [00:34, 4.65it/s] 162it [00:35, 4.67it/s] 163it [00:35, 4.69it/s] 164it [00:35, 4.69it/s] 165it [00:35, 4.71it/s] 166it [00:35, 4.71it/s] 167it [00:36, 4.71it/s] 168it [00:36, 4.71it/s] 169it [00:36, 4.72it/s] 170it [00:36, 4.54it/s] 171it [00:37, 4.55it/s] 172it [00:37, 4.48it/s] 173it [00:37, 4.54it/s] 174it [00:37, 4.57it/s] 175it [00:37, 4.60it/s] 176it [00:38, 4.61it/s] 177it [00:38, 4.63it/s] 178it [00:38, 4.50it/s] 179it [00:38, 4.56it/s] 180it [00:39, 4.47it/s] 181it [00:39, 4.52it/s] 182it [00:39, 4.58it/s] 183it [00:39, 4.62it/s] 184it [00:39, 4.65it/s] 185it [00:40, 4.67it/s] 186it [00:40, 4.69it/s] 187it [00:40, 4.70it/s] 188it [00:40, 4.54it/s] 189it [00:40, 4.60it/s] 190it [00:41, 4.62it/s] 191it [00:41, 4.65it/s] 192it [00:41, 4.66it/s] 193it [00:41, 4.51it/s] 194it [00:42, 4.57it/s] 195it [00:42, 4.50it/s] 196it [00:42, 4.55it/s] 196it [00:42, 4.60it/s] +2025-05-26 02:38:58,227 - INFO - Epoch: 69, Objective: tensor([1152.8077], device='cuda:0', grad_fn=), Loss: 0.006191767752170563, KL/n: 21.240211486816406 +2025-05-26 02:38:58,232 - INFO - Select objective: bbb + 0it [00:00, ?it/s] 1it [00:00, 9.81it/s] 4it [00:00, 20.04it/s] 7it [00:00, 24.35it/s] 11it [00:00, 26.31it/s] 14it [00:00, 26.70it/s] 17it [00:00, 27.49it/s] 20it [00:00, 27.48it/s] 23it [00:00, 27.83it/s] 26it [00:00, 27.97it/s] 30it [00:01, 28.32it/s] 33it [00:01, 28.32it/s] 37it [00:01, 28.56it/s] 40it [00:01, 28.14it/s] 43it [00:01, 28.40it/s] 46it [00:01, 28.13it/s] 50it [00:01, 28.59it/s] 54it [00:01, 28.74it/s] 57it [00:02, 28.24it/s] 60it [00:02, 28.32it/s] 64it [00:02, 28.70it/s] 67it [00:02, 28.25it/s] 71it [00:02, 28.45it/s] 75it [00:02, 28.90it/s] 78it [00:02, 28.33it/s] 81it [00:02, 28.45it/s] 85it [00:03, 28.54it/s] 89it [00:03, 28.72it/s] 92it [00:03, 28.46it/s] 95it [00:03, 28.53it/s] 99it [00:03, 28.32it/s] 102it [00:03, 28.57it/s] 105it [00:03, 28.18it/s] 108it [00:03, 27.92it/s] 111it [00:03, 27.99it/s] 114it [00:04, 28.12it/s] 117it [00:04, 28.13it/s] 120it [00:04, 28.43it/s] 123it [00:04, 27.97it/s] 126it [00:04, 28.06it/s] 129it [00:04, 28.20it/s] 132it [00:04, 28.53it/s] 136it [00:04, 28.78it/s] 139it [00:04, 28.10it/s] 142it [00:05, 28.39it/s] 146it [00:05, 28.45it/s] 149it [00:05, 28.46it/s] 152it [00:05, 28.20it/s] 155it [00:05, 28.33it/s] 158it [00:05, 28.72it/s] 161it [00:05, 28.34it/s] 164it [00:05, 28.41it/s] 167it [00:05, 28.47it/s] 170it [00:06, 28.60it/s] 173it [00:06, 28.20it/s] 176it [00:06, 28.26it/s] 180it [00:06, 28.73it/s] 183it [00:06, 28.23it/s] 187it [00:06, 28.55it/s] 190it [00:06, 28.25it/s] 193it [00:06, 28.44it/s] 196it [00:06, 28.44it/s] 199it [00:07, 28.76it/s] 202it [00:07, 28.37it/s] 205it [00:07, 28.70it/s] 209it [00:07, 28.44it/s] 213it [00:07, 28.70it/s] 217it [00:07, 28.50it/s] 221it [00:07, 28.74it/s] 225it [00:07, 28.54it/s] 229it [00:08, 28.62it/s] 233it [00:08, 28.85it/s] 236it [00:08, 28.73it/s] 239it [00:08, 28.04it/s] 243it [00:08, 28.63it/s] 246it [00:08, 28.04it/s] 250it [00:08, 28.17it/s] 254it [00:09, 28.51it/s] 258it [00:09, 28.92it/s] 261it [00:09, 28.46it/s] 264it [00:09, 28.53it/s] 267it [00:09, 28.48it/s] 271it [00:09, 28.93it/s] 274it [00:09, 28.61it/s] 277it [00:09, 28.13it/s] 280it [00:09, 26.35it/s] 280it [00:10, 27.98it/s] +2025-05-26 02:39:08,405 - INFO - Epoch: 0, Objective: 0.014402239583432674, Loss: 0.0063042594119906425, KL/n: 0.008097980171442032 + 0%| | 0/84 [00:00), Loss: 0.43466299772262573, KL/n: 68.75403594970703 + 0it [00:00, ?it/s]2025-05-26 03:14:51,541 - INFO - [Epoch 001 | Batch 0000] IWAE-loss 28074.5488 | mean log_px -0.3577 | KL -3369.96 + 1it [00:00, 5.33it/s] 2it [00:00, 7.26it/s] 3it [00:00, 8.20it/s] 4it [00:00, 8.07it/s] 5it [00:00, 8.56it/s] 6it [00:00, 8.86it/s] 7it [00:00, 9.04it/s] 8it [00:00, 8.73it/s] 9it [00:01, 8.95it/s] 10it [00:01, 9.11it/s] 11it [00:01, 9.24it/s] 12it [00:01, 9.29it/s] 13it [00:01, 9.42it/s] 14it [00:01, 9.44it/s] 15it [00:01, 9.45it/s] 16it [00:01, 9.46it/s] 17it [00:01, 9.49it/s] 18it [00:02, 9.51it/s] 19it [00:02, 9.53it/s] 20it [00:02, 9.50it/s] 21it [00:02, 9.51it/s] 22it [00:02, 9.53it/s] 23it [00:02, 9.53it/s] 24it [00:02, 9.51it/s] 25it [00:02, 9.24it/s] 26it [00:02, 9.38it/s] 27it [00:02, 9.46it/s] 28it [00:03, 9.46it/s] 29it [00:03, 9.47it/s] 30it [00:03, 9.44it/s] 31it [00:03, 9.48it/s] 32it [00:03, 9.48it/s] 33it [00:03, 9.49it/s] 34it [00:03, 9.51it/s] 35it [00:03, 9.57it/s] 36it [00:03, 9.59it/s] 37it [00:04, 9.52it/s] 38it [00:04, 9.56it/s] 39it [00:04, 9.63it/s] 40it [00:04, 9.05it/s] 41it [00:04, 9.23it/s] 42it [00:04, 9.32it/s] 43it [00:04, 9.39it/s] 44it [00:04, 9.46it/s] 45it [00:04, 9.49it/s] 46it [00:04, 9.54it/s] 47it [00:05, 9.58it/s] 48it [00:05, 9.56it/s] 49it [00:05, 9.52it/s] 50it [00:05, 9.48it/s]2025-05-26 03:14:56,847 - INFO - [Epoch 001 | Batch 0050] IWAE-loss 26761.6230 | mean log_px -0.3389 | KL -3393.95 + 51it [00:05, 9.55it/s] 52it [00:05, 9.50it/s] 53it [00:05, 9.53it/s] 54it [00:05, 9.53it/s] 55it [00:05, 9.56it/s] 56it [00:06, 9.53it/s] 57it [00:06, 9.53it/s] 58it [00:06, 9.50it/s] 59it [00:06, 9.50it/s] 60it [00:06, 9.50it/s] 61it [00:06, 9.56it/s] 62it [00:06, 9.52it/s] 63it [00:06, 9.52it/s] 64it [00:06, 9.43it/s] 65it [00:06, 9.47it/s] 66it [00:07, 9.49it/s] 67it [00:07, 9.50it/s] 68it [00:07, 9.51it/s] 69it [00:07, 8.96it/s] 70it [00:07, 9.12it/s] 71it [00:07, 9.27it/s] 72it [00:07, 9.35it/s] 73it [00:07, 9.00it/s] 74it [00:07, 9.13it/s] 75it [00:08, 9.16it/s] 76it [00:08, 9.23it/s] 77it [00:08, 9.31it/s] 78it [00:08, 8.93it/s] 79it [00:08, 9.03it/s] 80it [00:08, 9.19it/s] 81it [00:08, 9.31it/s] 82it [00:08, 9.34it/s] 83it [00:08, 9.45it/s] 84it [00:09, 9.45it/s] 85it [00:09, 9.49it/s] 86it [00:09, 9.55it/s] 87it [00:09, 9.61it/s] 88it [00:09, 9.52it/s] 89it [00:09, 9.54it/s] 90it [00:09, 9.48it/s] 91it [00:09, 9.51it/s] 92it [00:09, 9.51it/s] 93it [00:09, 9.47it/s] 94it [00:10, 9.50it/s] 95it [00:10, 9.49it/s] 96it [00:10, 9.50it/s] 97it [00:10, 9.44it/s] 98it [00:10, 8.87it/s] 99it [00:10, 8.92it/s] 100it [00:10, 9.11it/s]2025-05-26 03:15:02,193 - INFO - [Epoch 001 | Batch 0100] IWAE-loss 28285.6133 | mean log_px -0.3769 | KL -3410.21 + 101it [00:10, 9.19it/s] 102it [00:10, 8.77it/s] 103it [00:11, 8.97it/s] 104it [00:11, 9.08it/s] 105it [00:11, 9.05it/s] 106it [00:11, 8.55it/s] 107it [00:11, 8.84it/s] 108it [00:11, 8.99it/s] 109it [00:11, 9.16it/s] 110it [00:11, 8.75it/s] 111it [00:11, 8.93it/s] 112it [00:12, 9.11it/s] 113it [00:12, 9.19it/s] 114it [00:12, 8.79it/s] 115it [00:12, 9.03it/s] 116it [00:12, 9.20it/s] 117it [00:12, 9.27it/s] 118it [00:12, 9.17it/s] 119it [00:12, 8.95it/s] 120it [00:12, 8.94it/s] 121it [00:13, 8.55it/s] 122it [00:13, 8.84it/s] 123it [00:13, 9.05it/s] 124it [00:13, 9.20it/s] 125it [00:13, 8.80it/s] 126it [00:13, 9.01it/s] 127it [00:13, 9.14it/s] 128it [00:13, 9.25it/s] 129it [00:13, 8.83it/s] 130it [00:14, 9.05it/s] 131it [00:14, 9.15it/s] 132it [00:14, 9.22it/s] 133it [00:14, 8.71it/s] 134it [00:14, 8.96it/s] 135it [00:14, 9.09it/s] 136it [00:14, 9.21it/s] 137it [00:14, 8.75it/s] 138it [00:14, 8.93it/s] 139it [00:15, 9.06it/s] 140it [00:15, 9.19it/s] 141it [00:15, 9.28it/s] 142it [00:15, 8.86it/s] 143it [00:15, 9.00it/s] 144it [00:15, 9.14it/s] 145it [00:15, 9.23it/s] 146it [00:15, 8.74it/s] 147it [00:15, 8.95it/s] 148it [00:16, 9.09it/s] 149it [00:16, 9.23it/s] 150it [00:16, 8.79it/s]2025-05-26 03:15:07,756 - INFO - [Epoch 001 | Batch 0150] IWAE-loss 24188.4082 | mean log_px -0.3034 | KL -3424.15 + 151it [00:16, 9.02it/s] 152it [00:16, 9.15it/s] 153it [00:16, 9.27it/s] 154it [00:16, 8.83it/s] 155it [00:16, 9.02it/s] 156it [00:16, 9.14it/s] 157it [00:17, 9.23it/s] 158it [00:17, 8.82it/s] 159it [00:17, 9.07it/s] 160it [00:17, 9.15it/s] 161it [00:17, 9.23it/s] 162it [00:17, 8.78it/s] 163it [00:17, 8.99it/s] 164it [00:17, 8.62it/s] 165it [00:17, 8.86it/s] 166it [00:18, 9.07it/s] 167it [00:18, 9.14it/s] 168it [00:18, 8.69it/s] 169it [00:18, 8.95it/s] 170it [00:18, 9.08it/s] 171it [00:18, 9.20it/s] 172it [00:18, 8.79it/s] 173it [00:18, 8.99it/s] 174it [00:18, 9.17it/s] 175it [00:19, 9.24it/s] 176it [00:19, 8.81it/s] 177it [00:19, 9.03it/s] 178it [00:19, 9.20it/s] 179it [00:19, 9.31it/s] 180it [00:19, 8.88it/s] 181it [00:19, 9.08it/s] 182it [00:19, 9.07it/s] 183it [00:19, 9.15it/s] 184it [00:20, 8.75it/s] 185it [00:20, 8.97it/s] 186it [00:20, 9.15it/s] 187it [00:20, 9.27it/s] 188it [00:20, 8.85it/s] 189it [00:20, 9.02it/s] 190it [00:20, 9.14it/s] 191it [00:20, 9.27it/s] 192it [00:20, 8.87it/s] 193it [00:21, 9.07it/s] 194it [00:21, 9.20it/s] 195it [00:21, 8.76it/s] 196it [00:21, 8.52it/s] 196it [00:21, 9.13it/s] +2025-05-26 03:15:12,870 - INFO - Epoch: 1, Objective: tensor([25134.6309], device='cuda:0', grad_fn=), Loss: 0.3120049238204956, KL/n: 70.07382202148438 + 0it [00:00, ?it/s]2025-05-26 03:15:13,163 - INFO - [Epoch 002 | Batch 0000] IWAE-loss 26034.8926 | mean log_px -0.3319 | KL -3429.36 + 1it [00:00, 4.91it/s] 2it [00:00, 6.83it/s] 3it [00:00, 7.88it/s] 4it [00:00, 8.49it/s] 5it [00:00, 8.90it/s] 6it [00:00, 8.90it/s] 7it [00:00, 9.08it/s] 8it [00:00, 9.19it/s] 9it [00:01, 9.27it/s] 10it [00:01, 9.36it/s] 11it [00:01, 9.40it/s] 12it [00:01, 9.44it/s] 13it [00:01, 9.47it/s] 14it [00:01, 9.47it/s] 15it [00:01, 9.47it/s] 16it [00:01, 9.47it/s] 17it [00:01, 9.50it/s] 18it [00:01, 9.50it/s] 19it [00:02, 9.50it/s] 20it [00:02, 9.51it/s] 21it [00:02, 9.51it/s] 22it [00:02, 9.54it/s] 23it [00:02, 9.53it/s] 24it [00:02, 9.53it/s] 25it [00:02, 9.50it/s] 26it [00:02, 9.43it/s] 27it [00:02, 9.45it/s] 28it [00:03, 9.50it/s] 29it [00:03, 9.48it/s] 30it [00:03, 9.50it/s] 31it [00:03, 9.57it/s] 32it [00:03, 9.53it/s] 33it [00:03, 9.52it/s] 34it [00:03, 9.51it/s] 35it [00:03, 9.45it/s] 36it [00:03, 9.44it/s] 37it [00:03, 9.46it/s] 38it [00:04, 9.47it/s] 39it [00:04, 9.50it/s] 40it [00:04, 9.50it/s] 41it [00:04, 9.48it/s] 42it [00:04, 9.53it/s] 43it [00:04, 9.55it/s] 44it [00:04, 9.53it/s] 45it [00:04, 9.54it/s] 46it [00:04, 9.54it/s] 47it [00:05, 9.58it/s] 48it [00:05, 9.54it/s] 49it [00:05, 9.53it/s] 50it [00:05, 9.52it/s]2025-05-26 03:15:18,427 - INFO - [Epoch 002 | Batch 0050] IWAE-loss 24607.2324 | mean log_px -0.3063 | KL -3444.27 + 51it [00:05, 9.52it/s] 52it [00:05, 9.50it/s] 53it [00:05, 9.52it/s] 54it [00:05, 9.50it/s] 55it [00:05, 9.50it/s] 56it [00:05, 9.51it/s] 57it [00:06, 9.48it/s] 58it [00:06, 9.43it/s] 59it [00:06, 9.42it/s] 60it [00:06, 9.42it/s] 61it [00:06, 9.43it/s] 62it [00:06, 9.43it/s] 63it [00:06, 9.26it/s] 64it [00:06, 9.32it/s] 65it [00:06, 9.36it/s] 66it [00:07, 9.35it/s] 67it [00:07, 9.45it/s] 68it [00:07, 9.42it/s] 69it [00:07, 9.43it/s] 70it [00:07, 9.45it/s] 71it [00:07, 9.49it/s] 72it [00:07, 9.51it/s] 73it [00:07, 9.53it/s] 74it [00:07, 9.56it/s] 75it [00:08, 9.58it/s] 76it [00:08, 9.60it/s] 77it [00:08, 9.58it/s] 78it [00:08, 9.59it/s] 79it [00:08, 9.61it/s] 80it [00:08, 9.57it/s] 81it [00:08, 9.60it/s] 82it [00:08, 9.61it/s] 83it [00:08, 9.63it/s] 84it [00:08, 9.62it/s] 85it [00:09, 9.58it/s] 86it [00:09, 9.36it/s] 87it [00:09, 9.39it/s] 88it [00:09, 9.43it/s] 89it [00:09, 9.49it/s] 90it [00:09, 9.41it/s] 91it [00:09, 9.40it/s] 92it [00:09, 9.38it/s] 93it [00:09, 9.36it/s] 94it [00:10, 9.36it/s] 95it [00:10, 9.39it/s] 96it [00:10, 9.39it/s] 97it [00:10, 9.40it/s] 98it [00:10, 9.42it/s] 99it [00:10, 9.45it/s] 100it [00:10, 9.50it/s]2025-05-26 03:15:23,707 - INFO - [Epoch 002 | Batch 0100] IWAE-loss 20464.7461 | mean log_px -0.2492 | KL -3452.10 + 101it [00:10, 9.54it/s] 102it [00:10, 9.53it/s] 103it [00:10, 9.57it/s] 104it [00:11, 9.58it/s] 105it [00:11, 9.59it/s] 106it [00:11, 9.58it/s] 107it [00:11, 6.39it/s] 108it [00:11, 7.06it/s] 109it [00:11, 7.65it/s] 110it [00:11, 8.11it/s] 111it [00:11, 8.53it/s] 112it [00:12, 8.84it/s] 113it [00:12, 9.08it/s] 114it [00:12, 9.18it/s] 115it [00:12, 9.28it/s] 116it [00:12, 9.34it/s] 117it [00:12, 9.37it/s] 118it [00:12, 9.40it/s] 119it [00:12, 9.41it/s] 120it [00:12, 9.45it/s] 121it [00:13, 9.47it/s] 122it [00:13, 9.48it/s] 123it [00:13, 9.50it/s] 124it [00:13, 9.41it/s] 125it [00:13, 9.43it/s] 126it [00:13, 9.46it/s] 127it [00:13, 9.47it/s] 128it [00:13, 9.49it/s] 129it [00:13, 9.49it/s] 130it [00:13, 9.51it/s] 131it [00:14, 9.50it/s] 132it [00:14, 9.56it/s] 133it [00:14, 9.60it/s] 134it [00:14, 9.53it/s] 135it [00:14, 9.51it/s] 136it [00:14, 9.49it/s] 137it [00:14, 9.50it/s] 138it [00:14, 9.50it/s] 139it [00:14, 9.51it/s] 140it [00:15, 9.50it/s] 141it [00:15, 9.51it/s] 142it [00:15, 9.42it/s] 143it [00:15, 9.46it/s] 144it [00:15, 9.48it/s] 145it [00:15, 9.47it/s] 146it [00:15, 9.48it/s] 147it [00:15, 9.49it/s] 148it [00:15, 9.45it/s] 149it [00:15, 9.46it/s] 150it [00:16, 9.40it/s]2025-05-26 03:15:29,145 - INFO - [Epoch 002 | Batch 0150] IWAE-loss 18063.8633 | mean log_px -0.2179 | KL -3453.99 + 151it [00:16, 9.37it/s] 152it [00:16, 9.41it/s] 153it [00:16, 9.23it/s] 154it [00:16, 9.04it/s] 155it [00:16, 8.84it/s] 156it [00:16, 9.00it/s] 157it [00:16, 9.18it/s] 158it [00:16, 9.29it/s] 159it [00:17, 9.39it/s] 160it [00:17, 9.41it/s] 161it [00:17, 9.41it/s] 162it [00:17, 9.41it/s] 163it [00:17, 9.43it/s] 164it [00:17, 9.46it/s] 165it [00:17, 9.45it/s] 166it [00:17, 9.50it/s] 167it [00:17, 9.56it/s] 168it [00:18, 9.56it/s] 169it [00:18, 9.21it/s] 170it [00:18, 9.26it/s] 171it [00:18, 9.38it/s] 172it [00:18, 9.42it/s] 173it [00:18, 9.44it/s] 174it [00:18, 9.42it/s] 175it [00:18, 9.44it/s] 176it [00:18, 9.48it/s] 177it [00:18, 9.52it/s] 178it [00:19, 9.54it/s] 179it [00:19, 9.50it/s] 180it [00:19, 9.43it/s] 181it [00:19, 9.42it/s] 182it [00:19, 9.40it/s] 183it [00:19, 9.41it/s] 184it [00:19, 9.39it/s] 185it [00:19, 9.40it/s] 186it [00:19, 9.41it/s] 187it [00:20, 9.40it/s] 188it [00:20, 9.37it/s] 189it [00:20, 9.08it/s] 190it [00:20, 9.17it/s] 191it [00:20, 9.24it/s] 192it [00:20, 9.28it/s] 193it [00:20, 9.33it/s] 194it [00:20, 9.38it/s] 195it [00:20, 8.77it/s] 196it [00:21, 9.06it/s] 196it [00:21, 9.30it/s] +2025-05-26 03:15:34,082 - INFO - Epoch: 2, Objective: tensor([23773.6406], device='cuda:0', grad_fn=), Loss: 0.30370157957077026, KL/n: 70.60922241210938 + 0it [00:00, ?it/s]2025-05-26 03:15:34,369 - INFO - [Epoch 003 | Batch 0000] IWAE-loss 22127.6270 | mean log_px -0.2715 | KL -3458.96 + 1it [00:00, 4.44it/s] 2it [00:00, 6.52it/s] 3it [00:00, 7.66it/s] 4it [00:00, 8.12it/s] 5it [00:00, 8.65it/s] 6it [00:00, 8.43it/s] 7it [00:00, 8.79it/s] 8it [00:00, 8.96it/s] 9it [00:01, 9.14it/s] 10it [00:01, 9.17it/s] 11it [00:01, 9.22it/s] 12it [00:01, 9.21it/s] 13it [00:01, 8.60it/s] 14it [00:01, 8.76it/s] 15it [00:01, 9.00it/s] 16it [00:01, 9.04it/s] 17it [00:01, 9.10it/s] 18it [00:02, 9.18it/s] 19it [00:02, 9.28it/s] 20it [00:02, 9.28it/s] 21it [00:02, 9.36it/s] 22it [00:02, 9.22it/s] 23it [00:02, 9.21it/s] 24it [00:02, 9.27it/s] 25it [00:02, 9.34it/s] 26it [00:02, 9.37it/s] 27it [00:03, 9.42it/s] 28it [00:03, 9.41it/s] 29it [00:03, 9.02it/s] 30it [00:03, 9.14it/s] 31it [00:03, 9.28it/s] 32it [00:03, 9.31it/s] 33it [00:03, 9.39it/s] 34it [00:03, 9.43it/s] 35it [00:03, 9.46it/s] 36it [00:04, 9.51it/s] 37it [00:04, 9.51it/s] 38it [00:04, 9.50it/s] 39it [00:04, 9.55it/s] 40it [00:04, 9.53it/s] 41it [00:04, 9.10it/s] 42it [00:04, 9.24it/s] 43it [00:04, 9.32it/s] 44it [00:04, 9.31it/s] 45it [00:04, 9.35it/s] 46it [00:05, 9.39it/s] 47it [00:05, 9.43it/s] 48it [00:05, 9.49it/s] 49it [00:05, 9.52it/s] 50it [00:05, 9.53it/s]2025-05-26 03:15:39,770 - INFO - [Epoch 003 | Batch 0050] IWAE-loss 18690.7363 | mean log_px -0.2205 | KL -3462.40 + 51it [00:05, 9.44it/s] 52it [00:05, 9.45it/s] 53it [00:05, 9.51it/s] 54it [00:05, 9.48it/s] 55it [00:06, 9.51it/s] 56it [00:06, 9.49it/s] 57it [00:06, 9.48it/s] 58it [00:06, 9.45it/s] 59it [00:06, 9.51it/s] 60it [00:06, 9.58it/s] 61it [00:06, 9.58it/s] 62it [00:06, 9.52it/s] 63it [00:06, 9.54it/s] 64it [00:06, 9.54it/s] 65it [00:07, 9.54it/s] 66it [00:07, 9.53it/s] 67it [00:07, 9.55it/s] 68it [00:07, 9.54it/s] 69it [00:07, 9.58it/s] 70it [00:07, 9.52it/s] 71it [00:07, 9.54it/s] 72it [00:07, 9.14it/s] 73it [00:07, 9.24it/s] 74it [00:08, 9.29it/s] 75it [00:08, 9.32it/s] 76it [00:08, 9.41it/s] 77it [00:08, 9.47it/s] 78it [00:08, 9.50it/s] 79it [00:08, 9.48it/s] 80it [00:08, 9.45it/s] 81it [00:08, 9.38it/s] 82it [00:08, 9.41it/s] 83it [00:08, 9.42it/s] 84it [00:09, 9.37it/s] 85it [00:09, 9.33it/s] 86it [00:09, 9.37it/s] 87it [00:09, 9.39it/s] 88it [00:09, 9.40it/s] 89it [00:09, 9.44it/s] 90it [00:09, 9.44it/s] 91it [00:09, 9.42it/s] 92it [00:09, 9.26it/s] 93it [00:10, 9.31it/s] 94it [00:10, 9.39it/s] 95it [00:10, 9.44it/s] 96it [00:10, 9.48it/s] 97it [00:10, 9.53it/s] 98it [00:10, 9.55it/s] 99it [00:10, 9.54it/s] 100it [00:10, 9.51it/s]2025-05-26 03:15:45,059 - INFO - [Epoch 003 | Batch 0100] IWAE-loss 22098.5781 | mean log_px -0.2703 | KL -3471.58 + 101it [00:10, 9.54it/s] 102it [00:10, 9.54it/s] 103it [00:11, 9.44it/s] 104it [00:11, 9.42it/s] 105it [00:11, 9.41it/s] 106it [00:11, 9.42it/s] 107it [00:11, 9.43it/s] 108it [00:11, 9.49it/s] 109it [00:11, 9.48it/s] 110it [00:11, 8.96it/s] 111it [00:11, 9.09it/s] 112it [00:12, 9.18it/s] 113it [00:12, 9.25it/s] 114it [00:12, 8.85it/s] 115it [00:12, 9.06it/s] 116it [00:12, 9.17it/s] 117it [00:12, 9.29it/s] 118it [00:12, 8.88it/s] 119it [00:12, 9.06it/s] 120it [00:12, 9.17it/s] 121it [00:13, 9.24it/s] 122it [00:13, 9.33it/s] 123it [00:13, 9.38it/s] 124it [00:13, 9.46it/s] 125it [00:13, 9.47it/s] 126it [00:13, 9.53it/s] 127it [00:13, 9.52it/s] 128it [00:13, 9.47it/s] 129it [00:13, 9.54it/s] 130it [00:14, 9.54it/s] 131it [00:14, 9.57it/s] 132it [00:14, 9.56it/s] 133it [00:14, 9.55it/s] 134it [00:14, 9.51it/s] 135it [00:14, 9.51it/s] 136it [00:14, 9.51it/s] 137it [00:14, 9.51it/s] 138it [00:14, 9.52it/s] 139it [00:14, 9.51it/s] 140it [00:15, 9.48it/s] 141it [00:15, 9.50it/s] 142it [00:15, 9.49it/s] 143it [00:15, 9.50it/s] 144it [00:15, 9.50it/s] 145it [00:15, 9.51it/s] 146it [00:15, 9.55it/s] 147it [00:15, 9.52it/s] 148it [00:15, 9.58it/s] 149it [00:15, 9.63it/s] 150it [00:16, 9.61it/s]2025-05-26 03:15:50,375 - INFO - [Epoch 003 | Batch 0150] IWAE-loss 23228.7480 | mean log_px -0.2856 | KL -3470.63 + 151it [00:16, 9.57it/s] 152it [00:16, 9.59it/s] 153it [00:16, 9.56it/s] 154it [00:16, 9.52it/s] 155it [00:16, 9.51it/s] 156it [00:16, 9.08it/s] 157it [00:16, 9.17it/s] 158it [00:16, 9.22it/s] 159it [00:17, 8.83it/s] 160it [00:17, 9.02it/s] 161it [00:17, 9.14it/s] 162it [00:17, 9.26it/s] 163it [00:17, 9.30it/s] 164it [00:17, 9.34it/s] 165it [00:17, 9.35it/s] 166it [00:17, 9.37it/s] 167it [00:17, 9.38it/s] 168it [00:18, 9.41it/s] 169it [00:18, 9.43it/s] 170it [00:18, 9.44it/s] 171it [00:18, 9.48it/s] 172it [00:18, 9.43it/s] 173it [00:18, 9.47it/s] 174it [00:18, 9.49it/s] 175it [00:18, 9.51it/s] 176it [00:18, 9.52it/s] 177it [00:18, 9.57it/s] 178it [00:19, 9.58it/s] 179it [00:19, 9.53it/s] 180it [00:19, 9.52it/s] 181it [00:19, 9.54it/s] 182it [00:19, 9.03it/s] 183it [00:19, 9.18it/s] 184it [00:19, 9.24it/s] 185it [00:19, 9.33it/s] 186it [00:19, 9.07it/s] 187it [00:20, 9.21it/s] 188it [00:20, 9.30it/s] 189it [00:20, 9.35it/s] 190it [00:20, 8.91it/s] 191it [00:20, 9.06it/s] 192it [00:20, 9.20it/s] 193it [00:20, 9.26it/s] 194it [00:20, 8.85it/s] 195it [00:20, 8.55it/s] 196it [00:21, 8.86it/s] 196it [00:21, 9.28it/s] +2025-05-26 03:15:55,344 - INFO - Epoch: 3, Objective: tensor([23300.8750], device='cuda:0', grad_fn=), Loss: 0.2900332510471344, KL/n: 70.9906005859375 + 0it [00:00, ?it/s]2025-05-26 03:15:55,799 - INFO - [Epoch 004 | Batch 0000] IWAE-loss 12282.2793 | mean log_px -0.1411 | KL -3474.90 + 1it [00:00, 5.34it/s] 2it [00:00, 6.95it/s] 3it [00:00, 7.77it/s] 4it [00:00, 8.42it/s] 5it [00:00, 8.78it/s] 6it [00:00, 9.03it/s] 7it [00:00, 9.21it/s] 8it [00:00, 9.31it/s] 9it [00:01, 9.38it/s] 10it [00:01, 9.36it/s] 11it [00:01, 9.40it/s] 12it [00:01, 9.44it/s] 13it [00:01, 9.47it/s] 14it [00:01, 9.47it/s] 15it [00:01, 9.51it/s] 16it [00:01, 9.54it/s] 17it [00:01, 9.59it/s] 18it [00:01, 9.57it/s] 19it [00:02, 9.64it/s] 20it [00:02, 9.57it/s] 21it [00:02, 9.61it/s] 22it [00:02, 9.55it/s] 23it [00:02, 9.37it/s] 24it [00:02, 8.99it/s] 25it [00:02, 9.22it/s] 26it [00:02, 9.35it/s] 27it [00:02, 8.90it/s] 28it [00:03, 9.11it/s] 29it [00:03, 9.27it/s] 30it [00:03, 9.36it/s] 31it [00:03, 8.88it/s] 32it [00:03, 9.08it/s] 33it [00:03, 9.30it/s] 34it [00:03, 9.42it/s] 35it [00:03, 9.53it/s] 36it [00:03, 9.47it/s] 37it [00:04, 8.91it/s] 38it [00:04, 9.14it/s] 39it [00:04, 9.31it/s] 40it [00:04, 9.44it/s] 41it [00:04, 9.54it/s] 42it [00:04, 9.58it/s] 43it [00:04, 9.64it/s] 44it [00:04, 9.67it/s] 45it [00:04, 9.70it/s] 46it [00:04, 9.72it/s] 47it [00:05, 9.71it/s] 48it [00:05, 9.71it/s] 49it [00:05, 9.73it/s] 50it [00:05, 9.72it/s]2025-05-26 03:16:01,098 - INFO - [Epoch 004 | Batch 0050] IWAE-loss 23196.6523 | mean log_px -0.2816 | KL -3483.42 + 51it [00:05, 9.72it/s] 52it [00:05, 9.75it/s] 53it [00:05, 9.74it/s] 54it [00:05, 9.67it/s] 55it [00:05, 9.71it/s] 56it [00:06, 9.70it/s] 57it [00:06, 9.71it/s] 58it [00:06, 9.16it/s] 59it [00:06, 9.29it/s] 60it [00:06, 9.41it/s] 61it [00:06, 9.49it/s] 62it [00:06, 9.42it/s] 63it [00:06, 9.51it/s] 64it [00:06, 9.59it/s] 65it [00:06, 9.65it/s] 66it [00:07, 9.67it/s] 67it [00:07, 9.72it/s] 68it [00:07, 9.72it/s] 69it [00:07, 9.75it/s] 70it [00:07, 9.75it/s] 71it [00:07, 9.77it/s] 72it [00:07, 9.78it/s] 73it [00:07, 9.76it/s] 74it [00:07, 9.74it/s] 75it [00:07, 9.76it/s] 76it [00:08, 9.76it/s] 77it [00:08, 9.77it/s] 78it [00:08, 9.77it/s] 79it [00:08, 9.78it/s] 80it [00:08, 9.59it/s] 81it [00:08, 9.27it/s] 82it [00:08, 9.40it/s] 83it [00:08, 9.52it/s] 84it [00:08, 9.57it/s] 85it [00:09, 9.09it/s] 86it [00:09, 9.27it/s] 87it [00:09, 9.42it/s] 88it [00:09, 8.97it/s] 89it [00:09, 9.20it/s] 90it [00:09, 9.35it/s] 91it [00:09, 9.47it/s] 92it [00:09, 9.55it/s] 93it [00:09, 9.63it/s] 94it [00:09, 9.66it/s] 95it [00:10, 9.14it/s] 96it [00:10, 9.30it/s] 97it [00:10, 9.45it/s] 98it [00:10, 9.54it/s] 99it [00:10, 9.60it/s] 100it [00:10, 9.64it/s]2025-05-26 03:16:06,337 - INFO - [Epoch 004 | Batch 0100] IWAE-loss 22043.1543 | mean log_px -0.2736 | KL -3483.78 + 101it [00:10, 9.65it/s] 102it [00:10, 9.67it/s] 103it [00:10, 9.71it/s] 104it [00:11, 9.71it/s] 105it [00:11, 9.73it/s] 106it [00:11, 9.73it/s] 107it [00:11, 9.73it/s] 108it [00:11, 9.16it/s] 109it [00:11, 9.08it/s] 110it [00:11, 9.17it/s] 111it [00:11, 9.35it/s] 112it [00:11, 9.45it/s] 113it [00:11, 9.54it/s] 114it [00:12, 9.60it/s] 115it [00:12, 9.66it/s] 116it [00:12, 9.66it/s] 117it [00:12, 9.69it/s] 118it [00:12, 9.71it/s] 119it [00:12, 9.70it/s] 120it [00:12, 9.17it/s] 121it [00:12, 9.30it/s] 122it [00:12, 9.38it/s] 123it [00:13, 9.49it/s] 124it [00:13, 9.48it/s] 125it [00:13, 9.44it/s] 126it [00:13, 9.43it/s] 127it [00:13, 9.51it/s] 128it [00:13, 9.57it/s] 129it [00:13, 9.64it/s] 130it [00:13, 9.66it/s] 131it [00:13, 9.68it/s] 132it [00:13, 9.70it/s] 133it [00:14, 9.71it/s] 134it [00:14, 9.71it/s] 135it [00:14, 9.75it/s] 136it [00:14, 9.74it/s] 137it [00:14, 9.44it/s] 138it [00:14, 9.13it/s] 139it [00:14, 9.31it/s] 140it [00:14, 9.43it/s] 141it [00:14, 8.97it/s] 142it [00:15, 9.04it/s] 143it [00:15, 9.19it/s] 144it [00:15, 9.27it/s] 145it [00:15, 8.83it/s] 146it [00:15, 9.00it/s] 147it [00:15, 9.11it/s] 148it [00:15, 9.26it/s] 149it [00:15, 9.29it/s] 150it [00:15, 9.35it/s]2025-05-26 03:16:11,638 - INFO - [Epoch 004 | Batch 0150] IWAE-loss 22188.4727 | mean log_px -0.2672 | KL -3485.55 + 151it [00:16, 9.40it/s] 152it [00:16, 9.01it/s] 153it [00:16, 9.12it/s] 154it [00:16, 9.20it/s] 155it [00:16, 9.24it/s] 156it [00:16, 8.90it/s] 157it [00:16, 9.03it/s] 158it [00:16, 9.16it/s] 159it [00:16, 9.22it/s] 160it [00:17, 9.30it/s] 161it [00:17, 9.37it/s] 162it [00:17, 9.41it/s] 163it [00:17, 9.45it/s] 164it [00:17, 9.47it/s] 165it [00:17, 9.48it/s] 166it [00:17, 9.53it/s] 167it [00:17, 9.52it/s] 168it [00:17, 9.50it/s] 169it [00:17, 9.53it/s] 170it [00:18, 9.53it/s] 171it [00:18, 9.54it/s] 172it [00:18, 9.58it/s] 173it [00:18, 9.55it/s] 174it [00:18, 9.23it/s] 175it [00:18, 9.31it/s] 176it [00:18, 9.38it/s] 177it [00:18, 9.42it/s] 178it [00:18, 8.92it/s] 179it [00:19, 9.14it/s] 180it [00:19, 9.20it/s] 181it [00:19, 9.33it/s] 182it [00:19, 9.00it/s] 183it [00:19, 9.16it/s] 184it [00:19, 9.32it/s] 185it [00:19, 9.40it/s] 186it [00:19, 9.44it/s] 187it [00:19, 9.51it/s] 188it [00:19, 9.45it/s] 189it [00:20, 8.95it/s] 190it [00:20, 9.06it/s] 191it [00:20, 9.21it/s] 192it [00:20, 9.25it/s] 193it [00:20, 9.41it/s] 194it [00:20, 9.09it/s] 195it [00:20, 8.67it/s] 196it [00:20, 8.95it/s] 196it [00:20, 9.35it/s] +2025-05-26 03:16:16,612 - INFO - Epoch: 4, Objective: tensor([19702.6348], device='cuda:0', grad_fn=), Loss: 0.23782320320606232, KL/n: 71.2601089477539 + 0it [00:00, ?it/s]2025-05-26 03:16:16,889 - INFO - [Epoch 005 | Batch 0000] IWAE-loss 16530.5488 | mean log_px -0.1878 | KL -3492.38 + 1it [00:00, 4.73it/s] 2it [00:00, 6.73it/s] 3it [00:00, 7.74it/s] 4it [00:00, 8.30it/s] 5it [00:00, 8.65it/s] 6it [00:00, 8.80it/s] 7it [00:00, 9.06it/s] 8it [00:00, 9.19it/s] 9it [00:01, 8.74it/s] 10it [00:01, 8.96it/s] 11it [00:01, 9.06it/s] 12it [00:01, 9.15it/s] 13it [00:01, 8.93it/s] 14it [00:01, 8.71it/s] 15it [00:01, 8.93it/s] 16it [00:01, 9.10it/s] 17it [00:01, 9.19it/s] 18it [00:02, 9.23it/s] 19it [00:02, 9.26it/s] 20it [00:02, 9.31it/s] 21it [00:02, 8.81it/s] 22it [00:02, 8.97it/s] 23it [00:02, 9.12it/s] 24it [00:02, 9.20it/s] 25it [00:02, 9.32it/s] 26it [00:02, 8.96it/s] 27it [00:03, 9.15it/s] 28it [00:03, 9.24it/s] 29it [00:03, 8.90it/s] 30it [00:03, 9.07it/s] 31it [00:03, 9.21it/s] 32it [00:03, 8.73it/s] 33it [00:03, 8.94it/s] 34it [00:03, 9.07it/s] 35it [00:03, 9.14it/s] 36it [00:04, 8.75it/s] 37it [00:04, 8.95it/s] 38it [00:04, 9.10it/s] 39it [00:04, 9.21it/s] 40it [00:04, 8.89it/s] 41it [00:04, 9.09it/s] 42it [00:04, 9.17it/s] 43it [00:04, 9.26it/s] 44it [00:04, 9.31it/s] 45it [00:05, 9.42it/s] 46it [00:05, 9.35it/s] 47it [00:05, 8.82it/s] 48it [00:05, 8.76it/s] 49it [00:05, 8.84it/s] 50it [00:05, 9.03it/s]2025-05-26 03:16:22,409 - INFO - [Epoch 005 | Batch 0050] IWAE-loss 17774.5938 | mean log_px -0.2058 | KL -3492.53 + 51it [00:05, 9.17it/s] 52it [00:05, 8.73it/s] 53it [00:05, 8.93it/s] 54it [00:06, 9.05it/s] 55it [00:06, 9.20it/s] 56it [00:06, 9.26it/s] 57it [00:06, 9.38it/s] 58it [00:06, 8.84it/s] 59it [00:06, 9.03it/s] 60it [00:06, 9.14it/s] 61it [00:06, 9.27it/s] 62it [00:06, 9.33it/s] 63it [00:07, 9.39it/s] 64it [00:07, 9.44it/s] 65it [00:07, 9.43it/s] 66it [00:07, 9.43it/s] 67it [00:07, 9.03it/s] 68it [00:07, 9.14it/s] 69it [00:07, 9.23it/s] 70it [00:07, 8.81it/s] 71it [00:07, 8.91it/s] 72it [00:08, 9.01it/s] 73it [00:08, 9.15it/s] 74it [00:08, 9.25it/s] 75it [00:08, 9.36it/s] 76it [00:08, 8.88it/s] 77it [00:08, 9.07it/s] 78it [00:08, 9.21it/s] 79it [00:08, 9.35it/s] 80it [00:08, 9.39it/s] 81it [00:08, 9.39it/s] 82it [00:09, 9.39it/s] 83it [00:09, 9.41it/s] 84it [00:09, 8.91it/s] 85it [00:09, 9.08it/s] 86it [00:09, 9.19it/s] 87it [00:09, 9.26it/s] 88it [00:09, 8.84it/s] 89it [00:09, 9.01it/s] 90it [00:09, 9.14it/s] 91it [00:10, 9.21it/s] 92it [00:10, 8.79it/s] 93it [00:10, 8.93it/s] 94it [00:10, 9.10it/s] 95it [00:10, 8.73it/s] 96it [00:10, 8.94it/s] 97it [00:10, 9.10it/s] 98it [00:10, 9.23it/s] 99it [00:10, 8.81it/s] 100it [00:11, 9.00it/s]2025-05-26 03:16:27,891 - INFO - [Epoch 005 | Batch 0100] IWAE-loss 13819.5430 | mean log_px -0.1567 | KL -3497.92 + 101it [00:11, 9.16it/s] 102it [00:11, 9.26it/s] 103it [00:11, 8.86it/s] 104it [00:11, 9.01it/s] 105it [00:11, 9.18it/s] 106it [00:11, 9.30it/s] 107it [00:11, 9.37it/s] 108it [00:11, 9.44it/s] 109it [00:12, 9.48it/s] 110it [00:12, 9.52it/s] 111it [00:12, 9.51it/s] 112it [00:12, 9.57it/s] 113it [00:12, 9.00it/s] 114it [00:12, 9.20it/s] 115it [00:12, 9.37it/s] 116it [00:12, 9.41it/s] 117it [00:12, 9.48it/s] 118it [00:13, 8.99it/s] 119it [00:13, 9.15it/s] 120it [00:13, 9.24it/s] 121it [00:13, 9.35it/s] 122it [00:13, 9.41it/s] 123it [00:13, 9.48it/s] 124it [00:13, 9.48it/s] 125it [00:13, 9.52it/s] 126it [00:13, 9.58it/s] 127it [00:13, 9.58it/s] 128it [00:14, 9.56it/s] 129it [00:14, 9.60it/s] 130it [00:14, 9.53it/s] 131it [00:14, 9.12it/s] 132it [00:14, 9.22it/s] 133it [00:14, 9.29it/s] 134it [00:14, 9.34it/s] 135it [00:14, 9.43it/s] 136it [00:14, 9.38it/s] 137it [00:15, 9.49it/s] 138it [00:15, 9.56it/s] 139it [00:15, 9.55it/s] 140it [00:15, 9.59it/s] 141it [00:15, 9.16it/s] 142it [00:15, 9.30it/s] 143it [00:15, 9.38it/s] 144it [00:15, 9.41it/s] 145it [00:15, 9.43it/s] 146it [00:15, 9.48it/s] 147it [00:16, 9.52it/s] 148it [00:16, 9.53it/s] 149it [00:16, 9.50it/s] 150it [00:16, 8.97it/s]2025-05-26 03:16:33,232 - INFO - [Epoch 005 | Batch 0150] IWAE-loss 18954.9707 | mean log_px -0.2272 | KL -3503.50 + 151it [00:16, 9.16it/s] 152it [00:16, 9.30it/s] 153it [00:16, 9.34it/s] 154it [00:16, 8.90it/s] 155it [00:16, 9.09it/s] 156it [00:17, 9.14it/s] 157it [00:17, 9.28it/s] 158it [00:17, 8.83it/s] 159it [00:17, 9.05it/s] 160it [00:17, 8.70it/s] 161it [00:17, 8.92it/s] 162it [00:17, 9.14it/s] 163it [00:17, 8.74it/s] 164it [00:17, 8.93it/s] 165it [00:18, 9.12it/s] 166it [00:18, 9.27it/s] 167it [00:18, 8.85it/s] 168it [00:18, 9.07it/s] 169it [00:18, 9.25it/s] 170it [00:18, 9.37it/s] 171it [00:18, 8.91it/s] 172it [00:18, 9.10it/s] 173it [00:18, 9.23it/s] 174it [00:19, 9.27it/s] 175it [00:19, 8.84it/s] 176it [00:19, 9.03it/s] 177it [00:19, 9.19it/s] 178it [00:19, 9.29it/s] 179it [00:19, 8.92it/s] 180it [00:19, 9.11it/s] 181it [00:19, 9.25it/s] 182it [00:19, 9.32it/s] 183it [00:20, 8.87it/s] 184it [00:20, 9.06it/s] 185it [00:20, 9.20it/s] 186it [00:20, 9.29it/s] 187it [00:20, 8.86it/s] 188it [00:20, 9.04it/s] 189it [00:20, 9.18it/s] 190it [00:20, 9.31it/s] 191it [00:20, 8.89it/s] 192it [00:21, 9.07it/s] 193it [00:21, 9.19it/s] 194it [00:21, 9.27it/s] 195it [00:21, 8.29it/s] 196it [00:21, 8.66it/s] 196it [00:21, 9.09it/s] +2025-05-26 03:16:38,299 - INFO - Epoch: 5, Objective: tensor([12165.8643], device='cuda:0', grad_fn=), Loss: 0.1356792002916336, KL/n: 71.50433349609375 + 0it [00:00, ?it/s]2025-05-26 03:16:38,777 - INFO - [Epoch 006 | Batch 0000] IWAE-loss 17046.0859 | mean log_px -0.1989 | KL -3502.32 + 1it [00:00, 4.40it/s] 2it [00:00, 6.40it/s] 3it [00:00, 7.52it/s] 4it [00:00, 7.75it/s] 5it [00:00, 8.28it/s] 6it [00:00, 8.66it/s] 7it [00:00, 8.91it/s] 8it [00:00, 9.08it/s] 9it [00:01, 9.20it/s] 10it [00:01, 8.83it/s] 11it [00:01, 9.04it/s] 12it [00:01, 9.18it/s] 13it [00:01, 9.30it/s] 14it [00:01, 9.35it/s] 15it [00:01, 9.01it/s] 16it [00:01, 9.13it/s] 17it [00:01, 9.22it/s] 18it [00:02, 8.88it/s] 19it [00:02, 9.00it/s] 20it [00:02, 9.13it/s] 21it [00:02, 9.22it/s] 22it [00:02, 9.24it/s] 23it [00:02, 9.29it/s] 24it [00:02, 8.93it/s] 25it [00:02, 9.08it/s] 26it [00:02, 9.14it/s] 27it [00:03, 9.19it/s] 28it [00:03, 9.25it/s] 29it [00:03, 9.33it/s] 30it [00:03, 9.39it/s] 31it [00:03, 9.42it/s] 32it [00:03, 9.43it/s] 33it [00:03, 9.44it/s] 34it [00:03, 9.39it/s] 35it [00:03, 9.47it/s] 36it [00:04, 8.93it/s] 37it [00:04, 9.10it/s] 38it [00:04, 9.20it/s] 39it [00:04, 9.24it/s] 40it [00:04, 9.29it/s] 41it [00:04, 9.28it/s] 42it [00:04, 9.31it/s] 43it [00:04, 9.41it/s] 44it [00:04, 9.42it/s] 45it [00:04, 9.45it/s] 46it [00:05, 9.44it/s] 47it [00:05, 9.42it/s] 48it [00:05, 9.45it/s] 49it [00:05, 9.51it/s] 50it [00:05, 9.49it/s]2025-05-26 03:16:44,196 - INFO - [Epoch 006 | Batch 0050] IWAE-loss 15465.3457 | mean log_px -0.1867 | KL -3503.66 + 51it [00:05, 9.54it/s] 52it [00:05, 9.55it/s] 53it [00:05, 9.53it/s] 54it [00:05, 9.47it/s] 55it [00:06, 8.91it/s] 56it [00:06, 9.04it/s] 57it [00:06, 9.17it/s] 58it [00:06, 9.24it/s] 59it [00:06, 9.26it/s] 60it [00:06, 9.36it/s] 61it [00:06, 9.42it/s] 62it [00:06, 9.44it/s] 63it [00:06, 9.48it/s] 64it [00:07, 9.44it/s] 65it [00:07, 8.94it/s] 66it [00:07, 9.05it/s] 67it [00:07, 9.21it/s] 68it [00:07, 9.26it/s] 69it [00:07, 9.32it/s] 70it [00:07, 9.38it/s] 71it [00:07, 9.41it/s] 72it [00:07, 9.41it/s] 73it [00:07, 9.45it/s] 74it [00:08, 9.44it/s] 75it [00:08, 9.50it/s] 76it [00:08, 8.95it/s] 77it [00:08, 9.09it/s] 78it [00:08, 9.16it/s] 79it [00:08, 9.21it/s] 80it [00:08, 9.29it/s] 81it [00:08, 9.37it/s] 82it [00:08, 9.44it/s] 83it [00:09, 9.47it/s] 84it [00:09, 9.50it/s] 85it [00:09, 9.52it/s] 86it [00:09, 9.03it/s] 87it [00:09, 9.17it/s] 88it [00:09, 9.17it/s] 89it [00:09, 9.26it/s] 90it [00:09, 9.36it/s] 91it [00:09, 9.37it/s] 92it [00:10, 9.39it/s] 93it [00:10, 9.39it/s] 94it [00:10, 9.34it/s] 95it [00:10, 8.85it/s] 96it [00:10, 9.05it/s] 97it [00:10, 9.17it/s] 98it [00:10, 9.20it/s] 99it [00:10, 9.25it/s] 100it [00:10, 9.32it/s]2025-05-26 03:16:49,585 - INFO - [Epoch 006 | Batch 0100] IWAE-loss 16232.7539 | mean log_px -0.1872 | KL -3505.36 + 101it [00:11, 9.33it/s] 102it [00:11, 8.78it/s] 103it [00:11, 9.02it/s] 104it [00:11, 9.13it/s] 105it [00:11, 9.22it/s] 106it [00:11, 9.32it/s] 107it [00:11, 9.43it/s] 108it [00:11, 9.44it/s] 109it [00:11, 9.40it/s] 110it [00:12, 8.76it/s] 111it [00:12, 8.82it/s] 112it [00:12, 9.05it/s] 113it [00:12, 9.22it/s] 114it [00:12, 9.29it/s] 115it [00:12, 9.37it/s] 116it [00:12, 9.42it/s] 117it [00:12, 8.91it/s] 118it [00:12, 9.12it/s] 119it [00:12, 9.24it/s] 120it [00:13, 9.35it/s] 121it [00:13, 9.41it/s] 122it [00:13, 9.43it/s] 123it [00:13, 9.46it/s] 124it [00:13, 9.46it/s] 125it [00:13, 9.49it/s] 126it [00:13, 9.49it/s] 127it [00:13, 9.46it/s] 128it [00:13, 9.50it/s] 129it [00:14, 8.94it/s] 130it [00:14, 9.08it/s] 131it [00:14, 9.18it/s] 132it [00:14, 9.30it/s] 133it [00:14, 9.36it/s] 134it [00:14, 9.40it/s] 135it [00:14, 9.43it/s] 136it [00:14, 9.43it/s] 137it [00:14, 9.48it/s] 138it [00:15, 9.47it/s] 139it [00:15, 9.45it/s] 140it [00:15, 9.47it/s] 141it [00:15, 9.46it/s] 142it [00:15, 9.47it/s] 143it [00:15, 9.45it/s] 144it [00:15, 9.46it/s] 145it [00:15, 9.30it/s] 146it [00:15, 9.37it/s] 147it [00:15, 9.37it/s] 148it [00:16, 9.38it/s] 149it [00:16, 9.41it/s] 150it [00:16, 9.39it/s]2025-05-26 03:16:54,957 - INFO - [Epoch 006 | Batch 0150] IWAE-loss 16457.2578 | mean log_px -0.1880 | KL -3506.98 + 151it [00:16, 9.38it/s] 152it [00:16, 9.39it/s] 153it [00:16, 9.40it/s] 154it [00:16, 9.40it/s] 155it [00:16, 9.44it/s] 156it [00:16, 9.46it/s] 157it [00:17, 9.49it/s] 158it [00:17, 9.52it/s] 159it [00:17, 9.52it/s] 160it [00:17, 9.53it/s] 161it [00:17, 9.46it/s] 162it [00:17, 9.48it/s] 163it [00:17, 9.52it/s] 164it [00:17, 9.51it/s] 165it [00:17, 9.49it/s] 166it [00:17, 9.48it/s] 167it [00:18, 9.52it/s] 168it [00:18, 9.51it/s] 169it [00:18, 9.46it/s] 170it [00:18, 9.45it/s] 171it [00:18, 9.49it/s] 172it [00:18, 9.45it/s] 173it [00:18, 9.46it/s] 174it [00:18, 9.46it/s] 175it [00:18, 9.45it/s] 176it [00:19, 9.47it/s] 177it [00:19, 9.29it/s] 178it [00:19, 9.34it/s] 179it [00:19, 9.38it/s] 180it [00:19, 9.42it/s] 181it [00:19, 9.45it/s] 182it [00:19, 9.45it/s] 183it [00:19, 9.51it/s] 184it [00:19, 9.55it/s] 185it [00:19, 9.49it/s] 186it [00:20, 9.50it/s] 187it [00:20, 9.51it/s] 188it [00:20, 9.49it/s] 189it [00:20, 9.25it/s] 190it [00:20, 9.23it/s] 191it [00:20, 9.29it/s] 192it [00:20, 9.38it/s] 193it [00:20, 9.18it/s] 194it [00:20, 9.18it/s] 195it [00:21, 8.73it/s] 196it [00:21, 9.00it/s] 196it [00:21, 9.23it/s] +2025-05-26 03:16:59,860 - INFO - Epoch: 6, Objective: tensor([15376.6016], device='cuda:0', grad_fn=), Loss: 0.17358337342739105, KL/n: 71.75361633300781 + 0it [00:00, ?it/s]2025-05-26 03:17:00,136 - INFO - [Epoch 007 | Batch 0000] IWAE-loss 17575.0977 | mean log_px -0.2084 | KL -3514.32 + 1it [00:00, 4.72it/s] 2it [00:00, 6.68it/s] 3it [00:00, 7.75it/s] 4it [00:00, 8.35it/s] 5it [00:00, 8.78it/s] 6it [00:00, 8.50it/s] 7it [00:00, 8.84it/s] 8it [00:00, 9.09it/s] 9it [00:01, 9.26it/s] 10it [00:01, 8.90it/s] 11it [00:01, 9.06it/s] 12it [00:01, 9.09it/s] 13it [00:01, 8.83it/s] 14it [00:01, 9.02it/s] 15it [00:01, 9.17it/s] 16it [00:01, 9.23it/s] 17it [00:01, 9.36it/s] 18it [00:02, 8.89it/s] 19it [00:02, 9.09it/s] 20it [00:02, 9.15it/s] 21it [00:02, 9.23it/s] 22it [00:02, 9.28it/s] 23it [00:02, 9.31it/s] 24it [00:02, 9.39it/s] 25it [00:02, 9.45it/s] 26it [00:02, 9.07it/s] 27it [00:03, 9.19it/s] 28it [00:03, 9.33it/s] 29it [00:03, 9.41it/s] 30it [00:03, 8.94it/s] 31it [00:03, 9.08it/s] 32it [00:03, 9.19it/s] 33it [00:03, 9.27it/s] 34it [00:03, 8.83it/s] 35it [00:03, 9.02it/s] 36it [00:04, 9.20it/s] 37it [00:04, 9.31it/s] 38it [00:04, 8.95it/s] 39it [00:04, 9.08it/s] 40it [00:04, 9.18it/s] 41it [00:04, 9.33it/s] 42it [00:04, 9.36it/s] 43it [00:04, 9.41it/s] 44it [00:04, 9.48it/s] 45it [00:05, 8.98it/s] 46it [00:05, 9.13it/s] 47it [00:05, 9.27it/s] 48it [00:05, 9.34it/s] 49it [00:05, 8.78it/s] 50it [00:05, 8.97it/s]2025-05-26 03:17:05,608 - INFO - [Epoch 007 | Batch 0050] IWAE-loss 11222.3057 | mean log_px -0.1177 | KL -3518.79 + 51it [00:05, 9.17it/s] 52it [00:05, 9.29it/s] 53it [00:05, 8.74it/s] 54it [00:05, 9.00it/s] 55it [00:06, 9.16it/s] 56it [00:06, 9.23it/s] 57it [00:06, 9.40it/s] 58it [00:06, 9.46it/s] 59it [00:06, 9.51it/s] 60it [00:06, 9.49it/s] 61it [00:06, 9.49it/s] 62it [00:06, 9.53it/s] 63it [00:06, 9.49it/s] 64it [00:07, 8.93it/s] 65it [00:07, 9.04it/s] 66it [00:07, 9.17it/s] 67it [00:07, 9.26it/s] 68it [00:07, 8.91it/s] 69it [00:07, 9.06it/s] 70it [00:07, 9.24it/s] 71it [00:07, 9.36it/s] 72it [00:07, 9.35it/s] 73it [00:08, 9.39it/s] 74it [00:08, 9.39it/s] 75it [00:08, 9.39it/s] 76it [00:08, 9.48it/s] 77it [00:08, 9.53it/s] 78it [00:08, 9.57it/s] 79it [00:08, 8.97it/s] 80it [00:08, 9.08it/s] 81it [00:08, 9.23it/s] 82it [00:08, 9.36it/s] 83it [00:09, 9.40it/s] 84it [00:09, 9.35it/s] 85it [00:09, 9.37it/s] 86it [00:09, 9.48it/s] 87it [00:09, 9.48it/s] 88it [00:09, 9.47it/s] 89it [00:09, 9.45it/s] 90it [00:09, 9.42it/s] 91it [00:09, 8.79it/s] 92it [00:10, 8.65it/s] 93it [00:10, 8.94it/s] 94it [00:10, 9.08it/s] 95it [00:10, 9.23it/s] 96it [00:10, 9.33it/s] 97it [00:10, 9.43it/s] 98it [00:10, 9.51it/s] 99it [00:10, 9.57it/s] 100it [00:10, 9.61it/s]2025-05-26 03:17:10,979 - INFO - [Epoch 007 | Batch 0100] IWAE-loss 15323.3848 | mean log_px -0.1767 | KL -3517.25 + 101it [00:11, 9.55it/s] 102it [00:11, 9.42it/s] 103it [00:11, 9.49it/s] 104it [00:11, 9.50it/s] 105it [00:11, 9.45it/s] 106it [00:11, 9.38it/s] 107it [00:11, 9.50it/s] 108it [00:11, 8.94it/s] 109it [00:11, 9.12it/s] 110it [00:12, 9.21it/s] 111it [00:12, 9.33it/s] 112it [00:12, 9.42it/s] 113it [00:12, 8.97it/s] 114it [00:12, 9.05it/s] 115it [00:12, 9.26it/s] 116it [00:12, 9.27it/s] 117it [00:12, 9.36it/s] 118it [00:12, 9.40it/s] 119it [00:12, 9.47it/s] 120it [00:13, 9.47it/s] 121it [00:13, 9.49it/s] 122it [00:13, 9.57it/s] 123it [00:13, 9.64it/s] 124it [00:13, 9.60it/s] 125it [00:13, 9.59it/s] 126it [00:13, 9.58it/s] 127it [00:13, 9.57it/s] 128it [00:13, 9.56it/s] 129it [00:14, 9.54it/s] 130it [00:14, 9.46it/s] 131it [00:14, 9.48it/s] 132it [00:14, 9.42it/s] 133it [00:14, 9.47it/s] 134it [00:14, 9.36it/s] 135it [00:14, 9.13it/s] 136it [00:14, 9.03it/s] 137it [00:14, 9.22it/s] 138it [00:14, 9.28it/s] 139it [00:15, 9.40it/s] 140it [00:15, 9.49it/s] 141it [00:15, 9.50it/s] 142it [00:15, 9.51it/s] 143it [00:15, 9.41it/s] 144it [00:15, 9.43it/s] 145it [00:15, 9.55it/s] 146it [00:15, 9.64it/s] 147it [00:15, 9.70it/s] 148it [00:16, 9.75it/s] 149it [00:16, 9.80it/s] 150it [00:16, 9.82it/s]2025-05-26 03:17:16,279 - INFO - [Epoch 007 | Batch 0150] IWAE-loss 19223.7129 | mean log_px -0.2297 | KL -3526.62 + 151it [00:16, 9.73it/s] 152it [00:16, 9.78it/s] 153it [00:16, 9.80it/s] 154it [00:16, 9.76it/s] 155it [00:16, 9.62it/s] 156it [00:16, 9.53it/s] 157it [00:16, 9.53it/s] 158it [00:17, 9.51it/s] 159it [00:17, 9.48it/s] 160it [00:17, 9.43it/s] 161it [00:17, 9.43it/s] 162it [00:17, 9.39it/s] 163it [00:17, 9.38it/s] 164it [00:17, 9.32it/s] 165it [00:17, 9.44it/s] 166it [00:17, 9.48it/s] 167it [00:18, 9.55it/s] 168it [00:18, 9.54it/s] 169it [00:18, 9.57it/s] 170it [00:18, 9.60it/s] 171it [00:18, 9.00it/s] 172it [00:18, 9.16it/s] 173it [00:18, 9.26it/s] 174it [00:18, 9.34it/s] 175it [00:18, 9.43it/s] 176it [00:18, 9.46it/s] 177it [00:19, 9.51it/s] 178it [00:19, 9.49it/s] 179it [00:19, 9.48it/s] 180it [00:19, 9.45it/s] 181it [00:19, 9.50it/s] 182it [00:19, 9.42it/s] 183it [00:19, 9.49it/s] 184it [00:19, 9.53it/s] 185it [00:19, 9.61it/s] 186it [00:20, 9.12it/s] 187it [00:20, 9.24it/s] 188it [00:20, 9.37it/s] 189it [00:20, 9.35it/s] 190it [00:20, 9.40it/s] 191it [00:20, 9.45it/s] 192it [00:20, 9.47it/s] 193it [00:20, 9.47it/s] 194it [00:20, 9.45it/s] 195it [00:21, 8.89it/s] 196it [00:21, 9.10it/s] 196it [00:21, 9.26it/s] +2025-05-26 03:17:21,168 - INFO - Epoch: 7, Objective: tensor([11751.9316], device='cuda:0', grad_fn=), Loss: 0.11317390948534012, KL/n: 71.94717407226562 + 0it [00:00, ?it/s]2025-05-26 03:17:21,630 - INFO - [Epoch 008 | Batch 0000] IWAE-loss 14055.2070 | mean log_px -0.1545 | KL -3523.18 + 1it [00:00, 5.24it/s] 2it [00:00, 7.11it/s] 3it [00:00, 8.07it/s] 4it [00:00, 8.62it/s] 5it [00:00, 8.89it/s] 6it [00:00, 9.05it/s] 7it [00:00, 9.23it/s] 8it [00:00, 9.33it/s] 9it [00:01, 9.37it/s] 10it [00:01, 9.34it/s] 11it [00:01, 9.47it/s] 12it [00:01, 9.53it/s] 13it [00:01, 9.55it/s] 14it [00:01, 9.49it/s] 15it [00:01, 9.55it/s] 16it [00:01, 9.52it/s] 17it [00:01, 9.49it/s] 18it [00:01, 9.46it/s] 19it [00:02, 9.48it/s] 20it [00:02, 9.49it/s] 21it [00:02, 9.49it/s] 22it [00:02, 9.49it/s] 23it [00:02, 9.49it/s] 24it [00:02, 9.46it/s] 25it [00:02, 9.50it/s] 26it [00:02, 9.50it/s] 27it [00:02, 9.56it/s] 28it [00:03, 9.55it/s] 29it [00:03, 9.59it/s] 30it [00:03, 9.03it/s] 31it [00:03, 9.09it/s] 32it [00:03, 9.19it/s] 33it [00:03, 9.30it/s] 34it [00:03, 8.89it/s] 35it [00:03, 9.07it/s] 36it [00:03, 9.16it/s] 37it [00:04, 9.25it/s] 38it [00:04, 8.85it/s] 39it [00:04, 9.02it/s] 40it [00:04, 9.17it/s] 41it [00:04, 9.31it/s] 42it [00:04, 8.89it/s] 43it [00:04, 9.05it/s] 44it [00:04, 9.18it/s] 45it [00:04, 9.27it/s] 46it [00:05, 8.84it/s] 47it [00:05, 8.97it/s] 48it [00:05, 9.07it/s] 49it [00:05, 9.21it/s] 50it [00:05, 8.80it/s]2025-05-26 03:17:27,014 - INFO - [Epoch 008 | Batch 0050] IWAE-loss 12810.5664 | mean log_px -0.1418 | KL -3528.74 + 51it [00:05, 8.97it/s] 52it [00:05, 9.13it/s] 53it [00:05, 9.25it/s] 54it [00:05, 8.81it/s] 55it [00:06, 8.98it/s] 56it [00:06, 9.13it/s] 57it [00:06, 9.25it/s] 58it [00:06, 8.86it/s] 59it [00:06, 9.03it/s] 60it [00:06, 9.11it/s] 61it [00:06, 9.25it/s] 62it [00:06, 8.85it/s] 63it [00:06, 9.02it/s] 64it [00:07, 9.17it/s] 65it [00:07, 9.29it/s] 66it [00:07, 9.27it/s] 67it [00:07, 8.81it/s] 68it [00:07, 9.03it/s] 69it [00:07, 9.14it/s] 70it [00:07, 8.78it/s] 71it [00:07, 8.92it/s] 72it [00:07, 9.09it/s] 73it [00:07, 9.18it/s] 74it [00:08, 9.28it/s] 75it [00:08, 8.89it/s] 76it [00:08, 9.03it/s] 77it [00:08, 9.15it/s] 78it [00:08, 9.22it/s] 79it [00:08, 9.32it/s] 80it [00:08, 9.43it/s] 81it [00:08, 9.44it/s] 82it [00:08, 9.01it/s] 83it [00:09, 9.17it/s] 84it [00:09, 9.30it/s] 85it [00:09, 9.28it/s] 86it [00:09, 9.33it/s] 87it [00:09, 9.39it/s] 88it [00:09, 9.42it/s] 89it [00:09, 9.45it/s] 90it [00:09, 9.44it/s] 91it [00:09, 9.07it/s] 92it [00:10, 9.18it/s] 93it [00:10, 9.29it/s] 94it [00:10, 8.98it/s] 95it [00:10, 9.10it/s] 96it [00:10, 9.26it/s] 97it [00:10, 9.30it/s] 98it [00:10, 9.34it/s] 99it [00:10, 9.40it/s] 100it [00:10, 9.44it/s]2025-05-26 03:17:32,454 - INFO - [Epoch 008 | Batch 0100] IWAE-loss 9847.4746 | mean log_px -0.0930 | KL -3528.36 + 101it [00:11, 9.50it/s] 102it [00:11, 9.45it/s] 103it [00:11, 9.43it/s] 104it [00:11, 9.41it/s] 105it [00:11, 9.35it/s] 106it [00:11, 9.41it/s] 107it [00:11, 9.42it/s] 108it [00:11, 9.47it/s] 109it [00:11, 9.53it/s] 110it [00:11, 9.52it/s] 111it [00:12, 9.57it/s] 112it [00:12, 9.52it/s] 113it [00:12, 9.53it/s] 114it [00:12, 9.53it/s] 115it [00:12, 9.47it/s] 116it [00:12, 9.46it/s] 117it [00:12, 9.48it/s] 118it [00:12, 9.45it/s] 119it [00:12, 9.48it/s] 120it [00:13, 9.55it/s] 121it [00:13, 9.55it/s] 122it [00:13, 9.54it/s] 123it [00:13, 9.53it/s] 124it [00:13, 9.53it/s] 125it [00:13, 9.51it/s] 126it [00:13, 9.47it/s] 127it [00:13, 9.43it/s] 128it [00:13, 9.46it/s] 129it [00:13, 9.48it/s] 130it [00:14, 9.52it/s] 131it [00:14, 9.51it/s] 132it [00:14, 8.96it/s] 133it [00:14, 9.12it/s] 134it [00:14, 9.21it/s] 135it [00:14, 9.28it/s] 136it [00:14, 9.41it/s] 137it [00:14, 9.44it/s] 138it [00:14, 9.45it/s] 139it [00:15, 9.48it/s] 140it [00:15, 9.48it/s] 141it [00:15, 9.50it/s] 142it [00:15, 9.52it/s] 143it [00:15, 9.57it/s] 144it [00:15, 9.54it/s] 145it [00:15, 9.55it/s] 146it [00:15, 9.53it/s] 147it [00:15, 9.47it/s] 148it [00:15, 9.48it/s] 149it [00:16, 9.47it/s] 150it [00:16, 9.50it/s]2025-05-26 03:17:37,739 - INFO - [Epoch 008 | Batch 0150] IWAE-loss 11725.8896 | mean log_px -0.1225 | KL -3532.75 + 151it [00:16, 9.54it/s] 152it [00:16, 9.54it/s] 153it [00:16, 9.54it/s] 154it [00:16, 9.58it/s] 155it [00:16, 9.60it/s] 156it [00:16, 9.55it/s] 157it [00:16, 9.55it/s] 158it [00:17, 9.53it/s] 159it [00:17, 9.50it/s] 160it [00:17, 9.50it/s] 161it [00:17, 9.56it/s] 162it [00:17, 9.55it/s] 163it [00:17, 9.20it/s] 164it [00:17, 9.32it/s] 165it [00:17, 9.44it/s] 166it [00:17, 9.50it/s] 167it [00:17, 9.47it/s] 168it [00:18, 9.41it/s] 169it [00:18, 9.40it/s] 170it [00:18, 9.44it/s] 171it [00:18, 9.12it/s] 172it [00:18, 9.19it/s] 173it [00:18, 9.20it/s] 174it [00:18, 9.33it/s] 175it [00:18, 9.35it/s] 176it [00:18, 9.38it/s] 177it [00:19, 9.45it/s] 178it [00:19, 9.46it/s] 179it [00:19, 9.51it/s] 180it [00:19, 9.49it/s] 181it [00:19, 9.49it/s] 182it [00:19, 9.48it/s] 183it [00:19, 9.43it/s] 184it [00:19, 9.12it/s] 185it [00:19, 8.68it/s] 186it [00:20, 8.73it/s] 187it [00:20, 8.90it/s] 188it [00:20, 9.06it/s] 189it [00:20, 9.15it/s] 190it [00:20, 9.17it/s] 191it [00:20, 9.21it/s] 192it [00:20, 9.19it/s] 193it [00:20, 9.23it/s] 194it [00:20, 9.23it/s] 195it [00:21, 8.63it/s] 196it [00:21, 8.87it/s] 196it [00:21, 9.25it/s] +2025-05-26 03:17:42,681 - INFO - Epoch: 8, Objective: tensor([19531.0215], device='cuda:0', grad_fn=), Loss: 0.22876138985157013, KL/n: 72.13713073730469 + 0it [00:00, ?it/s]2025-05-26 03:17:42,969 - INFO - [Epoch 009 | Batch 0000] IWAE-loss 15139.6064 | mean log_px -0.1711 | KL -3532.32 + 1it [00:00, 5.12it/s] 2it [00:00, 6.99it/s] 3it [00:00, 7.96it/s] 4it [00:00, 8.50it/s] 5it [00:00, 8.86it/s] 6it [00:00, 9.06it/s] 7it [00:00, 9.21it/s] 8it [00:00, 9.33it/s] 9it [00:01, 9.39it/s] 10it [00:01, 9.47it/s] 11it [00:01, 9.50it/s] 12it [00:01, 9.49it/s] 13it [00:01, 9.57it/s] 14it [00:01, 8.96it/s] 15it [00:01, 9.13it/s] 16it [00:01, 9.23it/s] 17it [00:01, 9.31it/s] 18it [00:02, 9.35it/s] 19it [00:02, 9.45it/s] 20it [00:02, 8.96it/s] 21it [00:02, 9.11it/s] 22it [00:02, 9.25it/s] 23it [00:02, 9.37it/s] 24it [00:02, 9.43it/s] 25it [00:02, 9.48it/s] 26it [00:02, 9.48it/s] 27it [00:02, 9.48it/s] 28it [00:03, 9.50it/s] 29it [00:03, 9.51it/s] 30it [00:03, 9.51it/s] 31it [00:03, 9.57it/s] 32it [00:03, 9.39it/s] 33it [00:03, 9.41it/s] 34it [00:03, 9.38it/s] 35it [00:03, 9.45it/s] 36it [00:03, 9.44it/s] 37it [00:04, 9.47it/s] 38it [00:04, 9.46it/s] 39it [00:04, 9.49it/s] 40it [00:04, 9.43it/s] 41it [00:04, 9.46it/s] 42it [00:04, 9.46it/s] 43it [00:04, 9.51it/s] 44it [00:04, 9.56it/s] 45it [00:04, 9.55it/s] 46it [00:04, 9.53it/s] 47it [00:05, 9.54it/s] 48it [00:05, 9.53it/s] 49it [00:05, 9.54it/s] 50it [00:05, 9.55it/s]2025-05-26 03:17:48,265 - INFO - [Epoch 009 | Batch 0050] IWAE-loss 10535.8184 | mean log_px -0.1103 | KL -3535.26 + 51it [00:05, 9.56it/s] 52it [00:05, 9.56it/s] 53it [00:05, 9.56it/s] 54it [00:05, 9.55it/s] 55it [00:05, 9.54it/s] 56it [00:06, 9.53it/s] 57it [00:06, 9.53it/s] 58it [00:06, 9.51it/s] 59it [00:06, 9.29it/s] 60it [00:06, 9.21it/s] 61it [00:06, 9.31it/s] 62it [00:06, 9.36it/s] 63it [00:06, 9.49it/s] 64it [00:06, 9.48it/s] 65it [00:06, 9.51it/s] 66it [00:07, 9.56it/s] 67it [00:07, 9.53it/s] 68it [00:07, 9.51it/s] 69it [00:07, 9.52it/s] 70it [00:07, 9.52it/s] 71it [00:07, 9.55it/s] 72it [00:07, 9.54it/s] 73it [00:07, 9.55it/s] 74it [00:07, 9.53it/s] 75it [00:08, 9.52it/s] 76it [00:08, 9.58it/s] 77it [00:08, 9.56it/s] 78it [00:08, 9.48it/s] 79it [00:08, 9.50it/s] 80it [00:08, 9.49it/s] 81it [00:08, 9.43it/s] 82it [00:08, 9.44it/s] 83it [00:08, 9.51it/s] 84it [00:08, 9.50it/s] 85it [00:09, 9.53it/s] 86it [00:09, 9.51it/s] 87it [00:09, 9.53it/s] 88it [00:09, 9.56it/s] 89it [00:09, 9.54it/s] 90it [00:09, 9.53it/s] 91it [00:09, 9.47it/s] 92it [00:09, 9.45it/s] 93it [00:09, 9.48it/s] 94it [00:10, 9.46it/s] 95it [00:10, 9.54it/s] 96it [00:10, 9.51it/s] 97it [00:10, 9.49it/s] 98it [00:10, 9.52it/s] 99it [00:10, 9.42it/s] 100it [00:10, 9.49it/s]2025-05-26 03:17:53,533 - INFO - [Epoch 009 | Batch 0100] IWAE-loss 12649.1650 | mean log_px -0.1434 | KL -3534.93 + 101it [00:10, 9.43it/s] 102it [00:10, 9.44it/s] 103it [00:10, 9.46it/s] 104it [00:11, 9.45it/s] 105it [00:11, 9.48it/s] 106it [00:11, 9.51it/s] 107it [00:11, 9.54it/s] 108it [00:11, 9.56it/s] 109it [00:11, 9.58it/s] 110it [00:11, 9.61it/s] 111it [00:11, 9.65it/s] 112it [00:11, 9.64it/s] 113it [00:12, 9.63it/s] 114it [00:12, 9.57it/s] 115it [00:12, 9.50it/s] 116it [00:12, 9.51it/s] 117it [00:12, 9.53it/s] 118it [00:12, 9.45it/s] 119it [00:12, 9.52it/s] 120it [00:12, 9.56it/s] 121it [00:12, 9.54it/s] 122it [00:12, 9.51it/s] 123it [00:13, 9.50it/s] 124it [00:13, 9.49it/s] 125it [00:13, 9.57it/s] 126it [00:13, 9.53it/s] 127it [00:13, 9.51it/s] 128it [00:13, 9.32it/s] 129it [00:13, 9.01it/s] 130it [00:13, 8.82it/s] 131it [00:13, 8.96it/s] 132it [00:14, 9.13it/s] 133it [00:14, 9.08it/s] 134it [00:14, 9.18it/s] 135it [00:14, 9.33it/s] 136it [00:14, 9.41it/s] 137it [00:14, 9.43it/s] 138it [00:14, 9.46it/s] 139it [00:14, 9.44it/s] 140it [00:14, 9.45it/s] 141it [00:15, 9.44it/s] 142it [00:15, 9.43it/s] 143it [00:15, 9.53it/s] 144it [00:15, 9.51it/s] 145it [00:15, 9.52it/s] 146it [00:15, 9.50it/s] 147it [00:15, 9.51it/s] 148it [00:15, 9.53it/s] 149it [00:15, 9.53it/s] 150it [00:15, 9.54it/s]2025-05-26 03:17:58,825 - INFO - [Epoch 009 | Batch 0150] IWAE-loss 14599.3418 | mean log_px -0.1665 | KL -3540.62 + 151it [00:16, 9.56it/s] 152it [00:16, 9.55it/s] 153it [00:16, 9.54it/s] 154it [00:16, 9.51it/s] 155it [00:16, 9.50it/s] 156it [00:16, 9.35it/s] 157it [00:16, 9.38it/s] 158it [00:16, 9.44it/s] 159it [00:16, 9.46it/s] 160it [00:17, 9.42it/s] 161it [00:17, 9.42it/s] 162it [00:17, 9.41it/s] 163it [00:17, 9.42it/s] 164it [00:17, 9.45it/s] 165it [00:17, 9.44it/s] 166it [00:17, 9.46it/s] 167it [00:17, 9.29it/s] 168it [00:17, 9.32it/s] 169it [00:17, 9.33it/s] 170it [00:18, 9.38it/s] 171it [00:18, 9.43it/s] 172it [00:18, 9.42it/s] 173it [00:18, 9.46it/s] 174it [00:18, 9.36it/s] 175it [00:18, 9.23it/s] 176it [00:18, 9.29it/s] 177it [00:18, 9.35it/s] 178it [00:18, 9.36it/s] 179it [00:19, 9.39it/s] 180it [00:19, 9.40it/s] 181it [00:19, 9.49it/s] 182it [00:19, 9.51it/s] 183it [00:19, 9.44it/s] 184it [00:19, 9.44it/s] 185it [00:19, 9.36it/s] 186it [00:19, 9.40it/s] 187it [00:19, 9.41it/s] 188it [00:19, 9.50it/s] 189it [00:20, 9.48it/s] 190it [00:20, 9.37it/s] 191it [00:20, 9.41it/s] 192it [00:20, 9.43it/s] 193it [00:20, 9.49it/s] 194it [00:20, 9.53it/s] 195it [00:20, 8.96it/s] 196it [00:20, 9.20it/s] 196it [00:20, 9.38it/s] +2025-05-26 03:18:03,722 - INFO - Epoch: 9, Objective: tensor([12982.9697], device='cuda:0', grad_fn=), Loss: 0.14898112416267395, KL/n: 72.30970001220703 + 0it [00:00, ?it/s]2025-05-26 03:18:04,152 - INFO - [Epoch 010 | Batch 0000] IWAE-loss 13698.6484 | mean log_px -0.1451 | KL -3541.10 + 1it [00:00, 6.14it/s] 2it [00:00, 7.76it/s] 3it [00:00, 8.48it/s] 4it [00:00, 8.88it/s] 5it [00:00, 9.06it/s] 6it [00:00, 9.17it/s] 7it [00:00, 9.29it/s] 8it [00:00, 9.36it/s] 9it [00:01, 9.43it/s] 10it [00:01, 9.49it/s] 11it [00:01, 9.48it/s] 12it [00:01, 9.15it/s] 13it [00:01, 9.27it/s] 14it [00:01, 9.36it/s] 15it [00:01, 9.42it/s] 16it [00:01, 9.43it/s] 17it [00:01, 9.46it/s] 18it [00:01, 9.47it/s] 19it [00:02, 9.51it/s] 20it [00:02, 9.54it/s] 21it [00:02, 9.53it/s] 22it [00:02, 9.53it/s] 23it [00:02, 9.51it/s] 24it [00:02, 9.52it/s] 25it [00:02, 9.54it/s] 26it [00:02, 9.53it/s] 27it [00:02, 9.56it/s] 28it [00:03, 9.55it/s] 29it [00:03, 9.52it/s] 30it [00:03, 9.55it/s] 31it [00:03, 9.57it/s] 32it [00:03, 9.51it/s] 33it [00:03, 9.50it/s] 34it [00:03, 9.50it/s] 35it [00:03, 9.51it/s] 36it [00:03, 9.49it/s] 37it [00:03, 9.54it/s] 38it [00:04, 9.54it/s] 39it [00:04, 9.56it/s] 40it [00:04, 9.53it/s] 41it [00:04, 9.51it/s] 42it [00:04, 9.51it/s] 43it [00:04, 9.51it/s] 44it [00:04, 9.49it/s] 45it [00:04, 9.53it/s] 46it [00:04, 9.61it/s] 47it [00:05, 9.54it/s] 48it [00:05, 9.51it/s] 49it [00:05, 9.49it/s] 50it [00:05, 9.50it/s]2025-05-26 03:18:09,425 - INFO - [Epoch 010 | Batch 0050] IWAE-loss 15355.1699 | mean log_px -0.1796 | KL -3543.84 + 51it [00:05, 9.33it/s] 52it [00:05, 9.40it/s] 53it [00:05, 9.45it/s] 54it [00:05, 9.48it/s] 55it [00:05, 9.49it/s] 56it [00:05, 9.51it/s] 57it [00:06, 9.09it/s] 58it [00:06, 9.24it/s] 59it [00:06, 9.32it/s] 60it [00:06, 9.35it/s] 61it [00:06, 9.38it/s] 62it [00:06, 9.46it/s] 63it [00:06, 9.48it/s] 64it [00:06, 9.50it/s] 65it [00:06, 9.47it/s] 66it [00:07, 9.30it/s] 67it [00:07, 9.33it/s] 68it [00:07, 9.39it/s] 69it [00:07, 9.44it/s] 70it [00:07, 9.44it/s] 71it [00:07, 9.47it/s] 72it [00:07, 9.44it/s] 73it [00:07, 9.44it/s] 74it [00:07, 9.45it/s] 75it [00:07, 9.51it/s] 76it [00:08, 9.45it/s] 77it [00:08, 9.46it/s] 78it [00:08, 9.47it/s] 79it [00:08, 9.44it/s] 80it [00:08, 9.46it/s] 81it [00:08, 9.50it/s] 82it [00:08, 9.39it/s] 83it [00:08, 9.31it/s] 84it [00:08, 9.18it/s] 85it [00:09, 9.25it/s] 86it [00:09, 9.32it/s] 87it [00:09, 9.32it/s] 88it [00:09, 9.32it/s] 89it [00:09, 9.36it/s] 90it [00:09, 9.34it/s] 91it [00:09, 9.39it/s] 92it [00:09, 9.36it/s] 93it [00:09, 9.36it/s] 94it [00:10, 9.35it/s] 95it [00:10, 9.34it/s] 96it [00:10, 9.37it/s] 97it [00:10, 9.38it/s] 98it [00:10, 9.28it/s] 99it [00:10, 9.31it/s] 100it [00:10, 9.27it/s]2025-05-26 03:18:14,756 - INFO - [Epoch 010 | Batch 0100] IWAE-loss 10181.3457 | mean log_px -0.1026 | KL -3547.27 + 101it [00:10, 9.27it/s] 102it [00:10, 9.24it/s] 103it [00:10, 9.21it/s] 104it [00:11, 9.20it/s] 105it [00:11, 9.22it/s] 106it [00:11, 9.18it/s] 107it [00:11, 9.16it/s] 108it [00:11, 8.86it/s] 109it [00:11, 8.97it/s] 110it [00:11, 8.58it/s] 111it [00:11, 8.69it/s] 112it [00:12, 8.74it/s] 113it [00:12, 8.89it/s] 114it [00:12, 8.96it/s] 115it [00:12, 8.96it/s] 116it [00:12, 8.96it/s] 117it [00:12, 8.98it/s] 118it [00:12, 9.09it/s] 119it [00:12, 8.66it/s] 120it [00:12, 8.77it/s] 121it [00:13, 8.90it/s] 122it [00:13, 9.05it/s] 123it [00:13, 9.08it/s] 124it [00:13, 9.11it/s] 125it [00:13, 9.09it/s] 126it [00:13, 9.13it/s] 127it [00:13, 9.14it/s] 128it [00:13, 8.72it/s] 129it [00:13, 8.99it/s] 130it [00:13, 9.09it/s] 131it [00:14, 9.14it/s] 132it [00:14, 9.17it/s] 133it [00:14, 9.18it/s] 134it [00:14, 9.22it/s] 135it [00:14, 9.26it/s] 136it [00:14, 9.28it/s] 137it [00:14, 9.26it/s] 138it [00:14, 9.15it/s] 139it [00:14, 9.15it/s] 140it [00:15, 9.12it/s] 141it [00:15, 9.07it/s] 142it [00:15, 8.69it/s] 143it [00:15, 8.85it/s] 144it [00:15, 8.88it/s] 145it [00:15, 8.96it/s] 146it [00:15, 8.54it/s] 147it [00:15, 8.79it/s] 148it [00:15, 9.00it/s] 149it [00:16, 9.12it/s] 150it [00:16, 9.21it/s]2025-05-26 03:18:20,302 - INFO - [Epoch 010 | Batch 0150] IWAE-loss 12556.6738 | mean log_px -0.1344 | KL -3543.33 + 151it [00:16, 9.21it/s] 152it [00:16, 9.16it/s] 153it [00:16, 9.22it/s] 154it [00:16, 9.19it/s] 155it [00:16, 9.23it/s] 156it [00:16, 9.26it/s] 157it [00:16, 9.27it/s] 158it [00:17, 9.27it/s] 159it [00:17, 9.25it/s] 160it [00:17, 9.28it/s] 161it [00:17, 9.28it/s] 162it [00:17, 9.29it/s] 163it [00:17, 9.36it/s] 164it [00:17, 9.39it/s] 165it [00:17, 9.47it/s] 166it [00:17, 9.43it/s] 167it [00:18, 9.39it/s] 168it [00:18, 9.25it/s] 169it [00:18, 9.34it/s] 170it [00:18, 8.74it/s] 171it [00:18, 8.88it/s] 172it [00:18, 8.98it/s] 173it [00:18, 9.06it/s] 174it [00:18, 9.09it/s] 175it [00:18, 9.21it/s] 176it [00:19, 9.28it/s] 177it [00:19, 9.28it/s] 178it [00:19, 8.69it/s] 179it [00:19, 8.78it/s] 180it [00:19, 8.97it/s] 181it [00:19, 9.15it/s] 182it [00:19, 9.23it/s] 183it [00:19, 9.32it/s] 184it [00:19, 8.85it/s] 185it [00:20, 9.02it/s] 186it [00:20, 9.15it/s] 187it [00:20, 9.29it/s] 188it [00:20, 8.95it/s] 189it [00:20, 9.14it/s] 190it [00:20, 9.26it/s] 191it [00:20, 8.84it/s] 192it [00:20, 9.01it/s] 193it [00:20, 9.11it/s] 194it [00:21, 9.19it/s] 195it [00:21, 8.74it/s] 196it [00:21, 8.88it/s] 196it [00:21, 9.20it/s] +2025-05-26 03:18:25,345 - INFO - Epoch: 10, Objective: tensor([15107.3916], device='cuda:0', grad_fn=), Loss: 0.16303861141204834, KL/n: 72.43524169921875 + 0it [00:00, ?it/s]2025-05-26 03:18:25,619 - INFO - [Epoch 011 | Batch 0000] IWAE-loss 10246.0049 | mean log_px -0.1013 | KL -3548.55 + 1it [00:00, 4.92it/s] 2it [00:00, 6.77it/s] 3it [00:00, 7.67it/s] 4it [00:00, 8.17it/s] 5it [00:00, 8.50it/s] 6it [00:00, 8.64it/s] 7it [00:00, 8.80it/s] 8it [00:00, 8.91it/s] 9it [00:01, 9.06it/s] 10it [00:01, 9.15it/s] 11it [00:01, 9.04it/s] 12it [00:01, 9.07it/s] 13it [00:01, 9.14it/s] 14it [00:01, 9.05it/s] 15it [00:01, 9.07it/s] 16it [00:01, 8.56it/s] 17it [00:01, 8.75it/s] 18it [00:02, 8.88it/s] 19it [00:02, 9.07it/s] 20it [00:02, 9.16it/s] 21it [00:02, 9.21it/s] 22it [00:02, 9.21it/s] 23it [00:02, 9.28it/s] 24it [00:02, 9.31it/s] 25it [00:02, 9.19it/s] 26it [00:02, 9.16it/s] 27it [00:03, 9.11it/s] 28it [00:03, 9.11it/s] 29it [00:03, 9.15it/s] 30it [00:03, 9.18it/s] 31it [00:03, 9.21it/s] 32it [00:03, 9.22it/s] 33it [00:03, 9.20it/s] 34it [00:03, 9.30it/s] 35it [00:03, 9.25it/s] 36it [00:04, 9.28it/s] 37it [00:04, 9.20it/s] 38it [00:04, 9.07it/s] 39it [00:04, 9.09it/s] 40it [00:04, 9.01it/s] 41it [00:04, 9.03it/s] 42it [00:04, 9.05it/s] 43it [00:04, 9.16it/s] 44it [00:04, 9.27it/s] 45it [00:05, 9.41it/s] 46it [00:05, 9.44it/s] 47it [00:05, 9.28it/s] 48it [00:05, 9.27it/s] 49it [00:05, 8.77it/s] 50it [00:05, 8.81it/s]2025-05-26 03:18:31,126 - INFO - [Epoch 011 | Batch 0050] IWAE-loss 13919.8701 | mean log_px -0.1529 | KL -3551.17 + 51it [00:05, 8.93it/s] 52it [00:05, 9.03it/s] 53it [00:05, 9.14it/s] 54it [00:06, 9.24it/s] 55it [00:06, 9.30it/s] 56it [00:06, 9.37it/s] 57it [00:06, 9.46it/s] 58it [00:06, 9.45it/s] 59it [00:06, 9.46it/s] 60it [00:06, 9.45it/s] 61it [00:06, 9.46it/s] 62it [00:06, 9.01it/s] 63it [00:06, 9.14it/s] 64it [00:07, 9.25it/s] 65it [00:07, 9.34it/s] 66it [00:07, 9.05it/s] 67it [00:07, 9.22it/s] 68it [00:07, 9.31it/s] 69it [00:07, 9.41it/s] 70it [00:07, 9.10it/s] 71it [00:07, 9.20it/s] 72it [00:07, 9.27it/s] 73it [00:08, 9.32it/s] 74it [00:08, 9.35it/s] 75it [00:08, 9.46it/s] 76it [00:08, 9.44it/s] 77it [00:08, 9.52it/s] 78it [00:08, 9.53it/s] 79it [00:08, 9.23it/s] 80it [00:08, 9.27it/s] 81it [00:08, 9.37it/s] 82it [00:09, 9.43it/s] 83it [00:09, 9.46it/s] 84it [00:09, 9.47it/s] 85it [00:09, 9.50it/s] 86it [00:09, 9.48it/s] 87it [00:09, 9.48it/s] 88it [00:09, 9.47it/s] 89it [00:09, 9.47it/s] 90it [00:09, 9.45it/s] 91it [00:09, 9.49it/s] 92it [00:10, 9.46it/s] 93it [00:10, 9.50it/s] 94it [00:10, 9.05it/s] 95it [00:10, 9.20it/s] 96it [00:10, 9.26it/s] 97it [00:10, 9.29it/s] 98it [00:10, 9.30it/s] 99it [00:10, 8.88it/s] 100it [00:10, 9.07it/s]2025-05-26 03:18:36,485 - INFO - [Epoch 011 | Batch 0100] IWAE-loss 11395.6230 | mean log_px -0.1321 | KL -3551.43 + 101it [00:11, 9.18it/s] 102it [00:11, 9.27it/s] 103it [00:11, 9.30it/s] 104it [00:11, 9.36it/s] 105it [00:11, 9.43it/s] 106it [00:11, 9.40it/s] 107it [00:11, 9.43it/s] 108it [00:11, 9.46it/s] 109it [00:11, 8.81it/s] 110it [00:12, 8.98it/s] 111it [00:12, 9.16it/s] 112it [00:12, 9.23it/s] 113it [00:12, 9.22it/s] 114it [00:12, 9.27it/s] 115it [00:12, 9.34it/s] 116it [00:12, 9.33it/s] 117it [00:12, 9.34it/s] 118it [00:12, 9.37it/s] 119it [00:12, 9.44it/s] 120it [00:13, 9.49it/s] 121it [00:13, 9.54it/s] 122it [00:13, 9.53it/s] 123it [00:13, 9.55it/s] 124it [00:13, 9.04it/s] 125it [00:13, 9.14it/s] 126it [00:13, 9.07it/s] 127it [00:13, 9.19it/s] 128it [00:13, 9.28it/s] 129it [00:14, 9.36it/s] 130it [00:14, 9.41it/s] 131it [00:14, 9.47it/s] 132it [00:14, 9.50it/s] 133it [00:14, 9.52it/s] 134it [00:14, 9.54it/s] 135it [00:14, 9.49it/s] 136it [00:14, 9.53it/s] 137it [00:14, 9.02it/s] 138it [00:15, 9.11it/s] 139it [00:15, 9.24it/s] 140it [00:15, 9.34it/s] 141it [00:15, 9.35it/s] 142it [00:15, 9.37it/s] 143it [00:15, 9.41it/s] 144it [00:15, 9.44it/s] 145it [00:15, 9.49it/s] 146it [00:15, 9.54it/s] 147it [00:15, 9.47it/s] 148it [00:16, 9.46it/s] 149it [00:16, 9.49it/s] 150it [00:16, 9.45it/s]2025-05-26 03:18:41,826 - INFO - [Epoch 011 | Batch 0150] IWAE-loss 14350.5879 | mean log_px -0.1595 | KL -3548.78 + 151it [00:16, 9.47it/s] 152it [00:16, 9.47it/s] 153it [00:16, 9.49it/s] 154it [00:16, 9.51it/s] 155it [00:16, 9.54it/s] 156it [00:16, 9.58it/s] 157it [00:17, 9.58it/s] 158it [00:17, 9.54it/s] 159it [00:17, 9.53it/s] 160it [00:17, 9.46it/s] 161it [00:17, 9.47it/s] 162it [00:17, 9.44it/s] 163it [00:17, 9.44it/s] 164it [00:17, 9.44it/s] 165it [00:17, 9.48it/s] 166it [00:17, 9.48it/s] 167it [00:18, 9.48it/s] 168it [00:18, 9.47it/s] 169it [00:18, 9.45it/s] 170it [00:18, 9.47it/s] 171it [00:18, 9.47it/s] 172it [00:18, 9.26it/s] 173it [00:18, 8.79it/s] 174it [00:18, 8.90it/s] 175it [00:18, 9.06it/s] 176it [00:19, 9.15it/s] 177it [00:19, 8.71it/s] 178it [00:19, 8.87it/s] 179it [00:19, 8.99it/s] 180it [00:19, 9.09it/s] 181it [00:19, 9.15it/s] 182it [00:19, 9.22it/s] 183it [00:19, 8.71it/s] 184it [00:19, 8.90it/s] 185it [00:20, 9.08it/s] 186it [00:20, 9.08it/s] 187it [00:20, 9.16it/s] 188it [00:20, 9.16it/s] 189it [00:20, 9.26it/s] 190it [00:20, 9.37it/s] 191it [00:20, 9.47it/s] 192it [00:20, 9.52it/s] 193it [00:20, 9.09it/s] 194it [00:21, 9.26it/s] 195it [00:21, 8.79it/s] 196it [00:21, 8.56it/s] 196it [00:21, 9.18it/s] +2025-05-26 03:18:46,822 - INFO - Epoch: 11, Objective: tensor([10451.8135], device='cuda:0', grad_fn=), Loss: 0.1001165509223938, KL/n: 72.5517807006836 + 0it [00:00, ?it/s]2025-05-26 03:18:47,270 - INFO - [Epoch 012 | Batch 0000] IWAE-loss 8402.5049 | mean log_px -0.0712 | KL -3554.51 + 1it [00:00, 5.48it/s] 2it [00:00, 7.21it/s] 3it [00:00, 8.11it/s] 4it [00:00, 8.60it/s] 5it [00:00, 8.91it/s] 6it [00:00, 8.53it/s] 7it [00:00, 8.86it/s] 8it [00:00, 9.03it/s] 9it [00:01, 9.21it/s] 10it [00:01, 9.29it/s] 11it [00:01, 9.37it/s] 12it [00:01, 9.40it/s] 13it [00:01, 9.46it/s] 14it [00:01, 9.24it/s] 15it [00:01, 9.29it/s] 16it [00:01, 9.34it/s] 17it [00:01, 9.44it/s] 18it [00:02, 9.43it/s] 19it [00:02, 9.44it/s] 20it [00:02, 9.47it/s] 21it [00:02, 9.49it/s] 22it [00:02, 9.50it/s] 23it [00:02, 9.51it/s] 24it [00:02, 9.48it/s] 25it [00:02, 9.52it/s] 26it [00:02, 9.57it/s] 27it [00:02, 9.59it/s] 28it [00:03, 9.58it/s] 29it [00:03, 9.56it/s] 30it [00:03, 9.51it/s] 31it [00:03, 9.53it/s] 32it [00:03, 9.52it/s] 33it [00:03, 9.54it/s] 34it [00:03, 9.50it/s] 35it [00:03, 9.49it/s] 36it [00:03, 9.48it/s] 37it [00:03, 9.48it/s] 38it [00:04, 9.50it/s] 39it [00:04, 9.50it/s] 40it [00:04, 9.54it/s] 41it [00:04, 9.59it/s] 42it [00:04, 9.50it/s] 43it [00:04, 9.56it/s] 44it [00:04, 9.51it/s] 45it [00:04, 9.46it/s] 46it [00:04, 9.44it/s] 47it [00:05, 8.97it/s] 48it [00:05, 9.15it/s] 49it [00:05, 9.32it/s] 50it [00:05, 9.39it/s]2025-05-26 03:18:52,576 - INFO - [Epoch 012 | Batch 0050] IWAE-loss 10922.4316 | mean log_px -0.1087 | KL -3553.06 + 51it [00:05, 9.48it/s] 52it [00:05, 9.50it/s] 53it [00:05, 9.55it/s] 54it [00:05, 9.02it/s] 55it [00:05, 9.20it/s] 56it [00:06, 9.26it/s] 57it [00:06, 9.31it/s] 58it [00:06, 9.35it/s] 59it [00:06, 9.32it/s] 60it [00:06, 9.36it/s] 61it [00:06, 9.39it/s] 62it [00:06, 9.42it/s] 63it [00:06, 9.47it/s] 64it [00:06, 9.48it/s] 65it [00:06, 9.51it/s] 66it [00:07, 9.47it/s] 67it [00:07, 9.49it/s] 68it [00:07, 9.51it/s] 69it [00:07, 9.45it/s] 70it [00:07, 9.34it/s] 71it [00:07, 9.41it/s] 72it [00:07, 9.44it/s] 73it [00:07, 9.44it/s] 74it [00:07, 9.45it/s] 75it [00:08, 9.46it/s] 76it [00:08, 9.46it/s] 77it [00:08, 9.51it/s] 78it [00:08, 9.57it/s] 79it [00:08, 9.60it/s] 80it [00:08, 9.55it/s] 81it [00:08, 9.54it/s] 82it [00:08, 9.53it/s] 83it [00:08, 9.53it/s] 84it [00:08, 9.53it/s] 85it [00:09, 9.53it/s] 86it [00:09, 9.55it/s] 87it [00:09, 9.51it/s] 88it [00:09, 9.53it/s] 89it [00:09, 9.53it/s] 90it [00:09, 9.58it/s] 91it [00:09, 9.55it/s] 92it [00:09, 9.54it/s] 93it [00:09, 9.51it/s] 94it [00:10, 9.16it/s] 95it [00:10, 9.25it/s] 96it [00:10, 9.31it/s] 97it [00:10, 9.01it/s] 98it [00:10, 9.10it/s] 99it [00:10, 9.21it/s] 100it [00:10, 8.97it/s]2025-05-26 03:18:57,900 - INFO - [Epoch 012 | Batch 0100] IWAE-loss 11670.1055 | mean log_px -0.1183 | KL -3560.71 + 101it [00:10, 9.14it/s] 102it [00:10, 9.20it/s] 103it [00:11, 8.85it/s] 104it [00:11, 9.01it/s] 105it [00:11, 9.21it/s] 106it [00:11, 9.27it/s] 107it [00:11, 8.89it/s] 108it [00:11, 9.03it/s] 109it [00:11, 9.16it/s] 110it [00:11, 9.28it/s] 111it [00:11, 8.85it/s] 112it [00:12, 9.04it/s] 113it [00:12, 8.75it/s] 114it [00:12, 8.98it/s] 115it [00:12, 9.11it/s] 116it [00:12, 9.13it/s] 117it [00:12, 9.27it/s] 118it [00:12, 9.36it/s] 119it [00:12, 9.43it/s] 120it [00:12, 9.36it/s] 121it [00:12, 9.44it/s] 122it [00:13, 9.44it/s] 123it [00:13, 9.46it/s] 124it [00:13, 9.45it/s] 125it [00:13, 9.47it/s] 126it [00:13, 9.47it/s] 127it [00:13, 9.49it/s] 128it [00:13, 9.47it/s] 129it [00:13, 9.53it/s] 130it [00:13, 9.46it/s] 131it [00:14, 9.45it/s] 132it [00:14, 9.45it/s] 133it [00:14, 9.48it/s] 134it [00:14, 9.48it/s] 135it [00:14, 9.52it/s] 136it [00:14, 9.48it/s] 137it [00:14, 9.50it/s] 138it [00:14, 9.49it/s] 139it [00:14, 9.53it/s] 140it [00:14, 9.51it/s] 141it [00:15, 9.56it/s] 142it [00:15, 9.50it/s] 143it [00:15, 9.53it/s] 144it [00:15, 9.49it/s] 145it [00:15, 9.48it/s] 146it [00:15, 9.50it/s] 147it [00:15, 9.52it/s] 148it [00:15, 9.53it/s] 149it [00:15, 9.51it/s] 150it [00:16, 9.51it/s]2025-05-26 03:19:03,241 - INFO - [Epoch 012 | Batch 0150] IWAE-loss 9823.7705 | mean log_px -0.0984 | KL -3558.63 + 151it [00:16, 9.53it/s] 152it [00:16, 9.57it/s] 153it [00:16, 9.57it/s] 154it [00:16, 9.57it/s] 155it [00:16, 9.60it/s] 156it [00:16, 9.56it/s] 157it [00:16, 9.57it/s] 158it [00:16, 9.55it/s] 159it [00:16, 9.55it/s] 160it [00:17, 9.56it/s] 161it [00:17, 9.58it/s] 162it [00:17, 9.61it/s] 163it [00:17, 9.63it/s] 164it [00:17, 9.59it/s] 165it [00:17, 9.53it/s] 166it [00:17, 9.54it/s] 167it [00:17, 9.55it/s] 168it [00:17, 9.54it/s] 169it [00:18, 9.51it/s] 170it [00:18, 9.53it/s] 171it [00:18, 9.49it/s] 172it [00:18, 9.47it/s] 173it [00:18, 9.50it/s] 174it [00:18, 9.48it/s] 175it [00:18, 9.54it/s] 176it [00:18, 9.50it/s] 177it [00:18, 9.51it/s] 178it [00:18, 9.49it/s] 179it [00:19, 9.49it/s] 180it [00:19, 9.47it/s] 181it [00:19, 9.47it/s] 182it [00:19, 9.49it/s] 183it [00:19, 9.51it/s] 184it [00:19, 9.46it/s] 185it [00:19, 9.48it/s] 186it [00:19, 9.52it/s] 187it [00:19, 9.49it/s] 188it [00:20, 9.49it/s] 189it [00:20, 9.46it/s] 190it [00:20, 9.47it/s] 191it [00:20, 9.50it/s] 192it [00:20, 9.49it/s] 193it [00:20, 9.48it/s] 194it [00:20, 9.51it/s] 195it [00:20, 8.95it/s] 196it [00:20, 9.16it/s] 196it [00:20, 9.36it/s] +2025-05-26 03:19:08,082 - INFO - Epoch: 12, Objective: tensor([11959.2480], device='cuda:0', grad_fn=), Loss: 0.12528853118419647, KL/n: 72.63204193115234 + 0it [00:00, ?it/s]2025-05-26 03:19:08,364 - INFO - [Epoch 013 | Batch 0000] IWAE-loss 10673.3086 | mean log_px -0.1125 | KL -3559.28 + 1it [00:00, 4.58it/s] 2it [00:00, 6.56it/s] 3it [00:00, 7.68it/s] 4it [00:00, 8.32it/s] 5it [00:00, 8.72it/s] 6it [00:00, 8.95it/s] 7it [00:00, 9.19it/s] 8it [00:00, 9.20it/s] 9it [00:01, 8.78it/s] 10it [00:01, 9.02it/s] 11it [00:01, 9.14it/s] 12it [00:01, 9.23it/s] 13it [00:01, 8.77it/s] 14it [00:01, 8.96it/s] 15it [00:01, 9.14it/s] 16it [00:01, 9.29it/s] 17it [00:01, 8.93it/s] 18it [00:02, 9.13it/s] 19it [00:02, 9.23it/s] 20it [00:02, 9.32it/s] 21it [00:02, 9.38it/s] 22it [00:02, 9.42it/s] 23it [00:02, 9.47it/s] 24it [00:02, 9.49it/s] 25it [00:02, 9.51it/s] 26it [00:02, 9.53it/s] 27it [00:03, 8.94it/s] 28it [00:03, 9.14it/s] 29it [00:03, 9.19it/s] 30it [00:03, 9.25it/s] 31it [00:03, 8.83it/s] 32it [00:03, 9.01it/s] 33it [00:03, 9.13it/s] 34it [00:03, 9.26it/s] 35it [00:03, 9.35it/s] 36it [00:03, 9.39it/s] 37it [00:04, 9.45it/s] 38it [00:04, 9.46it/s] 39it [00:04, 9.50it/s] 40it [00:04, 9.52it/s] 41it [00:04, 9.51it/s] 42it [00:04, 9.50it/s] 43it [00:04, 9.52it/s] 44it [00:04, 9.52it/s] 45it [00:04, 9.57it/s] 46it [00:05, 9.12it/s] 47it [00:05, 9.23it/s] 48it [00:05, 9.31it/s] 49it [00:05, 9.34it/s] 50it [00:05, 9.36it/s]2025-05-26 03:19:13,764 - INFO - [Epoch 013 | Batch 0050] IWAE-loss 14811.1055 | mean log_px -0.1740 | KL -3564.73 + 51it [00:05, 9.39it/s] 52it [00:05, 9.49it/s] 53it [00:05, 9.55it/s] 54it [00:05, 9.50it/s] 55it [00:06, 9.53it/s] 56it [00:06, 9.50it/s] 57it [00:06, 9.14it/s] 58it [00:06, 9.27it/s] 59it [00:06, 9.30it/s] 60it [00:06, 9.36it/s] 61it [00:06, 9.25it/s] 62it [00:06, 9.33it/s] 63it [00:06, 8.87it/s] 64it [00:06, 9.07it/s] 65it [00:07, 9.16it/s] 66it [00:07, 9.10it/s] 67it [00:07, 9.04it/s] 68it [00:07, 9.17it/s] 69it [00:07, 9.23it/s] 70it [00:07, 9.26it/s] 71it [00:07, 9.28it/s] 72it [00:07, 9.30it/s] 73it [00:07, 9.32it/s] 74it [00:08, 9.32it/s] 75it [00:08, 9.36it/s] 76it [00:08, 9.36it/s] 77it [00:08, 8.83it/s] 78it [00:08, 8.97it/s] 79it [00:08, 8.99it/s] 80it [00:08, 8.76it/s] 81it [00:08, 8.47it/s] 82it [00:08, 8.76it/s] 83it [00:09, 8.99it/s] 84it [00:09, 9.13it/s] 85it [00:09, 9.26it/s] 86it [00:09, 8.84it/s] 87it [00:09, 9.05it/s] 88it [00:09, 9.20it/s] 89it [00:09, 9.31it/s] 90it [00:09, 8.85it/s] 91it [00:09, 9.03it/s] 92it [00:10, 9.10it/s] 93it [00:10, 9.27it/s] 94it [00:10, 9.39it/s] 95it [00:10, 8.94it/s] 96it [00:10, 9.14it/s] 97it [00:10, 9.33it/s] 98it [00:10, 9.45it/s] 99it [00:10, 9.54it/s] 100it [00:10, 9.03it/s]2025-05-26 03:19:19,222 - INFO - [Epoch 013 | Batch 0100] IWAE-loss 11084.1914 | mean log_px -0.1101 | KL -3557.34 + 101it [00:11, 9.23it/s] 102it [00:11, 9.37it/s] 103it [00:11, 9.48it/s] 104it [00:11, 9.56it/s] 105it [00:11, 9.45it/s] 106it [00:11, 8.89it/s] 107it [00:11, 9.14it/s] 108it [00:11, 9.32it/s] 109it [00:11, 9.45it/s] 110it [00:12, 9.54it/s] 111it [00:12, 9.60it/s] 112it [00:12, 9.64it/s] 113it [00:12, 9.68it/s] 114it [00:12, 9.31it/s] 115it [00:12, 9.44it/s] 116it [00:12, 9.54it/s] 117it [00:12, 9.62it/s] 118it [00:12, 9.66it/s] 119it [00:12, 9.70it/s] 120it [00:13, 9.14it/s] 121it [00:13, 9.32it/s] 122it [00:13, 9.44it/s] 123it [00:13, 9.54it/s] 124it [00:13, 9.61it/s] 125it [00:13, 9.66it/s] 126it [00:13, 9.68it/s] 127it [00:13, 9.71it/s] 128it [00:13, 9.71it/s] 129it [00:13, 9.32it/s] 130it [00:14, 9.44it/s] 131it [00:14, 9.53it/s] 132it [00:14, 9.60it/s] 133it [00:14, 9.65it/s] 134it [00:14, 9.66it/s] 135it [00:14, 9.63it/s] 136it [00:14, 9.42it/s] 137it [00:14, 9.40it/s] 138it [00:14, 9.29it/s] 139it [00:15, 9.32it/s] 140it [00:15, 9.32it/s] 141it [00:15, 9.33it/s] 142it [00:15, 9.33it/s] 143it [00:15, 9.31it/s] 144it [00:15, 9.38it/s] 145it [00:15, 9.35it/s] 146it [00:15, 9.32it/s] 147it [00:15, 9.30it/s] 148it [00:16, 9.40it/s] 149it [00:16, 9.35it/s] 150it [00:16, 9.24it/s]2025-05-26 03:19:24,517 - INFO - [Epoch 013 | Batch 0150] IWAE-loss 8056.9863 | mean log_px -0.0642 | KL -3562.25 + 151it [00:16, 9.18it/s] 152it [00:16, 8.63it/s] 153it [00:16, 8.77it/s] 154it [00:16, 8.98it/s] 155it [00:16, 9.01it/s] 156it [00:16, 8.54it/s] 157it [00:17, 8.91it/s] 158it [00:17, 9.09it/s] 159it [00:17, 9.33it/s] 160it [00:17, 9.49it/s] 161it [00:17, 9.63it/s] 162it [00:17, 9.70it/s] 163it [00:17, 9.28it/s] 164it [00:17, 9.42it/s] 165it [00:17, 9.51it/s] 166it [00:17, 9.63it/s] 167it [00:18, 9.73it/s] 168it [00:18, 9.77it/s] 169it [00:18, 9.82it/s] 170it [00:18, 9.82it/s] 171it [00:18, 9.87it/s] 172it [00:18, 9.88it/s] 173it [00:18, 9.91it/s] 174it [00:18, 9.88it/s] 175it [00:18, 9.82it/s] 176it [00:18, 9.83it/s] 177it [00:19, 9.80it/s] 178it [00:19, 9.76it/s] 179it [00:19, 9.82it/s] 180it [00:19, 9.86it/s] 181it [00:19, 9.88it/s] 182it [00:19, 9.85it/s] 183it [00:19, 9.89it/s] 184it [00:19, 9.86it/s] 185it [00:19, 9.87it/s] 186it [00:19, 9.88it/s] 187it [00:20, 9.81it/s] 188it [00:20, 9.82it/s] 189it [00:20, 9.86it/s] 190it [00:20, 9.85it/s] 191it [00:20, 9.89it/s] 192it [00:20, 9.32it/s] 193it [00:20, 9.43it/s] 194it [00:20, 9.49it/s] 195it [00:20, 9.04it/s] 196it [00:21, 9.28it/s] +2025-05-26 03:19:29,327 - INFO - Epoch: 13, Objective: tensor([13255.1807], device='cuda:0', grad_fn=), Loss: 0.15383651852607727, KL/n: 72.70011138916016 + 0it [00:00, ?it/s]2025-05-26 03:19:29,787 - INFO - [Epoch 014 | Batch 0000] IWAE-loss 11022.1055 | mean log_px -0.1185 | KL -3559.76 + 1it [00:00, 4.57it/s] 2it [00:00, 6.58it/s] 4it [00:00, 8.40it/s] 6it [00:00, 9.06it/s] 7it [00:00, 9.27it/s] 8it [00:00, 9.43it/s] 9it [00:01, 9.58it/s] 10it [00:01, 9.09it/s] 11it [00:01, 9.19it/s] 12it [00:01, 9.30it/s] 13it [00:01, 9.48it/s] 14it [00:01, 9.59it/s] 15it [00:01, 9.70it/s] 16it [00:01, 9.74it/s] 17it [00:01, 9.80it/s] 18it [00:01, 9.82it/s] 19it [00:02, 9.86it/s] 20it [00:02, 9.86it/s] 21it [00:02, 9.88it/s] 22it [00:02, 9.89it/s] 24it [00:02, 9.93it/s] 25it [00:02, 9.92it/s] 26it [00:02, 9.91it/s] 27it [00:02, 9.92it/s] 28it [00:02, 9.91it/s] 29it [00:03, 9.92it/s] 30it [00:03, 9.90it/s] 31it [00:03, 9.92it/s] 32it [00:03, 9.89it/s] 33it [00:03, 9.92it/s] 34it [00:03, 9.91it/s] 35it [00:03, 9.91it/s] 36it [00:03, 9.89it/s] 37it [00:03, 9.91it/s] 38it [00:03, 9.91it/s] 39it [00:04, 9.92it/s] 40it [00:04, 9.91it/s] 41it [00:04, 9.92it/s] 42it [00:04, 9.91it/s] 43it [00:04, 9.91it/s] 44it [00:04, 9.88it/s] 45it [00:04, 9.80it/s] 46it [00:04, 9.21it/s] 47it [00:04, 9.42it/s] 48it [00:05, 9.55it/s] 49it [00:05, 9.66it/s] 50it [00:05, 9.75it/s]2025-05-26 03:19:34,917 - INFO - [Epoch 014 | Batch 0050] IWAE-loss 8267.6357 | mean log_px -0.0700 | KL -3559.77 + 51it [00:05, 9.77it/s] 52it [00:05, 9.80it/s] 53it [00:05, 9.24it/s] 54it [00:05, 9.42it/s] 55it [00:05, 9.58it/s] 56it [00:05, 9.64it/s] 58it [00:06, 9.32it/s] 59it [00:06, 9.46it/s] 60it [00:06, 9.56it/s] 61it [00:06, 9.58it/s] 62it [00:06, 9.66it/s] 63it [00:06, 9.74it/s] 64it [00:06, 9.75it/s] 65it [00:06, 9.81it/s] 66it [00:06, 9.84it/s] 67it [00:07, 9.28it/s] 68it [00:07, 9.47it/s] 69it [00:07, 9.59it/s] 70it [00:07, 9.63it/s] 71it [00:07, 9.72it/s] 72it [00:07, 9.77it/s] 73it [00:07, 9.83it/s] 74it [00:07, 9.86it/s] 75it [00:07, 9.90it/s] 76it [00:07, 9.91it/s] 77it [00:08, 9.92it/s] 78it [00:08, 9.25it/s] 79it [00:08, 9.41it/s] 80it [00:08, 9.54it/s] 81it [00:08, 9.65it/s] 82it [00:08, 9.72it/s] 83it [00:08, 9.78it/s] 84it [00:08, 9.81it/s] 85it [00:08, 9.86it/s] 86it [00:08, 9.87it/s] 87it [00:09, 9.90it/s] 88it [00:09, 9.90it/s] 89it [00:09, 9.91it/s] 90it [00:09, 9.92it/s] 91it [00:09, 9.91it/s] 92it [00:09, 9.89it/s] 93it [00:09, 9.90it/s] 94it [00:09, 9.91it/s] 95it [00:09, 9.92it/s] 96it [00:09, 9.90it/s] 97it [00:10, 9.93it/s] 98it [00:10, 9.28it/s] 99it [00:10, 9.47it/s] 100it [00:10, 9.61it/s]2025-05-26 03:19:40,080 - INFO - [Epoch 014 | Batch 0100] IWAE-loss 13712.4199 | mean log_px -0.1565 | KL -3561.90 + 101it [00:10, 9.70it/s] 102it [00:10, 9.73it/s] 103it [00:10, 9.74it/s] 104it [00:10, 9.18it/s] 105it [00:10, 9.40it/s] 106it [00:11, 9.55it/s] 107it [00:11, 9.67it/s] 108it [00:11, 9.74it/s] 109it [00:11, 9.81it/s] 110it [00:11, 9.83it/s] 111it [00:11, 9.28it/s] 112it [00:11, 9.45it/s] 113it [00:11, 9.51it/s] 114it [00:11, 9.63it/s] 115it [00:11, 9.73it/s] 116it [00:12, 9.77it/s] 118it [00:12, 9.88it/s] 119it [00:12, 9.90it/s] 120it [00:12, 9.46it/s] 121it [00:12, 9.53it/s] 122it [00:12, 9.63it/s] 124it [00:12, 9.78it/s] 125it [00:12, 9.80it/s] 126it [00:13, 9.30it/s] 127it [00:13, 9.48it/s] 128it [00:13, 9.60it/s] 130it [00:13, 9.77it/s] 131it [00:13, 9.82it/s] 132it [00:13, 9.85it/s] 133it [00:13, 9.88it/s] 134it [00:13, 9.89it/s] 135it [00:13, 9.89it/s] 136it [00:14, 9.90it/s] 137it [00:14, 9.93it/s] 138it [00:14, 9.93it/s] 139it [00:14, 9.91it/s] 140it [00:14, 9.57it/s] 141it [00:14, 9.68it/s] 142it [00:14, 9.75it/s] 143it [00:14, 9.81it/s] 144it [00:14, 9.83it/s] 145it [00:15, 9.84it/s] 146it [00:15, 9.12it/s] 147it [00:15, 9.34it/s] 148it [00:15, 9.50it/s] 149it [00:15, 9.62it/s] 150it [00:15, 9.70it/s]2025-05-26 03:19:45,247 - INFO - [Epoch 014 | Batch 0150] IWAE-loss 13030.7373 | mean log_px -0.1424 | KL -3557.82 + 151it [00:15, 9.77it/s] 152it [00:15, 9.77it/s] 153it [00:15, 9.83it/s] 154it [00:15, 9.63it/s] 155it [00:16, 9.11it/s] 156it [00:16, 9.32it/s] 157it [00:16, 9.52it/s] 159it [00:16, 9.74it/s] 160it [00:16, 9.79it/s] 161it [00:16, 9.84it/s] 162it [00:16, 9.86it/s] 164it [00:16, 9.93it/s] 165it [00:17, 9.95it/s] 166it [00:17, 9.96it/s] 167it [00:17, 9.95it/s] 168it [00:17, 9.95it/s] 170it [00:17, 9.97it/s] 171it [00:17, 9.97it/s] 172it [00:17, 9.96it/s] 173it [00:17, 9.46it/s] 174it [00:18, 9.57it/s] 175it [00:18, 9.66it/s] 176it [00:18, 9.09it/s] 177it [00:18, 9.33it/s] 178it [00:18, 9.52it/s] 179it [00:18, 9.58it/s] 180it [00:18, 8.92it/s] 181it [00:18, 8.94it/s] 182it [00:18, 9.19it/s] 183it [00:18, 9.39it/s] 184it [00:19, 9.45it/s] 185it [00:19, 9.59it/s] 186it [00:19, 9.68it/s] 187it [00:19, 9.76it/s] 188it [00:19, 9.79it/s] 189it [00:19, 9.83it/s] 190it [00:19, 9.85it/s] 191it [00:19, 9.83it/s] 192it [00:19, 9.20it/s] 193it [00:20, 9.40it/s] 194it [00:20, 9.56it/s] 195it [00:20, 9.25it/s] 196it [00:20, 9.61it/s] +2025-05-26 03:19:50,041 - INFO - Epoch: 14, Objective: tensor([11565.9922], device='cuda:0', grad_fn=), Loss: 0.11370649188756943, KL/n: 72.74580383300781 + 0it [00:00, ?it/s]2025-05-26 03:19:50,316 - INFO - [Epoch 015 | Batch 0000] IWAE-loss 10721.7217 | mean log_px -0.1022 | KL -3567.32 + 1it [00:00, 4.66it/s] 2it [00:00, 6.75it/s] 4it [00:00, 8.48it/s] 6it [00:00, 9.14it/s] 8it [00:00, 9.47it/s] 9it [00:01, 9.59it/s] 10it [00:01, 9.66it/s] 11it [00:01, 9.74it/s] 12it [00:01, 9.78it/s] 14it [00:01, 9.41it/s] 16it [00:01, 9.63it/s] 18it [00:01, 9.76it/s] 20it [00:02, 9.84it/s] 21it [00:02, 9.87it/s] 22it [00:02, 9.88it/s] 23it [00:02, 9.90it/s] 24it [00:02, 9.91it/s] 26it [00:02, 9.95it/s] 27it [00:02, 9.95it/s] 28it [00:02, 9.90it/s] 30it [00:03, 9.40it/s] 31it [00:03, 9.38it/s] 32it [00:03, 9.36it/s] 33it [00:03, 9.05it/s] 34it [00:03, 9.21it/s] 35it [00:03, 9.33it/s] 36it [00:03, 9.43it/s] 37it [00:03, 9.53it/s] 38it [00:04, 9.61it/s] 39it [00:04, 9.65it/s] 40it [00:04, 9.67it/s] 41it [00:04, 9.71it/s] 42it [00:04, 9.71it/s] 43it [00:04, 9.13it/s] 44it [00:04, 9.25it/s] 45it [00:04, 9.40it/s] 46it [00:04, 9.49it/s] 47it [00:04, 9.14it/s] 48it [00:05, 9.18it/s] 49it [00:05, 9.34it/s] 50it [00:05, 9.45it/s]2025-05-26 03:19:55,533 - INFO - [Epoch 015 | Batch 0050] IWAE-loss 11714.7119 | mean log_px -0.1263 | KL -3566.29 + 51it [00:05, 9.53it/s] 52it [00:05, 9.56it/s] 53it [00:05, 9.64it/s] 54it [00:05, 9.65it/s] 55it [00:05, 9.68it/s] 56it [00:05, 9.67it/s] 57it [00:06, 9.08it/s] 58it [00:06, 9.19it/s] 59it [00:06, 9.34it/s] 60it [00:06, 9.43it/s] 61it [00:06, 9.49it/s] 62it [00:06, 9.54it/s] 63it [00:06, 9.52it/s] 64it [00:06, 8.87it/s] 65it [00:06, 9.06it/s] 66it [00:07, 9.21it/s] 67it [00:07, 9.35it/s] 68it [00:07, 9.47it/s] 69it [00:07, 9.36it/s] 70it [00:07, 8.87it/s] 71it [00:07, 9.04it/s] 72it [00:07, 9.19it/s] 73it [00:07, 9.26it/s] 74it [00:07, 9.30it/s] 75it [00:07, 9.36it/s] 76it [00:08, 9.38it/s] 77it [00:08, 8.83it/s] 78it [00:08, 9.00it/s] 79it [00:08, 9.22it/s] 80it [00:08, 9.36it/s] 81it [00:08, 9.48it/s] 82it [00:08, 9.56it/s] 83it [00:08, 9.03it/s] 84it [00:08, 9.12it/s] 85it [00:09, 9.29it/s] 86it [00:09, 8.83it/s] 87it [00:09, 9.02it/s] 88it [00:09, 9.16it/s] 89it [00:09, 9.22it/s] 90it [00:09, 8.75it/s] 91it [00:09, 8.93it/s] 92it [00:09, 9.15it/s] 93it [00:09, 9.28it/s] 94it [00:10, 9.40it/s] 95it [00:10, 8.89it/s] 96it [00:10, 9.08it/s] 97it [00:10, 9.19it/s] 98it [00:10, 9.31it/s] 99it [00:10, 8.84it/s] 100it [00:10, 9.08it/s]2025-05-26 03:20:00,957 - INFO - [Epoch 015 | Batch 0100] IWAE-loss 10056.2070 | mean log_px -0.1000 | KL -3566.32 + 101it [00:10, 9.25it/s] 102it [00:10, 9.34it/s] 103it [00:11, 8.84it/s] 104it [00:11, 8.91it/s] 105it [00:11, 8.85it/s] 106it [00:11, 9.00it/s] 107it [00:11, 8.77it/s] 108it [00:11, 8.99it/s] 109it [00:11, 9.20it/s] 110it [00:11, 9.31it/s] 111it [00:11, 9.41it/s] 112it [00:12, 9.25it/s] 113it [00:12, 8.65it/s] 114it [00:12, 8.81it/s] 115it [00:12, 8.95it/s] 116it [00:12, 9.08it/s] 117it [00:12, 9.20it/s] 118it [00:12, 9.24it/s] 119it [00:12, 8.79it/s] 120it [00:12, 8.91it/s] 121it [00:13, 8.93it/s] 122it [00:13, 8.98it/s] 123it [00:13, 8.50it/s] 124it [00:13, 8.85it/s] 125it [00:13, 9.16it/s] 126it [00:13, 9.38it/s] 127it [00:13, 9.52it/s] 128it [00:13, 9.66it/s] 130it [00:14, 9.28it/s] 132it [00:14, 9.54it/s] 133it [00:14, 9.64it/s] 134it [00:14, 9.23it/s] 135it [00:14, 9.41it/s] 136it [00:14, 9.50it/s] 137it [00:14, 9.61it/s] 138it [00:14, 9.66it/s] 139it [00:14, 9.71it/s] 140it [00:15, 9.71it/s] 141it [00:15, 9.76it/s] 142it [00:15, 9.58it/s] 143it [00:15, 8.93it/s] 145it [00:15, 9.44it/s] 147it [00:15, 9.70it/s] 149it [00:15, 9.85it/s]2025-05-26 03:20:06,323 - INFO - [Epoch 015 | Batch 0150] IWAE-loss 9198.8525 | mean log_px -0.0873 | KL -3561.38 + 151it [00:16, 9.55it/s] 153it [00:16, 9.73it/s] 155it [00:16, 9.83it/s] 157it [00:16, 9.53it/s] 158it [00:16, 9.60it/s] 160it [00:17, 9.72it/s] 162it [00:17, 9.51it/s] 164it [00:17, 9.70it/s] 166it [00:17, 9.82it/s] 168it [00:17, 9.91it/s] 170it [00:18, 9.89it/s] 171it [00:18, 9.53it/s] 173it [00:18, 9.71it/s] 175it [00:18, 9.85it/s] 177it [00:18, 9.93it/s] 178it [00:18, 9.74it/s] 179it [00:19, 9.46it/s] 181it [00:19, 9.71it/s] 182it [00:19, 9.67it/s] 184it [00:19, 9.53it/s] 186it [00:19, 9.74it/s] 188it [00:20, 9.51it/s] 190it [00:20, 9.71it/s] 192it [00:20, 9.85it/s] 194it [00:20, 9.94it/s] 195it [00:20, 9.68it/s] 196it [00:20, 9.38it/s] +2025-05-26 03:20:11,065 - INFO - Epoch: 15, Objective: tensor([12319.4551], device='cuda:0', grad_fn=), Loss: 0.13309964537620544, KL/n: 72.79181671142578 + 0it [00:00, ?it/s]2025-05-26 03:20:11,337 - INFO - [Epoch 016 | Batch 0000] IWAE-loss 7340.2905 | mean log_px -0.0581 | KL -3566.00 + 1it [00:00, 5.43it/s] 2it [00:00, 7.36it/s] 4it [00:00, 8.90it/s] 6it [00:00, 8.98it/s] 8it [00:00, 9.41it/s] 10it [00:01, 7.05it/s] 12it [00:01, 7.87it/s] 13it [00:01, 7.99it/s] 15it [00:01, 8.64it/s] 17it [00:02, 8.84it/s] 19it [00:02, 9.21it/s] 21it [00:02, 9.48it/s] 23it [00:02, 9.67it/s] 24it [00:02, 9.35it/s] 26it [00:02, 9.52it/s] 27it [00:03, 9.31it/s] 29it [00:03, 9.59it/s] 31it [00:03, 9.74it/s] 33it [00:03, 9.86it/s] 35it [00:03, 9.94it/s] 37it [00:04, 9.99it/s] 39it [00:04, 10.03it/s] 41it [00:04, 10.06it/s] 43it [00:04, 9.75it/s] 45it [00:04, 9.86it/s] 47it [00:05, 9.93it/s] 49it [00:05, 9.98it/s]2025-05-26 03:20:16,625 - INFO - [Epoch 016 | Batch 0050] IWAE-loss 9277.7939 | mean log_px -0.0837 | KL -3565.87 + 51it [00:05, 9.68it/s] 52it [00:05, 9.73it/s] 54it [00:05, 9.86it/s] 56it [00:05, 9.94it/s] 58it [00:06, 9.97it/s] 59it [00:06, 9.97it/s] 61it [00:06, 10.02it/s] 63it [00:06, 10.04it/s] 65it [00:06, 10.07it/s] 67it [00:07, 10.08it/s] 69it [00:07, 10.08it/s] 71it [00:07, 10.06it/s] 73it [00:07, 9.80it/s] 75it [00:07, 9.89it/s] 76it [00:07, 9.90it/s] 78it [00:08, 9.99it/s] 79it [00:08, 9.59it/s] 80it [00:08, 9.67it/s] 81it [00:08, 9.63it/s] 82it [00:08, 9.54it/s] 83it [00:08, 9.07it/s] 84it [00:08, 9.06it/s] 85it [00:08, 9.19it/s] 86it [00:09, 9.38it/s] 87it [00:09, 9.55it/s] 88it [00:09, 9.18it/s] 89it [00:09, 9.35it/s] 90it [00:09, 9.51it/s] 91it [00:09, 9.63it/s] 92it [00:09, 9.72it/s] 93it [00:09, 9.18it/s] 94it [00:09, 9.38it/s] 95it [00:10, 9.54it/s] 96it [00:10, 9.67it/s] 98it [00:10, 9.87it/s] 100it [00:10, 9.98it/s]2025-05-26 03:20:21,763 - INFO - [Epoch 016 | Batch 0100] IWAE-loss 11751.0801 | mean log_px -0.1212 | KL -3566.18 + 101it [00:10, 9.53it/s] 103it [00:10, 9.74it/s] 105it [00:11, 9.88it/s] 107it [00:11, 9.96it/s] 109it [00:11, 10.01it/s] 111it [00:11, 10.05it/s] 113it [00:11, 10.05it/s] 115it [00:12, 10.07it/s] 117it [00:12, 10.09it/s] 119it [00:12, 10.10it/s] 121it [00:12, 10.12it/s] 123it [00:12, 9.79it/s] 125it [00:13, 9.87it/s] 127it [00:13, 9.95it/s] 129it [00:13, 9.99it/s] 131it [00:13, 9.70it/s] 133it [00:13, 9.82it/s] 134it [00:13, 9.48it/s] 136it [00:14, 9.68it/s] 138it [00:14, 9.83it/s] 140it [00:14, 9.93it/s] 141it [00:14, 9.56it/s] 143it [00:14, 9.77it/s] 144it [00:14, 9.41it/s] 146it [00:15, 9.66it/s] 148it [00:15, 9.81it/s] 150it [00:15, 9.91it/s]2025-05-26 03:20:26,841 - INFO - [Epoch 016 | Batch 0150] IWAE-loss 10209.6055 | mean log_px -0.0996 | KL -3564.47 + 151it [00:15, 9.52it/s] 153it [00:15, 9.72it/s] 155it [00:16, 9.84it/s] 157it [00:16, 9.94it/s] 159it [00:16, 10.00it/s] 161it [00:16, 9.70it/s] 163it [00:16, 9.83it/s] 165it [00:17, 9.92it/s] 167it [00:17, 9.99it/s] 169it [00:17, 10.03it/s] 171it [00:17, 10.06it/s] 173it [00:17, 10.07it/s] 175it [00:18, 10.07it/s] 177it [00:18, 10.09it/s] 179it [00:18, 9.83it/s] 181it [00:18, 9.91it/s] 183it [00:18, 9.98it/s] 185it [00:19, 10.03it/s] 187it [00:19, 10.06it/s] 189it [00:19, 10.09it/s] 191it [00:19, 10.09it/s] 193it [00:19, 9.66it/s] 194it [00:20, 9.72it/s] 195it [00:20, 9.48it/s] 196it [00:20, 9.29it/s] 196it [00:20, 9.64it/s] +2025-05-26 03:20:31,519 - INFO - Epoch: 16, Objective: tensor([10027.8145], device='cuda:0', grad_fn=), Loss: 0.09540171176195145, KL/n: 72.8223648071289 + 0it [00:00, ?it/s]2025-05-26 03:20:31,795 - INFO - [Epoch 017 | Batch 0000] IWAE-loss 10231.7510 | mean log_px -0.0985 | KL -3565.85 + 1it [00:00, 5.37it/s] 2it [00:00, 6.75it/s] 4it [00:00, 8.51it/s] 6it [00:00, 9.15it/s] 7it [00:00, 8.96it/s] 8it [00:00, 9.20it/s] 10it [00:01, 9.51it/s] 12it [00:01, 9.69it/s] 13it [00:01, 9.75it/s] 14it [00:01, 9.79it/s] 15it [00:01, 9.31it/s] 16it [00:01, 9.44it/s] 17it [00:01, 9.54it/s] 18it [00:01, 9.66it/s] 19it [00:02, 9.76it/s] 20it [00:02, 9.83it/s] 21it [00:02, 9.28it/s] 22it [00:02, 9.46it/s] 23it [00:02, 9.60it/s] 24it [00:02, 9.70it/s] 25it [00:02, 9.17it/s] 26it [00:02, 9.38it/s] 27it [00:02, 9.53it/s] 28it [00:03, 9.52it/s] 29it [00:03, 9.09it/s] 30it [00:03, 9.31it/s] 31it [00:03, 9.50it/s] 32it [00:03, 9.63it/s] 33it [00:03, 9.25it/s] 34it [00:03, 9.44it/s] 35it [00:03, 9.59it/s] 36it [00:03, 9.10it/s] 37it [00:03, 9.31it/s] 38it [00:04, 9.46it/s] 39it [00:04, 9.61it/s] 40it [00:04, 9.10it/s] 41it [00:04, 9.34it/s] 42it [00:04, 9.49it/s] 44it [00:04, 9.27it/s] 45it [00:04, 9.44it/s] 46it [00:04, 9.55it/s] 47it [00:05, 9.13it/s] 48it [00:05, 9.35it/s] 50it [00:05, 9.20it/s]2025-05-26 03:20:37,082 - INFO - [Epoch 017 | Batch 0050] IWAE-loss 8144.4380 | mean log_px -0.0670 | KL -3562.43 + 51it [00:05, 9.36it/s] 52it [00:05, 9.50it/s] 53it [00:05, 9.11it/s] 54it [00:05, 9.31it/s] 56it [00:05, 9.60it/s] 57it [00:06, 9.22it/s] 58it [00:06, 9.39it/s] 59it [00:06, 9.52it/s] 60it [00:06, 9.10it/s] 62it [00:06, 9.48it/s] 64it [00:06, 9.31it/s] 65it [00:06, 9.44it/s] 66it [00:07, 9.54it/s] 68it [00:07, 9.34it/s] 69it [00:07, 9.47it/s] 70it [00:07, 9.55it/s] 71it [00:07, 9.15it/s] 72it [00:07, 9.34it/s] 73it [00:07, 9.49it/s] 74it [00:07, 9.59it/s] 75it [00:08, 9.12it/s] 76it [00:08, 9.34it/s] 77it [00:08, 9.48it/s] 78it [00:08, 9.62it/s] 79it [00:08, 9.13it/s] 80it [00:08, 9.33it/s] 81it [00:08, 9.51it/s] 82it [00:08, 9.63it/s] 83it [00:08, 9.13it/s] 84it [00:08, 9.37it/s] 85it [00:09, 9.54it/s] 86it [00:09, 9.65it/s] 87it [00:09, 9.12it/s] 88it [00:09, 9.30it/s] 89it [00:09, 9.48it/s] 90it [00:09, 9.61it/s] 91it [00:09, 9.12it/s] 92it [00:09, 9.33it/s] 93it [00:09, 9.51it/s] 94it [00:10, 9.03it/s] 95it [00:10, 9.27it/s] 96it [00:10, 9.45it/s] 97it [00:10, 9.60it/s] 98it [00:10, 9.10it/s] 99it [00:10, 9.26it/s] 100it [00:10, 9.40it/s]2025-05-26 03:20:42,409 - INFO - [Epoch 017 | Batch 0100] IWAE-loss 8396.8623 | mean log_px -0.0690 | KL -3563.99 + 101it [00:10, 9.54it/s] 102it [00:10, 9.08it/s] 103it [00:11, 9.30it/s] 104it [00:11, 9.49it/s] 105it [00:11, 9.07it/s] 106it [00:11, 9.32it/s] 108it [00:11, 9.63it/s] 109it [00:11, 9.21it/s] 110it [00:11, 9.38it/s] 111it [00:11, 9.52it/s] 112it [00:11, 9.62it/s] 113it [00:12, 9.15it/s] 114it [00:12, 9.36it/s] 115it [00:12, 9.51it/s] 116it [00:12, 9.61it/s] 117it [00:12, 9.12it/s] 119it [00:12, 9.50it/s] 120it [00:12, 9.12it/s] 121it [00:12, 9.32it/s] 122it [00:13, 9.46it/s] 123it [00:13, 9.59it/s] 124it [00:13, 9.10it/s] 125it [00:13, 9.33it/s] 126it [00:13, 9.49it/s] 127it [00:13, 9.63it/s] 128it [00:13, 9.14it/s] 129it [00:13, 9.36it/s] 130it [00:13, 9.50it/s] 131it [00:13, 9.64it/s] 132it [00:14, 9.12it/s] 133it [00:14, 9.34it/s] 134it [00:14, 9.52it/s] 135it [00:14, 9.64it/s] 136it [00:14, 9.13it/s] 137it [00:14, 9.36it/s] 138it [00:14, 9.53it/s] 139it [00:14, 9.04it/s] 140it [00:14, 9.28it/s] 141it [00:15, 9.46it/s] 142it [00:15, 9.60it/s] 143it [00:15, 9.09it/s] 144it [00:15, 9.29it/s] 145it [00:15, 9.48it/s] 146it [00:15, 9.59it/s] 147it [00:15, 9.10it/s] 148it [00:15, 9.32it/s] 149it [00:15, 9.50it/s] 150it [00:16, 9.62it/s]2025-05-26 03:20:47,737 - INFO - [Epoch 017 | Batch 0150] IWAE-loss 9258.7881 | mean log_px -0.0835 | KL -3569.38 + 151it [00:16, 9.11it/s] 152it [00:16, 9.33it/s] 153it [00:16, 9.49it/s] 154it [00:16, 9.58it/s] 155it [00:16, 9.09it/s] 156it [00:16, 9.34it/s] 157it [00:16, 9.48it/s] 159it [00:16, 9.74it/s] 160it [00:17, 9.80it/s] 161it [00:17, 9.84it/s] 162it [00:17, 9.87it/s] 163it [00:17, 9.90it/s] 164it [00:17, 9.30it/s] 166it [00:17, 9.56it/s] 168it [00:17, 9.73it/s] 170it [00:18, 9.83it/s] 171it [00:18, 9.86it/s] 172it [00:18, 9.87it/s] 174it [00:18, 9.93it/s] 175it [00:18, 9.45it/s] 176it [00:18, 9.53it/s] 178it [00:18, 9.72it/s] 179it [00:19, 9.30it/s] 180it [00:19, 9.10it/s] 181it [00:19, 9.12it/s] 182it [00:19, 9.14it/s] 183it [00:19, 9.21it/s] 184it [00:19, 9.29it/s] 185it [00:19, 8.72it/s] 186it [00:19, 8.71it/s] 187it [00:19, 8.90it/s] 188it [00:20, 9.09it/s] 189it [00:20, 9.25it/s] 190it [00:20, 9.35it/s] 191it [00:20, 9.43it/s] 192it [00:20, 9.48it/s] 193it [00:20, 9.54it/s] 194it [00:20, 9.56it/s] 195it [00:20, 9.05it/s] 196it [00:20, 8.83it/s] 196it [00:20, 9.34it/s] +2025-05-26 03:20:52,637 - INFO - Epoch: 17, Objective: tensor([9598.7822], device='cuda:0', grad_fn=), Loss: 0.08933060616254807, KL/n: 72.83203125 + 0it [00:00, ?it/s]2025-05-26 03:20:53,097 - INFO - [Epoch 018 | Batch 0000] IWAE-loss 12348.8164 | mean log_px -0.1254 | KL -3569.31 + 1it [00:00, 5.27it/s] 2it [00:00, 6.61it/s] 3it [00:00, 7.66it/s] 4it [00:00, 8.30it/s] 5it [00:00, 8.67it/s] 6it [00:00, 8.93it/s] 7it [00:00, 8.68it/s] 8it [00:00, 8.98it/s] 9it [00:01, 9.16it/s] 10it [00:01, 9.29it/s] 11it [00:01, 9.40it/s] 12it [00:01, 9.48it/s] 13it [00:01, 8.92it/s] 14it [00:01, 9.07it/s] 15it [00:01, 9.24it/s] 16it [00:01, 9.31it/s] 17it [00:01, 9.36it/s] 18it [00:02, 9.38it/s] 19it [00:02, 9.44it/s] 20it [00:02, 9.44it/s] 21it [00:02, 9.48it/s] 22it [00:02, 9.51it/s] 23it [00:02, 9.51it/s] 24it [00:02, 9.49it/s] 25it [00:02, 9.48it/s] 26it [00:02, 9.48it/s] 27it [00:02, 9.44it/s] 28it [00:03, 8.73it/s] 29it [00:03, 8.83it/s] 30it [00:03, 9.00it/s] 31it [00:03, 9.17it/s] 32it [00:03, 9.24it/s] 33it [00:03, 8.92it/s] 34it [00:03, 9.05it/s] 35it [00:03, 9.16it/s] 36it [00:04, 8.74it/s] 37it [00:04, 8.94it/s] 38it [00:04, 9.08it/s] 39it [00:04, 8.70it/s] 40it [00:04, 8.95it/s] 41it [00:04, 9.10it/s] 42it [00:04, 9.20it/s] 43it [00:04, 8.80it/s] 44it [00:04, 8.98it/s] 45it [00:04, 9.13it/s] 46it [00:05, 9.24it/s] 47it [00:05, 8.81it/s] 48it [00:05, 9.02it/s] 49it [00:05, 9.16it/s] 50it [00:05, 9.31it/s]2025-05-26 03:20:58,549 - INFO - [Epoch 018 | Batch 0050] IWAE-loss 8044.7241 | mean log_px -0.0678 | KL -3567.06 + 51it [00:05, 8.85it/s] 52it [00:05, 9.02it/s] 53it [00:05, 9.19it/s] 54it [00:05, 9.30it/s] 55it [00:06, 8.83it/s] 56it [00:06, 8.97it/s] 57it [00:06, 8.66it/s] 58it [00:06, 8.85it/s] 59it [00:06, 9.04it/s] 60it [00:06, 9.08it/s] 61it [00:06, 9.18it/s] 62it [00:06, 8.79it/s] 63it [00:06, 9.05it/s] 64it [00:07, 9.20it/s] 65it [00:07, 9.34it/s] 66it [00:07, 8.86it/s] 67it [00:07, 9.07it/s] 68it [00:07, 9.19it/s] 69it [00:07, 9.32it/s] 70it [00:07, 8.88it/s] 71it [00:07, 9.12it/s] 72it [00:07, 9.30it/s] 73it [00:08, 9.36it/s] 74it [00:08, 8.91it/s] 75it [00:08, 9.11it/s] 76it [00:08, 9.26it/s] 77it [00:08, 9.37it/s] 78it [00:08, 8.87it/s] 79it [00:08, 9.08it/s] 80it [00:08, 9.20it/s] 81it [00:08, 9.10it/s] 82it [00:09, 8.99it/s] 83it [00:09, 8.50it/s] 84it [00:09, 8.82it/s] 85it [00:09, 9.06it/s] 86it [00:09, 9.23it/s] 87it [00:09, 8.83it/s] 88it [00:09, 9.07it/s] 89it [00:09, 9.22it/s] 90it [00:09, 9.35it/s] 91it [00:10, 8.89it/s] 92it [00:10, 9.05it/s] 93it [00:10, 9.23it/s] 94it [00:10, 9.32it/s] 95it [00:10, 8.88it/s] 96it [00:10, 9.02it/s] 97it [00:10, 9.19it/s] 98it [00:10, 9.28it/s] 99it [00:10, 8.87it/s] 100it [00:11, 9.07it/s]2025-05-26 03:21:04,073 - INFO - [Epoch 018 | Batch 0100] IWAE-loss 8123.0947 | mean log_px -0.0684 | KL -3570.99 + 101it [00:11, 9.24it/s] 102it [00:11, 9.29it/s] 103it [00:11, 8.84it/s] 104it [00:11, 9.02it/s] 105it [00:11, 9.16it/s] 106it [00:11, 9.23it/s] 107it [00:11, 8.84it/s] 108it [00:11, 9.00it/s] 109it [00:12, 9.08it/s] 110it [00:12, 9.23it/s] 111it [00:12, 8.83it/s] 112it [00:12, 9.02it/s] 113it [00:12, 9.15it/s] 114it [00:12, 9.16it/s] 115it [00:12, 8.79it/s] 116it [00:12, 8.99it/s] 117it [00:12, 9.11it/s] 118it [00:13, 9.23it/s] 119it [00:13, 8.81it/s] 120it [00:13, 9.01it/s] 121it [00:13, 9.17it/s] 122it [00:13, 9.27it/s] 123it [00:13, 8.86it/s] 124it [00:13, 9.01it/s] 125it [00:13, 9.18it/s] 126it [00:13, 9.25it/s] 127it [00:14, 8.85it/s] 128it [00:14, 9.04it/s] 129it [00:14, 9.20it/s] 130it [00:14, 9.27it/s] 131it [00:14, 8.89it/s] 132it [00:14, 9.06it/s] 133it [00:14, 9.18it/s] 134it [00:14, 9.26it/s] 135it [00:14, 8.89it/s] 136it [00:15, 8.96it/s] 137it [00:15, 9.08it/s] 138it [00:15, 8.77it/s] 139it [00:15, 9.06it/s] 140it [00:15, 9.22it/s] 141it [00:15, 8.89it/s] 142it [00:15, 9.12it/s] 143it [00:15, 9.30it/s] 144it [00:15, 8.93it/s] 145it [00:16, 9.16it/s] 146it [00:16, 9.33it/s] 147it [00:16, 8.93it/s] 148it [00:16, 9.18it/s] 149it [00:16, 9.35it/s] 150it [00:16, 8.97it/s]2025-05-26 03:21:09,589 - INFO - [Epoch 018 | Batch 0150] IWAE-loss 6793.8252 | mean log_px -0.0610 | KL -3563.42 + 151it [00:16, 9.15it/s] 152it [00:16, 9.33it/s] 153it [00:16, 8.93it/s] 154it [00:17, 9.15it/s] 155it [00:17, 9.34it/s] 156it [00:17, 8.93it/s] 157it [00:17, 9.18it/s] 158it [00:17, 9.26it/s] 159it [00:17, 8.88it/s] 160it [00:17, 9.12it/s] 161it [00:17, 9.32it/s] 162it [00:17, 8.94it/s] 163it [00:17, 9.18it/s] 164it [00:18, 9.35it/s] 165it [00:18, 8.98it/s] 166it [00:18, 9.18it/s] 167it [00:18, 9.35it/s] 168it [00:18, 8.96it/s] 169it [00:18, 9.19it/s] 170it [00:18, 9.36it/s] 171it [00:18, 8.99it/s] 172it [00:18, 9.19it/s] 173it [00:19, 9.36it/s] 174it [00:19, 8.95it/s] 175it [00:19, 9.20it/s] 176it [00:19, 9.36it/s] 177it [00:19, 8.91it/s] 178it [00:19, 9.14it/s] 179it [00:19, 9.32it/s] 180it [00:19, 8.94it/s] 181it [00:19, 9.18it/s] 182it [00:20, 9.33it/s] 183it [00:20, 8.95it/s] 184it [00:20, 9.17it/s] 185it [00:20, 9.25it/s] 186it [00:20, 8.83it/s] 187it [00:20, 9.08it/s] 188it [00:20, 9.26it/s] 189it [00:20, 8.87it/s] 190it [00:20, 9.04it/s] 191it [00:21, 9.19it/s] 192it [00:21, 8.86it/s] 193it [00:21, 9.12it/s] 194it [00:21, 9.31it/s] 195it [00:21, 8.88it/s] 196it [00:21, 8.84it/s] 196it [00:21, 9.04it/s] +2025-05-26 03:21:14,643 - INFO - Epoch: 18, Objective: tensor([8188.5557], device='cuda:0', grad_fn=), Loss: 0.07669003307819366, KL/n: 72.82756805419922 + 0it [00:00, ?it/s]2025-05-26 03:21:14,929 - INFO - [Epoch 019 | Batch 0000] IWAE-loss 6962.9434 | mean log_px -0.0530 | KL -3566.80 + 1it [00:00, 5.21it/s] 2it [00:00, 7.20it/s] 3it [00:00, 7.76it/s] 4it [00:00, 8.46it/s] 5it [00:00, 8.91it/s] 6it [00:00, 9.16it/s] 7it [00:00, 9.21it/s] 8it [00:00, 9.32it/s] 9it [00:01, 9.49it/s] 10it [00:01, 9.56it/s] 11it [00:01, 9.64it/s] 12it [00:01, 9.67it/s] 13it [00:01, 9.68it/s] 14it [00:01, 9.61it/s] 15it [00:01, 9.65it/s] 16it [00:01, 9.71it/s] 17it [00:01, 9.74it/s] 18it [00:01, 9.76it/s] 19it [00:02, 9.77it/s] 20it [00:02, 9.78it/s] 21it [00:02, 9.76it/s] 22it [00:02, 9.77it/s] 23it [00:02, 9.77it/s] 24it [00:02, 9.79it/s] 25it [00:02, 9.81it/s] 26it [00:02, 9.83it/s] 27it [00:02, 9.86it/s] 28it [00:02, 9.86it/s] 29it [00:03, 9.88it/s] 30it [00:03, 9.86it/s] 31it [00:03, 9.83it/s] 32it [00:03, 9.79it/s] 33it [00:03, 9.81it/s] 34it [00:03, 9.81it/s] 35it [00:03, 9.81it/s] 36it [00:03, 9.82it/s] 37it [00:03, 9.84it/s] 38it [00:03, 9.82it/s] 39it [00:04, 9.81it/s] 40it [00:04, 9.81it/s] 41it [00:04, 9.83it/s] 42it [00:04, 9.79it/s] 43it [00:04, 9.82it/s] 44it [00:04, 9.82it/s] 45it [00:04, 9.82it/s] 46it [00:04, 9.79it/s] 47it [00:04, 9.82it/s] 48it [00:05, 9.81it/s] 49it [00:05, 9.81it/s] 50it [00:05, 9.79it/s]2025-05-26 03:21:20,056 - INFO - [Epoch 019 | Batch 0050] IWAE-loss 11381.5762 | mean log_px -0.1166 | KL -3569.48 + 51it [00:05, 9.77it/s] 52it [00:05, 9.62it/s] 53it [00:05, 9.63it/s] 54it [00:05, 9.64it/s] 55it [00:05, 9.68it/s] 56it [00:05, 9.71it/s] 57it [00:05, 9.72it/s] 58it [00:06, 9.72it/s] 59it [00:06, 9.71it/s] 60it [00:06, 9.72it/s] 61it [00:06, 9.74it/s] 62it [00:06, 9.76it/s] 63it [00:06, 9.79it/s] 64it [00:06, 9.79it/s] 65it [00:06, 9.81it/s] 66it [00:06, 9.27it/s] 67it [00:06, 9.44it/s] 68it [00:07, 9.54it/s] 69it [00:07, 9.64it/s] 70it [00:07, 9.67it/s] 71it [00:07, 9.70it/s] 72it [00:07, 9.76it/s] 73it [00:07, 9.79it/s] 74it [00:07, 9.75it/s] 75it [00:07, 9.80it/s] 76it [00:07, 9.76it/s] 77it [00:08, 9.69it/s] 78it [00:08, 9.29it/s] 79it [00:08, 9.27it/s] 80it [00:08, 9.41it/s] 81it [00:08, 9.50it/s] 82it [00:08, 9.55it/s] 83it [00:08, 9.60it/s] 84it [00:08, 9.60it/s] 85it [00:08, 9.67it/s] 86it [00:08, 9.67it/s] 87it [00:09, 9.69it/s] 88it [00:09, 9.70it/s] 89it [00:09, 9.69it/s] 90it [00:09, 9.66it/s] 91it [00:09, 9.67it/s] 92it [00:09, 9.70it/s] 93it [00:09, 9.75it/s] 94it [00:09, 9.78it/s] 95it [00:09, 9.69it/s] 96it [00:09, 9.71it/s] 97it [00:10, 9.75it/s] 98it [00:10, 9.74it/s] 99it [00:10, 9.75it/s] 100it [00:10, 9.76it/s]2025-05-26 03:21:25,232 - INFO - [Epoch 019 | Batch 0100] IWAE-loss 8565.3213 | mean log_px -0.0776 | KL -3569.59 + 101it [00:10, 9.74it/s] 102it [00:10, 9.76it/s] 103it [00:10, 9.76it/s] 104it [00:10, 9.79it/s] 105it [00:10, 9.80it/s] 106it [00:11, 9.78it/s] 107it [00:11, 9.77it/s] 108it [00:11, 9.66it/s] 109it [00:11, 9.70it/s] 110it [00:11, 9.74it/s] 111it [00:11, 9.68it/s] 112it [00:11, 9.74it/s] 113it [00:11, 9.77it/s] 114it [00:11, 9.69it/s] 115it [00:11, 9.73it/s] 116it [00:12, 9.73it/s] 117it [00:12, 9.78it/s] 118it [00:12, 9.76it/s] 119it [00:12, 9.80it/s] 120it [00:12, 9.82it/s] 121it [00:12, 9.82it/s] 122it [00:12, 9.76it/s] 123it [00:12, 9.78it/s] 124it [00:12, 9.78it/s] 125it [00:12, 9.57it/s] 126it [00:13, 9.40it/s] 127it [00:13, 9.44it/s] 128it [00:13, 9.52it/s] 129it [00:13, 9.47it/s] 130it [00:13, 9.58it/s] 131it [00:13, 9.64it/s] 132it [00:13, 9.67it/s] 133it [00:13, 9.69it/s] 134it [00:13, 9.71it/s] 135it [00:13, 9.76it/s] 136it [00:14, 9.72it/s] 137it [00:14, 9.71it/s] 138it [00:14, 9.74it/s] 139it [00:14, 9.73it/s] 140it [00:14, 9.76it/s] 141it [00:14, 9.77it/s] 142it [00:14, 9.77it/s] 143it [00:14, 9.71it/s] 144it [00:14, 9.71it/s] 145it [00:15, 9.76it/s] 146it [00:15, 9.79it/s] 147it [00:15, 9.81it/s] 148it [00:15, 9.79it/s] 149it [00:15, 9.82it/s] 150it [00:15, 9.83it/s]2025-05-26 03:21:30,373 - INFO - [Epoch 019 | Batch 0150] IWAE-loss 7441.7295 | mean log_px -0.0628 | KL -3567.16 + 151it [00:15, 9.83it/s] 152it [00:15, 9.81it/s] 153it [00:15, 9.84it/s] 154it [00:15, 9.81it/s] 155it [00:16, 9.84it/s] 156it [00:16, 9.81it/s] 157it [00:16, 9.82it/s] 158it [00:16, 9.83it/s] 159it [00:16, 9.81it/s] 160it [00:16, 9.81it/s] 161it [00:16, 9.81it/s] 162it [00:16, 9.80it/s] 163it [00:16, 9.59it/s] 164it [00:16, 9.63it/s] 165it [00:17, 9.68it/s] 166it [00:17, 9.69it/s] 167it [00:17, 9.73it/s] 168it [00:17, 9.74it/s] 169it [00:17, 9.76it/s] 170it [00:17, 9.78it/s] 171it [00:17, 9.80it/s] 172it [00:17, 9.76it/s] 173it [00:17, 9.78it/s] 174it [00:17, 9.80it/s] 175it [00:18, 9.83it/s] 176it [00:18, 9.82it/s] 177it [00:18, 9.72it/s] 178it [00:18, 9.52it/s] 179it [00:18, 9.60it/s] 180it [00:18, 9.63it/s] 181it [00:18, 9.56it/s] 182it [00:18, 9.31it/s] 183it [00:18, 8.76it/s] 184it [00:19, 8.70it/s] 185it [00:19, 8.82it/s] 186it [00:19, 8.99it/s] 187it [00:19, 9.21it/s] 188it [00:19, 9.35it/s] 189it [00:19, 9.50it/s] 190it [00:19, 9.23it/s] 191it [00:19, 9.40it/s] 192it [00:19, 9.52it/s] 193it [00:20, 9.62it/s] 194it [00:20, 9.69it/s] 195it [00:20, 9.17it/s] 196it [00:20, 9.60it/s] +2025-05-26 03:21:35,186 - INFO - Epoch: 19, Objective: tensor([7893.3765], device='cuda:0', grad_fn=), Loss: 0.061493679881095886, KL/n: 72.83820343017578 + 0it [00:00, ?it/s]2025-05-26 03:21:35,609 - INFO - [Epoch 020 | Batch 0000] IWAE-loss 6628.0117 | mean log_px -0.0495 | KL -3568.11 + 1it [00:00, 6.35it/s] 2it [00:00, 7.96it/s] 3it [00:00, 8.74it/s] 4it [00:00, 9.12it/s] 5it [00:00, 9.26it/s] 6it [00:00, 9.41it/s] 7it [00:00, 9.56it/s] 8it [00:00, 9.64it/s] 9it [00:00, 9.66it/s] 10it [00:01, 9.56it/s] 11it [00:01, 9.63it/s] 12it [00:01, 9.60it/s] 13it [00:01, 9.69it/s] 14it [00:01, 9.71it/s] 15it [00:01, 9.73it/s] 16it [00:01, 9.73it/s] 17it [00:01, 9.75it/s] 18it [00:01, 9.75it/s] 19it [00:02, 9.57it/s] 20it [00:02, 9.62it/s] 21it [00:02, 9.71it/s] 22it [00:02, 9.73it/s] 23it [00:02, 9.75it/s] 24it [00:02, 9.76it/s] 25it [00:02, 9.78it/s] 26it [00:02, 9.78it/s] 27it [00:02, 9.75it/s] 28it [00:02, 9.76it/s] 29it [00:03, 9.78it/s] 30it [00:03, 9.80it/s] 31it [00:03, 9.82it/s] 32it [00:03, 9.22it/s] 33it [00:03, 9.36it/s] 34it [00:03, 9.46it/s] 35it [00:03, 9.31it/s] 36it [00:03, 9.44it/s] 37it [00:03, 9.56it/s] 38it [00:03, 9.58it/s] 39it [00:04, 9.62it/s] 40it [00:04, 9.68it/s] 41it [00:04, 9.69it/s] 42it [00:04, 9.71it/s] 43it [00:04, 9.73it/s] 44it [00:04, 9.71it/s] 45it [00:04, 9.71it/s] 46it [00:04, 9.73it/s] 47it [00:04, 9.73it/s] 48it [00:05, 9.74it/s] 49it [00:05, 9.77it/s] 50it [00:05, 9.77it/s]2025-05-26 03:21:40,774 - INFO - [Epoch 020 | Batch 0050] IWAE-loss 7019.3750 | mean log_px -0.0534 | KL -3567.79 + 51it [00:05, 9.73it/s] 52it [00:05, 9.72it/s] 53it [00:05, 9.75it/s] 54it [00:05, 9.75it/s] 55it [00:05, 9.75it/s] 56it [00:05, 9.77it/s] 57it [00:05, 9.73it/s] 58it [00:06, 9.73it/s] 59it [00:06, 9.67it/s] 60it [00:06, 9.69it/s] 61it [00:06, 9.62it/s] 62it [00:06, 9.67it/s] 63it [00:06, 9.68it/s] 64it [00:06, 9.71it/s] 65it [00:06, 9.74it/s] 66it [00:06, 9.74it/s] 67it [00:06, 9.74it/s] 68it [00:07, 9.71it/s] 69it [00:07, 9.65it/s] 70it [00:07, 9.65it/s] 71it [00:07, 9.66it/s] 72it [00:07, 9.59it/s] 73it [00:07, 9.65it/s] 74it [00:07, 9.67it/s] 75it [00:07, 9.71it/s] 76it [00:07, 9.68it/s] 77it [00:08, 9.69it/s] 78it [00:08, 9.70it/s] 79it [00:08, 9.70it/s] 80it [00:08, 9.73it/s] 81it [00:08, 9.74it/s] 82it [00:08, 9.72it/s] 83it [00:08, 9.70it/s] 84it [00:08, 9.21it/s] 85it [00:08, 9.35it/s] 86it [00:08, 9.43it/s] 87it [00:09, 9.50it/s] 88it [00:09, 9.47it/s] 89it [00:09, 9.57it/s] 90it [00:09, 9.53it/s] 91it [00:09, 9.57it/s] 92it [00:09, 9.62it/s] 93it [00:09, 9.64it/s] 94it [00:09, 9.67it/s] 95it [00:09, 9.74it/s] 96it [00:09, 9.73it/s] 97it [00:10, 9.76it/s] 98it [00:10, 9.75it/s] 99it [00:10, 9.74it/s] 100it [00:10, 9.72it/s]2025-05-26 03:21:45,950 - INFO - [Epoch 020 | Batch 0100] IWAE-loss 9756.4814 | mean log_px -0.0918 | KL -3565.89 + 101it [00:10, 9.71it/s] 102it [00:10, 9.71it/s] 103it [00:10, 9.70it/s] 104it [00:10, 9.69it/s] 105it [00:10, 9.73it/s] 106it [00:11, 9.75it/s] 107it [00:11, 9.74it/s] 108it [00:11, 9.71it/s] 109it [00:11, 9.72it/s] 110it [00:11, 9.73it/s] 111it [00:11, 9.71it/s] 112it [00:11, 9.63it/s] 113it [00:11, 9.69it/s] 114it [00:11, 9.68it/s] 115it [00:11, 9.71it/s] 116it [00:12, 9.71it/s] 117it [00:12, 9.73it/s] 118it [00:12, 9.74it/s] 119it [00:12, 9.67it/s] 120it [00:12, 9.66it/s] 121it [00:12, 9.64it/s] 122it [00:12, 9.64it/s] 123it [00:12, 9.60it/s] 124it [00:12, 9.62it/s] 125it [00:12, 9.61it/s] 126it [00:13, 9.63it/s] 127it [00:13, 9.65it/s] 128it [00:13, 9.68it/s] 129it [00:13, 9.68it/s] 130it [00:13, 9.69it/s] 131it [00:13, 9.71it/s] 132it [00:13, 9.69it/s] 133it [00:13, 9.73it/s] 134it [00:13, 9.72it/s] 135it [00:14, 9.77it/s] 136it [00:14, 9.50it/s] 137it [00:14, 9.46it/s] 138it [00:14, 9.56it/s] 139it [00:14, 9.63it/s] 140it [00:14, 9.66it/s] 141it [00:14, 9.71it/s] 142it [00:14, 9.71it/s] 143it [00:14, 9.50it/s] 144it [00:14, 9.54it/s] 145it [00:15, 9.60it/s] 146it [00:15, 9.45it/s] 147it [00:15, 9.47it/s] 148it [00:15, 9.43it/s] 149it [00:15, 9.40it/s] 150it [00:15, 9.50it/s]2025-05-26 03:21:51,142 - INFO - [Epoch 020 | Batch 0150] IWAE-loss 6741.2627 | mean log_px -0.0465 | KL -3565.47 + 151it [00:15, 9.50it/s] 152it [00:15, 9.54it/s] 153it [00:15, 9.49it/s] 154it [00:16, 9.53it/s] 155it [00:16, 9.62it/s] 156it [00:16, 9.67it/s] 157it [00:16, 9.71it/s] 158it [00:16, 9.74it/s] 159it [00:16, 9.75it/s] 160it [00:16, 9.73it/s] 161it [00:16, 9.73it/s] 162it [00:16, 9.53it/s] 163it [00:16, 9.60it/s] 164it [00:17, 9.64it/s] 165it [00:17, 9.71it/s] 166it [00:17, 9.72it/s] 167it [00:17, 9.73it/s] 168it [00:17, 9.71it/s] 169it [00:17, 9.70it/s] 170it [00:17, 9.67it/s] 171it [00:17, 9.63it/s] 172it [00:17, 9.65it/s] 173it [00:17, 9.65it/s] 174it [00:18, 9.62it/s] 175it [00:18, 9.64it/s] 176it [00:18, 9.68it/s] 177it [00:18, 9.72it/s] 178it [00:18, 9.70it/s] 179it [00:18, 9.71it/s] 180it [00:18, 9.65it/s] 181it [00:18, 9.44it/s] 182it [00:18, 9.21it/s] 183it [00:19, 9.15it/s] 184it [00:19, 9.27it/s] 185it [00:19, 9.37it/s] 186it [00:19, 9.41it/s] 187it [00:19, 9.45it/s] 188it [00:19, 9.47it/s] 189it [00:19, 9.24it/s] 190it [00:19, 9.36it/s] 191it [00:19, 9.43it/s] 192it [00:19, 9.43it/s] 193it [00:20, 9.46it/s] 194it [00:20, 9.48it/s] 195it [00:20, 9.04it/s] 196it [00:20, 9.57it/s] +2025-05-26 03:21:55,969 - INFO - Epoch: 20, Objective: tensor([5954.1396], device='cuda:0', grad_fn=), Loss: 0.034850478172302246, KL/n: 72.82156372070312 + 0it [00:00, ?it/s]2025-05-26 03:21:56,215 - INFO - [Epoch 021 | Batch 0000] IWAE-loss 7638.6367 | mean log_px -0.0598 | KL -3567.85 + 1it [00:00, 6.23it/s] 2it [00:00, 7.87it/s] 3it [00:00, 8.63it/s] 4it [00:00, 9.08it/s] 5it [00:00, 9.29it/s] 6it [00:00, 9.44it/s] 7it [00:00, 9.55it/s] 8it [00:00, 9.64it/s] 9it [00:00, 9.68it/s] 10it [00:01, 9.73it/s] 11it [00:01, 9.77it/s] 12it [00:01, 9.75it/s] 13it [00:01, 9.76it/s] 14it [00:01, 9.76it/s] 15it [00:01, 9.78it/s] 16it [00:01, 9.76it/s] 17it [00:01, 9.76it/s] 18it [00:01, 9.75it/s] 19it [00:02, 9.77it/s] 20it [00:02, 9.76it/s] 21it [00:02, 9.76it/s] 22it [00:02, 9.77it/s] 23it [00:02, 9.77it/s] 24it [00:02, 9.78it/s] 25it [00:02, 9.77it/s] 26it [00:02, 9.76it/s] 27it [00:02, 9.77it/s] 28it [00:02, 9.75it/s] 29it [00:03, 9.69it/s] 30it [00:03, 9.72it/s] 31it [00:03, 9.75it/s] 32it [00:03, 9.77it/s] 33it [00:03, 9.79it/s] 34it [00:03, 9.72it/s] 35it [00:03, 9.73it/s] 36it [00:03, 9.73it/s] 37it [00:03, 9.74it/s] 38it [00:03, 9.76it/s] 39it [00:04, 9.78it/s] 40it [00:04, 9.78it/s] 41it [00:04, 9.78it/s] 42it [00:04, 9.76it/s] 43it [00:04, 9.75it/s] 44it [00:04, 9.76it/s] 45it [00:04, 9.80it/s] 46it [00:04, 9.81it/s] 47it [00:04, 9.78it/s] 48it [00:04, 9.79it/s] 49it [00:05, 9.82it/s] 50it [00:05, 9.79it/s]2025-05-26 03:22:01,337 - INFO - [Epoch 021 | Batch 0050] IWAE-loss 12824.7617 | mean log_px -0.1392 | KL -3568.71 + 51it [00:05, 9.76it/s] 52it [00:05, 9.75it/s] 53it [00:05, 9.67it/s] 54it [00:05, 9.72it/s] 55it [00:05, 9.75it/s] 56it [00:05, 9.71it/s] 57it [00:05, 9.71it/s] 58it [00:06, 9.74it/s] 59it [00:06, 9.78it/s] 60it [00:06, 9.54it/s] 61it [00:06, 9.62it/s] 62it [00:06, 9.68it/s] 63it [00:06, 9.75it/s] 64it [00:06, 9.78it/s] 65it [00:06, 9.78it/s] 66it [00:06, 9.75it/s] 67it [00:06, 9.76it/s] 68it [00:07, 9.75it/s] 69it [00:07, 9.74it/s] 70it [00:07, 9.75it/s] 71it [00:07, 9.79it/s] 72it [00:07, 9.77it/s] 73it [00:07, 9.76it/s] 74it [00:07, 9.79it/s] 75it [00:07, 9.77it/s] 76it [00:07, 9.75it/s] 77it [00:07, 9.74it/s] 78it [00:08, 9.71it/s] 79it [00:08, 9.73it/s] 80it [00:08, 9.72it/s] 81it [00:08, 9.75it/s] 82it [00:08, 9.74it/s] 83it [00:08, 9.53it/s] 84it [00:08, 9.61it/s] 85it [00:08, 9.67it/s] 86it [00:08, 9.67it/s] 87it [00:08, 9.70it/s] 88it [00:09, 9.71it/s] 89it [00:09, 9.73it/s] 90it [00:09, 9.76it/s] 91it [00:09, 9.77it/s] 92it [00:09, 9.74it/s] 93it [00:09, 9.76it/s] 94it [00:09, 9.77it/s] 95it [00:09, 9.79it/s] 96it [00:09, 9.75it/s] 97it [00:10, 9.75it/s] 98it [00:10, 9.52it/s] 99it [00:10, 9.60it/s] 100it [00:10, 9.66it/s]2025-05-26 03:22:06,483 - INFO - [Epoch 021 | Batch 0100] IWAE-loss 9816.6523 | mean log_px -0.1053 | KL -3570.17 + 101it [00:10, 9.73it/s] 102it [00:10, 9.74it/s] 103it [00:10, 9.76it/s] 104it [00:10, 9.77it/s] 105it [00:10, 9.81it/s] 106it [00:10, 9.77it/s] 107it [00:11, 9.78it/s] 108it [00:11, 9.78it/s] 109it [00:11, 9.76it/s] 110it [00:11, 9.76it/s] 111it [00:11, 9.76it/s] 112it [00:11, 9.73it/s] 113it [00:11, 9.74it/s] 114it [00:11, 9.77it/s] 115it [00:11, 9.78it/s] 116it [00:11, 9.78it/s] 117it [00:12, 9.78it/s] 118it [00:12, 9.78it/s] 119it [00:12, 9.58it/s] 120it [00:12, 9.62it/s] 121it [00:12, 9.68it/s] 122it [00:12, 9.72it/s] 123it [00:12, 9.46it/s] 124it [00:12, 8.71it/s] 125it [00:12, 8.90it/s] 126it [00:13, 9.03it/s] 127it [00:13, 9.16it/s] 128it [00:13, 9.25it/s] 129it [00:13, 9.33it/s] 130it [00:13, 9.34it/s] 131it [00:13, 9.39it/s] 132it [00:13, 9.39it/s] 133it [00:13, 9.42it/s] 134it [00:13, 9.34it/s] 135it [00:13, 9.34it/s] 136it [00:14, 9.28it/s] 137it [00:14, 9.41it/s] 138it [00:14, 9.52it/s] 139it [00:14, 9.60it/s] 140it [00:14, 9.61it/s] 141it [00:14, 9.64it/s] 142it [00:14, 9.64it/s] 143it [00:14, 9.68it/s] 144it [00:14, 9.63it/s] 145it [00:15, 9.55it/s] 146it [00:15, 9.04it/s] 147it [00:15, 9.21it/s] 148it [00:15, 9.35it/s] 149it [00:15, 9.45it/s] 150it [00:15, 9.50it/s]2025-05-26 03:22:11,739 - INFO - [Epoch 021 | Batch 0150] IWAE-loss 6365.2271 | mean log_px -0.0422 | KL -3569.45 + 151it [00:15, 9.02it/s] 152it [00:15, 9.19it/s] 153it [00:15, 9.24it/s] 154it [00:16, 9.39it/s] 155it [00:16, 9.49it/s] 156it [00:16, 9.51it/s] 157it [00:16, 9.57it/s] 158it [00:16, 9.61it/s] 159it [00:16, 9.12it/s] 160it [00:16, 9.30it/s] 161it [00:16, 9.42it/s] 162it [00:16, 8.91it/s] 164it [00:17, 9.38it/s] 165it [00:17, 9.44it/s] 166it [00:17, 9.21it/s] 167it [00:17, 9.38it/s] 169it [00:17, 9.68it/s] 171it [00:17, 9.84it/s] 173it [00:17, 9.93it/s] 174it [00:18, 9.51it/s] 176it [00:18, 9.72it/s] 177it [00:18, 9.35it/s] 178it [00:18, 9.45it/s] 179it [00:18, 9.48it/s] 181it [00:18, 9.73it/s] 183it [00:19, 9.84it/s] 185it [00:19, 9.94it/s] 187it [00:19, 10.00it/s] 189it [00:19, 10.05it/s] 191it [00:19, 10.08it/s] 193it [00:20, 10.09it/s] 195it [00:20, 9.79it/s] 196it [00:20, 9.60it/s] +2025-05-26 03:22:16,504 - INFO - Epoch: 21, Objective: tensor([6160.0498], device='cuda:0', grad_fn=), Loss: 0.040021877735853195, KL/n: 72.79065704345703 + 0it [00:00, ?it/s]2025-05-26 03:22:16,966 - INFO - [Epoch 022 | Batch 0000] IWAE-loss 9817.3037 | mean log_px -0.0940 | KL -3564.62 + 1it [00:00, 5.37it/s] 2it [00:00, 7.32it/s] 4it [00:00, 8.79it/s] 6it [00:00, 9.33it/s] 8it [00:00, 9.25it/s] 10it [00:01, 9.51it/s] 12it [00:01, 9.69it/s] 14it [00:01, 9.73it/s] 15it [00:01, 9.43it/s] 16it [00:01, 9.53it/s] 18it [00:01, 9.32it/s] 19it [00:02, 9.45it/s] 20it [00:02, 9.56it/s] 21it [00:02, 9.67it/s] 22it [00:02, 9.72it/s] 23it [00:02, 9.23it/s] 24it [00:02, 9.43it/s] 26it [00:02, 9.68it/s] 28it [00:02, 9.80it/s] 30it [00:03, 9.89it/s] 32it [00:03, 9.94it/s] 33it [00:03, 9.95it/s] 34it [00:03, 9.95it/s] 36it [00:03, 9.98it/s] 38it [00:03, 10.00it/s] 40it [00:04, 10.01it/s] 42it [00:04, 10.02it/s] 44it [00:04, 10.02it/s] 46it [00:04, 10.01it/s] 48it [00:04, 10.02it/s] 50it [00:05, 10.02it/s]2025-05-26 03:22:22,054 - INFO - [Epoch 022 | Batch 0050] IWAE-loss 8459.5879 | mean log_px -0.0763 | KL -3567.08 + 52it [00:05, 10.01it/s] 54it [00:05, 9.74it/s] 56it [00:05, 9.83it/s] 57it [00:05, 9.53it/s] 59it [00:06, 9.69it/s] 60it [00:06, 9.75it/s] 61it [00:06, 9.80it/s] 62it [00:06, 9.33it/s] 64it [00:06, 9.55it/s] 66it [00:06, 9.71it/s] 68it [00:07, 9.82it/s] 70it [00:07, 9.90it/s] 71it [00:07, 9.80it/s] 72it [00:07, 9.49it/s] 74it [00:07, 9.69it/s] 75it [00:07, 9.69it/s] 76it [00:07, 9.72it/s] 78it [00:08, 9.84it/s] 80it [00:08, 9.91it/s] 81it [00:08, 9.90it/s] 82it [00:08, 9.88it/s] 83it [00:08, 9.90it/s] 84it [00:08, 9.93it/s] 86it [00:08, 9.34it/s] 87it [00:09, 9.26it/s] 88it [00:09, 9.33it/s] 89it [00:09, 9.48it/s] 90it [00:09, 9.61it/s] 91it [00:09, 9.71it/s] 92it [00:09, 9.77it/s] 93it [00:09, 9.35it/s] 95it [00:09, 9.65it/s] 96it [00:09, 9.72it/s] 98it [00:10, 9.81it/s] 100it [00:10, 9.89it/s]2025-05-26 03:22:27,213 - INFO - [Epoch 022 | Batch 0100] IWAE-loss 9265.9893 | mean log_px -0.0819 | KL -3570.15 + 101it [00:10, 9.45it/s] 102it [00:10, 9.50it/s] 103it [00:10, 9.60it/s] 104it [00:10, 9.69it/s] 105it [00:10, 9.75it/s] 106it [00:10, 9.34it/s] 108it [00:11, 9.63it/s] 109it [00:11, 9.72it/s] 110it [00:11, 9.78it/s] 111it [00:11, 9.82it/s] 112it [00:11, 9.86it/s] 114it [00:11, 9.94it/s] 115it [00:11, 9.53it/s] 116it [00:12, 9.56it/s] 117it [00:12, 9.59it/s] 118it [00:12, 9.09it/s] 119it [00:12, 8.97it/s] 120it [00:12, 9.22it/s] 121it [00:12, 9.43it/s] 122it [00:12, 9.58it/s] 123it [00:12, 9.66it/s] 124it [00:12, 9.74it/s] 125it [00:12, 9.46it/s] 126it [00:13, 9.54it/s] 127it [00:13, 9.21it/s] 128it [00:13, 9.42it/s] 130it [00:13, 9.67it/s] 131it [00:13, 9.22it/s] 132it [00:13, 9.39it/s] 134it [00:13, 9.64it/s] 136it [00:14, 9.79it/s] 138it [00:14, 9.88it/s] 140it [00:14, 9.92it/s] 141it [00:14, 9.93it/s] 142it [00:14, 9.93it/s] 144it [00:14, 9.97it/s] 146it [00:15, 9.99it/s] 148it [00:15, 10.01it/s] 149it [00:15, 10.00it/s] 150it [00:15, 10.00it/s]2025-05-26 03:22:32,387 - INFO - [Epoch 022 | Batch 0150] IWAE-loss 8519.6299 | mean log_px -0.0768 | KL -3566.00 + 151it [00:15, 9.47it/s] 152it [00:15, 9.59it/s] 153it [00:15, 9.65it/s] 155it [00:16, 9.81it/s] 156it [00:16, 9.82it/s] 158it [00:16, 9.89it/s] 159it [00:16, 9.87it/s] 160it [00:16, 9.90it/s] 161it [00:16, 9.88it/s] 162it [00:16, 9.83it/s] 163it [00:16, 9.82it/s] 164it [00:16, 9.85it/s] 165it [00:17, 9.85it/s] 166it [00:17, 9.88it/s] 168it [00:17, 9.93it/s] 170it [00:17, 9.97it/s] 171it [00:17, 9.94it/s] 173it [00:17, 9.97it/s] 174it [00:17, 9.92it/s] 176it [00:18, 9.96it/s] 177it [00:18, 9.92it/s] 178it [00:18, 9.94it/s] 180it [00:18, 9.97it/s] 181it [00:18, 9.92it/s] 182it [00:18, 9.92it/s] 183it [00:18, 9.39it/s] 185it [00:19, 9.65it/s] 186it [00:19, 9.50it/s] 187it [00:19, 9.59it/s] 188it [00:19, 9.68it/s] 189it [00:19, 9.76it/s] 190it [00:19, 9.82it/s] 191it [00:19, 9.87it/s] 192it [00:19, 9.89it/s] 193it [00:19, 9.90it/s] 195it [00:20, 9.62it/s] 196it [00:20, 9.36it/s] 196it [00:20, 9.66it/s] +2025-05-26 03:22:37,105 - INFO - Epoch: 22, Objective: tensor([8000.1289], device='cuda:0', grad_fn=), Loss: 0.06485095620155334, KL/n: 72.75353240966797 + 0it [00:00, ?it/s]2025-05-26 03:22:37,382 - INFO - [Epoch 023 | Batch 0000] IWAE-loss 10706.0791 | mean log_px -0.1055 | KL -3565.08 + 1it [00:00, 5.23it/s] 2it [00:00, 6.72it/s] 4it [00:00, 8.49it/s] 6it [00:00, 9.16it/s] 8it [00:00, 9.51it/s] 10it [00:01, 9.70it/s] 12it [00:01, 9.78it/s] 14it [00:01, 9.87it/s] 16it [00:01, 9.93it/s] 18it [00:01, 9.78it/s] 19it [00:02, 9.46it/s] 20it [00:02, 9.55it/s] 21it [00:02, 9.64it/s] 22it [00:02, 9.65it/s] 23it [00:02, 9.05it/s] 24it [00:02, 9.27it/s] 25it [00:02, 9.41it/s] 26it [00:02, 9.56it/s] 28it [00:02, 9.75it/s] 29it [00:03, 9.81it/s] 30it [00:03, 9.85it/s] 32it [00:03, 9.47it/s] 33it [00:03, 9.54it/s] 34it [00:03, 9.62it/s] 35it [00:03, 9.70it/s] 36it [00:03, 9.32it/s] 37it [00:03, 9.47it/s] 38it [00:04, 9.61it/s] 40it [00:04, 9.82it/s] 42it [00:04, 9.56it/s] 44it [00:04, 9.72it/s] 46it [00:04, 9.82it/s] 48it [00:05, 9.86it/s] 50it [00:05, 9.92it/s]2025-05-26 03:22:42,531 - INFO - [Epoch 023 | Batch 0050] IWAE-loss 6445.8760 | mean log_px -0.0427 | KL -3562.69 + 51it [00:05, 9.53it/s] 52it [00:05, 9.62it/s] 54it [00:05, 9.78it/s] 55it [00:05, 9.82it/s] 56it [00:05, 9.85it/s] 57it [00:05, 9.88it/s] 58it [00:06, 9.88it/s] 59it [00:06, 9.91it/s] 61it [00:06, 9.96it/s] 62it [00:06, 9.54it/s] 64it [00:06, 9.74it/s] 65it [00:06, 9.80it/s] 66it [00:06, 9.84it/s] 67it [00:06, 9.87it/s] 68it [00:07, 9.90it/s] 70it [00:07, 9.48it/s] 71it [00:07, 9.60it/s] 73it [00:07, 9.34it/s] 74it [00:07, 9.46it/s] 76it [00:07, 9.68it/s] 78it [00:08, 9.80it/s] 80it [00:08, 9.88it/s] 82it [00:08, 9.94it/s] 84it [00:08, 9.96it/s] 86it [00:08, 9.99it/s] 88it [00:09, 10.00it/s] 90it [00:09, 9.68it/s] 92it [00:09, 9.80it/s] 94it [00:09, 9.87it/s] 95it [00:09, 9.59it/s] 96it [00:09, 9.66it/s] 97it [00:10, 9.65it/s] 98it [00:10, 9.72it/s] 99it [00:10, 9.79it/s]2025-05-26 03:22:47,656 - INFO - [Epoch 023 | Batch 0100] IWAE-loss 9278.5117 | mean log_px -0.0849 | KL -3567.39 + 101it [00:10, 9.39it/s] 102it [00:10, 9.50it/s] 104it [00:10, 9.72it/s] 106it [00:10, 9.86it/s] 108it [00:11, 9.91it/s] 109it [00:11, 9.49it/s] 110it [00:11, 9.59it/s] 111it [00:11, 9.68it/s] 112it [00:11, 9.69it/s] 113it [00:11, 9.77it/s] 114it [00:11, 9.76it/s] 115it [00:11, 9.21it/s] 116it [00:12, 9.41it/s] 118it [00:12, 9.69it/s] 119it [00:12, 9.76it/s] 120it [00:12, 9.38it/s] 122it [00:12, 9.66it/s] 124it [00:12, 9.80it/s] 126it [00:13, 9.88it/s] 128it [00:13, 9.58it/s] 129it [00:13, 9.65it/s] 130it [00:13, 9.71it/s] 131it [00:13, 9.29it/s] 132it [00:13, 9.46it/s] 134it [00:13, 9.67it/s] 135it [00:14, 9.73it/s] 137it [00:14, 9.86it/s] 139it [00:14, 9.94it/s] 141it [00:14, 9.99it/s] 143it [00:14, 10.02it/s] 144it [00:14, 10.01it/s] 146it [00:15, 10.02it/s] 148it [00:15, 9.72it/s] 150it [00:15, 9.83it/s]2025-05-26 03:22:52,805 - INFO - [Epoch 023 | Batch 0150] IWAE-loss 9398.9590 | mean log_px -0.0833 | KL -3566.49 + 151it [00:15, 9.45it/s] 152it [00:15, 9.55it/s] 154it [00:15, 9.74it/s] 156it [00:16, 9.86it/s] 158it [00:16, 9.55it/s] 160it [00:16, 9.71it/s] 162it [00:16, 9.83it/s] 164it [00:16, 9.89it/s] 166it [00:17, 9.93it/s] 167it [00:17, 9.55it/s] 168it [00:17, 9.64it/s] 169it [00:17, 9.70it/s] 170it [00:17, 9.77it/s] 172it [00:17, 9.86it/s] 174it [00:17, 9.93it/s] 175it [00:18, 9.93it/s] 176it [00:18, 9.45it/s] 177it [00:18, 9.57it/s] 178it [00:18, 9.66it/s] 179it [00:18, 9.75it/s] 180it [00:18, 9.82it/s] 181it [00:18, 9.23it/s] 182it [00:18, 9.43it/s] 184it [00:19, 9.68it/s] 185it [00:19, 9.76it/s] 186it [00:19, 9.30it/s] 187it [00:19, 9.47it/s] 188it [00:19, 9.59it/s] 190it [00:19, 9.77it/s] 191it [00:19, 9.26it/s] 192it [00:19, 9.13it/s] 193it [00:19, 9.17it/s] 194it [00:20, 9.31it/s] 195it [00:20, 8.63it/s] 196it [00:20, 9.61it/s] +2025-05-26 03:22:57,623 - INFO - Epoch: 23, Objective: tensor([7036.1016], device='cuda:0', grad_fn=), Loss: 0.05605386570096016, KL/n: 72.70604705810547 + 0it [00:00, ?it/s]2025-05-26 03:22:58,074 - INFO - [Epoch 024 | Batch 0000] IWAE-loss 10053.7881 | mean log_px -0.0965 | KL -3562.36 + 1it [00:00, 5.49it/s] 2it [00:00, 7.38it/s] 3it [00:00, 8.38it/s] 5it [00:00, 9.30it/s] 6it [00:00, 9.49it/s] 7it [00:00, 9.55it/s] 8it [00:00, 9.68it/s] 9it [00:00, 9.76it/s] 10it [00:01, 9.82it/s] 11it [00:01, 9.88it/s] 12it [00:01, 9.22it/s] 13it [00:01, 9.40it/s] 14it [00:01, 9.55it/s] 15it [00:01, 9.66it/s] 16it [00:01, 9.72it/s] 17it [00:01, 9.79it/s] 18it [00:01, 9.84it/s] 19it [00:02, 9.88it/s] 20it [00:02, 9.90it/s] 21it [00:02, 9.27it/s] 22it [00:02, 9.45it/s] 23it [00:02, 9.60it/s] 24it [00:02, 9.07it/s] 25it [00:02, 9.32it/s] 26it [00:02, 9.37it/s] 27it [00:02, 9.31it/s] 28it [00:02, 9.25it/s] 29it [00:03, 8.70it/s] 30it [00:03, 9.01it/s] 32it [00:03, 9.43it/s] 33it [00:03, 9.55it/s] 34it [00:03, 9.63it/s] 35it [00:03, 9.71it/s] 36it [00:03, 9.75it/s] 37it [00:03, 9.81it/s] 38it [00:04, 9.84it/s] 39it [00:04, 9.86it/s] 40it [00:04, 9.67it/s] 41it [00:04, 9.35it/s] 42it [00:04, 9.48it/s] 43it [00:04, 9.48it/s] 44it [00:04, 9.47it/s] 45it [00:04, 9.49it/s] 46it [00:04, 9.11it/s] 47it [00:04, 9.25it/s] 48it [00:05, 9.28it/s] 49it [00:05, 9.40it/s] 50it [00:05, 9.40it/s]2025-05-26 03:23:03,311 - INFO - [Epoch 024 | Batch 0050] IWAE-loss 7944.3613 | mean log_px -0.0672 | KL -3565.10 + 51it [00:05, 9.46it/s] 52it [00:05, 9.49it/s] 53it [00:05, 9.09it/s] 54it [00:05, 9.20it/s] 55it [00:05, 9.31it/s] 56it [00:05, 9.37it/s] 57it [00:06, 9.41it/s] 58it [00:06, 9.50it/s] 59it [00:06, 8.97it/s] 60it [00:06, 9.11it/s] 61it [00:06, 9.24it/s] 62it [00:06, 9.28it/s] 63it [00:06, 9.18it/s] 64it [00:06, 9.24it/s] 65it [00:06, 9.24it/s] 66it [00:07, 8.76it/s] 67it [00:07, 9.00it/s] 68it [00:07, 9.17it/s] 69it [00:07, 9.30it/s] 70it [00:07, 9.41it/s] 71it [00:07, 9.47it/s] 72it [00:07, 9.47it/s] 73it [00:07, 9.49it/s] 74it [00:07, 9.46it/s] 75it [00:08, 9.55it/s] 76it [00:08, 9.62it/s] 77it [00:08, 9.63it/s] 78it [00:08, 9.62it/s] 79it [00:08, 9.12it/s] 80it [00:08, 9.22it/s] 81it [00:08, 9.31it/s] 82it [00:08, 9.35it/s] 83it [00:08, 9.42it/s] 84it [00:08, 9.46it/s] 85it [00:09, 9.51it/s] 86it [00:09, 9.50it/s] 87it [00:09, 9.52it/s] 88it [00:09, 9.50it/s] 89it [00:09, 9.57it/s] 90it [00:09, 9.56it/s] 91it [00:09, 9.56it/s] 92it [00:09, 9.55it/s] 93it [00:09, 9.54it/s] 94it [00:10, 9.55it/s] 95it [00:10, 9.59it/s] 96it [00:10, 9.56it/s] 97it [00:10, 9.56it/s] 98it [00:10, 9.54it/s] 99it [00:10, 9.53it/s] 100it [00:10, 9.54it/s]2025-05-26 03:23:08,633 - INFO - [Epoch 024 | Batch 0100] IWAE-loss 6554.0537 | mean log_px -0.0452 | KL -3559.28 + 101it [00:10, 9.55it/s] 102it [00:10, 9.53it/s] 103it [00:10, 9.54it/s] 104it [00:11, 9.01it/s] 105it [00:11, 9.14it/s] 106it [00:11, 9.22it/s] 107it [00:11, 9.37it/s] 108it [00:11, 9.41it/s] 109it [00:11, 9.48it/s] 110it [00:11, 9.48it/s] 111it [00:11, 9.46it/s] 112it [00:11, 9.53it/s] 113it [00:12, 9.03it/s] 114it [00:12, 9.14it/s] 115it [00:12, 9.27it/s] 116it [00:12, 9.32it/s] 117it [00:12, 9.35it/s] 118it [00:12, 9.34it/s] 119it [00:12, 9.15it/s] 120it [00:12, 8.75it/s] 121it [00:12, 8.95it/s] 122it [00:13, 9.07it/s] 123it [00:13, 8.74it/s] 124it [00:13, 8.87it/s] 125it [00:13, 9.07it/s] 126it [00:13, 9.15it/s] 127it [00:13, 8.78it/s] 128it [00:13, 8.97it/s] 129it [00:13, 9.07it/s] 130it [00:13, 9.17it/s] 131it [00:14, 8.81it/s] 132it [00:14, 8.99it/s] 133it [00:14, 9.15it/s] 134it [00:14, 9.24it/s] 135it [00:14, 8.84it/s] 136it [00:14, 8.94it/s] 137it [00:14, 9.10it/s] 138it [00:14, 9.22it/s] 139it [00:14, 8.83it/s] 140it [00:15, 9.06it/s] 141it [00:15, 9.16it/s] 142it [00:15, 9.26it/s] 143it [00:15, 8.85it/s] 144it [00:15, 9.07it/s] 145it [00:15, 9.22it/s] 146it [00:15, 8.83it/s] 147it [00:15, 9.03it/s] 148it [00:15, 9.13it/s] 149it [00:16, 9.27it/s] 150it [00:16, 8.82it/s]2025-05-26 03:23:14,131 - INFO - [Epoch 024 | Batch 0150] IWAE-loss 11166.3877 | mean log_px -0.1161 | KL -3563.05 + 151it [00:16, 9.01it/s] 152it [00:16, 8.71it/s] 153it [00:16, 8.91it/s] 154it [00:16, 9.06it/s] 155it [00:16, 9.11it/s] 156it [00:16, 8.74it/s] 157it [00:16, 8.95it/s] 158it [00:17, 9.09it/s] 159it [00:17, 9.22it/s] 160it [00:17, 8.84it/s] 161it [00:17, 8.99it/s] 162it [00:17, 9.10it/s] 163it [00:17, 9.23it/s] 164it [00:17, 8.82it/s] 165it [00:17, 9.04it/s] 166it [00:17, 9.14it/s] 167it [00:18, 9.22it/s] 168it [00:18, 8.85it/s] 169it [00:18, 9.06it/s] 170it [00:18, 9.18it/s] 171it [00:18, 9.30it/s] 172it [00:18, 8.86it/s] 173it [00:18, 9.03it/s] 174it [00:18, 9.19it/s] 175it [00:18, 9.29it/s] 176it [00:19, 8.90it/s] 177it [00:19, 9.03it/s] 178it [00:19, 9.17it/s] 179it [00:19, 9.17it/s] 180it [00:19, 8.81it/s] 181it [00:19, 8.98it/s] 182it [00:19, 9.15it/s] 183it [00:19, 9.19it/s] 184it [00:19, 8.82it/s] 185it [00:20, 9.01it/s] 186it [00:20, 9.10it/s] 187it [00:20, 8.76it/s] 188it [00:20, 8.92it/s] 189it [00:20, 9.08it/s] 190it [00:20, 9.24it/s] 191it [00:20, 8.86it/s] 192it [00:20, 9.04it/s] 193it [00:20, 9.17it/s] 194it [00:20, 9.29it/s] 195it [00:21, 8.80it/s] 196it [00:21, 8.67it/s] 196it [00:21, 9.21it/s] +2025-05-26 03:23:19,223 - INFO - Epoch: 24, Objective: tensor([7781.2070], device='cuda:0', grad_fn=), Loss: 0.06895510107278824, KL/n: 72.64373779296875 + 0it [00:00, ?it/s]2025-05-26 03:23:19,501 - INFO - [Epoch 025 | Batch 0000] IWAE-loss 5908.9863 | mean log_px -0.0345 | KL -3553.46 + 1it [00:00, 5.41it/s] 2it [00:00, 7.17it/s] 3it [00:00, 8.13it/s] 4it [00:00, 8.62it/s] 5it [00:00, 8.93it/s] 6it [00:00, 9.16it/s] 7it [00:00, 9.26it/s] 8it [00:00, 9.34it/s] 9it [00:01, 9.42it/s] 10it [00:01, 9.44it/s] 11it [00:01, 9.47it/s] 12it [00:01, 9.43it/s] 13it [00:01, 9.45it/s] 14it [00:01, 9.44it/s] 15it [00:01, 9.44it/s] 16it [00:01, 9.44it/s] 17it [00:01, 9.49it/s] 18it [00:01, 9.47it/s] 19it [00:02, 9.48it/s] 20it [00:02, 9.22it/s] 21it [00:02, 9.24it/s] 22it [00:02, 9.29it/s] 23it [00:02, 8.85it/s] 24it [00:02, 9.05it/s] 25it [00:02, 9.16it/s] 26it [00:02, 9.26it/s] 27it [00:02, 9.29it/s] 28it [00:03, 9.39it/s] 29it [00:03, 9.47it/s] 30it [00:03, 8.95it/s] 31it [00:03, 9.11it/s] 32it [00:03, 9.18it/s] 33it [00:03, 9.30it/s] 34it [00:03, 9.31it/s] 35it [00:03, 8.86it/s] 36it [00:03, 9.05it/s] 37it [00:04, 9.19it/s] 38it [00:04, 9.29it/s] 39it [00:04, 9.36it/s] 40it [00:04, 9.37it/s] 41it [00:04, 9.39it/s] 42it [00:04, 9.39it/s] 43it [00:04, 9.45it/s] 44it [00:04, 9.40it/s] 45it [00:04, 9.48it/s] 46it [00:04, 9.49it/s] 47it [00:05, 9.48it/s] 48it [00:05, 9.48it/s] 49it [00:05, 8.94it/s] 50it [00:05, 9.11it/s]2025-05-26 03:23:24,866 - INFO - [Epoch 025 | Batch 0050] IWAE-loss 5141.8364 | mean log_px -0.0226 | KL -3558.55 + 51it [00:05, 9.18it/s] 52it [00:05, 9.27it/s] 53it [00:05, 9.34it/s] 54it [00:05, 9.30it/s] 55it [00:05, 8.84it/s] 56it [00:06, 9.03it/s] 57it [00:06, 9.20it/s] 58it [00:06, 9.27it/s] 59it [00:06, 9.40it/s] 60it [00:06, 9.49it/s] 61it [00:06, 9.57it/s] 62it [00:06, 9.60it/s] 63it [00:06, 9.64it/s] 64it [00:06, 9.64it/s] 65it [00:07, 9.68it/s] 66it [00:07, 9.65it/s] 67it [00:07, 9.59it/s] 68it [00:07, 9.58it/s] 69it [00:07, 9.63it/s] 70it [00:07, 9.66it/s] 71it [00:07, 9.67it/s] 72it [00:07, 9.67it/s] 73it [00:07, 9.67it/s] 74it [00:07, 9.67it/s] 75it [00:08, 9.68it/s] 76it [00:08, 9.69it/s] 77it [00:08, 9.72it/s] 78it [00:08, 9.71it/s] 79it [00:08, 9.71it/s] 80it [00:08, 9.71it/s] 81it [00:08, 9.71it/s] 82it [00:08, 9.70it/s] 83it [00:08, 9.71it/s] 84it [00:08, 9.60it/s] 85it [00:09, 9.41it/s] 86it [00:09, 9.30it/s] 87it [00:09, 9.38it/s] 88it [00:09, 9.44it/s] 89it [00:09, 9.53it/s] 90it [00:09, 9.54it/s] 91it [00:09, 9.58it/s] 92it [00:09, 9.55it/s] 93it [00:09, 9.56it/s] 94it [00:10, 9.63it/s] 95it [00:10, 9.69it/s] 96it [00:10, 9.68it/s] 97it [00:10, 9.72it/s] 98it [00:10, 9.69it/s] 99it [00:10, 9.74it/s] 100it [00:10, 9.66it/s]2025-05-26 03:23:30,090 - INFO - [Epoch 025 | Batch 0100] IWAE-loss 6209.9375 | mean log_px -0.0399 | KL -3555.98 + 101it [00:10, 9.62it/s] 102it [00:10, 9.59it/s] 103it [00:10, 9.58it/s] 104it [00:11, 9.53it/s] 105it [00:11, 9.54it/s] 106it [00:11, 9.50it/s] 107it [00:11, 9.50it/s] 108it [00:11, 9.52it/s] 109it [00:11, 9.55it/s] 110it [00:11, 9.53it/s] 111it [00:11, 9.55it/s] 112it [00:11, 9.52it/s] 113it [00:12, 9.51it/s] 114it [00:12, 9.49it/s] 115it [00:12, 9.46it/s] 116it [00:12, 9.47it/s] 117it [00:12, 9.48it/s] 118it [00:12, 9.48it/s] 119it [00:12, 9.49it/s] 120it [00:12, 9.50it/s] 121it [00:12, 9.54it/s] 122it [00:12, 9.51it/s] 123it [00:13, 9.51it/s] 124it [00:13, 9.50it/s] 125it [00:13, 9.53it/s] 126it [00:13, 9.52it/s] 127it [00:13, 9.45it/s] 128it [00:13, 9.49it/s] 129it [00:13, 9.57it/s] 130it [00:13, 9.37it/s] 131it [00:13, 9.43it/s] 132it [00:14, 9.47it/s] 133it [00:14, 9.50it/s] 134it [00:14, 9.51it/s] 135it [00:14, 9.53it/s] 136it [00:14, 9.55it/s] 137it [00:14, 9.61it/s] 138it [00:14, 9.60it/s] 139it [00:14, 9.55it/s] 140it [00:14, 9.55it/s] 141it [00:14, 9.53it/s] 142it [00:15, 9.54it/s] 143it [00:15, 9.55it/s] 144it [00:15, 9.55it/s] 145it [00:15, 9.54it/s] 146it [00:15, 9.51it/s] 147it [00:15, 9.58it/s] 148it [00:15, 9.62it/s] 149it [00:15, 9.53it/s] 150it [00:15, 9.53it/s]2025-05-26 03:23:35,343 - INFO - [Epoch 025 | Batch 0150] IWAE-loss 8218.2256 | mean log_px -0.0712 | KL -3553.84 + 151it [00:16, 9.56it/s] 152it [00:16, 9.53it/s] 153it [00:16, 9.55it/s] 154it [00:16, 9.55it/s] 155it [00:16, 9.60it/s] 156it [00:16, 9.55it/s] 157it [00:16, 9.56it/s] 158it [00:16, 9.55it/s] 159it [00:16, 9.55it/s] 160it [00:16, 9.58it/s] 161it [00:17, 9.60it/s] 162it [00:17, 9.60it/s] 163it [00:17, 9.63it/s] 164it [00:17, 9.55it/s] 165it [00:17, 9.53it/s] 166it [00:17, 9.55it/s] 167it [00:17, 9.49it/s] 168it [00:17, 9.52it/s] 169it [00:17, 9.51it/s] 170it [00:18, 9.49it/s] 171it [00:18, 9.51it/s] 172it [00:18, 9.54it/s] 173it [00:18, 9.59it/s] 174it [00:18, 9.62it/s] 175it [00:18, 9.63it/s] 176it [00:18, 9.62it/s] 177it [00:18, 9.63it/s] 178it [00:18, 9.59it/s] 179it [00:18, 9.57it/s] 180it [00:19, 9.57it/s] 181it [00:19, 9.61it/s] 182it [00:19, 9.57it/s] 183it [00:19, 9.59it/s] 184it [00:19, 9.58it/s] 185it [00:19, 9.58it/s] 186it [00:19, 9.60it/s] 187it [00:19, 9.63it/s] 188it [00:19, 9.57it/s] 189it [00:19, 9.58it/s] 190it [00:20, 9.59it/s] 191it [00:20, 9.58it/s] 192it [00:20, 9.55it/s] 193it [00:20, 9.53it/s] 194it [00:20, 9.55it/s] 195it [00:20, 8.97it/s] 196it [00:20, 9.18it/s] 196it [00:20, 9.42it/s] +2025-05-26 03:23:40,167 - INFO - Epoch: 25, Objective: tensor([8688.2051], device='cuda:0', grad_fn=), Loss: 0.08251015841960907, KL/n: 72.58772277832031 + 0it [00:00, ?it/s]2025-05-26 03:23:40,630 - INFO - [Epoch 026 | Batch 0000] IWAE-loss 7151.1875 | mean log_px -0.0637 | KL -3554.05 + 1it [00:00, 5.20it/s] 2it [00:00, 6.40it/s] 3it [00:00, 7.52it/s] 4it [00:00, 8.13it/s] 5it [00:00, 8.59it/s] 6it [00:00, 8.79it/s] 7it [00:00, 9.01it/s] 8it [00:00, 9.18it/s] 9it [00:01, 9.28it/s] 10it [00:01, 9.32it/s] 11it [00:01, 8.97it/s] 12it [00:01, 9.12it/s] 13it [00:01, 9.22it/s] 14it [00:01, 9.31it/s] 15it [00:01, 9.37it/s] 16it [00:01, 9.40it/s] 17it [00:01, 9.46it/s] 18it [00:02, 9.44it/s] 19it [00:02, 9.44it/s] 20it [00:02, 9.46it/s] 21it [00:02, 9.47it/s] 22it [00:02, 9.47it/s] 23it [00:02, 9.47it/s] 24it [00:02, 9.45it/s] 25it [00:02, 9.50it/s] 26it [00:02, 9.45it/s] 27it [00:02, 9.44it/s] 28it [00:03, 9.45it/s] 29it [00:03, 9.45it/s] 30it [00:03, 9.46it/s] 31it [00:03, 9.52it/s] 32it [00:03, 9.48it/s] 33it [00:03, 9.48it/s] 34it [00:03, 9.45it/s] 35it [00:03, 8.88it/s] 36it [00:03, 9.06it/s] 37it [00:04, 9.17it/s] 38it [00:04, 9.20it/s] 39it [00:04, 9.23it/s] 40it [00:04, 9.27it/s] 41it [00:04, 9.31it/s] 42it [00:04, 9.32it/s] 43it [00:04, 9.34it/s] 44it [00:04, 9.37it/s] 45it [00:04, 8.97it/s] 46it [00:05, 9.07it/s] 47it [00:05, 9.19it/s] 48it [00:05, 9.27it/s] 49it [00:05, 9.34it/s] 50it [00:05, 9.33it/s]2025-05-26 03:23:46,015 - INFO - [Epoch 026 | Batch 0050] IWAE-loss 8084.2090 | mean log_px -0.0655 | KL -3553.26 + 51it [00:05, 9.05it/s] 52it [00:05, 8.92it/s] 53it [00:05, 9.06it/s] 54it [00:05, 9.15it/s] 55it [00:06, 9.25it/s] 56it [00:06, 9.33it/s] 57it [00:06, 9.31it/s] 58it [00:06, 9.31it/s] 59it [00:06, 9.34it/s] 60it [00:06, 9.39it/s] 61it [00:06, 9.36it/s] 62it [00:06, 9.23it/s] 63it [00:06, 9.30it/s] 64it [00:06, 9.36it/s] 65it [00:07, 9.40it/s] 66it [00:07, 9.41it/s] 67it [00:07, 9.45it/s] 68it [00:07, 9.44it/s] 69it [00:07, 9.44it/s] 70it [00:07, 9.42it/s] 71it [00:07, 9.44it/s] 72it [00:07, 9.44it/s] 73it [00:07, 9.43it/s] 74it [00:08, 9.41it/s] 75it [00:08, 8.89it/s] 76it [00:08, 9.05it/s] 77it [00:08, 9.18it/s] 78it [00:08, 9.23it/s] 79it [00:08, 9.30it/s] 80it [00:08, 9.31it/s] 81it [00:08, 8.96it/s] 82it [00:08, 9.06it/s] 83it [00:09, 9.21it/s] 84it [00:09, 9.27it/s] 85it [00:09, 9.36it/s] 86it [00:09, 9.35it/s] 87it [00:09, 8.86it/s] 88it [00:09, 8.99it/s] 89it [00:09, 9.11it/s] 90it [00:09, 9.22it/s] 91it [00:09, 9.29it/s] 92it [00:09, 9.38it/s] 93it [00:10, 9.48it/s] 94it [00:10, 9.46it/s] 95it [00:10, 9.47it/s] 96it [00:10, 9.45it/s] 97it [00:10, 9.49it/s] 98it [00:10, 9.48it/s] 99it [00:10, 9.48it/s] 100it [00:10, 9.47it/s]2025-05-26 03:23:51,385 - INFO - [Epoch 026 | Batch 0100] IWAE-loss 6382.7183 | mean log_px -0.0501 | KL -3556.70 + 101it [00:10, 9.49it/s] 102it [00:11, 9.46it/s] 103it [00:11, 9.49it/s] 104it [00:11, 9.50it/s] 105it [00:11, 8.99it/s] 106it [00:11, 9.13it/s] 107it [00:11, 9.23it/s] 108it [00:11, 9.28it/s] 109it [00:11, 9.36it/s] 110it [00:11, 8.86it/s] 111it [00:12, 9.02it/s] 112it [00:12, 9.20it/s] 113it [00:12, 9.29it/s] 114it [00:12, 9.36it/s] 115it [00:12, 9.42it/s] 116it [00:12, 9.45it/s] 117it [00:12, 9.05it/s] 118it [00:12, 9.16it/s] 119it [00:12, 9.22it/s] 120it [00:13, 9.28it/s] 121it [00:13, 9.34it/s] 122it [00:13, 9.35it/s] 123it [00:13, 9.41it/s] 124it [00:13, 9.43it/s] 125it [00:13, 9.49it/s] 126it [00:13, 8.96it/s] 127it [00:13, 9.10it/s] 128it [00:13, 9.11it/s] 129it [00:13, 9.20it/s] 130it [00:14, 9.25it/s] 131it [00:14, 8.71it/s] 132it [00:14, 8.86it/s] 133it [00:14, 9.09it/s] 134it [00:14, 9.16it/s] 135it [00:14, 8.74it/s] 136it [00:14, 8.93it/s] 137it [00:14, 9.12it/s] 138it [00:14, 9.18it/s] 139it [00:15, 9.28it/s] 140it [00:15, 9.20it/s] 141it [00:15, 9.33it/s] 142it [00:15, 9.35it/s] 143it [00:15, 9.38it/s] 144it [00:15, 9.41it/s] 145it [00:15, 9.41it/s] 146it [00:15, 9.44it/s] 147it [00:15, 9.43it/s] 148it [00:16, 9.45it/s] 149it [00:16, 9.51it/s] 150it [00:16, 9.49it/s]2025-05-26 03:23:56,795 - INFO - [Epoch 026 | Batch 0150] IWAE-loss 8474.0977 | mean log_px -0.0783 | KL -3551.70 + 151it [00:16, 8.89it/s] 152it [00:16, 9.05it/s] 153it [00:16, 9.18it/s] 154it [00:16, 9.24it/s] 155it [00:16, 9.31it/s] 156it [00:16, 9.34it/s] 157it [00:17, 9.36it/s] 158it [00:17, 9.33it/s] 159it [00:17, 9.39it/s] 160it [00:17, 9.42it/s] 161it [00:17, 9.40it/s] 162it [00:17, 9.44it/s] 163it [00:17, 9.51it/s] 164it [00:17, 9.52it/s] 165it [00:17, 9.49it/s] 166it [00:17, 9.43it/s] 167it [00:18, 9.45it/s] 168it [00:18, 9.49it/s] 169it [00:18, 9.43it/s] 170it [00:18, 9.40it/s] 171it [00:18, 9.43it/s] 172it [00:18, 9.43it/s] 173it [00:18, 9.41it/s] 174it [00:18, 9.36it/s] 175it [00:18, 8.87it/s] 176it [00:19, 9.00it/s] 177it [00:19, 9.09it/s] 178it [00:19, 9.02it/s] 179it [00:19, 8.93it/s] 180it [00:19, 8.53it/s] 181it [00:19, 8.75it/s] 182it [00:19, 8.93it/s] 183it [00:19, 9.11it/s] 184it [00:19, 9.15it/s] 185it [00:20, 9.22it/s] 186it [00:20, 9.24it/s] 187it [00:20, 9.35it/s] 188it [00:20, 9.35it/s] 189it [00:20, 9.38it/s] 190it [00:20, 8.96it/s] 191it [00:20, 9.11it/s] 192it [00:20, 9.23it/s] 193it [00:20, 9.30it/s] 194it [00:21, 9.36it/s] 195it [00:21, 8.79it/s] 196it [00:21, 9.06it/s] 196it [00:21, 9.19it/s] +2025-05-26 03:24:01,798 - INFO - Epoch: 26, Objective: tensor([10124.8457], device='cuda:0', grad_fn=), Loss: 0.10262526571750641, KL/n: 72.52192687988281 + 0it [00:00, ?it/s]2025-05-26 03:24:02,056 - INFO - [Epoch 027 | Batch 0000] IWAE-loss 5660.2915 | mean log_px -0.0403 | KL -3550.19 + 1it [00:00, 6.06it/s] 2it [00:00, 7.61it/s] 3it [00:00, 8.37it/s] 4it [00:00, 8.78it/s] 5it [00:00, 9.03it/s] 6it [00:00, 9.24it/s] 7it [00:00, 9.29it/s] 8it [00:00, 9.34it/s] 9it [00:01, 9.37it/s] 10it [00:01, 9.40it/s] 11it [00:01, 9.39it/s] 12it [00:01, 9.41it/s] 13it [00:01, 9.42it/s] 14it [00:01, 9.45it/s] 15it [00:01, 9.48it/s] 16it [00:01, 9.39it/s] 17it [00:01, 9.39it/s] 18it [00:01, 9.43it/s] 19it [00:02, 9.47it/s] 20it [00:02, 9.44it/s] 21it [00:02, 9.40it/s] 22it [00:02, 9.43it/s] 23it [00:02, 9.43it/s] 24it [00:02, 9.44it/s] 25it [00:02, 9.50it/s] 26it [00:02, 9.45it/s] 27it [00:02, 9.39it/s] 28it [00:03, 9.37it/s] 29it [00:03, 9.42it/s] 30it [00:03, 9.39it/s] 31it [00:03, 8.93it/s] 32it [00:03, 9.09it/s] 33it [00:03, 9.25it/s] 34it [00:03, 9.30it/s] 35it [00:03, 9.24it/s] 36it [00:03, 9.28it/s] 37it [00:03, 9.35it/s] 38it [00:04, 9.36it/s] 39it [00:04, 9.36it/s] 40it [00:04, 9.38it/s] 41it [00:04, 9.44it/s] 42it [00:04, 9.42it/s] 43it [00:04, 9.44it/s] 44it [00:04, 9.43it/s] 45it [00:04, 8.97it/s] 46it [00:04, 9.11it/s] 47it [00:05, 9.08it/s] 48it [00:05, 9.22it/s] 49it [00:05, 9.35it/s] 50it [00:05, 9.32it/s]2025-05-26 03:24:07,395 - INFO - [Epoch 027 | Batch 0050] IWAE-loss 7041.8789 | mean log_px -0.0514 | KL -3547.65 + 51it [00:05, 8.89it/s] 52it [00:05, 9.03it/s] 53it [00:05, 9.16it/s] 54it [00:05, 9.25it/s] 55it [00:05, 9.30it/s] 56it [00:06, 9.31it/s] 57it [00:06, 9.42it/s] 58it [00:06, 9.44it/s] 59it [00:06, 9.44it/s] 60it [00:06, 9.46it/s] 61it [00:06, 9.50it/s] 62it [00:06, 9.46it/s] 63it [00:06, 9.48it/s] 64it [00:06, 9.44it/s] 65it [00:07, 9.42it/s] 66it [00:07, 9.42it/s] 67it [00:07, 8.99it/s] 68it [00:07, 9.08it/s] 69it [00:07, 9.20it/s] 70it [00:07, 9.26it/s] 71it [00:07, 9.34it/s] 72it [00:07, 9.38it/s] 73it [00:07, 9.43it/s] 74it [00:07, 9.50it/s] 75it [00:08, 9.52it/s] 76it [00:08, 9.50it/s] 77it [00:08, 9.50it/s] 78it [00:08, 9.49it/s] 79it [00:08, 9.50it/s] 80it [00:08, 9.50it/s] 81it [00:08, 9.50it/s] 82it [00:08, 9.49it/s] 83it [00:08, 9.43it/s] 84it [00:09, 9.41it/s] 85it [00:09, 9.46it/s] 86it [00:09, 9.51it/s] 87it [00:09, 9.48it/s] 88it [00:09, 9.45it/s] 89it [00:09, 9.42it/s] 90it [00:09, 9.40it/s] 91it [00:09, 9.44it/s] 92it [00:09, 9.44it/s] 93it [00:09, 9.45it/s] 94it [00:10, 9.44it/s] 95it [00:10, 9.46it/s] 96it [00:10, 9.42it/s] 97it [00:10, 9.44it/s] 98it [00:10, 9.42it/s] 99it [00:10, 9.43it/s] 100it [00:10, 9.45it/s]2025-05-26 03:24:12,720 - INFO - [Epoch 027 | Batch 0100] IWAE-loss 7957.1924 | mean log_px -0.0696 | KL -3551.78 + 101it [00:10, 9.41it/s] 102it [00:10, 9.43it/s] 103it [00:11, 9.42it/s] 104it [00:11, 9.41it/s] 105it [00:11, 9.46it/s] 106it [00:11, 9.46it/s] 107it [00:11, 9.49it/s] 108it [00:11, 9.13it/s] 109it [00:11, 9.27it/s] 110it [00:11, 9.32it/s] 111it [00:11, 9.36it/s] 112it [00:12, 9.39it/s] 113it [00:12, 9.42it/s] 114it [00:12, 9.14it/s] 115it [00:12, 9.26it/s] 116it [00:12, 9.33it/s] 117it [00:12, 8.90it/s] 118it [00:12, 9.03it/s] 119it [00:12, 9.19it/s] 120it [00:12, 9.25it/s] 121it [00:12, 9.33it/s] 122it [00:13, 9.38it/s] 123it [00:13, 9.43it/s] 124it [00:13, 9.44it/s] 125it [00:13, 8.95it/s] 126it [00:13, 9.12it/s] 127it [00:13, 9.27it/s] 128it [00:13, 8.86it/s] 129it [00:13, 9.07it/s] 130it [00:13, 9.16it/s] 131it [00:14, 9.24it/s] 132it [00:14, 9.32it/s] 133it [00:14, 9.37it/s] 134it [00:14, 9.40it/s] 135it [00:14, 9.40it/s] 136it [00:14, 9.43it/s] 137it [00:14, 9.37it/s] 138it [00:14, 9.39it/s] 139it [00:14, 9.43it/s] 140it [00:15, 9.45it/s] 141it [00:15, 9.46it/s] 142it [00:15, 9.45it/s] 143it [00:15, 9.46it/s] 144it [00:15, 9.44it/s] 145it [00:15, 9.41it/s] 146it [00:15, 9.41it/s] 147it [00:15, 9.46it/s] 148it [00:15, 9.57it/s] 149it [00:15, 9.66it/s] 150it [00:16, 9.69it/s]2025-05-26 03:24:18,068 - INFO - [Epoch 027 | Batch 0150] IWAE-loss 7002.5981 | mean log_px -0.0568 | KL -3547.20 + 151it [00:16, 9.71it/s] 152it [00:16, 9.73it/s] 153it [00:16, 9.77it/s] 154it [00:16, 9.65it/s] 155it [00:16, 9.69it/s] 156it [00:16, 9.73it/s] 157it [00:16, 9.78it/s] 158it [00:16, 9.81it/s] 159it [00:16, 9.84it/s] 160it [00:17, 9.84it/s] 161it [00:17, 9.85it/s] 162it [00:17, 9.83it/s] 163it [00:17, 9.83it/s] 164it [00:17, 9.83it/s] 165it [00:17, 9.85it/s] 166it [00:17, 9.30it/s] 167it [00:17, 9.27it/s] 168it [00:17, 9.38it/s] 169it [00:18, 9.52it/s] 170it [00:18, 9.61it/s] 171it [00:18, 9.11it/s] 172it [00:18, 9.31it/s] 173it [00:18, 9.49it/s] 174it [00:18, 9.60it/s] 175it [00:18, 9.68it/s] 176it [00:18, 9.74it/s] 177it [00:18, 9.77it/s] 178it [00:18, 9.79it/s] 179it [00:19, 9.81it/s] 180it [00:19, 9.82it/s] 181it [00:19, 9.83it/s] 182it [00:19, 9.80it/s] 183it [00:19, 9.79it/s] 184it [00:19, 9.81it/s] 185it [00:19, 9.83it/s] 186it [00:19, 9.83it/s] 187it [00:19, 9.84it/s] 188it [00:19, 9.84it/s] 189it [00:20, 9.85it/s] 190it [00:20, 9.83it/s] 191it [00:20, 9.84it/s] 192it [00:20, 9.85it/s] 193it [00:20, 9.87it/s] 194it [00:20, 9.85it/s] 195it [00:20, 9.25it/s] 196it [00:20, 9.39it/s] +2025-05-26 03:24:22,812 - INFO - Epoch: 27, Objective: tensor([5026.2368], device='cuda:0', grad_fn=), Loss: 0.021482713520526886, KL/n: 72.46076965332031 + 0it [00:00, ?it/s]2025-05-26 03:24:23,269 - INFO - [Epoch 028 | Batch 0000] IWAE-loss 6144.6147 | mean log_px -0.0405 | KL -3548.91 + 1it [00:00, 2.72it/s] 2it [00:00, 4.70it/s] 3it [00:00, 6.19it/s] 4it [00:00, 7.25it/s] 5it [00:00, 8.03it/s] 6it [00:00, 8.57it/s] 7it [00:00, 8.96it/s] 8it [00:01, 9.22it/s] 9it [00:01, 9.43it/s] 10it [00:01, 8.93it/s] 11it [00:01, 9.19it/s] 12it [00:01, 9.38it/s] 13it [00:01, 9.54it/s] 14it [00:01, 9.62it/s] 15it [00:01, 9.67it/s] 16it [00:01, 9.23it/s] 17it [00:02, 9.41it/s] 18it [00:02, 9.50it/s] 19it [00:02, 9.60it/s] 20it [00:02, 9.65it/s] 21it [00:02, 9.72it/s] 22it [00:02, 9.75it/s] 23it [00:02, 9.80it/s] 24it [00:02, 9.21it/s] 25it [00:02, 9.41it/s] 26it [00:02, 9.53it/s] 27it [00:03, 9.60it/s] 28it [00:03, 9.66it/s] 29it [00:03, 9.72it/s] 30it [00:03, 9.76it/s] 31it [00:03, 9.80it/s] 32it [00:03, 9.81it/s] 33it [00:03, 9.84it/s] 34it [00:03, 9.82it/s] 35it [00:03, 9.83it/s] 36it [00:03, 9.83it/s] 37it [00:04, 9.85it/s] 38it [00:04, 9.85it/s] 39it [00:04, 9.84it/s] 40it [00:04, 9.83it/s] 41it [00:04, 9.85it/s] 42it [00:04, 9.84it/s] 43it [00:04, 9.24it/s] 44it [00:04, 9.37it/s] 45it [00:04, 9.52it/s] 46it [00:05, 9.60it/s] 47it [00:05, 9.68it/s] 48it [00:05, 9.71it/s] 49it [00:05, 9.72it/s] 50it [00:05, 9.73it/s]2025-05-26 03:24:28,440 - INFO - [Epoch 028 | Batch 0050] IWAE-loss 7022.5996 | mean log_px -0.0538 | KL -3548.01 + 51it [00:05, 9.75it/s] 52it [00:05, 9.77it/s] 53it [00:05, 9.79it/s] 54it [00:05, 9.79it/s] 55it [00:05, 9.81it/s] 56it [00:06, 9.79it/s] 57it [00:06, 9.81it/s] 58it [00:06, 9.77it/s] 59it [00:06, 9.82it/s] 60it [00:06, 9.39it/s] 61it [00:06, 9.53it/s] 62it [00:06, 9.61it/s] 63it [00:06, 9.54it/s] 64it [00:06, 9.60it/s] 65it [00:06, 9.67it/s] 66it [00:07, 9.71it/s] 67it [00:07, 9.70it/s] 68it [00:07, 9.61it/s] 69it [00:07, 9.67it/s] 70it [00:07, 9.73it/s] 71it [00:07, 9.77it/s] 72it [00:07, 9.79it/s] 73it [00:07, 9.81it/s] 74it [00:07, 9.82it/s] 75it [00:08, 9.83it/s] 76it [00:08, 9.06it/s] 77it [00:08, 9.03it/s] 78it [00:08, 9.09it/s] 79it [00:08, 9.19it/s] 80it [00:08, 9.19it/s] 81it [00:08, 9.32it/s] 82it [00:08, 9.38it/s] 83it [00:08, 9.45it/s] 84it [00:08, 9.49it/s] 85it [00:09, 9.54it/s] 86it [00:09, 9.55it/s] 87it [00:09, 9.60it/s] 88it [00:09, 9.58it/s] 89it [00:09, 9.60it/s] 90it [00:09, 9.00it/s] 91it [00:09, 9.23it/s] 92it [00:09, 9.38it/s] 93it [00:09, 9.51it/s] 94it [00:10, 9.59it/s] 95it [00:10, 9.65it/s] 96it [00:10, 9.69it/s] 97it [00:10, 9.14it/s] 98it [00:10, 9.33it/s] 99it [00:10, 9.49it/s] 100it [00:10, 9.56it/s]2025-05-26 03:24:33,683 - INFO - [Epoch 028 | Batch 0100] IWAE-loss 7795.5220 | mean log_px -0.0668 | KL -3546.89 + 101it [00:10, 9.57it/s] 102it [00:10, 9.64it/s] 103it [00:10, 9.71it/s] 104it [00:11, 9.68it/s] 105it [00:11, 9.74it/s] 106it [00:11, 9.75it/s] 107it [00:11, 9.78it/s] 108it [00:11, 9.16it/s] 109it [00:11, 9.36it/s] 110it [00:11, 9.49it/s] 111it [00:11, 9.61it/s] 112it [00:11, 9.07it/s] 113it [00:12, 9.30it/s] 114it [00:12, 9.44it/s] 115it [00:12, 9.50it/s] 116it [00:12, 9.50it/s] 117it [00:12, 9.13it/s] 118it [00:12, 9.33it/s] 119it [00:12, 9.46it/s] 120it [00:12, 8.99it/s] 121it [00:12, 9.24it/s] 122it [00:13, 9.40it/s] 123it [00:13, 9.52it/s] 124it [00:13, 9.01it/s] 125it [00:13, 9.20it/s] 126it [00:13, 9.38it/s] 127it [00:13, 9.52it/s] 128it [00:13, 9.61it/s] 129it [00:13, 9.07it/s] 130it [00:13, 9.11it/s] 131it [00:13, 9.29it/s] 132it [00:14, 9.38it/s] 133it [00:14, 9.51it/s] 134it [00:14, 9.59it/s] 135it [00:14, 9.67it/s] 136it [00:14, 9.71it/s] 137it [00:14, 9.75it/s] 138it [00:14, 9.77it/s] 139it [00:14, 9.19it/s] 140it [00:14, 9.24it/s] 141it [00:15, 9.28it/s] 142it [00:15, 9.31it/s] 143it [00:15, 9.27it/s] 144it [00:15, 9.24it/s] 145it [00:15, 9.41it/s] 146it [00:15, 9.53it/s] 147it [00:15, 9.62it/s] 148it [00:15, 9.65it/s] 149it [00:15, 9.07it/s] 150it [00:16, 9.19it/s]2025-05-26 03:24:39,005 - INFO - [Epoch 028 | Batch 0150] IWAE-loss 6129.2549 | mean log_px -0.0445 | KL -3552.00 + 151it [00:16, 9.34it/s] 152it [00:16, 9.05it/s] 153it [00:16, 9.26it/s] 154it [00:16, 9.41it/s] 155it [00:16, 8.94it/s] 156it [00:16, 9.16it/s] 157it [00:16, 9.34it/s] 158it [00:16, 9.44it/s] 159it [00:16, 8.98it/s] 160it [00:17, 9.20it/s] 161it [00:17, 9.36it/s] 162it [00:17, 9.47it/s] 163it [00:17, 9.09it/s] 164it [00:17, 9.30it/s] 165it [00:17, 9.47it/s] 166it [00:17, 9.56it/s] 167it [00:17, 9.65it/s] 168it [00:17, 9.72it/s] 169it [00:18, 9.15it/s] 170it [00:18, 9.35it/s] 171it [00:18, 9.51it/s] 172it [00:18, 9.61it/s] 173it [00:18, 9.69it/s] 174it [00:18, 9.73it/s] 175it [00:18, 9.79it/s] 176it [00:18, 9.68it/s] 177it [00:18, 9.77it/s] 178it [00:18, 9.16it/s] 179it [00:19, 9.35it/s] 180it [00:19, 9.46it/s] 181it [00:19, 9.57it/s] 182it [00:19, 9.05it/s] 183it [00:19, 9.29it/s] 184it [00:19, 9.43it/s] 185it [00:19, 9.54it/s] 186it [00:19, 9.64it/s] 187it [00:19, 9.22it/s] 188it [00:20, 9.40it/s] 189it [00:20, 9.55it/s] 190it [00:20, 9.63it/s] 191it [00:20, 9.66it/s] 192it [00:20, 9.70it/s] 193it [00:20, 9.74it/s] 194it [00:20, 9.76it/s] 195it [00:20, 8.73it/s] 196it [00:20, 9.35it/s] +2025-05-26 03:24:43,903 - INFO - Epoch: 28, Objective: tensor([7316.0479], device='cuda:0', grad_fn=), Loss: 0.06041298806667328, KL/n: 72.37413787841797 + 0it [00:00, ?it/s]2025-05-26 03:24:44,190 - INFO - [Epoch 029 | Batch 0000] IWAE-loss 5790.9482 | mean log_px -0.0366 | KL -3544.11 + 1it [00:00, 5.02it/s] 2it [00:00, 6.45it/s] 3it [00:00, 7.61it/s] 4it [00:00, 8.17it/s] 5it [00:00, 8.62it/s] 6it [00:00, 8.40it/s] 7it [00:00, 8.76it/s] 8it [00:00, 9.07it/s] 9it [00:01, 9.29it/s] 10it [00:01, 8.84it/s] 11it [00:01, 9.10it/s] 12it [00:01, 9.28it/s] 13it [00:01, 9.41it/s] 14it [00:01, 8.97it/s] 15it [00:01, 9.24it/s] 16it [00:01, 9.41it/s] 17it [00:01, 9.54it/s] 18it [00:02, 8.98it/s] 19it [00:02, 9.23it/s] 20it [00:02, 9.39it/s] 21it [00:02, 9.49it/s] 22it [00:02, 9.56it/s] 23it [00:02, 9.65it/s] 24it [00:02, 9.71it/s] 25it [00:02, 9.76it/s] 26it [00:02, 9.76it/s] 27it [00:02, 9.79it/s] 28it [00:03, 9.81it/s] 29it [00:03, 9.82it/s] 30it [00:03, 9.84it/s] 31it [00:03, 9.86it/s] 32it [00:03, 9.85it/s] 33it [00:03, 9.87it/s] 34it [00:03, 9.86it/s] 35it [00:03, 9.87it/s] 36it [00:03, 9.84it/s] 37it [00:03, 9.87it/s] 38it [00:04, 9.86it/s] 39it [00:04, 9.86it/s] 40it [00:04, 9.85it/s] 41it [00:04, 9.86it/s] 42it [00:04, 9.87it/s] 43it [00:04, 9.88it/s] 44it [00:04, 9.87it/s] 45it [00:04, 9.85it/s] 46it [00:04, 9.85it/s] 47it [00:05, 9.83it/s] 48it [00:05, 9.80it/s] 49it [00:05, 9.81it/s] 50it [00:05, 9.82it/s]2025-05-26 03:24:49,408 - INFO - [Epoch 029 | Batch 0050] IWAE-loss 8045.6401 | mean log_px -0.0730 | KL -3546.79 + 51it [00:05, 9.81it/s] 52it [00:05, 9.83it/s] 53it [00:05, 9.85it/s] 54it [00:05, 9.85it/s] 55it [00:05, 9.85it/s] 56it [00:05, 9.84it/s] 57it [00:06, 9.84it/s] 58it [00:06, 9.83it/s] 59it [00:06, 9.85it/s] 60it [00:06, 9.84it/s] 61it [00:06, 9.86it/s] 62it [00:06, 9.85it/s] 63it [00:06, 9.86it/s] 64it [00:06, 9.83it/s] 65it [00:06, 9.84it/s] 66it [00:06, 9.84it/s] 67it [00:07, 9.86it/s] 68it [00:07, 9.80it/s] 69it [00:07, 9.81it/s] 70it [00:07, 9.81it/s] 71it [00:07, 9.82it/s] 72it [00:07, 9.81it/s] 73it [00:07, 9.78it/s] 74it [00:07, 9.81it/s] 75it [00:07, 9.82it/s] 76it [00:07, 9.82it/s] 77it [00:08, 9.85it/s] 78it [00:08, 9.84it/s] 79it [00:08, 9.85it/s] 80it [00:08, 9.84it/s] 81it [00:08, 9.81it/s] 82it [00:08, 9.82it/s] 83it [00:08, 9.82it/s] 84it [00:08, 9.83it/s] 85it [00:08, 9.84it/s] 86it [00:08, 9.70it/s] 87it [00:09, 9.75it/s] 88it [00:09, 9.74it/s] 89it [00:09, 9.78it/s] 90it [00:09, 9.80it/s] 91it [00:09, 9.83it/s] 92it [00:09, 9.84it/s] 93it [00:09, 9.86it/s] 94it [00:09, 9.86it/s] 95it [00:09, 9.88it/s] 96it [00:09, 9.88it/s] 97it [00:10, 9.90it/s] 98it [00:10, 9.87it/s] 99it [00:10, 9.65it/s] 100it [00:10, 9.72it/s]2025-05-26 03:24:54,501 - INFO - [Epoch 029 | Batch 0100] IWAE-loss 7717.3555 | mean log_px -0.0658 | KL -3546.15 + 101it [00:10, 9.74it/s] 102it [00:10, 9.78it/s] 103it [00:10, 9.82it/s] 104it [00:10, 9.84it/s] 105it [00:10, 9.85it/s] 106it [00:11, 9.86it/s] 107it [00:11, 9.87it/s] 108it [00:11, 9.86it/s] 109it [00:11, 9.87it/s] 110it [00:11, 9.86it/s] 111it [00:11, 9.87it/s] 112it [00:11, 9.85it/s] 113it [00:11, 9.86it/s] 114it [00:11, 9.85it/s] 115it [00:11, 9.61it/s] 116it [00:12, 9.58it/s] 117it [00:12, 9.55it/s] 118it [00:12, 9.53it/s] 119it [00:12, 9.51it/s] 120it [00:12, 9.49it/s] 121it [00:12, 9.48it/s] 122it [00:12, 9.45it/s] 123it [00:12, 9.44it/s] 124it [00:12, 9.44it/s] 125it [00:12, 9.45it/s] 126it [00:13, 9.43it/s] 127it [00:13, 9.50it/s] 128it [00:13, 9.50it/s] 129it [00:13, 9.50it/s] 130it [00:13, 9.46it/s] 131it [00:13, 9.49it/s] 132it [00:13, 9.50it/s] 133it [00:13, 9.48it/s] 134it [00:13, 9.49it/s] 135it [00:14, 9.48it/s] 136it [00:14, 9.50it/s] 137it [00:14, 9.50it/s] 138it [00:14, 9.51it/s] 139it [00:14, 9.51it/s] 140it [00:14, 9.48it/s] 141it [00:14, 9.47it/s] 142it [00:14, 9.47it/s] 143it [00:14, 9.54it/s] 144it [00:14, 9.46it/s] 145it [00:15, 9.41it/s] 146it [00:15, 9.53it/s] 147it [00:15, 9.61it/s] 148it [00:15, 9.67it/s] 149it [00:15, 9.74it/s] 150it [00:15, 9.73it/s]2025-05-26 03:24:59,708 - INFO - [Epoch 029 | Batch 0150] IWAE-loss 9115.5293 | mean log_px -0.0874 | KL -3541.34 + 151it [00:15, 9.74it/s] 152it [00:15, 9.76it/s] 153it [00:15, 9.79it/s] 154it [00:16, 9.77it/s] 155it [00:16, 9.81it/s] 156it [00:16, 9.80it/s] 157it [00:16, 9.82it/s] 158it [00:16, 9.83it/s] 159it [00:16, 9.84it/s] 160it [00:16, 9.62it/s] 161it [00:16, 9.67it/s] 162it [00:16, 9.72it/s] 163it [00:16, 9.77it/s] 164it [00:17, 9.78it/s] 165it [00:17, 9.83it/s] 166it [00:17, 9.83it/s] 167it [00:17, 9.84it/s] 168it [00:17, 9.84it/s] 169it [00:17, 9.78it/s] 170it [00:17, 9.78it/s] 171it [00:17, 9.63it/s] 172it [00:17, 9.64it/s] 173it [00:17, 9.69it/s] 174it [00:18, 9.52it/s] 175it [00:18, 9.27it/s] 176it [00:18, 9.39it/s] 177it [00:18, 9.54it/s] 178it [00:18, 9.09it/s] 179it [00:18, 9.16it/s] 180it [00:18, 9.34it/s] 181it [00:18, 9.47it/s] 182it [00:18, 9.58it/s] 183it [00:19, 9.66it/s] 184it [00:19, 9.73it/s] 185it [00:19, 9.71it/s] 186it [00:19, 9.75it/s] 187it [00:19, 9.71it/s] 188it [00:19, 9.60it/s] 189it [00:19, 8.89it/s] 190it [00:19, 9.15it/s] 191it [00:19, 9.37it/s] 192it [00:19, 9.51it/s] 193it [00:20, 9.61it/s] 194it [00:20, 9.69it/s] 195it [00:20, 9.16it/s] 196it [00:20, 9.58it/s] +2025-05-26 03:25:04,503 - INFO - Epoch: 29, Objective: tensor([7595.7744], device='cuda:0', grad_fn=), Loss: 0.06281988322734833, KL/n: 72.2783432006836 + 0it [00:00, ?it/s]2025-05-26 03:25:04,757 - INFO - [Epoch 030 | Batch 0000] IWAE-loss 7184.0381 | mean log_px -0.0520 | KL -3540.00 + 1it [00:00, 5.18it/s] 2it [00:00, 7.16it/s] 3it [00:00, 8.21it/s] 4it [00:00, 8.76it/s] 5it [00:00, 9.04it/s] 6it [00:00, 9.29it/s] 7it [00:00, 9.47it/s] 8it [00:00, 9.60it/s] 9it [00:01, 9.69it/s] 10it [00:01, 9.76it/s] 11it [00:01, 9.79it/s] 12it [00:01, 9.79it/s] 13it [00:01, 9.31it/s] 14it [00:01, 9.46it/s] 15it [00:01, 9.51it/s] 16it [00:01, 9.61it/s] 17it [00:01, 9.69it/s] 18it [00:01, 9.72it/s] 19it [00:02, 9.20it/s] 20it [00:02, 6.19it/s] 21it [00:02, 6.94it/s] 22it [00:02, 7.59it/s] 23it [00:02, 8.15it/s] 24it [00:02, 8.12it/s] 25it [00:02, 8.57it/s] 26it [00:02, 8.87it/s] 27it [00:03, 9.15it/s] 28it [00:03, 8.78it/s] 29it [00:03, 9.08it/s] 30it [00:03, 9.29it/s] 31it [00:03, 9.47it/s] 32it [00:03, 9.15it/s] 33it [00:03, 9.36it/s] 34it [00:03, 9.50it/s] 35it [00:03, 9.62it/s] 36it [00:04, 9.69it/s] 37it [00:04, 9.75it/s] 38it [00:04, 9.76it/s] 39it [00:04, 9.81it/s] 40it [00:04, 9.83it/s] 41it [00:04, 9.34it/s] 42it [00:04, 9.48it/s] 43it [00:04, 9.60it/s] 44it [00:04, 9.68it/s] 45it [00:04, 9.08it/s] 46it [00:05, 9.29it/s] 47it [00:05, 9.44it/s] 48it [00:05, 9.57it/s] 49it [00:05, 9.64it/s] 50it [00:05, 9.70it/s]2025-05-26 03:25:10,198 - INFO - [Epoch 030 | Batch 0050] IWAE-loss 5986.0142 | mean log_px -0.0354 | KL -3537.95 + 51it [00:05, 9.74it/s] 52it [00:05, 9.76it/s] 53it [00:05, 9.81it/s] 54it [00:05, 9.81it/s] 55it [00:06, 9.56it/s] 56it [00:06, 9.36it/s] 57it [00:06, 8.93it/s] 58it [00:06, 9.09it/s] 59it [00:06, 9.32it/s] 60it [00:06, 9.48it/s] 61it [00:06, 9.59it/s] 62it [00:06, 9.67it/s] 63it [00:06, 9.74it/s] 64it [00:06, 9.78it/s] 65it [00:07, 9.82it/s] 66it [00:07, 9.82it/s] 67it [00:07, 9.83it/s] 68it [00:07, 9.86it/s] 69it [00:07, 9.87it/s] 70it [00:07, 9.86it/s] 71it [00:07, 9.86it/s] 72it [00:07, 9.86it/s] 73it [00:07, 9.24it/s] 74it [00:08, 9.42it/s] 75it [00:08, 9.57it/s] 76it [00:08, 9.64it/s] 77it [00:08, 9.71it/s] 78it [00:08, 9.73it/s] 79it [00:08, 9.74it/s] 80it [00:08, 9.11it/s] 81it [00:08, 9.08it/s] 82it [00:08, 9.22it/s] 83it [00:08, 8.83it/s] 84it [00:09, 9.09it/s] 85it [00:09, 9.31it/s] 86it [00:09, 9.45it/s] 87it [00:09, 8.97it/s] 88it [00:09, 9.22it/s] 89it [00:09, 9.42it/s] 90it [00:09, 9.55it/s] 91it [00:09, 9.56it/s] 92it [00:09, 9.33it/s] 93it [00:10, 8.90it/s] 94it [00:10, 9.16it/s] 95it [00:10, 9.27it/s] 96it [00:10, 9.44it/s] 97it [00:10, 9.57it/s] 98it [00:10, 9.65it/s] 99it [00:10, 9.73it/s] 100it [00:10, 9.76it/s]2025-05-26 03:25:15,463 - INFO - [Epoch 030 | Batch 0100] IWAE-loss 5398.5059 | mean log_px -0.0280 | KL -3539.20 + 101it [00:10, 9.79it/s] 102it [00:10, 9.81it/s] 103it [00:11, 9.36it/s] 104it [00:11, 9.50it/s] 105it [00:11, 9.59it/s] 106it [00:11, 9.08it/s] 107it [00:11, 9.32it/s] 108it [00:11, 9.48it/s] 109it [00:11, 9.57it/s] 110it [00:11, 9.57it/s] 111it [00:11, 9.53it/s] 112it [00:12, 9.57it/s] 113it [00:12, 9.68it/s] 114it [00:12, 9.74it/s] 115it [00:12, 9.29it/s] 116it [00:12, 9.46it/s] 117it [00:12, 9.59it/s] 118it [00:12, 9.68it/s] 119it [00:12, 9.74it/s] 120it [00:12, 9.78it/s] 121it [00:12, 9.83it/s] 122it [00:13, 9.84it/s] 123it [00:13, 9.86it/s] 124it [00:13, 9.86it/s] 125it [00:13, 9.88it/s] 126it [00:13, 9.88it/s] 127it [00:13, 9.89it/s] 128it [00:13, 9.88it/s] 129it [00:13, 9.88it/s] 130it [00:13, 9.86it/s] 131it [00:13, 9.38it/s] 132it [00:14, 9.52it/s] 133it [00:14, 9.62it/s] 134it [00:14, 9.68it/s] 135it [00:14, 9.75it/s] 136it [00:14, 9.77it/s] 137it [00:14, 9.80it/s] 138it [00:14, 9.82it/s] 139it [00:14, 9.85it/s] 140it [00:14, 9.86it/s] 141it [00:15, 9.88it/s] 142it [00:15, 9.87it/s] 143it [00:15, 9.84it/s] 144it [00:15, 9.35it/s] 145it [00:15, 9.50it/s] 146it [00:15, 9.59it/s] 147it [00:15, 9.17it/s] 148it [00:15, 9.35it/s] 149it [00:15, 9.49it/s] 150it [00:15, 9.59it/s]2025-05-26 03:25:20,651 - INFO - [Epoch 030 | Batch 0150] IWAE-loss 8095.3145 | mean log_px -0.0698 | KL -3535.73 + 151it [00:16, 9.66it/s] 152it [00:16, 9.22it/s] 153it [00:16, 9.40it/s] 154it [00:16, 9.51it/s] 155it [00:16, 9.58it/s] 156it [00:16, 9.64it/s] 157it [00:16, 9.69it/s] 158it [00:16, 9.74it/s] 159it [00:16, 9.77it/s] 160it [00:17, 9.15it/s] 161it [00:17, 9.35it/s] 162it [00:17, 9.50it/s] 163it [00:17, 9.61it/s] 164it [00:17, 9.68it/s] 165it [00:17, 9.73it/s] 166it [00:17, 9.77it/s] 167it [00:17, 9.81it/s] 168it [00:17, 9.81it/s] 169it [00:17, 9.85it/s] 170it [00:18, 9.83it/s] 171it [00:18, 9.85it/s] 172it [00:18, 9.86it/s] 173it [00:18, 9.88it/s] 174it [00:18, 9.86it/s] 175it [00:18, 9.80it/s] 176it [00:18, 9.81it/s] 177it [00:18, 9.84it/s] 178it [00:18, 9.84it/s] 179it [00:18, 9.86it/s] 180it [00:19, 9.86it/s] 181it [00:19, 9.87it/s] 182it [00:19, 9.88it/s] 183it [00:19, 9.87it/s] 184it [00:19, 9.87it/s] 185it [00:19, 9.27it/s] 186it [00:19, 9.44it/s] 187it [00:19, 9.58it/s] 188it [00:19, 9.67it/s] 189it [00:19, 9.72it/s] 190it [00:20, 9.66it/s] 191it [00:20, 9.72it/s] 192it [00:20, 9.77it/s] 193it [00:20, 9.81it/s] 194it [00:20, 9.83it/s] 195it [00:20, 9.26it/s] 196it [00:20, 9.43it/s] +2025-05-26 03:25:25,413 - INFO - Epoch: 30, Objective: tensor([8346.3223], device='cuda:0', grad_fn=), Loss: 0.08652433753013611, KL/n: 72.18109130859375 + 0it [00:00, ?it/s]2025-05-26 03:25:25,689 - INFO - [Epoch 031 | Batch 0000] IWAE-loss 7981.7705 | mean log_px -0.0697 | KL -3537.61 + 1it [00:00, 4.81it/s] 2it [00:00, 6.81it/s] 3it [00:00, 7.95it/s] 4it [00:00, 8.60it/s] 5it [00:00, 8.59it/s] 6it [00:00, 8.98it/s] 7it [00:00, 9.26it/s] 8it [00:00, 9.42it/s] 9it [00:01, 9.51it/s] 10it [00:01, 9.60it/s] 11it [00:01, 9.69it/s] 12it [00:01, 9.73it/s] 13it [00:01, 9.78it/s] 14it [00:01, 9.79it/s] 15it [00:01, 9.20it/s] 16it [00:01, 9.39it/s] 17it [00:01, 9.53it/s] 18it [00:01, 9.62it/s] 19it [00:02, 9.08it/s] 20it [00:02, 9.28it/s] 21it [00:02, 9.46it/s] 22it [00:02, 9.46it/s] 23it [00:02, 9.52it/s] 24it [00:02, 9.57it/s] 25it [00:02, 9.67it/s] 26it [00:02, 9.72it/s] 27it [00:02, 9.76it/s] 28it [00:03, 9.79it/s] 29it [00:03, 9.82it/s] 30it [00:03, 9.83it/s] 31it [00:03, 9.84it/s] 32it [00:03, 9.84it/s] 33it [00:03, 9.85it/s] 34it [00:03, 9.43it/s] 35it [00:03, 9.56it/s] 36it [00:03, 9.64it/s] 37it [00:03, 9.72it/s] 38it [00:04, 9.73it/s] 39it [00:04, 9.27it/s] 40it [00:04, 9.42it/s] 41it [00:04, 9.54it/s] 42it [00:04, 9.63it/s] 43it [00:04, 9.70it/s] 44it [00:04, 9.75it/s] 45it [00:04, 9.79it/s] 46it [00:04, 9.78it/s] 47it [00:04, 9.80it/s] 48it [00:05, 9.81it/s] 49it [00:05, 9.82it/s] 50it [00:05, 9.82it/s]2025-05-26 03:25:30,894 - INFO - [Epoch 031 | Batch 0050] IWAE-loss 7131.4248 | mean log_px -0.0549 | KL -3539.47 + 51it [00:05, 9.80it/s] 52it [00:05, 9.69it/s] 53it [00:05, 9.75it/s] 54it [00:05, 9.77it/s] 55it [00:05, 9.57it/s] 56it [00:05, 9.18it/s] 57it [00:06, 9.38it/s] 58it [00:06, 9.50it/s] 59it [00:06, 9.61it/s] 60it [00:06, 9.68it/s] 61it [00:06, 9.74it/s] 62it [00:06, 9.76it/s] 63it [00:06, 9.80it/s] 64it [00:06, 9.81it/s] 65it [00:06, 9.81it/s] 66it [00:06, 9.82it/s] 67it [00:07, 9.84it/s] 68it [00:07, 9.85it/s] 69it [00:07, 9.86it/s] 70it [00:07, 9.85it/s] 71it [00:07, 9.87it/s] 72it [00:07, 9.85it/s] 73it [00:07, 9.87it/s] 74it [00:07, 9.85it/s] 75it [00:07, 9.87it/s] 76it [00:07, 9.86it/s] 77it [00:08, 9.86it/s] 78it [00:08, 9.36it/s] 79it [00:08, 9.48it/s] 80it [00:08, 9.59it/s] 81it [00:08, 9.69it/s] 82it [00:08, 9.74it/s] 83it [00:08, 9.27it/s] 84it [00:08, 9.36it/s] 85it [00:08, 9.51it/s] 86it [00:09, 9.15it/s] 87it [00:09, 9.09it/s] 88it [00:09, 9.17it/s] 89it [00:09, 9.14it/s] 90it [00:09, 9.01it/s] 91it [00:09, 8.58it/s] 92it [00:09, 8.82it/s] 93it [00:09, 9.04it/s] 94it [00:09, 9.18it/s] 95it [00:10, 9.31it/s] 96it [00:10, 9.40it/s] 97it [00:10, 8.90it/s] 98it [00:10, 9.07it/s] 99it [00:10, 9.23it/s] 100it [00:10, 9.32it/s]2025-05-26 03:25:36,174 - INFO - [Epoch 031 | Batch 0100] IWAE-loss 6414.5449 | mean log_px -0.0424 | KL -3538.34 + 101it [00:10, 9.36it/s] 102it [00:10, 9.44it/s] 103it [00:10, 9.54it/s] 104it [00:10, 9.61it/s] 105it [00:11, 9.68it/s] 106it [00:11, 9.72it/s] 107it [00:11, 9.75it/s] 108it [00:11, 9.77it/s] 109it [00:11, 9.76it/s] 110it [00:11, 9.75it/s] 111it [00:11, 9.77it/s] 112it [00:11, 9.77it/s] 113it [00:11, 9.80it/s] 114it [00:12, 9.79it/s] 115it [00:12, 9.74it/s] 116it [00:12, 9.75it/s] 117it [00:12, 9.74it/s] 118it [00:12, 9.63it/s] 119it [00:12, 9.67it/s] 120it [00:12, 9.60it/s] 121it [00:12, 9.55it/s] 122it [00:12, 9.51it/s] 123it [00:12, 9.53it/s] 124it [00:13, 9.51it/s] 125it [00:13, 9.51it/s] 126it [00:13, 9.52it/s] 127it [00:13, 9.55it/s] 128it [00:13, 9.53it/s] 129it [00:13, 9.51it/s] 130it [00:13, 9.54it/s] 131it [00:13, 9.54it/s] 132it [00:13, 9.47it/s] 133it [00:13, 9.54it/s] 134it [00:14, 9.49it/s] 135it [00:14, 9.55it/s] 136it [00:14, 9.55it/s] 137it [00:14, 9.58it/s] 138it [00:14, 9.58it/s] 139it [00:14, 9.58it/s] 140it [00:14, 9.52it/s] 141it [00:14, 9.57it/s] 142it [00:14, 9.59it/s] 143it [00:15, 9.54it/s] 144it [00:15, 8.85it/s] 145it [00:15, 9.01it/s] 146it [00:15, 9.22it/s] 147it [00:15, 9.39it/s] 148it [00:15, 9.52it/s] 149it [00:15, 9.57it/s] 150it [00:15, 9.55it/s]2025-05-26 03:25:41,398 - INFO - [Epoch 031 | Batch 0150] IWAE-loss 7563.3599 | mean log_px -0.0640 | KL -3531.75 + 151it [00:15, 9.01it/s] 152it [00:16, 9.21it/s] 153it [00:16, 9.38it/s] 154it [00:16, 9.47it/s] 155it [00:16, 9.57it/s] 156it [00:16, 9.61it/s] 157it [00:16, 9.20it/s] 158it [00:16, 9.35it/s] 159it [00:16, 9.50it/s] 160it [00:16, 9.56it/s] 161it [00:16, 9.62it/s] 162it [00:17, 9.66it/s] 163it [00:17, 9.71it/s] 164it [00:17, 9.74it/s] 165it [00:17, 9.78it/s] 166it [00:17, 9.79it/s] 167it [00:17, 9.80it/s] 168it [00:17, 9.80it/s] 169it [00:17, 9.82it/s] 170it [00:17, 9.80it/s] 171it [00:17, 9.82it/s] 172it [00:18, 9.80it/s] 173it [00:18, 9.80it/s] 174it [00:18, 9.78it/s] 175it [00:18, 9.81it/s] 176it [00:18, 9.64it/s] 177it [00:18, 9.45it/s] 178it [00:18, 9.06it/s] 179it [00:18, 9.24it/s] 180it [00:18, 9.29it/s] 181it [00:19, 9.39it/s] 182it [00:19, 9.42it/s] 183it [00:19, 9.04it/s] 184it [00:19, 9.17it/s] 185it [00:19, 9.26it/s] 186it [00:19, 9.34it/s] 187it [00:19, 9.35it/s] 188it [00:19, 9.34it/s] 189it [00:19, 9.40it/s] 190it [00:20, 9.36it/s] 191it [00:20, 8.82it/s] 192it [00:20, 9.01it/s] 193it [00:20, 9.15it/s] 194it [00:20, 9.24it/s] 195it [00:20, 8.74it/s] 196it [00:20, 9.00it/s] 196it [00:20, 9.45it/s] +2025-05-26 03:25:46,288 - INFO - Epoch: 31, Objective: tensor([6049.7988], device='cuda:0', grad_fn=), Loss: 0.03925026208162308, KL/n: 72.08685302734375 + 0it [00:00, ?it/s]2025-05-26 03:25:46,583 - INFO - [Epoch 032 | Batch 0000] IWAE-loss 5750.3301 | mean log_px -0.0349 | KL -3535.57 + 1it [00:00, 4.81it/s] 2it [00:00, 6.73it/s] 3it [00:00, 7.82it/s] 4it [00:00, 8.40it/s] 5it [00:00, 8.78it/s] 6it [00:00, 8.59it/s] 7it [00:00, 8.88it/s] 8it [00:00, 8.97it/s] 9it [00:01, 9.23it/s] 10it [00:01, 5.86it/s] 11it [00:01, 6.68it/s] 12it [00:01, 7.34it/s] 13it [00:01, 7.96it/s] 14it [00:01, 8.43it/s] 15it [00:01, 8.81it/s] 16it [00:01, 9.10it/s] 17it [00:02, 9.31it/s] 18it [00:02, 9.47it/s] 19it [00:02, 9.59it/s] 20it [00:02, 9.64it/s] 21it [00:02, 9.69it/s] 22it [00:02, 9.12it/s] 23it [00:02, 9.30it/s] 24it [00:02, 9.35it/s] 25it [00:02, 9.46it/s] 26it [00:03, 9.55it/s] 27it [00:03, 9.64it/s] 28it [00:03, 9.69it/s] 29it [00:03, 9.75it/s] 30it [00:03, 9.76it/s] 31it [00:03, 9.61it/s] 32it [00:03, 9.63it/s] 33it [00:03, 9.59it/s] 34it [00:03, 9.56it/s] 35it [00:03, 9.56it/s] 36it [00:04, 9.59it/s] 37it [00:04, 9.65it/s] 38it [00:04, 9.67it/s] 39it [00:04, 9.58it/s] 40it [00:04, 9.41it/s] 41it [00:04, 9.48it/s] 42it [00:04, 9.47it/s] 43it [00:04, 9.47it/s] 44it [00:04, 9.48it/s] 45it [00:05, 9.56it/s] 46it [00:05, 9.54it/s] 47it [00:05, 9.58it/s] 48it [00:05, 9.53it/s] 49it [00:05, 9.59it/s] 50it [00:05, 9.56it/s]2025-05-26 03:25:52,023 - INFO - [Epoch 032 | Batch 0050] IWAE-loss 5072.8218 | mean log_px -0.0260 | KL -3529.07 + 51it [00:05, 9.52it/s] 52it [00:05, 9.42it/s] 53it [00:05, 9.47it/s] 54it [00:05, 9.45it/s] 55it [00:06, 9.42it/s] 56it [00:06, 8.90it/s] 57it [00:06, 9.07it/s] 58it [00:06, 9.18it/s] 59it [00:06, 9.28it/s] 60it [00:06, 9.36it/s] 61it [00:06, 9.45it/s] 62it [00:06, 9.50it/s] 63it [00:06, 9.48it/s] 64it [00:07, 9.45it/s] 65it [00:07, 9.46it/s] 66it [00:07, 9.48it/s] 67it [00:07, 9.50it/s] 68it [00:07, 9.51it/s] 69it [00:07, 9.46it/s] 70it [00:07, 9.50it/s] 71it [00:07, 8.98it/s] 72it [00:07, 8.85it/s] 73it [00:08, 9.12it/s] 74it [00:08, 8.82it/s] 75it [00:08, 9.10it/s] 76it [00:08, 9.31it/s] 77it [00:08, 9.48it/s] 78it [00:08, 9.57it/s] 79it [00:08, 9.59it/s] 80it [00:08, 9.65it/s] 81it [00:08, 9.68it/s] 82it [00:08, 9.73it/s] 83it [00:09, 9.77it/s] 84it [00:09, 9.80it/s] 85it [00:09, 9.81it/s] 86it [00:09, 9.83it/s] 87it [00:09, 9.83it/s] 88it [00:09, 9.82it/s] 89it [00:09, 9.82it/s] 90it [00:09, 9.81it/s] 91it [00:09, 9.83it/s] 92it [00:09, 9.83it/s] 93it [00:10, 9.84it/s] 94it [00:10, 9.83it/s] 95it [00:10, 9.84it/s] 96it [00:10, 9.84it/s] 97it [00:10, 9.86it/s] 98it [00:10, 9.84it/s] 99it [00:10, 9.85it/s] 100it [00:10, 9.85it/s]2025-05-26 03:25:57,264 - INFO - [Epoch 032 | Batch 0100] IWAE-loss 6324.5918 | mean log_px -0.0521 | KL -3526.06 + 101it [00:10, 9.83it/s] 102it [00:10, 9.82it/s] 103it [00:11, 9.84it/s] 104it [00:11, 9.84it/s] 105it [00:11, 9.86it/s] 106it [00:11, 9.32it/s] 107it [00:11, 9.47it/s] 108it [00:11, 9.59it/s] 109it [00:11, 9.70it/s] 110it [00:11, 9.74it/s] 111it [00:11, 9.77it/s] 112it [00:12, 9.78it/s] 113it [00:12, 9.81it/s] 114it [00:12, 9.77it/s] 115it [00:12, 9.75it/s] 116it [00:12, 9.78it/s] 117it [00:12, 9.80it/s] 118it [00:12, 9.78it/s] 119it [00:12, 9.79it/s] 120it [00:12, 9.80it/s] 121it [00:12, 9.82it/s] 122it [00:13, 9.81it/s] 123it [00:13, 9.82it/s] 124it [00:13, 9.80it/s] 125it [00:13, 9.69it/s] 126it [00:13, 9.68it/s] 127it [00:13, 9.71it/s] 128it [00:13, 9.74it/s] 129it [00:13, 9.78it/s] 130it [00:13, 9.78it/s] 131it [00:13, 9.80it/s] 132it [00:14, 9.80it/s] 133it [00:14, 9.81it/s] 134it [00:14, 9.80it/s] 135it [00:14, 9.81it/s] 136it [00:14, 9.82it/s] 137it [00:14, 9.85it/s] 138it [00:14, 9.82it/s] 139it [00:14, 9.84it/s] 140it [00:14, 9.83it/s] 141it [00:14, 9.85it/s] 142it [00:15, 9.82it/s] 143it [00:15, 9.84it/s] 144it [00:15, 9.84it/s] 145it [00:15, 9.85it/s] 146it [00:15, 9.82it/s] 147it [00:15, 9.82it/s] 148it [00:15, 9.76it/s] 149it [00:15, 9.73it/s] 150it [00:15, 9.77it/s]2025-05-26 03:26:02,381 - INFO - [Epoch 032 | Batch 0150] IWAE-loss 7815.7627 | mean log_px -0.0678 | KL -3526.52 + 151it [00:16, 9.78it/s] 152it [00:16, 9.81it/s] 153it [00:16, 9.83it/s] 154it [00:16, 9.83it/s] 155it [00:16, 9.84it/s] 156it [00:16, 9.85it/s] 157it [00:16, 9.86it/s] 158it [00:16, 9.86it/s] 159it [00:16, 9.87it/s] 160it [00:16, 9.86it/s] 161it [00:17, 9.86it/s] 162it [00:17, 9.85it/s] 163it [00:17, 9.86it/s] 164it [00:17, 9.86it/s] 165it [00:17, 9.86it/s] 166it [00:17, 9.85it/s] 167it [00:17, 9.85it/s] 168it [00:17, 9.84it/s] 169it [00:17, 9.83it/s] 170it [00:17, 9.85it/s] 171it [00:18, 9.86it/s] 172it [00:18, 9.85it/s] 173it [00:18, 9.86it/s] 174it [00:18, 9.85it/s] 175it [00:18, 9.86it/s] 176it [00:18, 9.85it/s] 177it [00:18, 9.85it/s] 178it [00:18, 9.82it/s] 179it [00:18, 9.83it/s] 180it [00:18, 9.82it/s] 181it [00:19, 9.84it/s] 182it [00:19, 9.82it/s] 183it [00:19, 9.83it/s] 184it [00:19, 9.83it/s] 185it [00:19, 9.83it/s] 186it [00:19, 9.83it/s] 187it [00:19, 9.84it/s] 188it [00:19, 9.39it/s] 189it [00:19, 9.24it/s] 190it [00:19, 9.22it/s] 191it [00:20, 9.31it/s] 192it [00:20, 9.39it/s] 193it [00:20, 9.47it/s] 194it [00:20, 9.51it/s] 195it [00:20, 9.00it/s] 196it [00:20, 9.25it/s] 196it [00:20, 9.46it/s] +2025-05-26 03:26:07,127 - INFO - Epoch: 32, Objective: tensor([5291.6196], device='cuda:0', grad_fn=), Loss: 0.03124961443245411, KL/n: 71.98877716064453 + 0it [00:00, ?it/s]2025-05-26 03:26:07,389 - INFO - [Epoch 033 | Batch 0000] IWAE-loss 5486.5654 | mean log_px -0.0308 | KL -3528.38 + 1it [00:00, 5.38it/s] 2it [00:00, 7.18it/s] 3it [00:00, 8.22it/s] 4it [00:00, 8.78it/s] 5it [00:00, 9.17it/s] 6it [00:00, 9.38it/s] 7it [00:00, 9.55it/s] 8it [00:00, 9.00it/s] 9it [00:01, 9.27it/s] 10it [00:01, 9.44it/s] 11it [00:01, 9.58it/s] 12it [00:01, 9.18it/s] 13it [00:01, 9.39it/s] 14it [00:01, 9.53it/s] 15it [00:01, 9.64it/s] 16it [00:01, 9.70it/s] 17it [00:01, 9.76it/s] 18it [00:01, 9.76it/s] 19it [00:02, 9.81it/s] 20it [00:02, 9.19it/s] 21it [00:02, 9.39it/s] 22it [00:02, 9.49it/s] 23it [00:02, 9.61it/s] 24it [00:02, 9.66it/s] 25it [00:02, 9.73it/s] 26it [00:02, 9.75it/s] 27it [00:02, 9.37it/s] 28it [00:03, 9.50it/s] 29it [00:03, 9.53it/s] 30it [00:03, 9.58it/s] 31it [00:03, 9.67it/s] 32it [00:03, 9.72it/s] 33it [00:03, 9.78it/s] 34it [00:03, 9.82it/s] 35it [00:03, 9.83it/s] 36it [00:03, 9.76it/s] 37it [00:03, 9.79it/s] 38it [00:04, 9.30it/s] 39it [00:04, 9.46it/s] 40it [00:04, 9.58it/s] 41it [00:04, 9.68it/s] 42it [00:04, 9.73it/s] 43it [00:04, 9.79it/s] 44it [00:04, 9.81it/s] 45it [00:04, 9.84it/s] 46it [00:04, 9.84it/s] 47it [00:04, 9.86it/s] 48it [00:05, 9.86it/s] 49it [00:05, 9.88it/s] 50it [00:05, 9.88it/s]2025-05-26 03:26:12,587 - INFO - [Epoch 033 | Batch 0050] IWAE-loss 5826.6826 | mean log_px -0.0356 | KL -3525.49 + 51it [00:05, 9.86it/s] 52it [00:05, 9.84it/s] 53it [00:05, 9.85it/s] 54it [00:05, 9.85it/s] 55it [00:05, 9.86it/s] 56it [00:05, 9.83it/s] 57it [00:05, 9.85it/s] 58it [00:06, 9.86it/s] 59it [00:06, 9.86it/s] 60it [00:06, 9.85it/s] 61it [00:06, 9.68it/s] 62it [00:06, 9.59it/s] 63it [00:06, 9.69it/s] 64it [00:06, 9.74it/s] 65it [00:06, 9.25it/s] 66it [00:06, 9.40it/s] 67it [00:07, 9.55it/s] 68it [00:07, 9.64it/s] 69it [00:07, 9.72it/s] 70it [00:07, 9.77it/s] 71it [00:07, 9.19it/s] 72it [00:07, 9.37it/s] 73it [00:07, 9.52it/s] 74it [00:07, 9.62it/s] 75it [00:07, 9.70it/s] 76it [00:07, 9.75it/s] 77it [00:08, 9.78it/s] 78it [00:08, 9.80it/s] 79it [00:08, 9.85it/s] 80it [00:08, 9.86it/s] 81it [00:08, 9.87it/s] 82it [00:08, 9.88it/s] 83it [00:08, 9.89it/s] 84it [00:08, 9.88it/s] 85it [00:08, 9.89it/s] 86it [00:08, 9.87it/s] 87it [00:09, 9.48it/s] 88it [00:09, 9.59it/s] 89it [00:09, 9.69it/s] 90it [00:09, 9.75it/s] 91it [00:09, 9.80it/s] 92it [00:09, 9.19it/s] 93it [00:09, 9.39it/s] 94it [00:09, 9.51it/s] 95it [00:09, 9.63it/s] 96it [00:10, 9.68it/s] 97it [00:10, 9.71it/s] 98it [00:10, 9.07it/s] 99it [00:10, 9.31it/s] 100it [00:10, 9.48it/s]2025-05-26 03:26:17,770 - INFO - [Epoch 033 | Batch 0100] IWAE-loss 7603.5825 | mean log_px -0.0618 | KL -3521.97 + 101it [00:10, 9.58it/s] 102it [00:10, 9.65it/s] 103it [00:10, 9.72it/s] 104it [00:10, 9.77it/s] 105it [00:10, 9.80it/s] 106it [00:11, 9.81it/s] 107it [00:11, 9.19it/s] 108it [00:11, 9.38it/s] 109it [00:11, 9.50it/s] 110it [00:11, 9.60it/s] 111it [00:11, 9.68it/s] 112it [00:11, 9.73it/s] 113it [00:11, 9.76it/s] 114it [00:11, 9.24it/s] 115it [00:12, 9.40it/s] 116it [00:12, 9.54it/s] 117it [00:12, 9.64it/s] 118it [00:12, 9.71it/s] 119it [00:12, 9.16it/s] 120it [00:12, 9.36it/s] 121it [00:12, 9.51it/s] 122it [00:12, 9.61it/s] 123it [00:12, 9.69it/s] 124it [00:12, 9.73it/s] 125it [00:13, 9.78it/s] 126it [00:13, 9.80it/s] 127it [00:13, 9.84it/s] 128it [00:13, 9.84it/s] 129it [00:13, 9.87it/s] 130it [00:13, 9.85it/s] 131it [00:13, 9.87it/s] 132it [00:13, 9.87it/s] 133it [00:13, 9.88it/s] 134it [00:13, 9.87it/s] 135it [00:14, 9.88it/s] 136it [00:14, 9.89it/s] 137it [00:14, 9.88it/s] 138it [00:14, 9.88it/s] 139it [00:14, 9.90it/s] 140it [00:14, 9.89it/s] 141it [00:14, 9.91it/s] 142it [00:14, 9.89it/s] 143it [00:14, 9.90it/s] 144it [00:14, 9.90it/s] 145it [00:15, 9.90it/s] 146it [00:15, 9.89it/s] 147it [00:15, 9.78it/s] 148it [00:15, 9.70it/s] 149it [00:15, 9.70it/s] 150it [00:15, 9.20it/s]2025-05-26 03:26:22,933 - INFO - [Epoch 033 | Batch 0150] IWAE-loss 5245.3364 | mean log_px -0.0273 | KL -3525.40 + 151it [00:15, 9.24it/s] 152it [00:15, 9.30it/s] 153it [00:15, 8.94it/s] 154it [00:16, 9.10it/s] 155it [00:16, 9.14it/s] 156it [00:16, 9.23it/s] 157it [00:16, 9.32it/s] 158it [00:16, 9.35it/s] 159it [00:16, 9.41it/s] 160it [00:16, 9.36it/s] 161it [00:16, 9.43it/s] 162it [00:16, 9.42it/s] 163it [00:16, 9.43it/s] 164it [00:17, 9.45it/s] 165it [00:17, 9.45it/s] 166it [00:17, 8.70it/s] 167it [00:17, 8.74it/s] 168it [00:17, 8.94it/s] 169it [00:17, 9.20it/s] 170it [00:17, 9.32it/s] 171it [00:17, 9.38it/s] 172it [00:17, 9.42it/s] 173it [00:18, 9.06it/s] 174it [00:18, 9.21it/s] 175it [00:18, 9.35it/s] 176it [00:18, 8.92it/s] 177it [00:18, 9.18it/s] 178it [00:18, 9.37it/s] 179it [00:18, 9.51it/s] 180it [00:18, 9.07it/s] 181it [00:18, 9.25it/s] 182it [00:19, 9.42it/s] 183it [00:19, 9.54it/s] 184it [00:19, 9.02it/s] 185it [00:19, 9.24it/s] 186it [00:19, 9.42it/s] 187it [00:19, 9.54it/s] 188it [00:19, 9.61it/s] 189it [00:19, 9.66it/s] 190it [00:19, 9.23it/s] 191it [00:20, 9.40it/s] 192it [00:20, 9.52it/s] 193it [00:20, 9.61it/s] 194it [00:20, 9.67it/s] 195it [00:20, 9.13it/s] 196it [00:20, 9.37it/s] 196it [00:20, 9.51it/s] +2025-05-26 03:26:27,865 - INFO - Epoch: 33, Objective: tensor([9180.2832], device='cuda:0', grad_fn=), Loss: 0.08810441941022873, KL/n: 71.89595794677734 + 0it [00:00, ?it/s]2025-05-26 03:26:28,324 - INFO - [Epoch 034 | Batch 0000] IWAE-loss 7107.1201 | mean log_px -0.0598 | KL -3525.40 + 1it [00:00, 4.71it/s] 2it [00:00, 6.81it/s] 3it [00:00, 7.93it/s] 4it [00:00, 8.57it/s] 5it [00:00, 8.98it/s] 6it [00:00, 9.26it/s] 7it [00:00, 9.43it/s] 8it [00:00, 9.52it/s] 9it [00:01, 9.59it/s] 10it [00:01, 9.67it/s] 11it [00:01, 9.72it/s] 12it [00:01, 9.76it/s] 13it [00:01, 9.79it/s] 14it [00:01, 9.28it/s] 15it [00:01, 9.46it/s] 16it [00:01, 9.57it/s] 17it [00:01, 9.66it/s] 18it [00:01, 9.71it/s] 19it [00:02, 9.15it/s] 20it [00:02, 9.24it/s] 21it [00:02, 9.42it/s] 22it [00:02, 9.55it/s] 23it [00:02, 9.63it/s] 24it [00:02, 9.70it/s] 25it [00:02, 9.76it/s] 26it [00:02, 9.17it/s] 27it [00:02, 9.35it/s] 28it [00:03, 9.50it/s] 29it [00:03, 9.57it/s] 30it [00:03, 9.62it/s] 31it [00:03, 9.70it/s] 32it [00:03, 9.75it/s] 33it [00:03, 9.80it/s] 34it [00:03, 9.81it/s] 35it [00:03, 9.84it/s] 36it [00:03, 9.85it/s] 37it [00:03, 9.82it/s] 38it [00:04, 9.82it/s] 39it [00:04, 9.85it/s] 40it [00:04, 9.86it/s] 41it [00:04, 9.87it/s] 42it [00:04, 9.86it/s] 43it [00:04, 9.87it/s] 44it [00:04, 9.23it/s] 45it [00:04, 9.42it/s] 46it [00:04, 9.54it/s] 47it [00:04, 9.64it/s] 48it [00:05, 9.70it/s] 49it [00:05, 9.71it/s] 50it [00:05, 9.75it/s]2025-05-26 03:26:33,524 - INFO - [Epoch 034 | Batch 0050] IWAE-loss 5209.7563 | mean log_px -0.0287 | KL -3518.90 + 51it [00:05, 9.77it/s] 52it [00:05, 9.78it/s] 53it [00:05, 9.81it/s] 54it [00:05, 9.80it/s] 55it [00:05, 9.81it/s] 56it [00:05, 9.82it/s] 57it [00:06, 9.51it/s] 58it [00:06, 9.61it/s] 59it [00:06, 9.70it/s] 60it [00:06, 9.74it/s] 61it [00:06, 9.78it/s] 62it [00:06, 9.19it/s] 63it [00:06, 9.40it/s] 64it [00:06, 9.53it/s] 65it [00:06, 9.64it/s] 66it [00:06, 9.70it/s] 67it [00:07, 9.77it/s] 68it [00:07, 9.18it/s] 69it [00:07, 9.37it/s] 70it [00:07, 9.52it/s] 71it [00:07, 9.60it/s] 72it [00:07, 9.68it/s] 73it [00:07, 9.76it/s] 74it [00:07, 9.80it/s] 75it [00:07, 9.81it/s] 76it [00:07, 9.83it/s] 77it [00:08, 9.86it/s] 78it [00:08, 9.87it/s] 79it [00:08, 9.88it/s] 80it [00:08, 9.76it/s] 81it [00:08, 9.80it/s] 82it [00:08, 9.82it/s] 83it [00:08, 9.84it/s] 84it [00:08, 9.84it/s] 85it [00:08, 9.85it/s] 86it [00:08, 9.85it/s] 87it [00:09, 9.86it/s] 88it [00:09, 9.85it/s] 89it [00:09, 9.86it/s] 90it [00:09, 9.72it/s] 91it [00:09, 9.00it/s] 92it [00:09, 8.89it/s] 93it [00:09, 9.03it/s] 94it [00:09, 9.17it/s] 95it [00:09, 9.29it/s] 96it [00:10, 9.38it/s] 97it [00:10, 9.43it/s] 98it [00:10, 9.03it/s] 99it [00:10, 9.18it/s] 100it [00:10, 9.29it/s]2025-05-26 03:26:38,748 - INFO - [Epoch 034 | Batch 0100] IWAE-loss 6808.0835 | mean log_px -0.0500 | KL -3514.93 + 101it [00:10, 9.38it/s] 102it [00:10, 8.93it/s] 103it [00:10, 9.13it/s] 104it [00:10, 9.34it/s] 105it [00:11, 9.49it/s] 106it [00:11, 9.57it/s] 107it [00:11, 9.68it/s] 108it [00:11, 9.74it/s] 109it [00:11, 9.80it/s] 110it [00:11, 9.82it/s] 111it [00:11, 9.84it/s] 112it [00:11, 9.85it/s] 113it [00:11, 9.86it/s] 114it [00:11, 9.86it/s] 115it [00:12, 9.87it/s] 116it [00:12, 9.86it/s] 117it [00:12, 9.87it/s] 118it [00:12, 9.87it/s] 119it [00:12, 9.87it/s] 120it [00:12, 9.87it/s] 121it [00:12, 9.20it/s] 122it [00:12, 9.39it/s] 123it [00:12, 9.54it/s] 124it [00:12, 9.63it/s] 125it [00:13, 9.71it/s] 126it [00:13, 9.75it/s] 127it [00:13, 9.77it/s] 128it [00:13, 9.80it/s] 129it [00:13, 9.84it/s] 130it [00:13, 9.85it/s] 131it [00:13, 9.88it/s] 132it [00:13, 9.88it/s] 133it [00:13, 9.89it/s] 134it [00:13, 9.89it/s] 135it [00:14, 9.90it/s] 136it [00:14, 9.89it/s] 137it [00:14, 9.75it/s] 138it [00:14, 9.78it/s] 139it [00:14, 9.81it/s] 140it [00:14, 9.84it/s] 141it [00:14, 9.86it/s] 142it [00:14, 9.86it/s] 143it [00:14, 9.18it/s] 144it [00:15, 9.37it/s] 145it [00:15, 9.53it/s] 146it [00:15, 9.63it/s] 147it [00:15, 9.72it/s] 148it [00:15, 9.76it/s] 149it [00:15, 9.81it/s] 150it [00:15, 9.82it/s]2025-05-26 03:26:43,889 - INFO - [Epoch 034 | Batch 0150] IWAE-loss 7905.4756 | mean log_px -0.0700 | KL -3521.38 + 151it [00:15, 9.83it/s] 152it [00:15, 9.83it/s] 153it [00:15, 9.84it/s] 154it [00:16, 9.34it/s] 155it [00:16, 9.50it/s] 156it [00:16, 9.60it/s] 157it [00:16, 9.68it/s] 158it [00:16, 9.33it/s] 159it [00:16, 9.48it/s] 160it [00:16, 9.58it/s] 161it [00:16, 9.28it/s] 162it [00:16, 9.45it/s] 163it [00:17, 9.10it/s] 164it [00:17, 9.24it/s] 165it [00:17, 9.44it/s] 166it [00:17, 9.56it/s] 167it [00:17, 9.66it/s] 168it [00:17, 9.10it/s] 169it [00:17, 9.34it/s] 170it [00:17, 9.49it/s] 171it [00:17, 9.60it/s] 172it [00:17, 9.68it/s] 173it [00:18, 9.75it/s] 174it [00:18, 9.32it/s] 175it [00:18, 9.45it/s] 176it [00:18, 9.47it/s] 177it [00:18, 9.59it/s] 178it [00:18, 9.66it/s] 179it [00:18, 9.73it/s] 180it [00:18, 9.78it/s] 181it [00:18, 9.82it/s] 182it [00:19, 9.35it/s] 183it [00:19, 9.46it/s] 184it [00:19, 9.55it/s] 185it [00:19, 9.07it/s] 186it [00:19, 9.30it/s] 187it [00:19, 9.47it/s] 188it [00:19, 9.58it/s] 189it [00:19, 9.48it/s] 190it [00:19, 9.57it/s] 191it [00:19, 9.68it/s] 192it [00:20, 9.73it/s] 193it [00:20, 9.79it/s] 194it [00:20, 9.78it/s] 195it [00:20, 9.22it/s] 196it [00:20, 9.43it/s] 196it [00:20, 9.53it/s] +2025-05-26 03:26:48,737 - INFO - Epoch: 34, Objective: tensor([7032.6973], device='cuda:0', grad_fn=), Loss: 0.05743390694260597, KL/n: 71.76044464111328 + 0it [00:00, ?it/s]2025-05-26 03:26:49,021 - INFO - [Epoch 035 | Batch 0000] IWAE-loss 5518.7554 | mean log_px -0.0321 | KL -3518.21 + 1it [00:00, 5.32it/s] 2it [00:00, 7.04it/s] 3it [00:00, 7.73it/s] 4it [00:00, 8.45it/s] 5it [00:00, 8.93it/s] 6it [00:00, 8.59it/s] 7it [00:00, 8.97it/s] 8it [00:00, 9.24it/s] 9it [00:01, 9.46it/s] 10it [00:01, 9.59it/s] 11it [00:01, 9.70it/s] 12it [00:01, 9.75it/s] 13it [00:01, 9.82it/s] 14it [00:01, 9.83it/s] 15it [00:01, 9.86it/s] 16it [00:01, 9.86it/s] 17it [00:01, 9.89it/s] 18it [00:01, 9.89it/s] 19it [00:02, 9.92it/s] 20it [00:02, 9.90it/s] 21it [00:02, 9.92it/s] 22it [00:02, 9.91it/s] 23it [00:02, 9.90it/s] 24it [00:02, 9.86it/s] 25it [00:02, 9.83it/s] 26it [00:02, 9.84it/s] 27it [00:02, 9.83it/s] 28it [00:02, 9.80it/s] 29it [00:03, 9.81it/s] 30it [00:03, 9.82it/s] 31it [00:03, 9.84it/s] 32it [00:03, 9.85it/s] 33it [00:03, 9.86it/s] 34it [00:03, 9.86it/s] 35it [00:03, 9.86it/s] 36it [00:03, 9.87it/s] 37it [00:03, 9.88it/s] 38it [00:03, 9.87it/s] 39it [00:04, 9.87it/s] 40it [00:04, 9.88it/s] 41it [00:04, 9.89it/s] 42it [00:04, 9.89it/s] 43it [00:04, 9.88it/s] 44it [00:04, 9.87it/s] 45it [00:04, 9.89it/s] 46it [00:04, 9.86it/s] 47it [00:04, 9.52it/s] 48it [00:05, 9.58it/s] 49it [00:05, 9.65it/s] 50it [00:05, 9.65it/s]2025-05-26 03:26:54,149 - INFO - [Epoch 035 | Batch 0050] IWAE-loss 10205.3838 | mean log_px -0.0955 | KL -3515.78 + 51it [00:05, 9.10it/s] 52it [00:05, 9.31it/s] 53it [00:05, 9.47it/s] 54it [00:05, 9.58it/s] 55it [00:05, 9.68it/s] 56it [00:05, 9.14it/s] 57it [00:05, 9.35it/s] 58it [00:06, 9.49it/s] 59it [00:06, 9.62it/s] 60it [00:06, 9.69it/s] 61it [00:06, 9.76it/s] 62it [00:06, 9.78it/s] 63it [00:06, 9.81it/s] 64it [00:06, 9.80it/s] 65it [00:06, 9.82it/s] 66it [00:06, 9.84it/s] 67it [00:06, 9.86it/s] 68it [00:07, 9.87it/s] 69it [00:07, 9.88it/s] 70it [00:07, 9.90it/s] 71it [00:07, 9.90it/s] 72it [00:07, 9.90it/s] 73it [00:07, 9.39it/s] 74it [00:07, 9.52it/s] 75it [00:07, 9.62it/s] 76it [00:07, 9.70it/s] 77it [00:08, 9.75it/s] 78it [00:08, 9.78it/s] 79it [00:08, 9.80it/s] 80it [00:08, 9.83it/s] 81it [00:08, 9.22it/s] 82it [00:08, 9.39it/s] 83it [00:08, 9.54it/s] 84it [00:08, 9.63it/s] 85it [00:08, 9.11it/s] 86it [00:08, 9.31it/s] 87it [00:09, 9.47it/s] 88it [00:09, 9.60it/s] 89it [00:09, 9.68it/s] 90it [00:09, 9.73it/s] 91it [00:09, 9.77it/s] 92it [00:09, 9.79it/s] 93it [00:09, 9.82it/s] 94it [00:09, 9.82it/s] 95it [00:09, 9.85it/s] 96it [00:09, 9.85it/s] 97it [00:10, 9.86it/s] 98it [00:10, 9.75it/s] 99it [00:10, 9.77it/s] 100it [00:10, 9.68it/s]2025-05-26 03:26:59,330 - INFO - [Epoch 035 | Batch 0100] IWAE-loss 7475.6548 | mean log_px -0.0570 | KL -3514.94 + 101it [00:10, 9.70it/s] 102it [00:10, 9.13it/s] 103it [00:10, 9.33it/s] 104it [00:10, 9.47it/s] 105it [00:10, 9.57it/s] 106it [00:11, 9.06it/s] 107it [00:11, 9.30it/s] 108it [00:11, 9.45it/s] 109it [00:11, 9.58it/s] 110it [00:11, 9.65it/s] 111it [00:11, 9.72it/s] 112it [00:11, 9.77it/s] 113it [00:11, 9.80it/s] 114it [00:11, 9.81it/s] 115it [00:11, 9.82it/s] 116it [00:12, 9.84it/s] 117it [00:12, 9.85it/s] 118it [00:12, 9.86it/s] 119it [00:12, 9.86it/s] 120it [00:12, 9.74it/s] 121it [00:12, 9.79it/s] 122it [00:12, 9.80it/s] 123it [00:12, 9.82it/s] 124it [00:12, 9.83it/s] 125it [00:12, 9.83it/s] 126it [00:13, 9.79it/s] 127it [00:13, 9.33it/s] 128it [00:13, 9.46it/s] 129it [00:13, 9.59it/s] 130it [00:13, 9.20it/s] 131it [00:13, 9.34it/s] 132it [00:13, 9.33it/s] 133it [00:13, 9.40it/s] 134it [00:13, 9.51it/s] 135it [00:14, 9.61it/s] 136it [00:14, 9.69it/s] 137it [00:14, 9.71it/s] 138it [00:14, 9.75it/s] 139it [00:14, 9.76it/s] 140it [00:14, 9.78it/s] 141it [00:14, 9.79it/s] 142it [00:14, 9.81it/s] 143it [00:14, 9.80it/s] 144it [00:14, 9.31it/s] 145it [00:15, 9.45it/s] 146it [00:15, 9.55it/s] 147it [00:15, 9.61it/s] 148it [00:15, 9.68it/s] 149it [00:15, 9.73it/s] 150it [00:15, 9.75it/s]2025-05-26 03:27:04,527 - INFO - [Epoch 035 | Batch 0150] IWAE-loss 5995.6523 | mean log_px -0.0361 | KL -3514.44 + 151it [00:15, 9.77it/s] 152it [00:15, 9.76it/s] 153it [00:15, 9.79it/s] 154it [00:15, 9.80it/s] 155it [00:16, 9.81it/s] 156it [00:16, 9.82it/s] 157it [00:16, 9.83it/s] 158it [00:16, 9.84it/s] 159it [00:16, 9.20it/s] 160it [00:16, 9.37it/s] 161it [00:16, 9.46it/s] 162it [00:16, 9.55it/s] 163it [00:16, 9.63it/s] 164it [00:17, 9.68it/s] 165it [00:17, 9.73it/s] 166it [00:17, 9.75it/s] 167it [00:17, 9.79it/s] 168it [00:17, 9.79it/s] 169it [00:17, 9.81it/s] 170it [00:17, 9.81it/s] 171it [00:17, 9.80it/s] 172it [00:17, 9.81it/s] 173it [00:17, 9.83it/s] 174it [00:18, 9.81it/s] 175it [00:18, 9.83it/s] 176it [00:18, 9.22it/s] 177it [00:18, 9.39it/s] 178it [00:18, 9.52it/s] 179it [00:18, 9.61it/s] 180it [00:18, 9.19it/s] 181it [00:18, 9.37it/s] 182it [00:18, 9.50it/s] 183it [00:19, 9.59it/s] 184it [00:19, 9.64it/s] 185it [00:19, 9.70it/s] 186it [00:19, 9.72it/s] 187it [00:19, 9.76it/s] 188it [00:19, 9.76it/s] 189it [00:19, 9.79it/s] 190it [00:19, 9.76it/s] 191it [00:19, 9.80it/s] 192it [00:19, 9.79it/s] 193it [00:20, 9.80it/s] 194it [00:20, 9.06it/s] 195it [00:20, 8.48it/s] 196it [00:20, 8.84it/s] 196it [00:20, 9.58it/s] +2025-05-26 03:27:09,338 - INFO - Epoch: 35, Objective: tensor([5837.2930], device='cuda:0', grad_fn=), Loss: 0.03758452087640762, KL/n: 71.64217376708984 + 0it [00:00, ?it/s]2025-05-26 03:27:09,796 - INFO - [Epoch 036 | Batch 0000] IWAE-loss 5874.6455 | mean log_px -0.0372 | KL -3509.21 + 1it [00:00, 4.72it/s] 2it [00:00, 6.79it/s] 3it [00:00, 7.92it/s] 4it [00:00, 8.58it/s] 5it [00:00, 8.53it/s] 6it [00:00, 8.86it/s] 7it [00:00, 9.14it/s] 8it [00:00, 9.31it/s] 9it [00:01, 9.35it/s] 10it [00:01, 8.89it/s] 11it [00:01, 9.15it/s] 12it [00:01, 9.34it/s] 13it [00:01, 9.47it/s] 14it [00:01, 9.57it/s] 15it [00:01, 9.62it/s] 16it [00:01, 9.67it/s] 17it [00:01, 9.69it/s] 18it [00:01, 9.72it/s] 19it [00:02, 9.71it/s] 20it [00:02, 9.72it/s] 21it [00:02, 9.74it/s] 22it [00:02, 9.75it/s] 23it [00:02, 9.41it/s] 24it [00:02, 9.47it/s] 25it [00:02, 9.58it/s] 26it [00:02, 9.63it/s] 27it [00:02, 9.65it/s] 28it [00:03, 9.66it/s] 29it [00:03, 9.65it/s] 30it [00:03, 9.69it/s] 31it [00:03, 9.12it/s] 32it [00:03, 9.31it/s] 33it [00:03, 9.46it/s] 34it [00:03, 8.98it/s] 35it [00:03, 9.21it/s] 36it [00:03, 9.37it/s] 37it [00:03, 9.50it/s] 38it [00:04, 9.59it/s] 39it [00:04, 9.67it/s] 40it [00:04, 9.71it/s] 41it [00:04, 9.73it/s] 42it [00:04, 9.73it/s] 43it [00:04, 9.78it/s] 44it [00:04, 9.77it/s] 45it [00:04, 9.78it/s] 46it [00:04, 9.69it/s] 47it [00:05, 9.52it/s] 48it [00:05, 9.56it/s] 49it [00:05, 9.59it/s] 50it [00:05, 9.66it/s]2025-05-26 03:27:15,056 - INFO - [Epoch 036 | Batch 0050] IWAE-loss 5224.4829 | mean log_px -0.0283 | KL -3501.39 + 51it [00:05, 9.41it/s] 52it [00:05, 9.51it/s] 53it [00:05, 9.59it/s] 54it [00:05, 9.11it/s] 55it [00:05, 9.26it/s] 56it [00:05, 9.38it/s] 57it [00:06, 9.52it/s] 58it [00:06, 9.60it/s] 59it [00:06, 9.69it/s] 60it [00:06, 9.14it/s] 61it [00:06, 9.27it/s] 62it [00:06, 9.35it/s] 63it [00:06, 9.45it/s] 64it [00:06, 9.54it/s] 65it [00:06, 9.59it/s] 66it [00:07, 9.52it/s] 67it [00:07, 9.58it/s] 68it [00:07, 9.00it/s] 69it [00:07, 9.17it/s] 70it [00:07, 9.35it/s] 71it [00:07, 9.51it/s] 72it [00:07, 9.61it/s] 73it [00:07, 9.68it/s] 74it [00:07, 9.74it/s] 75it [00:07, 9.79it/s] 76it [00:08, 9.80it/s] 77it [00:08, 9.83it/s] 78it [00:08, 9.83it/s] 79it [00:08, 9.86it/s] 80it [00:08, 9.86it/s] 81it [00:08, 9.86it/s] 82it [00:08, 9.86it/s] 83it [00:08, 9.86it/s] 84it [00:08, 9.85it/s] 85it [00:08, 9.87it/s] 86it [00:09, 9.87it/s] 87it [00:09, 9.89it/s] 88it [00:09, 9.86it/s] 89it [00:09, 9.86it/s] 90it [00:09, 9.25it/s] 91it [00:09, 9.43it/s] 92it [00:09, 9.55it/s] 93it [00:09, 9.65it/s] 94it [00:09, 9.72it/s] 95it [00:10, 9.77it/s] 96it [00:10, 9.43it/s] 97it [00:10, 9.56it/s] 98it [00:10, 9.65it/s] 99it [00:10, 9.71it/s] 100it [00:10, 9.76it/s]2025-05-26 03:27:20,264 - INFO - [Epoch 036 | Batch 0100] IWAE-loss 8589.2041 | mean log_px -0.0804 | KL -3509.35 + 101it [00:10, 9.79it/s] 102it [00:10, 9.81it/s] 103it [00:10, 9.84it/s] 104it [00:10, 9.84it/s] 105it [00:11, 9.86it/s] 106it [00:11, 9.86it/s] 107it [00:11, 9.86it/s] 108it [00:11, 9.85it/s] 109it [00:11, 9.86it/s] 110it [00:11, 9.85it/s] 111it [00:11, 9.85it/s] 112it [00:11, 9.84it/s] 113it [00:11, 9.86it/s] 114it [00:11, 9.84it/s] 115it [00:12, 9.86it/s] 116it [00:12, 9.85it/s] 117it [00:12, 9.78it/s] 118it [00:12, 9.76it/s] 119it [00:12, 9.79it/s] 120it [00:12, 9.80it/s] 121it [00:12, 9.83it/s] 122it [00:12, 9.84it/s] 123it [00:12, 9.86it/s] 124it [00:12, 9.84it/s] 125it [00:13, 9.83it/s] 126it [00:13, 9.81it/s] 127it [00:13, 9.82it/s] 128it [00:13, 9.83it/s] 129it [00:13, 9.57it/s] 130it [00:13, 9.09it/s] 131it [00:13, 9.30it/s] 132it [00:13, 9.39it/s] 133it [00:13, 9.54it/s] 134it [00:14, 9.06it/s] 135it [00:14, 9.27it/s] 136it [00:14, 9.44it/s] 137it [00:14, 9.56it/s] 138it [00:14, 9.24it/s] 139it [00:14, 9.38it/s] 140it [00:14, 8.92it/s] 141it [00:14, 9.17it/s] 142it [00:14, 9.36it/s] 143it [00:15, 9.52it/s] 144it [00:15, 9.61it/s] 145it [00:15, 9.69it/s] 146it [00:15, 9.74it/s] 147it [00:15, 9.79it/s] 148it [00:15, 9.79it/s] 149it [00:15, 9.82it/s] 150it [00:15, 9.83it/s]2025-05-26 03:27:25,437 - INFO - [Epoch 036 | Batch 0150] IWAE-loss 5136.7231 | mean log_px -0.0261 | KL -3499.86 + 151it [00:15, 9.81it/s] 152it [00:15, 9.83it/s] 153it [00:16, 9.86it/s] 154it [00:16, 9.85it/s] 155it [00:16, 9.87it/s] 156it [00:16, 9.86it/s] 157it [00:16, 9.85it/s] 158it [00:16, 9.62it/s] 159it [00:16, 9.62it/s] 160it [00:16, 9.66it/s] 161it [00:16, 9.73it/s] 162it [00:16, 9.77it/s] 163it [00:17, 9.80it/s] 164it [00:17, 9.82it/s] 165it [00:17, 9.69it/s] 166it [00:17, 9.69it/s] 167it [00:17, 9.63it/s] 168it [00:17, 9.62it/s] 169it [00:17, 9.56it/s] 170it [00:17, 9.56it/s] 171it [00:17, 9.59it/s] 172it [00:17, 9.64it/s] 173it [00:18, 9.58it/s] 174it [00:18, 9.50it/s] 175it [00:18, 9.55it/s] 176it [00:18, 9.57it/s] 177it [00:18, 9.23it/s] 178it [00:18, 9.27it/s] 179it [00:18, 9.33it/s] 180it [00:18, 9.37it/s] 181it [00:18, 9.39it/s] 182it [00:19, 9.47it/s] 183it [00:19, 9.52it/s] 184it [00:19, 9.50it/s] 185it [00:19, 9.54it/s] 186it [00:19, 9.50it/s] 187it [00:19, 8.91it/s] 188it [00:19, 9.03it/s] 189it [00:19, 9.14it/s] 190it [00:19, 9.27it/s] 191it [00:20, 9.32it/s] 192it [00:20, 9.36it/s] 193it [00:20, 9.37it/s] 194it [00:20, 9.36it/s] 195it [00:20, 8.84it/s] 196it [00:20, 9.07it/s] 196it [00:20, 9.49it/s] +2025-05-26 03:27:30,297 - INFO - Epoch: 36, Objective: tensor([6148.1465], device='cuda:0', grad_fn=), Loss: 0.04331137239933014, KL/n: 71.53656005859375 + 0it [00:00, ?it/s]2025-05-26 03:27:30,569 - INFO - [Epoch 037 | Batch 0000] IWAE-loss 5157.5024 | mean log_px -0.0263 | KL -3506.90 + 1it [00:00, 5.40it/s] 2it [00:00, 7.20it/s] 3it [00:00, 8.04it/s] 4it [00:00, 8.67it/s] 5it [00:00, 8.94it/s] 6it [00:00, 9.16it/s] 7it [00:00, 9.34it/s] 8it [00:00, 9.45it/s] 9it [00:01, 9.17it/s] 10it [00:01, 9.30it/s] 11it [00:01, 9.45it/s] 12it [00:01, 9.52it/s] 13it [00:01, 8.94it/s] 14it [00:01, 9.14it/s] 15it [00:01, 9.31it/s] 16it [00:01, 9.38it/s] 17it [00:01, 9.49it/s] 18it [00:01, 9.53it/s] 19it [00:02, 9.59it/s] 20it [00:02, 9.48it/s] 21it [00:02, 9.55it/s] 22it [00:02, 9.55it/s] 23it [00:02, 9.44it/s] 24it [00:02, 9.47it/s] 25it [00:02, 9.44it/s] 26it [00:02, 9.33it/s] 27it [00:02, 9.44it/s] 28it [00:03, 9.50it/s] 29it [00:03, 9.48it/s] 30it [00:03, 9.53it/s] 31it [00:03, 9.49it/s] 32it [00:03, 9.51it/s] 33it [00:03, 9.50it/s] 34it [00:03, 9.50it/s] 35it [00:03, 9.51it/s] 36it [00:03, 9.53it/s] 37it [00:03, 9.57it/s] 38it [00:04, 9.58it/s] 39it [00:04, 9.63it/s] 40it [00:04, 9.55it/s] 41it [00:04, 9.54it/s] 42it [00:04, 9.57it/s] 43it [00:04, 9.53it/s] 44it [00:04, 9.51it/s] 45it [00:04, 9.52it/s] 46it [00:04, 9.51it/s] 47it [00:05, 9.51it/s] 48it [00:05, 9.51it/s] 49it [00:05, 9.08it/s] 50it [00:05, 9.19it/s]2025-05-26 03:27:35,858 - INFO - [Epoch 037 | Batch 0050] IWAE-loss 6418.6987 | mean log_px -0.0469 | KL -3502.43 + 51it [00:05, 9.24it/s] 52it [00:05, 9.10it/s] 53it [00:05, 9.11it/s] 54it [00:05, 9.24it/s] 55it [00:05, 9.37it/s] 56it [00:06, 9.50it/s] 57it [00:06, 9.62it/s] 58it [00:06, 9.65it/s] 59it [00:06, 9.64it/s] 60it [00:06, 9.66it/s] 61it [00:06, 9.69it/s] 62it [00:06, 9.68it/s] 63it [00:06, 9.06it/s] 64it [00:06, 9.22it/s] 65it [00:06, 9.34it/s] 66it [00:07, 9.43it/s] 67it [00:07, 9.57it/s] 68it [00:07, 9.63it/s] 69it [00:07, 9.70it/s] 70it [00:07, 9.73it/s] 71it [00:07, 9.74it/s] 72it [00:07, 9.73it/s] 73it [00:07, 9.77it/s] 74it [00:07, 9.79it/s] 75it [00:07, 9.76it/s] 76it [00:08, 9.77it/s] 77it [00:08, 9.77it/s] 78it [00:08, 9.72it/s] 79it [00:08, 9.73it/s] 80it [00:08, 9.69it/s] 81it [00:08, 9.70it/s] 82it [00:08, 9.69it/s] 83it [00:08, 9.20it/s] 84it [00:08, 9.31it/s] 85it [00:09, 9.45it/s] 86it [00:09, 9.54it/s] 87it [00:09, 9.04it/s] 88it [00:09, 9.21it/s] 89it [00:09, 9.36it/s] 90it [00:09, 9.47it/s] 91it [00:09, 9.56it/s] 92it [00:09, 9.64it/s] 93it [00:09, 9.65it/s] 94it [00:09, 9.50it/s] 95it [00:10, 8.85it/s] 96it [00:10, 9.09it/s] 97it [00:10, 9.32it/s] 98it [00:10, 9.45it/s] 99it [00:10, 9.55it/s] 100it [00:10, 9.62it/s]2025-05-26 03:27:41,115 - INFO - [Epoch 037 | Batch 0100] IWAE-loss 5038.2764 | mean log_px -0.0247 | KL -3498.83 + 101it [00:10, 9.64it/s] 102it [00:10, 9.69it/s] 103it [00:10, 9.26it/s] 104it [00:11, 9.43it/s] 105it [00:11, 9.55it/s] 106it [00:11, 9.64it/s] 107it [00:11, 9.69it/s] 108it [00:11, 9.74it/s] 109it [00:11, 9.77it/s] 110it [00:11, 9.80it/s] 111it [00:11, 9.81it/s] 112it [00:11, 9.82it/s] 113it [00:11, 9.83it/s] 114it [00:12, 9.83it/s] 115it [00:12, 9.86it/s] 116it [00:12, 9.85it/s] 117it [00:12, 9.86it/s] 118it [00:12, 9.86it/s] 119it [00:12, 9.87it/s] 120it [00:12, 9.86it/s] 121it [00:12, 9.85it/s] 122it [00:12, 9.86it/s] 123it [00:12, 9.79it/s] 124it [00:13, 9.80it/s] 125it [00:13, 9.84it/s] 126it [00:13, 9.84it/s] 127it [00:13, 9.86it/s] 128it [00:13, 9.86it/s] 129it [00:13, 9.87it/s] 130it [00:13, 9.87it/s] 131it [00:13, 9.85it/s] 132it [00:13, 9.87it/s] 133it [00:14, 9.60it/s] 134it [00:14, 9.20it/s] 135it [00:14, 9.28it/s] 136it [00:14, 9.45it/s] 137it [00:14, 9.58it/s] 138it [00:14, 9.64it/s] 139it [00:14, 9.71it/s] 140it [00:14, 9.74it/s] 141it [00:14, 9.77it/s] 142it [00:14, 9.79it/s] 143it [00:15, 9.33it/s] 144it [00:15, 9.48it/s] 145it [00:15, 9.58it/s] 146it [00:15, 9.65it/s] 147it [00:15, 9.71it/s] 148it [00:15, 9.75it/s] 149it [00:15, 9.18it/s] 150it [00:15, 9.36it/s]2025-05-26 03:27:46,281 - INFO - [Epoch 037 | Batch 0150] IWAE-loss 6093.8408 | mean log_px -0.0371 | KL -3496.12 + 151it [00:15, 9.49it/s] 152it [00:15, 9.59it/s] 153it [00:16, 9.68it/s] 154it [00:16, 9.74it/s] 155it [00:16, 9.80it/s] 156it [00:16, 9.83it/s] 157it [00:16, 9.85it/s] 158it [00:16, 9.72it/s] 159it [00:16, 9.77it/s] 160it [00:16, 9.80it/s] 161it [00:16, 9.83it/s] 162it [00:17, 9.83it/s] 163it [00:17, 9.85it/s] 164it [00:17, 9.86it/s] 165it [00:17, 9.88it/s] 166it [00:17, 9.88it/s] 167it [00:17, 9.87it/s] 168it [00:17, 9.85it/s] 169it [00:17, 9.85it/s] 170it [00:17, 9.81it/s] 171it [00:17, 9.81it/s] 172it [00:18, 9.82it/s] 173it [00:18, 9.75it/s] 174it [00:18, 9.72it/s] 175it [00:18, 9.69it/s] 176it [00:18, 9.73it/s] 177it [00:18, 9.79it/s] 178it [00:18, 9.81it/s] 179it [00:18, 9.81it/s] 180it [00:18, 9.84it/s] 181it [00:18, 9.85it/s] 182it [00:19, 9.84it/s] 183it [00:19, 9.87it/s] 184it [00:19, 9.89it/s] 185it [00:19, 9.90it/s] 186it [00:19, 9.90it/s] 187it [00:19, 9.91it/s] 188it [00:19, 9.90it/s] 189it [00:19, 9.89it/s] 190it [00:19, 9.89it/s] 191it [00:19, 9.89it/s] 192it [00:20, 9.78it/s] 193it [00:20, 9.80it/s] 194it [00:20, 9.81it/s] 195it [00:20, 9.23it/s] 196it [00:20, 9.54it/s] +2025-05-26 03:27:50,974 - INFO - Epoch: 37, Objective: tensor([7495.4062], device='cuda:0', grad_fn=), Loss: 0.06337570399045944, KL/n: 71.414794921875 + 0it [00:00, ?it/s]2025-05-26 03:27:51,428 - INFO - [Epoch 038 | Batch 0000] IWAE-loss 8049.1758 | mean log_px -0.0730 | KL -3499.70 + 1it [00:00, 5.36it/s] 2it [00:00, 7.29it/s] 3it [00:00, 8.30it/s] 4it [00:00, 8.86it/s] 5it [00:00, 9.23it/s] 6it [00:00, 9.43it/s] 7it [00:00, 8.95it/s] 8it [00:00, 9.21it/s] 9it [00:01, 9.41it/s] 10it [00:01, 9.54it/s] 11it [00:01, 9.26it/s] 12it [00:01, 9.41it/s] 13it [00:01, 9.57it/s] 14it [00:01, 9.63it/s] 15it [00:01, 9.68it/s] 16it [00:01, 9.72it/s] 17it [00:01, 9.39it/s] 18it [00:01, 9.51it/s] 19it [00:02, 9.62it/s] 20it [00:02, 9.68it/s] 21it [00:02, 9.23it/s] 22it [00:02, 9.33it/s] 23it [00:02, 9.48it/s] 24it [00:02, 9.60it/s] 25it [00:02, 9.30it/s] 26it [00:02, 9.46it/s] 27it [00:02, 9.58it/s] 28it [00:03, 9.65it/s] 29it [00:03, 9.72it/s] 30it [00:03, 9.77it/s] 31it [00:03, 9.80it/s] 32it [00:03, 9.26it/s] 33it [00:03, 9.45it/s] 34it [00:03, 9.59it/s] 35it [00:03, 9.69it/s] 36it [00:03, 9.75it/s] 37it [00:03, 9.80it/s] 38it [00:04, 9.78it/s] 39it [00:04, 9.01it/s] 40it [00:04, 8.97it/s] 41it [00:04, 9.15it/s] 42it [00:04, 9.36it/s] 43it [00:04, 9.52it/s] 44it [00:04, 9.62it/s] 45it [00:04, 9.70it/s] 46it [00:04, 9.74it/s] 47it [00:04, 9.79it/s] 48it [00:05, 9.82it/s] 49it [00:05, 9.84it/s] 50it [00:05, 9.85it/s]2025-05-26 03:27:56,653 - INFO - [Epoch 038 | Batch 0050] IWAE-loss 5952.2158 | mean log_px -0.0410 | KL -3503.08 + 51it [00:05, 9.71it/s] 52it [00:05, 9.26it/s] 53it [00:05, 9.33it/s] 54it [00:05, 9.43it/s] 55it [00:05, 9.58it/s] 56it [00:05, 9.65it/s] 57it [00:06, 9.73it/s] 58it [00:06, 9.77it/s] 59it [00:06, 9.81it/s] 60it [00:06, 9.83it/s] 61it [00:06, 9.86it/s] 62it [00:06, 9.86it/s] 63it [00:06, 9.88it/s] 64it [00:06, 9.86it/s] 65it [00:06, 9.87it/s] 66it [00:06, 9.86it/s] 67it [00:07, 9.88it/s] 68it [00:07, 9.88it/s] 69it [00:07, 9.88it/s] 70it [00:07, 9.88it/s] 71it [00:07, 9.87it/s] 72it [00:07, 9.86it/s] 73it [00:07, 9.87it/s] 74it [00:07, 9.84it/s] 75it [00:07, 9.83it/s] 76it [00:07, 9.83it/s] 77it [00:08, 9.86it/s] 78it [00:08, 9.85it/s] 79it [00:08, 9.85it/s] 80it [00:08, 9.84it/s] 81it [00:08, 9.35it/s] 82it [00:08, 9.48it/s] 83it [00:08, 9.60it/s] 84it [00:08, 9.63it/s] 85it [00:08, 9.71it/s] 86it [00:09, 9.74it/s] 87it [00:09, 9.79it/s] 88it [00:09, 9.79it/s] 89it [00:09, 9.81it/s] 90it [00:09, 9.82it/s] 91it [00:09, 9.19it/s] 92it [00:09, 9.34it/s] 93it [00:09, 9.50it/s] 94it [00:09, 9.60it/s] 95it [00:09, 9.66it/s] 96it [00:10, 9.72it/s] 97it [00:10, 9.78it/s] 98it [00:10, 9.81it/s] 99it [00:10, 9.82it/s] 100it [00:10, 9.81it/s]2025-05-26 03:28:01,792 - INFO - [Epoch 038 | Batch 0100] IWAE-loss 7382.7646 | mean log_px -0.0584 | KL -3494.08 + 101it [00:10, 9.19it/s] 102it [00:10, 9.24it/s] 103it [00:10, 9.41it/s] 104it [00:10, 9.52it/s] 105it [00:10, 9.62it/s] 106it [00:11, 9.19it/s] 107it [00:11, 9.31it/s] 108it [00:11, 9.46it/s] 109it [00:11, 9.56it/s] 110it [00:11, 9.63it/s] 111it [00:11, 9.67it/s] 112it [00:11, 9.72it/s] 113it [00:11, 9.66it/s] 114it [00:11, 9.71it/s] 115it [00:12, 9.73it/s] 116it [00:12, 9.74it/s] 117it [00:12, 9.77it/s] 118it [00:12, 9.78it/s] 119it [00:12, 9.81it/s] 120it [00:12, 9.79it/s] 121it [00:12, 9.81it/s] 122it [00:12, 9.78it/s] 123it [00:12, 9.80it/s] 124it [00:12, 9.79it/s] 125it [00:13, 9.80it/s] 126it [00:13, 9.82it/s] 127it [00:13, 9.84it/s] 128it [00:13, 9.83it/s] 129it [00:13, 9.07it/s] 130it [00:13, 9.23it/s] 131it [00:13, 9.40it/s] 132it [00:13, 9.53it/s] 133it [00:13, 9.58it/s] 134it [00:14, 9.26it/s] 135it [00:14, 9.40it/s] 136it [00:14, 9.07it/s] 137it [00:14, 9.27it/s] 138it [00:14, 9.40it/s] 139it [00:14, 9.53it/s] 140it [00:14, 9.62it/s] 141it [00:14, 9.17it/s] 142it [00:14, 9.35it/s] 143it [00:14, 9.51it/s] 144it [00:15, 9.11it/s] 145it [00:15, 9.26it/s] 146it [00:15, 9.42it/s] 147it [00:15, 9.49it/s] 148it [00:15, 9.56it/s] 149it [00:15, 9.67it/s] 150it [00:15, 9.22it/s]2025-05-26 03:28:07,061 - INFO - [Epoch 038 | Batch 0150] IWAE-loss 5241.9893 | mean log_px -0.0268 | KL -3495.52 + 151it [00:15, 9.39it/s] 152it [00:15, 9.53it/s] 153it [00:16, 9.62it/s] 154it [00:16, 9.64it/s] 155it [00:16, 9.70it/s] 156it [00:16, 9.73it/s] 157it [00:16, 9.77it/s] 158it [00:16, 9.81it/s] 159it [00:16, 9.82it/s] 160it [00:16, 9.79it/s] 161it [00:16, 9.71it/s] 162it [00:16, 9.63it/s] 163it [00:17, 9.70it/s] 164it [00:17, 9.74it/s] 165it [00:17, 9.78it/s] 166it [00:17, 9.79it/s] 167it [00:17, 9.80it/s] 168it [00:17, 9.80it/s] 169it [00:17, 9.83it/s] 170it [00:17, 9.83it/s] 171it [00:17, 9.83it/s] 172it [00:17, 9.82it/s] 173it [00:18, 9.84it/s] 174it [00:18, 9.83it/s] 175it [00:18, 9.85it/s] 176it [00:18, 9.86it/s] 177it [00:18, 9.88it/s] 178it [00:18, 9.86it/s] 179it [00:18, 9.83it/s] 180it [00:18, 9.72it/s] 181it [00:18, 9.70it/s] 182it [00:18, 9.73it/s] 183it [00:19, 9.79it/s] 184it [00:19, 9.82it/s] 185it [00:19, 9.84it/s] 186it [00:19, 9.85it/s] 187it [00:19, 9.85it/s] 188it [00:19, 9.86it/s] 189it [00:19, 9.67it/s] 190it [00:19, 9.74it/s] 191it [00:19, 9.79it/s] 192it [00:20, 9.82it/s] 193it [00:20, 9.84it/s] 194it [00:20, 9.83it/s] 195it [00:20, 9.26it/s] 196it [00:20, 9.56it/s] +2025-05-26 03:28:11,776 - INFO - Epoch: 38, Objective: tensor([6876.5137], device='cuda:0', grad_fn=), Loss: 0.05297667905688286, KL/n: 71.28185272216797 + 0it [00:00, ?it/s]2025-05-26 03:28:12,061 - INFO - [Epoch 039 | Batch 0000] IWAE-loss 6343.7041 | mean log_px -0.0524 | KL -3491.50 + 1it [00:00, 4.52it/s] 2it [00:00, 6.58it/s] 3it [00:00, 7.78it/s] 4it [00:00, 8.49it/s] 5it [00:00, 8.94it/s] 6it [00:00, 9.22it/s] 7it [00:00, 8.90it/s] 8it [00:00, 9.17it/s] 9it [00:01, 9.38it/s] 10it [00:01, 9.46it/s] 11it [00:01, 9.57it/s] 12it [00:01, 9.04it/s] 13it [00:01, 9.28it/s] 14it [00:01, 9.43it/s] 15it [00:01, 9.56it/s] 16it [00:01, 9.65it/s] 17it [00:01, 9.70it/s] 18it [00:01, 9.74it/s] 19it [00:02, 9.76it/s] 20it [00:02, 9.75it/s] 21it [00:02, 9.20it/s] 22it [00:02, 9.39it/s] 23it [00:02, 9.51it/s] 24it [00:02, 9.59it/s] 25it [00:02, 9.19it/s] 26it [00:02, 9.36it/s] 27it [00:02, 9.51it/s] 28it [00:03, 9.13it/s] 29it [00:03, 9.35it/s] 30it [00:03, 9.48it/s] 31it [00:03, 9.59it/s] 32it [00:03, 9.04it/s] 33it [00:03, 9.27it/s] 34it [00:03, 9.42it/s] 35it [00:03, 9.54it/s] 36it [00:03, 9.63it/s] 37it [00:04, 9.70it/s] 38it [00:04, 9.74it/s] 39it [00:04, 9.77it/s] 40it [00:04, 9.78it/s] 41it [00:04, 9.81it/s] 42it [00:04, 9.82it/s] 43it [00:04, 9.83it/s] 44it [00:04, 9.82it/s] 45it [00:04, 9.85it/s] 46it [00:04, 9.81it/s] 47it [00:05, 9.85it/s] 48it [00:05, 9.84it/s] 49it [00:05, 9.85it/s] 50it [00:05, 9.86it/s]2025-05-26 03:28:17,298 - INFO - [Epoch 039 | Batch 0050] IWAE-loss 5679.2578 | mean log_px -0.0351 | KL -3490.73 + 51it [00:05, 9.84it/s] 52it [00:05, 9.85it/s] 53it [00:05, 9.86it/s] 54it [00:05, 9.84it/s] 55it [00:05, 9.87it/s] 56it [00:05, 9.86it/s] 57it [00:06, 9.87it/s] 58it [00:06, 9.86it/s] 59it [00:06, 9.84it/s] 60it [00:06, 9.83it/s] 61it [00:06, 9.84it/s] 62it [00:06, 9.84it/s] 63it [00:06, 9.85it/s] 64it [00:06, 9.85it/s] 65it [00:06, 9.85it/s] 66it [00:06, 9.85it/s] 67it [00:07, 9.85it/s] 68it [00:07, 9.72it/s] 69it [00:07, 9.73it/s] 70it [00:07, 9.77it/s] 71it [00:07, 9.81it/s] 72it [00:07, 9.76it/s] 73it [00:07, 9.71it/s] 74it [00:07, 9.74it/s] 75it [00:07, 9.16it/s] 76it [00:08, 9.29it/s] 77it [00:08, 9.27it/s] 78it [00:08, 9.30it/s] 79it [00:08, 9.42it/s] 80it [00:08, 9.50it/s] 81it [00:08, 9.59it/s] 82it [00:08, 9.64it/s] 83it [00:08, 9.47it/s] 84it [00:08, 9.53it/s] 85it [00:08, 9.08it/s] 86it [00:09, 9.27it/s] 87it [00:09, 9.43it/s] 88it [00:09, 9.53it/s] 89it [00:09, 9.01it/s] 90it [00:09, 9.21it/s] 91it [00:09, 9.37it/s] 92it [00:09, 9.49it/s] 93it [00:09, 9.59it/s] 94it [00:09, 9.19it/s] 95it [00:10, 9.37it/s] 96it [00:10, 9.48it/s] 97it [00:10, 9.57it/s] 98it [00:10, 9.64it/s] 99it [00:10, 9.69it/s] 100it [00:10, 9.72it/s]2025-05-26 03:28:22,507 - INFO - [Epoch 039 | Batch 0100] IWAE-loss 5635.9746 | mean log_px -0.0364 | KL -3484.96 + 101it [00:10, 9.74it/s] 102it [00:10, 9.75it/s] 103it [00:10, 9.78it/s] 104it [00:10, 9.80it/s] 105it [00:11, 9.81it/s] 106it [00:11, 9.80it/s] 107it [00:11, 9.82it/s] 108it [00:11, 9.80it/s] 109it [00:11, 9.80it/s] 110it [00:11, 9.78it/s] 111it [00:11, 9.78it/s] 112it [00:11, 9.77it/s] 113it [00:11, 9.80it/s] 114it [00:11, 9.80it/s] 115it [00:12, 9.81it/s] 116it [00:12, 9.80it/s] 117it [00:12, 9.79it/s] 118it [00:12, 9.80it/s] 119it [00:12, 9.82it/s] 120it [00:12, 9.80it/s] 121it [00:12, 9.82it/s] 122it [00:12, 9.80it/s] 123it [00:12, 9.70it/s] 124it [00:12, 9.74it/s] 125it [00:13, 9.77it/s] 126it [00:13, 9.78it/s] 127it [00:13, 9.80it/s] 128it [00:13, 9.78it/s] 129it [00:13, 9.79it/s] 130it [00:13, 9.18it/s] 131it [00:13, 9.32it/s] 132it [00:13, 9.45it/s] 133it [00:13, 9.56it/s] 134it [00:14, 9.04it/s] 135it [00:14, 9.24it/s] 136it [00:14, 9.37it/s] 137it [00:14, 9.47it/s] 138it [00:14, 9.57it/s] 139it [00:14, 9.65it/s] 140it [00:14, 9.70it/s] 141it [00:14, 9.74it/s] 142it [00:14, 9.77it/s] 143it [00:14, 9.79it/s] 144it [00:15, 9.78it/s] 145it [00:15, 9.80it/s] 146it [00:15, 9.78it/s] 147it [00:15, 9.80it/s] 148it [00:15, 9.80it/s] 149it [00:15, 9.81it/s] 150it [00:15, 9.82it/s]2025-05-26 03:28:27,659 - INFO - [Epoch 039 | Batch 0150] IWAE-loss 6551.1885 | mean log_px -0.0438 | KL -3480.69 + 151it [00:15, 9.81it/s] 152it [00:15, 9.81it/s] 153it [00:15, 9.81it/s] 154it [00:16, 9.81it/s] 155it [00:16, 9.82it/s] 156it [00:16, 9.77it/s] 157it [00:16, 9.80it/s] 158it [00:16, 9.18it/s] 159it [00:16, 9.34it/s] 160it [00:16, 9.44it/s] 161it [00:16, 9.53it/s] 162it [00:16, 9.56it/s] 163it [00:17, 9.63it/s] 164it [00:17, 9.65it/s] 165it [00:17, 9.09it/s] 166it [00:17, 9.31it/s] 167it [00:17, 9.47it/s] 168it [00:17, 8.98it/s] 169it [00:17, 9.09it/s] 170it [00:17, 9.23it/s] 171it [00:17, 9.36it/s] 172it [00:18, 9.48it/s] 173it [00:18, 9.60it/s] 174it [00:18, 9.65it/s] 175it [00:18, 9.72it/s] 176it [00:18, 9.74it/s] 177it [00:18, 9.77it/s] 178it [00:18, 9.79it/s] 179it [00:18, 9.81it/s] 180it [00:18, 9.82it/s] 181it [00:18, 9.68it/s] 182it [00:19, 9.71it/s] 183it [00:19, 9.74it/s] 184it [00:19, 9.76it/s] 185it [00:19, 9.79it/s] 186it [00:19, 9.71it/s] 187it [00:19, 9.74it/s] 188it [00:19, 9.77it/s] 189it [00:19, 9.79it/s] 190it [00:19, 9.80it/s] 191it [00:19, 9.83it/s] 192it [00:20, 9.83it/s] 193it [00:20, 9.84it/s] 194it [00:20, 9.81it/s] 195it [00:20, 9.24it/s] 196it [00:20, 9.06it/s] 196it [00:20, 9.53it/s] +2025-05-26 03:28:32,468 - INFO - Epoch: 39, Objective: tensor([6474.6235], device='cuda:0', grad_fn=), Loss: 0.045537568628787994, KL/n: 71.1382827758789 + 0it [00:00, ?it/s]2025-05-26 03:28:32,930 - INFO - [Epoch 040 | Batch 0000] IWAE-loss 7672.9946 | mean log_px -0.0628 | KL -3483.29 + 1it [00:00, 5.36it/s] 2it [00:00, 7.26it/s] 3it [00:00, 8.25it/s] 4it [00:00, 8.82it/s] 5it [00:00, 9.19it/s] 6it [00:00, 9.40it/s] 7it [00:00, 9.53it/s] 8it [00:00, 9.60it/s] 9it [00:01, 9.69it/s] 10it [00:01, 9.73it/s] 11it [00:01, 9.77it/s] 12it [00:01, 9.78it/s] 13it [00:01, 9.80it/s] 14it [00:01, 9.79it/s] 15it [00:01, 9.81it/s] 16it [00:01, 9.82it/s] 17it [00:01, 9.84it/s] 18it [00:01, 9.83it/s] 19it [00:02, 9.85it/s] 20it [00:02, 9.84it/s] 21it [00:02, 9.84it/s] 22it [00:02, 9.79it/s] 23it [00:02, 9.82it/s] 24it [00:02, 9.82it/s] 25it [00:02, 9.83it/s] 26it [00:02, 9.81it/s] 27it [00:02, 9.82it/s] 28it [00:02, 9.81it/s] 29it [00:03, 9.82it/s] 30it [00:03, 9.82it/s] 31it [00:03, 9.80it/s] 32it [00:03, 9.80it/s] 33it [00:03, 9.81it/s] 34it [00:03, 9.82it/s] 35it [00:03, 9.82it/s] 36it [00:03, 9.78it/s] 37it [00:03, 9.80it/s] 38it [00:03, 9.79it/s] 39it [00:04, 9.18it/s] 40it [00:04, 9.35it/s] 41it [00:04, 9.50it/s] 42it [00:04, 9.58it/s] 43it [00:04, 9.64it/s] 44it [00:04, 9.69it/s] 45it [00:04, 9.74it/s] 46it [00:04, 9.77it/s] 47it [00:04, 9.80it/s] 48it [00:04, 9.81it/s] 49it [00:05, 9.83it/s] 50it [00:05, 9.82it/s]2025-05-26 03:28:38,047 - INFO - [Epoch 040 | Batch 0050] IWAE-loss 5287.8018 | mean log_px -0.0307 | KL -3482.75 + 51it [00:05, 9.82it/s] 52it [00:05, 9.82it/s] 53it [00:05, 9.83it/s] 54it [00:05, 9.81it/s] 55it [00:05, 9.32it/s] 56it [00:05, 9.28it/s] 57it [00:05, 9.06it/s] 58it [00:06, 9.18it/s] 59it [00:06, 9.37it/s] 60it [00:06, 9.50it/s] 61it [00:06, 9.04it/s] 62it [00:06, 9.26it/s] 63it [00:06, 9.41it/s] 64it [00:06, 8.99it/s] 65it [00:06, 9.22it/s] 66it [00:06, 9.39it/s] 67it [00:07, 9.53it/s] 68it [00:07, 9.62it/s] 69it [00:07, 9.69it/s] 70it [00:07, 9.11it/s] 71it [00:07, 9.31it/s] 72it [00:07, 9.46it/s] 73it [00:07, 9.58it/s] 74it [00:07, 9.66it/s] 75it [00:07, 9.71it/s] 76it [00:07, 9.76it/s] 77it [00:08, 9.05it/s] 78it [00:08, 9.11it/s] 79it [00:08, 9.21it/s] 80it [00:08, 9.33it/s] 81it [00:08, 9.37it/s] 82it [00:08, 9.41it/s] 83it [00:08, 9.39it/s] 84it [00:08, 9.42it/s] 85it [00:08, 8.96it/s] 86it [00:09, 9.17it/s] 87it [00:09, 9.28it/s] 88it [00:09, 9.32it/s] 89it [00:09, 9.39it/s] 90it [00:09, 9.37it/s] 91it [00:09, 9.31it/s] 92it [00:09, 9.30it/s] 93it [00:09, 9.26it/s] 94it [00:09, 9.33it/s] 95it [00:10, 9.33it/s] 96it [00:10, 9.37it/s] 97it [00:10, 9.43it/s] 98it [00:10, 9.45it/s] 99it [00:10, 8.80it/s] 100it [00:10, 8.80it/s]2025-05-26 03:28:43,428 - INFO - [Epoch 040 | Batch 0100] IWAE-loss 6247.6255 | mean log_px -0.0492 | KL -3478.28 + 101it [00:10, 8.92it/s] 102it [00:10, 9.09it/s] 103it [00:10, 9.23it/s] 104it [00:10, 9.31it/s] 105it [00:11, 9.42it/s] 106it [00:11, 9.42it/s] 107it [00:11, 9.48it/s] 108it [00:11, 9.44it/s] 109it [00:11, 9.43it/s] 110it [00:11, 8.73it/s] 111it [00:11, 8.85it/s] 112it [00:11, 8.92it/s] 113it [00:12, 8.64it/s] 114it [00:12, 8.95it/s] 115it [00:12, 9.19it/s] 116it [00:12, 9.31it/s] 117it [00:12, 9.48it/s] 118it [00:12, 9.58it/s] 119it [00:12, 9.66it/s] 120it [00:12, 9.72it/s] 121it [00:12, 9.77it/s] 122it [00:12, 9.81it/s] 123it [00:13, 9.82it/s] 124it [00:13, 9.81it/s] 125it [00:13, 9.19it/s] 126it [00:13, 9.37it/s] 127it [00:13, 9.52it/s] 128it [00:13, 9.59it/s] 129it [00:13, 9.67it/s] 130it [00:13, 9.71it/s] 131it [00:13, 9.75it/s] 132it [00:13, 9.78it/s] 133it [00:14, 9.81it/s] 134it [00:14, 9.82it/s] 135it [00:14, 9.83it/s] 136it [00:14, 9.82it/s] 137it [00:14, 9.83it/s] 138it [00:14, 9.83it/s] 139it [00:14, 9.83it/s] 140it [00:14, 9.81it/s] 141it [00:14, 9.78it/s] 142it [00:15, 8.86it/s] 143it [00:15, 8.65it/s] 144it [00:15, 8.69it/s] 145it [00:15, 8.99it/s] 146it [00:15, 9.23it/s] 147it [00:15, 9.41it/s] 148it [00:15, 9.53it/s] 149it [00:15, 9.62it/s] 150it [00:15, 9.69it/s]2025-05-26 03:28:48,708 - INFO - [Epoch 040 | Batch 0150] IWAE-loss 6392.1655 | mean log_px -0.0420 | KL -3472.99 + 151it [00:15, 9.70it/s] 152it [00:16, 9.74it/s] 153it [00:16, 9.77it/s] 154it [00:16, 9.75it/s] 155it [00:16, 9.24it/s] 156it [00:16, 9.40it/s] 157it [00:16, 9.55it/s] 158it [00:16, 9.60it/s] 159it [00:16, 9.67it/s] 160it [00:16, 9.71it/s] 161it [00:17, 9.31it/s] 162it [00:17, 9.46it/s] 163it [00:17, 9.59it/s] 164it [00:17, 9.65it/s] 165it [00:17, 9.71it/s] 166it [00:17, 9.13it/s] 167it [00:17, 9.34it/s] 168it [00:17, 9.48it/s] 169it [00:17, 9.55it/s] 170it [00:17, 9.63it/s] 171it [00:18, 9.71it/s] 172it [00:18, 9.77it/s] 173it [00:18, 9.78it/s] 174it [00:18, 9.80it/s] 175it [00:18, 9.83it/s] 176it [00:18, 9.84it/s] 177it [00:18, 9.85it/s] 178it [00:18, 8.94it/s] 179it [00:18, 9.21it/s] 180it [00:19, 9.39it/s] 181it [00:19, 9.52it/s] 182it [00:19, 9.00it/s] 183it [00:19, 9.25it/s] 184it [00:19, 9.42it/s] 185it [00:19, 9.51it/s] 186it [00:19, 9.01it/s] 187it [00:19, 9.26it/s] 188it [00:19, 9.45it/s] 189it [00:19, 9.57it/s] 190it [00:20, 9.04it/s] 191it [00:20, 9.27it/s] 192it [00:20, 9.34it/s] 193it [00:20, 9.50it/s] 194it [00:20, 9.62it/s] 195it [00:20, 9.12it/s] 196it [00:20, 9.43it/s] +2025-05-26 03:28:53,572 - INFO - Epoch: 40, Objective: tensor([5746.3809], device='cuda:0', grad_fn=), Loss: 0.034290388226509094, KL/n: 70.98202514648438 + 0it [00:00, ?it/s]2025-05-26 03:28:53,852 - INFO - [Epoch 041 | Batch 0000] IWAE-loss 5749.5537 | mean log_px -0.0346 | KL -3479.12 + 1it [00:00, 5.22it/s] 2it [00:00, 7.07it/s] 3it [00:00, 8.15it/s] 4it [00:00, 8.73it/s] 5it [00:00, 9.12it/s] 6it [00:00, 8.84it/s] 7it [00:00, 9.11it/s] 8it [00:00, 9.22it/s] 9it [00:01, 9.41it/s] 10it [00:01, 9.54it/s] 11it [00:01, 9.64it/s] 12it [00:01, 9.71it/s] 13it [00:01, 9.76it/s] 14it [00:01, 9.78it/s] 15it [00:01, 9.82it/s] 16it [00:01, 9.82it/s] 17it [00:01, 9.85it/s] 18it [00:01, 9.82it/s] 19it [00:02, 9.35it/s] 20it [00:02, 9.50it/s] 21it [00:02, 9.62it/s] 22it [00:02, 9.65it/s] 23it [00:02, 9.72it/s] 24it [00:02, 9.76it/s] 25it [00:02, 9.79it/s] 26it [00:02, 9.82it/s] 27it [00:02, 9.85it/s] 28it [00:02, 9.86it/s] 29it [00:03, 9.88it/s] 30it [00:03, 9.89it/s] 31it [00:03, 9.89it/s] 32it [00:03, 9.89it/s] 33it [00:03, 9.89it/s] 34it [00:03, 9.88it/s] 35it [00:03, 9.89it/s] 36it [00:03, 9.88it/s] 37it [00:03, 9.89it/s] 38it [00:03, 9.89it/s] 39it [00:04, 9.91it/s] 40it [00:04, 9.89it/s] 41it [00:04, 9.89it/s] 42it [00:04, 9.87it/s] 43it [00:04, 9.88it/s] 44it [00:04, 9.23it/s] 45it [00:04, 9.41it/s] 46it [00:04, 9.53it/s] 47it [00:04, 9.62it/s] 48it [00:05, 9.10it/s] 49it [00:05, 9.31it/s] 50it [00:05, 9.47it/s]2025-05-26 03:28:59,015 - INFO - [Epoch 041 | Batch 0050] IWAE-loss 5837.0518 | mean log_px -0.0380 | KL -3473.68 + 51it [00:05, 9.54it/s] 52it [00:05, 9.03it/s] 53it [00:05, 9.27it/s] 54it [00:05, 9.42it/s] 55it [00:05, 8.99it/s] 56it [00:05, 9.18it/s] 57it [00:06, 9.39it/s] 58it [00:06, 9.52it/s] 59it [00:06, 9.61it/s] 60it [00:06, 9.69it/s] 61it [00:06, 9.74it/s] 62it [00:06, 9.27it/s] 63it [00:06, 9.45it/s] 64it [00:06, 9.57it/s] 65it [00:06, 9.64it/s] 66it [00:06, 9.69it/s] 67it [00:07, 9.75it/s] 68it [00:07, 9.77it/s] 69it [00:07, 9.81it/s] 70it [00:07, 9.81it/s] 71it [00:07, 9.84it/s] 72it [00:07, 9.85it/s] 73it [00:07, 9.85it/s] 74it [00:07, 9.83it/s] 75it [00:07, 9.84it/s] 76it [00:07, 9.84it/s] 77it [00:08, 9.77it/s] 78it [00:08, 9.78it/s] 79it [00:08, 9.82it/s] 80it [00:08, 9.82it/s] 81it [00:08, 9.84it/s] 82it [00:08, 9.85it/s] 83it [00:08, 9.24it/s] 84it [00:08, 9.41it/s] 85it [00:08, 9.55it/s] 86it [00:09, 9.43it/s] 87it [00:09, 9.42it/s] 88it [00:09, 9.46it/s] 89it [00:09, 9.53it/s] 90it [00:09, 9.53it/s] 91it [00:09, 8.99it/s] 92it [00:09, 9.12it/s] 93it [00:09, 9.23it/s] 94it [00:09, 9.31it/s] 95it [00:09, 9.34it/s] 96it [00:10, 9.29it/s] 97it [00:10, 9.35it/s] 98it [00:10, 9.36it/s] 99it [00:10, 9.39it/s] 100it [00:10, 9.38it/s]2025-05-26 03:29:04,270 - INFO - [Epoch 041 | Batch 0100] IWAE-loss 5281.2070 | mean log_px -0.0259 | KL -3478.21 + 101it [00:10, 8.87it/s] 102it [00:10, 9.07it/s] 103it [00:10, 9.21it/s] 104it [00:10, 9.29it/s] 105it [00:11, 9.34it/s] 106it [00:11, 9.39it/s] 107it [00:11, 9.39it/s] 108it [00:11, 9.32it/s] 109it [00:11, 9.35it/s] 110it [00:11, 9.39it/s] 111it [00:11, 9.41it/s] 112it [00:11, 9.47it/s] 113it [00:11, 9.48it/s] 114it [00:12, 9.44it/s] 115it [00:12, 8.93it/s] 116it [00:12, 9.05it/s] 117it [00:12, 9.20it/s] 118it [00:12, 9.29it/s] 119it [00:12, 9.35it/s] 120it [00:12, 9.38it/s] 121it [00:12, 9.42it/s] 122it [00:12, 9.44it/s] 123it [00:12, 9.42it/s] 124it [00:13, 9.27it/s] 125it [00:13, 9.33it/s] 126it [00:13, 9.32it/s] 127it [00:13, 8.58it/s] 128it [00:13, 8.87it/s] 129it [00:13, 9.08it/s] 130it [00:13, 9.21it/s] 131it [00:13, 9.32it/s] 132it [00:13, 9.29it/s] 133it [00:14, 8.86it/s] 134it [00:14, 9.04it/s] 135it [00:14, 9.16it/s] 136it [00:14, 9.21it/s] 137it [00:14, 9.32it/s] 138it [00:14, 9.34it/s] 139it [00:14, 9.33it/s] 140it [00:14, 8.84it/s] 141it [00:14, 9.04it/s] 142it [00:15, 9.17it/s] 143it [00:15, 9.19it/s] 144it [00:15, 9.29it/s] 145it [00:15, 9.35it/s] 146it [00:15, 9.32it/s] 147it [00:15, 9.33it/s] 148it [00:15, 9.37it/s] 149it [00:15, 9.42it/s] 150it [00:15, 9.47it/s]2025-05-26 03:29:09,680 - INFO - [Epoch 041 | Batch 0150] IWAE-loss 5604.3018 | mean log_px -0.0409 | KL -3472.15 + 151it [00:16, 9.50it/s] 152it [00:16, 9.49it/s] 153it [00:16, 9.54it/s] 154it [00:16, 9.50it/s] 155it [00:16, 9.01it/s] 156it [00:16, 9.15it/s] 157it [00:16, 9.27it/s] 158it [00:16, 9.32it/s] 159it [00:16, 9.37it/s] 160it [00:16, 9.46it/s] 161it [00:17, 9.46it/s] 162it [00:17, 9.44it/s] 163it [00:17, 9.47it/s] 164it [00:17, 9.46it/s] 165it [00:17, 9.47it/s] 166it [00:17, 9.47it/s] 167it [00:17, 9.46it/s] 168it [00:17, 9.44it/s] 169it [00:17, 9.40it/s] 170it [00:18, 9.43it/s] 171it [00:18, 9.47it/s] 172it [00:18, 9.48it/s] 173it [00:18, 9.48it/s] 174it [00:18, 8.97it/s] 175it [00:18, 9.11it/s] 176it [00:18, 9.19it/s] 177it [00:18, 9.28it/s] 178it [00:18, 9.33it/s] 179it [00:19, 9.36it/s] 180it [00:19, 9.38it/s] 181it [00:19, 9.45it/s] 182it [00:19, 9.43it/s] 183it [00:19, 9.46it/s] 184it [00:19, 9.42it/s] 185it [00:19, 9.42it/s] 186it [00:19, 9.42it/s] 187it [00:19, 9.48it/s] 188it [00:19, 9.48it/s] 189it [00:20, 9.46it/s] 190it [00:20, 9.47it/s] 191it [00:20, 9.40it/s] 192it [00:20, 9.41it/s] 193it [00:20, 8.91it/s] 194it [00:20, 9.03it/s] 195it [00:20, 8.60it/s] 196it [00:20, 8.63it/s] 196it [00:20, 9.37it/s] +2025-05-26 03:29:14,622 - INFO - Epoch: 41, Objective: tensor([4431.4009], device='cuda:0', grad_fn=), Loss: 0.017086666077375412, KL/n: 70.84024810791016 + 0it [00:00, ?it/s]2025-05-26 03:29:15,099 - INFO - [Epoch 042 | Batch 0000] IWAE-loss 7730.5332 | mean log_px -0.0675 | KL -3471.14 + 1it [00:00, 2.57it/s] 2it [00:00, 4.31it/s] 3it [00:00, 5.75it/s] 4it [00:00, 6.75it/s] 5it [00:00, 7.48it/s] 6it [00:00, 8.05it/s] 7it [00:01, 8.40it/s] 8it [00:01, 8.73it/s] 9it [00:01, 8.99it/s] 10it [00:01, 9.12it/s] 11it [00:01, 8.86it/s] 12it [00:01, 8.96it/s] 13it [00:01, 8.99it/s] 14it [00:01, 9.07it/s] 15it [00:01, 9.25it/s] 16it [00:02, 9.25it/s] 17it [00:02, 9.34it/s] 18it [00:02, 9.38it/s] 19it [00:02, 9.09it/s] 20it [00:02, 9.20it/s] 21it [00:02, 9.27it/s] 22it [00:02, 9.31it/s] 23it [00:02, 9.32it/s] 24it [00:02, 9.34it/s] 25it [00:02, 9.37it/s] 26it [00:03, 9.45it/s] 27it [00:03, 9.49it/s] 28it [00:03, 9.46it/s] 29it [00:03, 9.44it/s] 30it [00:03, 9.43it/s] 31it [00:03, 9.47it/s] 32it [00:03, 9.43it/s] 33it [00:03, 9.44it/s] 34it [00:03, 9.45it/s] 35it [00:04, 9.49it/s] 36it [00:04, 9.48it/s] 37it [00:04, 9.48it/s] 38it [00:04, 9.46it/s] 39it [00:04, 9.41it/s] 40it [00:04, 9.45it/s] 41it [00:04, 9.47it/s] 42it [00:04, 9.45it/s] 43it [00:04, 8.90it/s] 44it [00:05, 9.02it/s] 45it [00:05, 9.19it/s] 46it [00:05, 9.30it/s] 47it [00:05, 9.40it/s] 48it [00:05, 9.40it/s] 49it [00:05, 9.43it/s] 50it [00:05, 9.43it/s]2025-05-26 03:29:20,478 - INFO - [Epoch 042 | Batch 0050] IWAE-loss 6543.3037 | mean log_px -0.0493 | KL -3464.77 + 51it [00:05, 9.37it/s] 52it [00:05, 9.39it/s] 53it [00:05, 9.40it/s] 54it [00:06, 9.37it/s] 55it [00:06, 9.35it/s] 56it [00:06, 9.37it/s] 57it [00:06, 8.86it/s] 58it [00:06, 9.03it/s] 59it [00:06, 9.15it/s] 60it [00:06, 9.26it/s] 61it [00:06, 9.34it/s] 62it [00:06, 9.39it/s] 63it [00:07, 9.39it/s] 64it [00:07, 9.43it/s] 65it [00:07, 9.45it/s] 66it [00:07, 9.45it/s] 67it [00:07, 9.45it/s] 68it [00:07, 9.45it/s] 69it [00:07, 9.50it/s] 70it [00:07, 9.47it/s] 71it [00:07, 9.48it/s] 72it [00:07, 9.42it/s] 73it [00:08, 9.45it/s] 74it [00:08, 9.42it/s] 75it [00:08, 8.97it/s] 76it [00:08, 9.14it/s] 77it [00:08, 9.21it/s] 78it [00:08, 9.26it/s] 79it [00:08, 9.30it/s] 80it [00:08, 9.32it/s] 81it [00:08, 9.39it/s] 82it [00:09, 9.40it/s] 83it [00:09, 9.46it/s] 84it [00:09, 9.09it/s] 85it [00:09, 9.21it/s] 86it [00:09, 9.26it/s] 87it [00:09, 9.34it/s] 88it [00:09, 9.35it/s] 89it [00:09, 9.19it/s] 90it [00:09, 8.61it/s] 91it [00:10, 8.75it/s] 92it [00:10, 8.87it/s] 93it [00:10, 9.00it/s] 94it [00:10, 9.08it/s] 95it [00:10, 9.14it/s] 96it [00:10, 9.21it/s] 97it [00:10, 9.26it/s] 98it [00:10, 9.24it/s] 99it [00:10, 8.79it/s] 100it [00:11, 8.95it/s]2025-05-26 03:29:25,901 - INFO - [Epoch 042 | Batch 0100] IWAE-loss 4768.8535 | mean log_px -0.0224 | KL -3467.10 + 101it [00:11, 9.03it/s] 102it [00:11, 9.14it/s] 103it [00:11, 8.74it/s] 104it [00:11, 8.98it/s] 105it [00:11, 9.10it/s] 106it [00:11, 9.20it/s] 107it [00:11, 9.23it/s] 108it [00:11, 9.27it/s] 109it [00:12, 9.32it/s] 110it [00:12, 9.38it/s] 111it [00:12, 9.42it/s] 112it [00:12, 9.39it/s] 113it [00:12, 9.40it/s] 114it [00:12, 9.40it/s] 115it [00:12, 9.36it/s] 116it [00:12, 9.39it/s] 117it [00:12, 9.41it/s] 118it [00:13, 9.36it/s] 119it [00:13, 9.39it/s] 120it [00:13, 9.45it/s] 121it [00:13, 9.50it/s] 122it [00:13, 9.53it/s] 123it [00:13, 9.56it/s] 124it [00:13, 9.55it/s] 125it [00:13, 9.59it/s] 126it [00:13, 9.58it/s] 127it [00:13, 9.59it/s] 128it [00:14, 9.53it/s] 129it [00:14, 9.57it/s] 130it [00:14, 9.51it/s] 131it [00:14, 9.48it/s] 132it [00:14, 9.52it/s] 133it [00:14, 9.51it/s] 134it [00:14, 9.45it/s] 135it [00:14, 9.39it/s] 136it [00:14, 9.08it/s] 137it [00:15, 9.21it/s] 138it [00:15, 9.26it/s] 139it [00:15, 9.32it/s] 140it [00:15, 9.35it/s] 141it [00:15, 9.40it/s] 142it [00:15, 9.41it/s] 143it [00:15, 9.16it/s] 144it [00:15, 9.22it/s] 145it [00:15, 9.26it/s] 146it [00:15, 9.23it/s] 147it [00:16, 8.98it/s] 148it [00:16, 9.09it/s] 149it [00:16, 9.08it/s] 150it [00:16, 9.25it/s]2025-05-26 03:29:31,251 - INFO - [Epoch 042 | Batch 0150] IWAE-loss 5339.9580 | mean log_px -0.0337 | KL -3464.08 + 151it [00:16, 9.37it/s] 152it [00:16, 9.45it/s] 153it [00:16, 9.55it/s] 154it [00:16, 9.63it/s] 155it [00:16, 9.65it/s] 156it [00:17, 9.70it/s] 157it [00:17, 9.75it/s] 158it [00:17, 9.76it/s] 159it [00:17, 9.76it/s] 160it [00:17, 9.77it/s] 161it [00:17, 9.80it/s] 162it [00:17, 9.75it/s] 163it [00:17, 9.75it/s] 164it [00:17, 9.73it/s] 165it [00:17, 9.73it/s] 166it [00:18, 9.74it/s] 167it [00:18, 9.75it/s] 168it [00:18, 9.75it/s] 169it [00:18, 9.76it/s] 170it [00:18, 9.77it/s] 171it [00:18, 9.80it/s] 172it [00:18, 9.65it/s] 173it [00:18, 9.51it/s] 174it [00:18, 9.43it/s] 175it [00:19, 9.05it/s] 176it [00:19, 9.25it/s] 177it [00:19, 9.42it/s] 178it [00:19, 9.53it/s] 179it [00:19, 9.61it/s] 180it [00:19, 9.61it/s] 181it [00:19, 9.68it/s] 182it [00:19, 9.71it/s] 183it [00:19, 9.77it/s] 184it [00:19, 9.79it/s] 185it [00:20, 9.81it/s] 186it [00:20, 9.82it/s] 187it [00:20, 9.86it/s] 188it [00:20, 9.85it/s] 189it [00:20, 9.86it/s] 190it [00:20, 9.85it/s] 191it [00:20, 9.85it/s] 192it [00:20, 9.84it/s] 193it [00:20, 9.86it/s] 194it [00:20, 9.84it/s] 195it [00:21, 9.30it/s] 196it [00:21, 9.23it/s] +2025-05-26 03:29:36,008 - INFO - Epoch: 42, Objective: tensor([5298.1240], device='cuda:0', grad_fn=), Loss: 0.0280563123524189, KL/n: 70.67806243896484 + 0it [00:00, ?it/s]2025-05-26 03:29:36,272 - INFO - [Epoch 043 | Batch 0000] IWAE-loss 4510.7559 | mean log_px -0.0216 | KL -3460.82 + 1it [00:00, 5.64it/s] 2it [00:00, 7.43it/s] 3it [00:00, 8.36it/s] 4it [00:00, 8.80it/s] 5it [00:00, 9.09it/s] 6it [00:00, 9.27it/s] 7it [00:00, 9.42it/s] 8it [00:00, 9.52it/s] 9it [00:01, 9.60it/s] 10it [00:01, 9.65it/s] 11it [00:01, 9.63it/s] 12it [00:01, 9.61it/s] 13it [00:01, 9.44it/s] 14it [00:01, 9.52it/s] 15it [00:01, 9.33it/s] 16it [00:01, 9.43it/s] 17it [00:01, 9.54it/s] 18it [00:01, 9.60it/s] 19it [00:02, 9.64it/s] 20it [00:02, 9.67it/s] 21it [00:02, 9.72it/s] 22it [00:02, 9.73it/s] 23it [00:02, 9.76it/s] 24it [00:02, 9.77it/s] 25it [00:02, 9.78it/s] 26it [00:02, 9.77it/s] 27it [00:02, 9.78it/s] 28it [00:02, 9.77it/s] 29it [00:03, 9.53it/s] 30it [00:03, 9.58it/s] 31it [00:03, 9.54it/s] 32it [00:03, 9.56it/s] 33it [00:03, 9.61it/s] 34it [00:03, 9.64it/s] 35it [00:03, 9.66it/s] 36it [00:03, 9.68it/s] 37it [00:03, 9.70it/s] 38it [00:04, 9.71it/s] 39it [00:04, 9.74it/s] 40it [00:04, 9.80it/s] 42it [00:04, 9.90it/s] 44it [00:04, 9.96it/s] 46it [00:04, 9.99it/s] 48it [00:05, 10.01it/s] 50it [00:05, 10.02it/s]2025-05-26 03:29:41,409 - INFO - [Epoch 043 | Batch 0050] IWAE-loss 4645.6123 | mean log_px -0.0196 | KL -3460.41 + 52it [00:05, 10.03it/s] 54it [00:05, 10.02it/s] 56it [00:05, 10.02it/s] 58it [00:06, 9.90it/s] 59it [00:06, 9.61it/s] 60it [00:06, 9.67it/s] 62it [00:06, 9.81it/s] 64it [00:06, 9.89it/s] 66it [00:06, 9.93it/s] 68it [00:07, 9.61it/s] 70it [00:07, 9.73it/s] 71it [00:07, 9.78it/s] 72it [00:07, 9.81it/s] 73it [00:07, 9.84it/s] 74it [00:07, 9.86it/s] 75it [00:07, 9.88it/s] 76it [00:07, 9.44it/s] 77it [00:07, 9.57it/s] 78it [00:08, 9.58it/s] 79it [00:08, 9.64it/s] 80it [00:08, 9.66it/s] 81it [00:08, 9.71it/s] 82it [00:08, 9.58it/s] 83it [00:08, 9.48it/s] 84it [00:08, 9.54it/s] 85it [00:08, 9.61it/s] 86it [00:08, 9.59it/s] 87it [00:09, 9.04it/s] 88it [00:09, 9.21it/s] 89it [00:09, 9.37it/s] 90it [00:09, 9.49it/s] 91it [00:09, 9.62it/s] 92it [00:09, 8.96it/s] 93it [00:09, 8.87it/s] 94it [00:09, 8.93it/s] 95it [00:09, 8.73it/s] 96it [00:10, 8.95it/s] 98it [00:10, 9.40it/s] 99it [00:10, 9.52it/s] 100it [00:10, 9.60it/s]2025-05-26 03:29:46,632 - INFO - [Epoch 043 | Batch 0100] IWAE-loss 7542.3433 | mean log_px -0.0583 | KL -3461.22 + 101it [00:10, 9.68it/s] 102it [00:10, 9.74it/s] 104it [00:10, 9.87it/s] 106it [00:11, 9.49it/s] 108it [00:11, 9.66it/s] 110it [00:11, 9.79it/s] 112it [00:11, 9.87it/s] 114it [00:11, 9.91it/s] 116it [00:12, 9.94it/s] 118it [00:12, 9.96it/s] 120it [00:12, 9.98it/s] 122it [00:12, 10.00it/s] 124it [00:12, 10.01it/s] 126it [00:13, 9.75it/s] 127it [00:13, 9.76it/s] 128it [00:13, 9.80it/s] 129it [00:13, 9.84it/s] 131it [00:13, 9.92it/s] 132it [00:13, 9.94it/s] 134it [00:13, 9.98it/s] 136it [00:14, 10.00it/s] 138it [00:14, 10.02it/s] 140it [00:14, 9.92it/s] 142it [00:14, 9.94it/s] 143it [00:14, 9.95it/s] 145it [00:14, 9.99it/s] 146it [00:15, 9.99it/s] 147it [00:15, 9.98it/s] 148it [00:15, 9.98it/s] 149it [00:15, 9.98it/s] 150it [00:15, 9.98it/s]2025-05-26 03:29:51,675 - INFO - [Epoch 043 | Batch 0150] IWAE-loss 4443.6572 | mean log_px -0.0191 | KL -3451.98 + 151it [00:15, 9.97it/s] 152it [00:15, 9.93it/s] 153it [00:15, 9.94it/s] 155it [00:15, 9.98it/s] 156it [00:16, 9.97it/s] 158it [00:16, 9.62it/s] 159it [00:16, 9.64it/s] 160it [00:16, 9.69it/s] 161it [00:16, 9.75it/s] 162it [00:16, 9.78it/s] 164it [00:16, 9.83it/s] 165it [00:17, 9.84it/s] 166it [00:17, 9.83it/s] 167it [00:17, 9.86it/s] 168it [00:17, 9.30it/s] 170it [00:17, 9.62it/s] 172it [00:17, 9.78it/s] 174it [00:17, 9.86it/s] 176it [00:18, 9.92it/s] 178it [00:18, 9.95it/s] 180it [00:18, 9.98it/s] 181it [00:18, 9.97it/s] 182it [00:18, 9.97it/s] 184it [00:18, 9.99it/s] 186it [00:19, 10.01it/s] 187it [00:19, 9.99it/s] 188it [00:19, 9.98it/s] 190it [00:19, 9.99it/s] 191it [00:19, 9.62it/s] 192it [00:19, 9.70it/s] 193it [00:19, 9.75it/s] 195it [00:20, 9.55it/s] 196it [00:20, 9.69it/s] +2025-05-26 03:29:56,360 - INFO - Epoch: 43, Objective: tensor([4990.5254], device='cuda:0', grad_fn=), Loss: 0.022801268845796585, KL/n: 70.53202056884766 + 0it [00:00, ?it/s]2025-05-26 03:29:56,633 - INFO - [Epoch 044 | Batch 0000] IWAE-loss 8241.9609 | mean log_px -0.0746 | KL -3451.67 + 1it [00:00, 4.71it/s] 2it [00:00, 6.78it/s] 3it [00:00, 7.91it/s] 4it [00:00, 8.62it/s] 5it [00:00, 9.07it/s] 6it [00:00, 9.36it/s] 8it [00:00, 9.68it/s] 9it [00:01, 9.72it/s] 10it [00:01, 9.79it/s] 12it [00:01, 9.91it/s] 13it [00:01, 9.91it/s] 14it [00:01, 6.73it/s] 15it [00:01, 7.35it/s] 16it [00:01, 7.92it/s] 18it [00:02, 8.72it/s] 19it [00:02, 8.99it/s] 20it [00:02, 9.21it/s] 22it [00:02, 9.53it/s] 23it [00:02, 9.63it/s] 24it [00:02, 9.19it/s] 26it [00:02, 9.19it/s] 27it [00:03, 9.34it/s] 28it [00:03, 9.47it/s] 29it [00:03, 9.57it/s] 30it [00:03, 9.66it/s] 31it [00:03, 9.70it/s] 32it [00:03, 9.77it/s] 33it [00:03, 9.79it/s] 34it [00:03, 9.81it/s] 35it [00:03, 9.37it/s] 36it [00:03, 9.50it/s] 37it [00:04, 9.53it/s] 38it [00:04, 9.59it/s] 39it [00:04, 9.58it/s] 40it [00:04, 9.64it/s] 41it [00:04, 9.67it/s] 42it [00:04, 9.71it/s] 43it [00:04, 9.13it/s] 44it [00:04, 9.32it/s] 45it [00:04, 9.48it/s] 46it [00:05, 9.54it/s] 47it [00:05, 9.63it/s] 48it [00:05, 9.62it/s] 49it [00:05, 9.01it/s] 50it [00:05, 9.10it/s]2025-05-26 03:30:02,026 - INFO - [Epoch 044 | Batch 0050] IWAE-loss 8636.9531 | mean log_px -0.0781 | KL -3454.60 + 51it [00:05, 9.14it/s] 52it [00:05, 9.36it/s] 53it [00:05, 8.96it/s] 54it [00:05, 9.22it/s] 55it [00:06, 9.43it/s] 56it [00:06, 9.58it/s] 57it [00:06, 9.69it/s] 58it [00:06, 9.65it/s] 60it [00:06, 9.81it/s] 62it [00:06, 9.88it/s] 63it [00:06, 9.91it/s] 64it [00:06, 9.92it/s] 65it [00:07, 9.94it/s] 66it [00:07, 9.91it/s] 68it [00:07, 9.93it/s] 69it [00:07, 9.54it/s] 70it [00:07, 9.63it/s] 71it [00:07, 9.70it/s] 72it [00:07, 9.21it/s] 73it [00:07, 9.42it/s] 74it [00:07, 9.56it/s] 76it [00:08, 9.74it/s] 78it [00:08, 9.84it/s] 79it [00:08, 9.86it/s] 80it [00:08, 9.89it/s] 82it [00:08, 9.94it/s] 83it [00:08, 9.58it/s] 84it [00:08, 9.66it/s] 85it [00:09, 9.75it/s] 86it [00:09, 9.79it/s] 88it [00:09, 9.83it/s] 90it [00:09, 9.91it/s] 91it [00:09, 9.92it/s] 92it [00:09, 9.92it/s] 93it [00:09, 9.93it/s] 94it [00:09, 9.89it/s] 95it [00:10, 9.89it/s] 96it [00:10, 9.91it/s] 98it [00:10, 9.94it/s] 99it [00:10, 9.91it/s] 100it [00:10, 9.89it/s]2025-05-26 03:30:07,136 - INFO - [Epoch 044 | Batch 0100] IWAE-loss 4468.0703 | mean log_px -0.0182 | KL -3448.35 + 101it [00:10, 9.91it/s] 102it [00:10, 9.91it/s] 103it [00:10, 9.92it/s] 105it [00:11, 9.48it/s] 106it [00:11, 9.56it/s] 107it [00:11, 9.64it/s] 108it [00:11, 9.71it/s] 109it [00:11, 9.72it/s] 110it [00:11, 9.79it/s] 111it [00:11, 9.83it/s] 113it [00:11, 9.52it/s] 114it [00:12, 9.60it/s] 116it [00:12, 9.77it/s] 118it [00:12, 9.83it/s] 119it [00:12, 9.83it/s] 120it [00:12, 9.86it/s] 121it [00:12, 9.37it/s] 122it [00:12, 9.52it/s] 124it [00:13, 9.28it/s] 125it [00:13, 9.30it/s] 126it [00:13, 9.43it/s] 128it [00:13, 9.66it/s] 130it [00:13, 9.78it/s] 131it [00:13, 9.82it/s] 132it [00:13, 9.84it/s] 133it [00:13, 9.88it/s] 134it [00:14, 9.90it/s] 135it [00:14, 9.93it/s] 136it [00:14, 9.93it/s] 138it [00:14, 9.98it/s] 140it [00:14, 9.99it/s] 141it [00:14, 9.99it/s] 142it [00:14, 9.98it/s] 143it [00:15, 9.89it/s] 145it [00:15, 9.96it/s] 146it [00:15, 9.95it/s] 148it [00:15, 10.00it/s] 150it [00:15, 10.01it/s]2025-05-26 03:30:12,250 - INFO - [Epoch 044 | Batch 0150] IWAE-loss 5638.1201 | mean log_px -0.0363 | KL -3448.95 + 151it [00:15, 9.99it/s] 152it [00:15, 9.98it/s] 153it [00:16, 9.96it/s] 154it [00:16, 9.94it/s] 156it [00:16, 9.98it/s] 158it [00:16, 9.99it/s] 159it [00:16, 9.93it/s] 160it [00:16, 9.94it/s] 161it [00:16, 9.95it/s] 162it [00:16, 9.95it/s] 163it [00:17, 9.80it/s] 164it [00:17, 9.77it/s] 165it [00:17, 9.82it/s] 166it [00:17, 9.85it/s] 167it [00:17, 9.26it/s] 168it [00:17, 9.43it/s] 169it [00:17, 9.58it/s] 170it [00:17, 9.10it/s] 171it [00:17, 9.35it/s] 172it [00:17, 9.51it/s] 173it [00:18, 9.60it/s] 174it [00:18, 9.69it/s] 175it [00:18, 9.15it/s] 176it [00:18, 9.38it/s] 177it [00:18, 9.54it/s] 178it [00:18, 9.66it/s] 179it [00:18, 9.75it/s] 180it [00:18, 9.82it/s] 181it [00:18, 9.79it/s] 182it [00:18, 9.84it/s] 184it [00:19, 9.41it/s] 185it [00:19, 9.53it/s] 186it [00:19, 9.64it/s] 187it [00:19, 9.73it/s] 188it [00:19, 9.80it/s] 190it [00:19, 9.90it/s] 191it [00:19, 9.92it/s] 192it [00:20, 9.91it/s] 193it [00:20, 9.91it/s] 194it [00:20, 9.93it/s] 195it [00:20, 9.53it/s] 196it [00:20, 9.56it/s] +2025-05-26 03:30:16,995 - INFO - Epoch: 44, Objective: tensor([5709.1240], device='cuda:0', grad_fn=), Loss: 0.03686925023794174, KL/n: 70.38143920898438 + 0it [00:00, ?it/s]2025-05-26 03:30:17,268 - INFO - [Epoch 045 | Batch 0000] IWAE-loss 6154.7354 | mean log_px -0.0426 | KL -3452.68 + 1it [00:00, 4.80it/s] 2it [00:00, 6.62it/s] 3it [00:00, 7.49it/s] 4it [00:00, 7.74it/s] 6it [00:00, 8.87it/s] 8it [00:00, 9.37it/s] 9it [00:01, 9.08it/s] 10it [00:01, 9.29it/s] 12it [00:01, 9.61it/s] 13it [00:01, 9.23it/s] 15it [00:01, 9.57it/s] 17it [00:01, 9.78it/s] 19it [00:02, 9.51it/s] 20it [00:02, 9.58it/s] 22it [00:02, 9.78it/s] 24it [00:02, 9.89it/s] 26it [00:02, 9.97it/s] 28it [00:02, 10.02it/s] 30it [00:03, 10.07it/s] 32it [00:03, 10.09it/s] 34it [00:03, 10.11it/s] 36it [00:03, 10.13it/s] 38it [00:03, 10.14it/s] 40it [00:04, 10.14it/s] 42it [00:04, 10.14it/s] 44it [00:04, 9.67it/s] 45it [00:04, 9.71it/s] 47it [00:04, 9.84it/s] 48it [00:05, 9.83it/s] 49it [00:05, 9.52it/s] 50it [00:05, 9.59it/s]2025-05-26 03:30:22,409 - INFO - [Epoch 045 | Batch 0050] IWAE-loss 4413.5903 | mean log_px -0.0159 | KL -3443.76 + 51it [00:05, 9.67it/s] 52it [00:05, 9.29it/s] 53it [00:05, 9.46it/s] 55it [00:05, 9.70it/s] 56it [00:05, 9.37it/s] 57it [00:05, 9.49it/s] 58it [00:06, 9.60it/s] 60it [00:06, 9.78it/s] 62it [00:06, 9.88it/s] 64it [00:06, 9.95it/s] 66it [00:06, 9.99it/s] 68it [00:07, 9.85it/s] 69it [00:07, 9.58it/s] 71it [00:07, 9.78it/s] 73it [00:07, 9.90it/s] 74it [00:07, 9.82it/s] 76it [00:07, 9.92it/s] 78it [00:08, 9.61it/s] 79it [00:08, 9.67it/s] 81it [00:08, 9.85it/s] 83it [00:08, 9.95it/s] 85it [00:08, 10.02it/s] 87it [00:09, 9.78it/s] 89it [00:09, 9.87it/s] 91it [00:09, 9.97it/s] 93it [00:09, 9.74it/s] 95it [00:09, 9.85it/s] 97it [00:10, 9.94it/s] 99it [00:10, 9.98it/s] 100it [00:10, 9.90it/s]2025-05-26 03:30:27,502 - INFO - [Epoch 045 | Batch 0100] IWAE-loss 5534.2393 | mean log_px -0.0361 | KL -3439.78 + 101it [00:10, 9.92it/s] 103it [00:10, 10.00it/s] 105it [00:10, 10.06it/s] 107it [00:11, 10.08it/s] 109it [00:11, 9.81it/s] 110it [00:11, 9.79it/s] 112it [00:11, 9.92it/s] 114it [00:11, 10.00it/s] 115it [00:11, 9.94it/s] 116it [00:11, 9.87it/s] 117it [00:12, 9.44it/s] 119it [00:12, 9.72it/s] 120it [00:12, 9.34it/s] 122it [00:12, 9.62it/s] 124it [00:12, 9.81it/s] 126it [00:12, 9.92it/s] 128it [00:13, 10.01it/s] 130it [00:13, 9.76it/s] 132it [00:13, 9.89it/s] 134it [00:13, 9.96it/s] 136it [00:13, 10.03it/s] 138it [00:14, 9.72it/s] 140it [00:14, 9.85it/s] 142it [00:14, 9.94it/s] 144it [00:14, 10.00it/s] 146it [00:14, 10.01it/s] 148it [00:15, 10.06it/s] 150it [00:15, 10.09it/s]2025-05-26 03:30:32,549 - INFO - [Epoch 045 | Batch 0150] IWAE-loss 5436.4814 | mean log_px -0.0340 | KL -3438.98 + 152it [00:15, 10.09it/s] 154it [00:15, 10.11it/s] 156it [00:15, 10.12it/s] 158it [00:16, 10.13it/s] 160it [00:16, 9.80it/s] 162it [00:16, 9.90it/s] 164it [00:16, 9.97it/s] 166it [00:16, 10.03it/s] 168it [00:17, 9.89it/s] 170it [00:17, 9.97it/s] 172it [00:17, 9.90it/s] 174it [00:17, 9.97it/s] 176it [00:17, 10.02it/s] 178it [00:18, 10.05it/s] 180it [00:18, 10.05it/s] 182it [00:18, 9.73it/s] 184it [00:18, 9.85it/s] 185it [00:18, 9.87it/s] 187it [00:19, 9.98it/s] 188it [00:19, 9.87it/s] 189it [00:19, 9.69it/s] 190it [00:19, 9.66it/s] 191it [00:19, 9.70it/s] 192it [00:19, 9.75it/s] 193it [00:19, 9.74it/s] 194it [00:19, 9.66it/s] 195it [00:19, 9.29it/s] 196it [00:20, 9.48it/s] 196it [00:20, 9.76it/s] +2025-05-26 03:30:37,215 - INFO - Epoch: 45, Objective: tensor([5079.6650], device='cuda:0', grad_fn=), Loss: 0.031979966908693314, KL/n: 70.21158599853516 + 0it [00:00, ?it/s]2025-05-26 03:30:37,494 - INFO - [Epoch 046 | Batch 0000] IWAE-loss 4801.6733 | mean log_px -0.0225 | KL -3436.86 + 1it [00:00, 5.34it/s] 2it [00:00, 7.26it/s] 3it [00:00, 8.28it/s] 4it [00:00, 8.85it/s] 5it [00:00, 9.22it/s] 6it [00:00, 9.43it/s] 7it [00:00, 9.59it/s] 8it [00:00, 9.68it/s] 9it [00:00, 9.77it/s] 10it [00:01, 9.81it/s] 11it [00:01, 9.84it/s] 12it [00:01, 9.86it/s] 13it [00:01, 9.88it/s] 14it [00:01, 9.87it/s] 15it [00:01, 9.90it/s] 16it [00:01, 9.89it/s] 18it [00:01, 9.92it/s] 19it [00:02, 9.92it/s] 20it [00:02, 9.88it/s] 21it [00:02, 9.90it/s] 22it [00:02, 9.90it/s] 23it [00:02, 9.91it/s] 24it [00:02, 9.90it/s] 25it [00:02, 9.90it/s] 26it [00:02, 9.89it/s] 27it [00:02, 9.89it/s] 28it [00:02, 9.89it/s] 29it [00:03, 9.90it/s] 30it [00:03, 9.89it/s] 31it [00:03, 9.91it/s] 32it [00:03, 9.90it/s] 33it [00:03, 9.91it/s] 34it [00:03, 6.33it/s] 35it [00:03, 7.08it/s] 36it [00:03, 7.72it/s] 37it [00:04, 8.26it/s] 38it [00:04, 8.68it/s] 39it [00:04, 9.02it/s] 40it [00:04, 9.25it/s] 41it [00:04, 9.44it/s] 42it [00:04, 9.55it/s] 43it [00:04, 9.66it/s] 44it [00:04, 9.71it/s] 45it [00:04, 9.54it/s] 46it [00:04, 9.62it/s] 47it [00:05, 9.70it/s] 48it [00:05, 9.75it/s] 49it [00:05, 9.79it/s] 50it [00:05, 9.80it/s]2025-05-26 03:30:42,753 - INFO - [Epoch 046 | Batch 0050] IWAE-loss 4658.3813 | mean log_px -0.0175 | KL -3431.65 + 51it [00:05, 9.80it/s] 52it [00:05, 9.81it/s] 53it [00:05, 9.81it/s] 54it [00:05, 9.82it/s] 55it [00:05, 9.84it/s] 56it [00:05, 9.83it/s] 57it [00:06, 9.75it/s] 58it [00:06, 9.78it/s] 59it [00:06, 9.78it/s] 60it [00:06, 9.78it/s] 61it [00:06, 9.79it/s] 62it [00:06, 9.81it/s] 63it [00:06, 9.81it/s] 64it [00:06, 9.82it/s] 65it [00:06, 9.81it/s] 66it [00:06, 9.80it/s] 67it [00:07, 9.78it/s] 68it [00:07, 9.79it/s] 69it [00:07, 9.17it/s] 71it [00:07, 9.54it/s] 72it [00:07, 9.54it/s] 73it [00:07, 9.58it/s] 74it [00:07, 9.25it/s] 75it [00:07, 9.44it/s] 76it [00:08, 9.57it/s] 78it [00:08, 9.79it/s] 79it [00:08, 9.81it/s] 80it [00:08, 9.44it/s] 82it [00:08, 9.69it/s] 84it [00:08, 9.85it/s] 86it [00:09, 9.93it/s] 88it [00:09, 9.97it/s] 90it [00:09, 10.02it/s] 91it [00:09, 9.70it/s] 93it [00:09, 9.85it/s] 95it [00:09, 9.94it/s] 97it [00:10, 10.00it/s] 98it [00:10, 9.67it/s] 100it [00:10, 9.73it/s]2025-05-26 03:30:47,882 - INFO - [Epoch 046 | Batch 0100] IWAE-loss 5551.6338 | mean log_px -0.0332 | KL -3436.21 + 101it [00:10, 9.36it/s] 103it [00:10, 9.62it/s] 105it [00:10, 9.78it/s] 107it [00:11, 9.90it/s] 109it [00:11, 9.96it/s] 110it [00:11, 9.92it/s] 111it [00:11, 9.43it/s] 112it [00:11, 9.32it/s] 113it [00:11, 9.47it/s] 115it [00:12, 9.72it/s] 116it [00:12, 9.41it/s] 118it [00:12, 9.66it/s] 119it [00:12, 9.73it/s] 121it [00:12, 9.88it/s] 122it [00:12, 9.86it/s] 124it [00:12, 9.48it/s] 125it [00:13, 9.41it/s] 126it [00:13, 9.24it/s] 127it [00:13, 9.40it/s] 128it [00:13, 9.50it/s] 129it [00:13, 9.61it/s] 130it [00:13, 9.66it/s] 131it [00:13, 9.72it/s] 132it [00:13, 9.77it/s] 133it [00:13, 9.80it/s] 134it [00:13, 9.82it/s] 135it [00:14, 9.85it/s] 136it [00:14, 9.82it/s] 138it [00:14, 9.93it/s] 139it [00:14, 9.45it/s] 141it [00:14, 9.71it/s] 143it [00:14, 9.86it/s] 144it [00:15, 9.84it/s] 145it [00:15, 9.51it/s] 147it [00:15, 9.73it/s] 149it [00:15, 9.85it/s]2025-05-26 03:30:53,044 - INFO - [Epoch 046 | Batch 0150] IWAE-loss 5915.6621 | mean log_px -0.0405 | KL -3435.87 + 151it [00:15, 9.56it/s] 153it [00:15, 9.73it/s] 155it [00:16, 9.86it/s] 157it [00:16, 9.93it/s] 158it [00:16, 9.56it/s] 160it [00:16, 9.75it/s] 162it [00:16, 9.85it/s] 164it [00:17, 9.93it/s] 166it [00:17, 9.98it/s] 168it [00:17, 9.97it/s] 169it [00:17, 9.95it/s] 170it [00:17, 9.93it/s] 171it [00:17, 9.91it/s] 172it [00:17, 9.89it/s] 173it [00:17, 9.87it/s] 175it [00:18, 9.98it/s] 177it [00:18, 10.02it/s] 179it [00:18, 10.05it/s] 181it [00:18, 9.70it/s] 183it [00:18, 9.83it/s] 185it [00:19, 9.92it/s] 187it [00:19, 9.64it/s] 189it [00:19, 9.78it/s] 190it [00:19, 9.82it/s] 192it [00:19, 9.92it/s] 194it [00:20, 9.99it/s] 195it [00:20, 9.71it/s] 196it [00:20, 9.47it/s] 196it [00:20, 9.61it/s] +2025-05-26 03:30:57,743 - INFO - Epoch: 46, Objective: tensor([5599.3286], device='cuda:0', grad_fn=), Loss: 0.028604112565517426, KL/n: 70.04393768310547 + 0it [00:00, ?it/s]2025-05-26 03:30:58,028 - INFO - [Epoch 047 | Batch 0000] IWAE-loss 6606.0967 | mean log_px -0.0507 | KL -3426.96 + 1it [00:00, 5.06it/s] 2it [00:00, 6.55it/s] 3it [00:00, 7.77it/s] 5it [00:00, 8.92it/s] 6it [00:00, 9.20it/s] 7it [00:00, 9.42it/s] 8it [00:00, 9.56it/s] 10it [00:01, 9.72it/s] 12it [00:01, 9.30it/s] 13it [00:01, 9.44it/s] 14it [00:01, 9.46it/s] 15it [00:01, 9.59it/s] 16it [00:01, 9.56it/s] 17it [00:01, 9.54it/s] 18it [00:01, 9.17it/s] 19it [00:02, 9.39it/s] 20it [00:02, 9.54it/s] 21it [00:02, 9.65it/s] 22it [00:02, 9.16it/s] 23it [00:02, 9.39it/s] 24it [00:02, 9.44it/s] 25it [00:02, 9.13it/s] 26it [00:02, 9.34it/s] 28it [00:03, 9.64it/s] 29it [00:03, 9.59it/s] 30it [00:03, 9.62it/s] 31it [00:03, 9.16it/s] 32it [00:03, 9.35it/s] 33it [00:03, 9.43it/s] 34it [00:03, 9.03it/s] 35it [00:03, 9.25it/s] 36it [00:03, 9.42it/s] 37it [00:03, 9.56it/s] 38it [00:04, 9.63it/s] 39it [00:04, 9.22it/s] 40it [00:04, 9.37it/s] 41it [00:04, 9.55it/s] 42it [00:04, 9.64it/s] 43it [00:04, 9.67it/s] 44it [00:04, 9.71it/s] 45it [00:04, 9.29it/s] 46it [00:04, 9.42it/s] 48it [00:05, 9.67it/s] 49it [00:05, 9.74it/s] 50it [00:05, 9.34it/s]2025-05-26 03:31:03,308 - INFO - [Epoch 047 | Batch 0050] IWAE-loss 5071.6953 | mean log_px -0.0309 | KL -3429.48 + 51it [00:05, 9.35it/s] 52it [00:05, 9.44it/s] 53it [00:05, 9.05it/s] 54it [00:05, 9.17it/s] 55it [00:05, 9.39it/s] 56it [00:06, 9.05it/s] 57it [00:06, 9.28it/s] 58it [00:06, 9.31it/s] 59it [00:06, 9.39it/s] 60it [00:06, 9.52it/s] 61it [00:06, 9.60it/s] 62it [00:06, 9.62it/s] 63it [00:06, 9.10it/s] 64it [00:06, 9.14it/s] 65it [00:06, 9.29it/s] 66it [00:07, 9.39it/s] 67it [00:07, 9.48it/s] 68it [00:07, 8.97it/s] 69it [00:07, 9.16it/s] 70it [00:07, 9.37it/s] 71it [00:07, 9.29it/s] 72it [00:07, 9.45it/s] 73it [00:07, 9.09it/s] 74it [00:07, 9.31it/s] 75it [00:08, 9.49it/s] 76it [00:08, 9.62it/s] 77it [00:08, 9.71it/s] 78it [00:08, 9.75it/s] 79it [00:08, 9.79it/s] 80it [00:08, 9.80it/s] 81it [00:08, 9.27it/s] 82it [00:08, 9.40it/s] 83it [00:08, 9.52it/s] 84it [00:09, 9.11it/s] 85it [00:09, 9.21it/s] 86it [00:09, 9.31it/s] 87it [00:09, 8.84it/s] 88it [00:09, 9.01it/s] 90it [00:09, 9.45it/s] 91it [00:09, 9.58it/s] 92it [00:09, 9.64it/s] 93it [00:09, 9.29it/s] 94it [00:10, 9.43it/s] 95it [00:10, 9.57it/s] 96it [00:10, 9.63it/s] 97it [00:10, 9.70it/s] 98it [00:10, 9.76it/s] 99it [00:10, 9.30it/s] 100it [00:10, 9.42it/s]2025-05-26 03:31:08,635 - INFO - [Epoch 047 | Batch 0100] IWAE-loss 4540.6260 | mean log_px -0.0246 | KL -3428.07 + 101it [00:10, 9.43it/s] 102it [00:10, 8.98it/s] 103it [00:11, 9.20it/s] 104it [00:11, 9.36it/s] 105it [00:11, 9.52it/s] 106it [00:11, 9.00it/s] 107it [00:11, 9.21it/s] 108it [00:11, 9.43it/s] 109it [00:11, 9.48it/s] 110it [00:11, 9.58it/s] 112it [00:11, 9.79it/s] 113it [00:12, 9.72it/s] 114it [00:12, 9.77it/s] 116it [00:12, 9.89it/s] 117it [00:12, 9.89it/s] 118it [00:12, 9.81it/s] 119it [00:12, 8.99it/s] 120it [00:12, 9.16it/s] 122it [00:13, 9.52it/s] 124it [00:13, 9.73it/s] 126it [00:13, 9.85it/s] 128it [00:13, 9.92it/s] 130it [00:13, 9.95it/s] 132it [00:14, 9.98it/s] 134it [00:14, 10.01it/s] 136it [00:14, 10.02it/s] 138it [00:14, 10.05it/s] 140it [00:14, 10.05it/s] 142it [00:15, 9.70it/s] 144it [00:15, 9.80it/s] 146it [00:15, 9.86it/s] 148it [00:15, 9.91it/s] 150it [00:15, 9.95it/s]2025-05-26 03:31:13,759 - INFO - [Epoch 047 | Batch 0150] IWAE-loss 4956.0400 | mean log_px -0.0260 | KL -3420.03 + 151it [00:15, 9.58it/s] 153it [00:16, 9.74it/s] 154it [00:16, 9.78it/s] 155it [00:16, 9.69it/s] 156it [00:16, 9.26it/s] 158it [00:16, 9.58it/s] 160it [00:16, 9.34it/s] 161it [00:16, 9.46it/s] 163it [00:17, 9.69it/s] 165it [00:17, 9.44it/s] 166it [00:17, 9.54it/s] 168it [00:17, 9.72it/s] 169it [00:17, 9.45it/s] 170it [00:17, 9.57it/s] 172it [00:18, 9.76it/s] 174it [00:18, 9.86it/s] 176it [00:18, 9.93it/s] 178it [00:18, 9.97it/s] 180it [00:18, 9.97it/s] 182it [00:19, 10.00it/s] 184it [00:19, 9.74it/s] 185it [00:19, 9.78it/s] 187it [00:19, 9.88it/s] 189it [00:19, 9.94it/s] 190it [00:19, 9.95it/s] 192it [00:20, 10.00it/s] 194it [00:20, 10.00it/s] 195it [00:20, 9.70it/s] 196it [00:20, 9.45it/s] 196it [00:20, 9.50it/s] +2025-05-26 03:31:18,506 - INFO - Epoch: 47, Objective: tensor([5860.7812], device='cuda:0', grad_fn=), Loss: 0.03282099589705467, KL/n: 69.88233184814453 + 0it [00:00, ?it/s]2025-05-26 03:31:18,774 - INFO - [Epoch 048 | Batch 0000] IWAE-loss 4398.5654 | mean log_px -0.0148 | KL -3425.91 + 1it [00:00, 5.52it/s] 2it [00:00, 6.86it/s] 4it [00:00, 8.47it/s] 5it [00:00, 8.48it/s] 6it [00:00, 8.89it/s] 8it [00:00, 9.41it/s] 10it [00:01, 9.68it/s] 12it [00:01, 9.81it/s] 14it [00:01, 9.90it/s] 16it [00:01, 9.97it/s] 18it [00:01, 10.01it/s] 20it [00:02, 10.04it/s] 22it [00:02, 9.70it/s] 24it [00:02, 9.53it/s] 26it [00:02, 9.66it/s] 28it [00:02, 9.79it/s] 29it [00:03, 9.74it/s] 30it [00:03, 9.65it/s] 31it [00:03, 9.24it/s] 32it [00:03, 9.39it/s] 34it [00:03, 9.66it/s] 36it [00:03, 9.81it/s] 37it [00:04, 7.13it/s] 38it [00:04, 7.39it/s] 39it [00:04, 7.89it/s] 41it [00:04, 8.66it/s] 43it [00:04, 9.09it/s] 44it [00:04, 9.21it/s] 45it [00:04, 8.94it/s] 47it [00:05, 9.37it/s] 49it [00:05, 9.63it/s]2025-05-26 03:31:24,105 - INFO - [Epoch 048 | Batch 0050] IWAE-loss 5411.3506 | mean log_px -0.0329 | KL -3426.38 + 51it [00:05, 9.77it/s] 53it [00:05, 9.88it/s] 55it [00:05, 9.92it/s] 56it [00:06, 9.84it/s] 57it [00:06, 9.86it/s] 58it [00:06, 9.86it/s] 60it [00:06, 9.94it/s] 62it [00:06, 9.97it/s] 63it [00:06, 9.97it/s] 64it [00:06, 9.98it/s] 65it [00:06, 9.97it/s] 66it [00:07, 9.97it/s] 68it [00:07, 9.99it/s] 70it [00:07, 10.02it/s] 72it [00:07, 10.06it/s] 74it [00:07, 10.08it/s] 76it [00:08, 10.10it/s] 78it [00:08, 10.11it/s] 80it [00:08, 10.12it/s] 82it [00:08, 10.13it/s] 84it [00:08, 10.13it/s] 86it [00:08, 10.13it/s] 88it [00:09, 10.12it/s] 90it [00:09, 10.13it/s] 92it [00:09, 10.13it/s] 94it [00:09, 10.13it/s] 96it [00:09, 10.13it/s] 98it [00:10, 10.13it/s] 100it [00:10, 10.12it/s]2025-05-26 03:31:29,068 - INFO - [Epoch 048 | Batch 0100] IWAE-loss 5481.2749 | mean log_px -0.0403 | KL -3417.41 + 102it [00:10, 10.09it/s] 104it [00:10, 10.09it/s] 106it [00:10, 9.69it/s] 108it [00:11, 9.79it/s] 110it [00:11, 9.86it/s] 111it [00:11, 9.89it/s] 112it [00:11, 9.55it/s] 114it [00:11, 9.73it/s] 116it [00:12, 9.83it/s] 118it [00:12, 9.90it/s] 120it [00:12, 9.94it/s] 121it [00:12, 9.94it/s] 122it [00:12, 9.94it/s] 123it [00:12, 9.61it/s] 124it [00:12, 9.66it/s] 125it [00:12, 9.69it/s] 126it [00:13, 9.29it/s] 127it [00:13, 9.43it/s] 128it [00:13, 9.55it/s] 129it [00:13, 9.65it/s] 130it [00:13, 9.72it/s] 131it [00:13, 9.19it/s] 132it [00:13, 9.40it/s] 134it [00:13, 9.66it/s] 135it [00:13, 9.74it/s] 137it [00:14, 9.86it/s] 138it [00:14, 9.88it/s] 140it [00:14, 9.95it/s] 142it [00:14, 9.98it/s] 143it [00:14, 9.98it/s] 144it [00:14, 9.98it/s] 145it [00:14, 9.99it/s] 146it [00:15, 9.96it/s] 147it [00:15, 9.51it/s] 148it [00:15, 9.64it/s] 150it [00:15, 9.82it/s]2025-05-26 03:31:34,192 - INFO - [Epoch 048 | Batch 0150] IWAE-loss 4167.0127 | mean log_px -0.0108 | KL -3420.06 + 151it [00:15, 9.33it/s] 152it [00:15, 9.49it/s] 154it [00:15, 9.72it/s] 155it [00:16, 9.30it/s] 156it [00:16, 9.46it/s] 158it [00:16, 9.71it/s] 160it [00:16, 9.84it/s] 162it [00:16, 9.93it/s] 164it [00:16, 9.98it/s] 165it [00:17, 9.57it/s] 166it [00:17, 9.65it/s] 168it [00:17, 9.80it/s] 170it [00:17, 9.50it/s] 171it [00:17, 9.59it/s] 172it [00:17, 9.68it/s] 174it [00:17, 9.82it/s] 176it [00:18, 9.90it/s] 178it [00:18, 9.95it/s] 180it [00:18, 9.99it/s] 181it [00:18, 9.96it/s] 182it [00:18, 9.95it/s] 184it [00:18, 9.99it/s] 186it [00:19, 10.01it/s] 188it [00:19, 10.02it/s] 190it [00:19, 10.03it/s] 192it [00:19, 9.72it/s] 193it [00:19, 9.77it/s] 194it [00:19, 9.81it/s] 195it [00:20, 9.51it/s] 196it [00:20, 9.29it/s] 196it [00:20, 9.66it/s] +2025-05-26 03:31:38,926 - INFO - Epoch: 48, Objective: tensor([5577.5146], device='cuda:0', grad_fn=), Loss: 0.034665796905756, KL/n: 69.71744537353516 + 0it [00:00, ?it/s]2025-05-26 03:31:39,204 - INFO - [Epoch 049 | Batch 0000] IWAE-loss 4387.7876 | mean log_px -0.0154 | KL -3415.77 + 1it [00:00, 5.16it/s] 2it [00:00, 6.69it/s] 4it [00:00, 8.47it/s] 6it [00:00, 9.12it/s] 7it [00:00, 8.81it/s] 8it [00:00, 9.09it/s] 10it [00:01, 9.47it/s] 11it [00:01, 9.58it/s] 12it [00:01, 9.66it/s] 13it [00:01, 9.73it/s] 14it [00:01, 9.80it/s] 15it [00:01, 9.80it/s] 16it [00:01, 9.84it/s] 17it [00:01, 9.27it/s] 18it [00:01, 9.46it/s] 20it [00:02, 9.72it/s] 21it [00:02, 9.78it/s] 22it [00:02, 9.83it/s] 23it [00:02, 9.87it/s] 24it [00:02, 9.90it/s] 26it [00:02, 9.94it/s] 27it [00:02, 9.96it/s] 28it [00:02, 9.95it/s] 29it [00:03, 9.95it/s] 30it [00:03, 9.35it/s] 32it [00:03, 9.65it/s] 34it [00:03, 9.81it/s] 36it [00:03, 9.90it/s] 37it [00:03, 9.92it/s] 38it [00:03, 9.92it/s] 39it [00:04, 9.94it/s] 40it [00:04, 9.94it/s] 41it [00:04, 9.95it/s] 42it [00:04, 9.96it/s] 44it [00:04, 10.02it/s] 45it [00:04, 9.95it/s] 46it [00:04, 9.96it/s] 48it [00:04, 9.96it/s] 49it [00:05, 9.44it/s] 50it [00:05, 9.54it/s]2025-05-26 03:31:44,330 - INFO - [Epoch 049 | Batch 0050] IWAE-loss 6286.7646 | mean log_px -0.0480 | KL -3411.50 + 51it [00:05, 9.65it/s] 52it [00:05, 9.13it/s] 53it [00:05, 9.34it/s] 54it [00:05, 9.46it/s] 56it [00:05, 9.66it/s] 58it [00:06, 9.79it/s] 59it [00:06, 9.82it/s] 60it [00:06, 9.85it/s] 61it [00:06, 9.83it/s] 62it [00:06, 9.86it/s] 63it [00:06, 9.88it/s] 64it [00:06, 9.90it/s] 65it [00:06, 9.93it/s] 66it [00:06, 9.90it/s] 68it [00:07, 9.96it/s] 69it [00:07, 9.86it/s] 70it [00:07, 9.33it/s] 72it [00:07, 9.61it/s] 73it [00:07, 9.68it/s] 74it [00:07, 9.74it/s] 76it [00:07, 9.87it/s] 78it [00:08, 9.94it/s] 79it [00:08, 9.94it/s] 81it [00:08, 9.95it/s] 82it [00:08, 9.94it/s] 83it [00:08, 9.94it/s] 84it [00:08, 9.95it/s] 86it [00:08, 9.98it/s] 88it [00:09, 10.01it/s] 89it [00:09, 9.55it/s] 91it [00:09, 9.73it/s] 92it [00:09, 9.79it/s] 93it [00:09, 9.83it/s] 94it [00:09, 9.86it/s] 96it [00:09, 9.93it/s] 97it [00:10, 9.94it/s] 98it [00:10, 9.46it/s] 99it [00:10, 9.50it/s] 100it [00:10, 9.62it/s]2025-05-26 03:31:49,444 - INFO - [Epoch 049 | Batch 0100] IWAE-loss 6288.9609 | mean log_px -0.0417 | KL -3411.01 + 101it [00:10, 9.70it/s] 102it [00:10, 9.78it/s] 103it [00:10, 9.68it/s] 104it [00:10, 9.29it/s] 105it [00:10, 9.48it/s] 106it [00:10, 9.63it/s] 108it [00:11, 9.31it/s] 109it [00:11, 9.45it/s] 110it [00:11, 9.57it/s] 111it [00:11, 9.62it/s] 112it [00:11, 9.67it/s] 113it [00:11, 9.75it/s] 114it [00:11, 9.79it/s] 116it [00:11, 9.90it/s] 117it [00:12, 9.87it/s] 118it [00:12, 9.89it/s] 119it [00:12, 9.87it/s] 120it [00:12, 9.87it/s] 121it [00:12, 9.83it/s] 122it [00:12, 9.85it/s] 123it [00:12, 9.88it/s] 124it [00:12, 9.87it/s] 126it [00:12, 9.93it/s] 127it [00:13, 9.87it/s] 128it [00:13, 9.88it/s] 129it [00:13, 9.86it/s] 130it [00:13, 9.89it/s] 132it [00:13, 9.95it/s] 133it [00:13, 9.89it/s] 134it [00:13, 9.91it/s] 135it [00:13, 9.92it/s] 136it [00:14, 9.93it/s] 137it [00:14, 9.21it/s] 138it [00:14, 9.22it/s] 139it [00:14, 9.27it/s] 140it [00:14, 9.43it/s] 141it [00:14, 9.57it/s] 142it [00:14, 9.19it/s] 143it [00:14, 9.41it/s] 144it [00:14, 9.53it/s] 145it [00:14, 9.17it/s] 146it [00:15, 9.37it/s] 147it [00:15, 9.48it/s] 148it [00:15, 9.11it/s] 149it [00:15, 9.35it/s]2025-05-26 03:31:54,629 - INFO - [Epoch 049 | Batch 0150] IWAE-loss 5174.5752 | mean log_px -0.0317 | KL -3409.79 + 151it [00:15, 9.60it/s] 152it [00:15, 9.69it/s] 154it [00:15, 9.83it/s] 155it [00:16, 9.81it/s] 157it [00:16, 9.91it/s] 158it [00:16, 9.45it/s] 159it [00:16, 9.56it/s] 160it [00:16, 9.65it/s] 161it [00:16, 9.71it/s] 162it [00:16, 9.19it/s] 164it [00:16, 9.53it/s] 165it [00:17, 9.63it/s] 166it [00:17, 9.19it/s] 167it [00:17, 9.38it/s] 169it [00:17, 9.67it/s] 170it [00:17, 9.73it/s] 172it [00:17, 9.85it/s] 174it [00:17, 9.92it/s] 176it [00:18, 9.96it/s] 178it [00:18, 9.99it/s] 179it [00:18, 9.65it/s] 180it [00:18, 9.64it/s] 182it [00:18, 9.80it/s] 184it [00:19, 9.86it/s] 186it [00:19, 9.93it/s] 187it [00:19, 9.94it/s] 188it [00:19, 9.49it/s] 190it [00:19, 9.70it/s] 192it [00:19, 9.83it/s] 193it [00:19, 9.83it/s] 194it [00:20, 9.86it/s] 195it [00:20, 9.01it/s] 196it [00:20, 9.64it/s] +2025-05-26 03:31:59,381 - INFO - Epoch: 49, Objective: tensor([5592.1567], device='cuda:0', grad_fn=), Loss: 0.03624124079942703, KL/n: 69.54737854003906 + 0it [00:00, ?it/s]2025-05-26 03:31:59,659 - INFO - [Epoch 050 | Batch 0000] IWAE-loss 4820.5073 | mean log_px -0.0246 | KL -3407.40 + 1it [00:00, 4.59it/s] 2it [00:00, 6.67it/s] 4it [00:00, 8.50it/s] 6it [00:00, 8.75it/s] 8it [00:00, 9.26it/s] 10it [00:01, 9.57it/s] 11it [00:01, 9.33it/s] 13it [00:01, 9.61it/s] 14it [00:01, 9.68it/s] 15it [00:01, 9.24it/s] 16it [00:01, 9.42it/s] 18it [00:01, 9.69it/s] 20it [00:02, 9.85it/s] 22it [00:02, 9.63it/s] 24it [00:02, 9.79it/s] 25it [00:02, 9.82it/s] 27it [00:02, 9.92it/s] 28it [00:03, 7.22it/s] 29it [00:03, 7.47it/s] 30it [00:03, 7.95it/s] 32it [00:03, 8.36it/s] 34it [00:03, 8.94it/s] 35it [00:03, 9.12it/s] 37it [00:04, 9.46it/s] 39it [00:04, 9.32it/s] 41it [00:04, 9.57it/s] 43it [00:04, 9.73it/s] 44it [00:04, 9.47it/s] 45it [00:04, 9.58it/s] 47it [00:05, 9.77it/s] 49it [00:05, 9.86it/s] 50it [00:05, 9.88it/s]2025-05-26 03:32:05,005 - INFO - [Epoch 050 | Batch 0050] IWAE-loss 6266.3530 | mean log_px -0.0450 | KL -3405.55 + 52it [00:05, 9.95it/s] 54it [00:05, 10.01it/s] 56it [00:06, 10.03it/s] 58it [00:06, 9.78it/s] 60it [00:06, 9.88it/s] 61it [00:06, 9.52it/s] 63it [00:06, 9.72it/s] 65it [00:06, 9.85it/s] 66it [00:07, 9.55it/s] 68it [00:07, 9.74it/s] 70it [00:07, 9.86it/s] 72it [00:07, 9.95it/s] 74it [00:07, 10.00it/s] 76it [00:08, 10.04it/s] 78it [00:08, 10.06it/s] 80it [00:08, 10.06it/s] 82it [00:08, 9.80it/s] 84it [00:08, 9.88it/s] 86it [00:09, 9.95it/s] 88it [00:09, 10.00it/s] 90it [00:09, 10.04it/s] 92it [00:09, 9.94it/s] 94it [00:09, 9.98it/s] 96it [00:10, 10.01it/s] 98it [00:10, 9.71it/s] 100it [00:10, 9.82it/s]2025-05-26 03:32:10,062 - INFO - [Epoch 050 | Batch 0100] IWAE-loss 5081.3320 | mean log_px -0.0248 | KL -3404.80 + 101it [00:10, 9.82it/s] 103it [00:10, 9.55it/s] 104it [00:10, 9.63it/s] 106it [00:11, 9.80it/s] 108it [00:11, 9.90it/s] 110it [00:11, 9.97it/s] 112it [00:11, 10.01it/s] 114it [00:11, 10.04it/s] 116it [00:12, 10.06it/s] 118it [00:12, 10.08it/s] 120it [00:12, 10.08it/s] 122it [00:12, 10.03it/s] 124it [00:12, 9.63it/s] 125it [00:13, 9.68it/s] 126it [00:13, 9.70it/s] 128it [00:13, 9.85it/s] 130it [00:13, 9.94it/s] 132it [00:13, 10.00it/s] 134it [00:13, 10.04it/s] 136it [00:14, 10.06it/s] 138it [00:14, 10.08it/s] 140it [00:14, 10.08it/s] 142it [00:14, 9.74it/s] 143it [00:14, 9.67it/s] 144it [00:14, 9.42it/s] 146it [00:15, 9.60it/s] 147it [00:15, 9.65it/s] 148it [00:15, 9.36it/s] 150it [00:15, 9.65it/s]2025-05-26 03:32:15,146 - INFO - [Epoch 050 | Batch 0150] IWAE-loss 5562.5117 | mean log_px -0.0343 | KL -3396.77 + 151it [00:15, 9.28it/s] 153it [00:15, 9.57it/s] 155it [00:16, 9.38it/s] 157it [00:16, 9.62it/s] 158it [00:16, 9.38it/s] 160it [00:16, 9.63it/s] 161it [00:16, 9.34it/s] 163it [00:16, 9.61it/s] 164it [00:17, 9.26it/s] 166it [00:17, 9.55it/s] 168it [00:17, 9.37it/s] 170it [00:17, 9.58it/s] 172it [00:17, 9.39it/s] 174it [00:18, 9.61it/s] 176it [00:18, 9.44it/s] 178it [00:18, 9.61it/s] 179it [00:18, 9.39it/s] 180it [00:18, 9.50it/s] 181it [00:18, 9.60it/s] 182it [00:18, 9.31it/s] 184it [00:19, 9.61it/s] 185it [00:19, 9.21it/s] 186it [00:19, 9.37it/s] 188it [00:19, 9.64it/s] 189it [00:19, 9.24it/s] 190it [00:19, 9.38it/s] 192it [00:20, 9.67it/s] 194it [00:20, 9.82it/s] 195it [00:20, 9.54it/s] 196it [00:20, 9.33it/s] 196it [00:20, 9.56it/s] +2025-05-26 03:32:20,016 - INFO - Epoch: 50, Objective: tensor([5149.9160], device='cuda:0', grad_fn=), Loss: 0.02591179683804512, KL/n: 69.36389923095703 + 0it [00:00, ?it/s]2025-05-26 03:32:20,297 - INFO - [Epoch 051 | Batch 0000] IWAE-loss 4607.3794 | mean log_px -0.0298 | KL -3396.73 + 1it [00:00, 5.30it/s] 2it [00:00, 7.15it/s] 4it [00:00, 8.75it/s] 5it [00:00, 8.66it/s] 6it [00:00, 9.01it/s] 8it [00:00, 9.47it/s] 9it [00:01, 9.59it/s] 10it [00:01, 9.68it/s] 11it [00:01, 9.70it/s] 13it [00:01, 9.85it/s] 14it [00:01, 9.86it/s] 16it [00:01, 9.95it/s] 17it [00:01, 9.96it/s] 18it [00:01, 9.97it/s] 20it [00:02, 10.00it/s] 21it [00:02, 9.52it/s] 23it [00:02, 9.72it/s] 24it [00:02, 9.77it/s] 26it [00:02, 9.89it/s] 28it [00:02, 9.95it/s] 29it [00:03, 9.96it/s] 30it [00:03, 9.96it/s] 32it [00:03, 10.00it/s] 34it [00:03, 10.00it/s] 36it [00:03, 10.02it/s] 38it [00:03, 10.03it/s] 40it [00:04, 9.68it/s] 42it [00:04, 9.79it/s] 43it [00:04, 9.42it/s] 44it [00:04, 9.29it/s] 45it [00:04, 9.12it/s] 46it [00:04, 8.83it/s] 47it [00:04, 9.03it/s] 48it [00:05, 9.18it/s] 49it [00:05, 9.32it/s] 50it [00:05, 9.40it/s]2025-05-26 03:32:25,459 - INFO - [Epoch 051 | Batch 0050] IWAE-loss 4357.4595 | mean log_px -0.0165 | KL -3393.12 + 51it [00:05, 9.06it/s] 52it [00:05, 9.23it/s] 53it [00:05, 9.01it/s] 54it [00:05, 9.13it/s] 55it [00:05, 9.31it/s] 56it [00:05, 9.24it/s] 57it [00:06, 8.63it/s] 58it [00:06, 8.42it/s] 59it [00:06, 8.61it/s] 60it [00:06, 8.86it/s] 61it [00:06, 8.99it/s] 62it [00:06, 9.11it/s] 63it [00:06, 9.20it/s] 64it [00:06, 9.30it/s] 65it [00:06, 9.32it/s] 66it [00:07, 8.86it/s] 67it [00:07, 9.09it/s] 68it [00:07, 9.17it/s] 69it [00:07, 9.29it/s] 70it [00:07, 8.90it/s] 71it [00:07, 9.12it/s] 72it [00:07, 9.25it/s] 73it [00:07, 8.88it/s] 74it [00:07, 9.07it/s] 75it [00:08, 9.21it/s] 76it [00:08, 8.85it/s] 77it [00:08, 9.03it/s] 78it [00:08, 9.17it/s] 79it [00:08, 9.29it/s] 80it [00:08, 8.85it/s] 81it [00:08, 9.07it/s] 82it [00:08, 9.19it/s] 83it [00:08, 9.32it/s] 84it [00:09, 8.88it/s] 85it [00:09, 9.08it/s] 86it [00:09, 9.20it/s] 87it [00:09, 8.76it/s] 88it [00:09, 8.87it/s] 89it [00:09, 9.06it/s] 90it [00:09, 9.13it/s] 91it [00:09, 8.77it/s] 92it [00:09, 8.96it/s] 93it [00:10, 9.16it/s] 94it [00:10, 9.28it/s] 95it [00:10, 8.88it/s] 96it [00:10, 9.11it/s] 97it [00:10, 9.21it/s] 98it [00:10, 9.29it/s] 99it [00:10, 8.89it/s] 100it [00:10, 9.03it/s]2025-05-26 03:32:30,993 - INFO - [Epoch 051 | Batch 0100] IWAE-loss 4766.6494 | mean log_px -0.0259 | KL -3393.81 + 101it [00:10, 9.22it/s] 102it [00:10, 9.30it/s] 103it [00:11, 8.88it/s] 104it [00:11, 9.05it/s] 105it [00:11, 8.76it/s] 106it [00:11, 8.94it/s] 107it [00:11, 9.18it/s] 108it [00:11, 9.20it/s] 109it [00:11, 9.23it/s] 110it [00:11, 9.32it/s] 111it [00:11, 9.39it/s] 112it [00:12, 9.41it/s] 113it [00:12, 9.46it/s] 114it [00:12, 9.48it/s] 115it [00:12, 9.51it/s] 116it [00:12, 9.52it/s] 117it [00:12, 9.53it/s] 118it [00:12, 9.49it/s] 119it [00:12, 9.50it/s] 120it [00:12, 9.36it/s] 121it [00:13, 9.45it/s] 122it [00:13, 8.93it/s] 123it [00:13, 9.10it/s] 124it [00:13, 9.23it/s] 125it [00:13, 9.30it/s] 126it [00:13, 9.33it/s] 127it [00:13, 9.41it/s] 128it [00:13, 9.45it/s] 129it [00:13, 9.44it/s] 130it [00:14, 8.97it/s] 131it [00:14, 9.14it/s] 132it [00:14, 9.23it/s] 133it [00:14, 9.33it/s] 134it [00:14, 9.38it/s] 135it [00:14, 9.40it/s] 136it [00:14, 9.45it/s] 137it [00:14, 9.49it/s] 138it [00:14, 9.51it/s] 139it [00:14, 9.47it/s] 140it [00:15, 9.49it/s] 141it [00:15, 8.89it/s] 142it [00:15, 9.07it/s] 143it [00:15, 9.20it/s] 144it [00:15, 9.29it/s] 145it [00:15, 9.34it/s] 146it [00:15, 9.44it/s] 147it [00:15, 9.51it/s] 148it [00:15, 9.50it/s] 149it [00:16, 9.50it/s] 150it [00:16, 9.48it/s]2025-05-26 03:32:36,355 - INFO - [Epoch 051 | Batch 0150] IWAE-loss 5195.3750 | mean log_px -0.0258 | KL -3389.90 + 151it [00:16, 8.96it/s] 152it [00:16, 9.13it/s] 153it [00:16, 9.26it/s] 154it [00:16, 9.33it/s] 155it [00:16, 9.26it/s] 156it [00:16, 8.81it/s] 157it [00:16, 9.06it/s] 158it [00:17, 9.21it/s] 159it [00:17, 9.33it/s] 160it [00:17, 9.43it/s] 161it [00:17, 9.51it/s] 162it [00:17, 9.56it/s] 163it [00:17, 9.54it/s] 164it [00:17, 9.54it/s] 165it [00:17, 9.50it/s] 166it [00:17, 9.55it/s] 167it [00:17, 9.09it/s] 168it [00:18, 9.21it/s] 169it [00:18, 9.33it/s] 170it [00:18, 9.45it/s] 171it [00:18, 9.46it/s] 172it [00:18, 9.49it/s] 173it [00:18, 9.50it/s] 174it [00:18, 9.58it/s] 175it [00:18, 9.00it/s] 176it [00:18, 9.16it/s] 177it [00:19, 9.30it/s] 178it [00:19, 9.41it/s] 179it [00:19, 9.46it/s] 180it [00:19, 9.45it/s] 181it [00:19, 9.46it/s] 182it [00:19, 9.53it/s] 183it [00:19, 9.60it/s] 184it [00:19, 9.62it/s] 185it [00:19, 9.59it/s] 186it [00:19, 9.56it/s] 187it [00:20, 9.61it/s] 188it [00:20, 9.64it/s] 189it [00:20, 9.59it/s] 190it [00:20, 9.59it/s] 191it [00:20, 9.16it/s] 192it [00:20, 9.18it/s] 193it [00:20, 9.26it/s] 194it [00:20, 9.30it/s] 195it [00:20, 8.81it/s] 196it [00:21, 9.07it/s] 196it [00:21, 9.28it/s] +2025-05-26 03:32:41,280 - INFO - Epoch: 51, Objective: tensor([5151.0229], device='cuda:0', grad_fn=), Loss: 0.03177899122238159, KL/n: 69.16956329345703 + 0it [00:00, ?it/s]2025-05-26 03:32:41,537 - INFO - [Epoch 052 | Batch 0000] IWAE-loss 4369.1685 | mean log_px -0.0140 | KL -3385.86 + 1it [00:00, 5.29it/s] 2it [00:00, 7.06it/s] 3it [00:00, 8.01it/s] 4it [00:00, 8.54it/s] 5it [00:00, 8.85it/s] 6it [00:00, 9.08it/s] 7it [00:00, 9.24it/s] 8it [00:00, 9.32it/s] 9it [00:01, 9.41it/s] 10it [00:01, 9.44it/s] 11it [00:01, 9.48it/s] 12it [00:01, 9.55it/s] 13it [00:01, 9.56it/s] 14it [00:01, 9.04it/s] 15it [00:01, 9.18it/s] 16it [00:01, 9.17it/s] 17it [00:01, 9.25it/s] 18it [00:01, 9.32it/s] 19it [00:02, 9.37it/s] 20it [00:02, 9.42it/s] 21it [00:02, 9.45it/s] 22it [00:02, 9.45it/s] 23it [00:02, 9.48it/s] 24it [00:02, 9.48it/s] 25it [00:02, 9.18it/s] 26it [00:02, 8.94it/s] 27it [00:02, 9.10it/s] 28it [00:03, 9.21it/s] 29it [00:03, 9.29it/s] 30it [00:03, 9.38it/s] 31it [00:03, 9.43it/s] 32it [00:03, 9.43it/s] 33it [00:03, 9.45it/s] 34it [00:03, 9.47it/s] 35it [00:03, 9.49it/s] 36it [00:03, 9.53it/s] 37it [00:04, 9.52it/s] 38it [00:04, 9.49it/s] 39it [00:04, 9.52it/s] 40it [00:04, 9.57it/s] 41it [00:04, 9.54it/s] 42it [00:04, 6.22it/s] 43it [00:04, 6.95it/s] 44it [00:04, 7.56it/s] 45it [00:05, 8.05it/s] 46it [00:05, 8.44it/s] 47it [00:05, 8.71it/s] 48it [00:05, 8.92it/s] 49it [00:05, 9.07it/s] 50it [00:05, 9.19it/s]2025-05-26 03:32:47,052 - INFO - [Epoch 052 | Batch 0050] IWAE-loss 4918.5332 | mean log_px -0.0245 | KL -3388.32 + 51it [00:05, 9.32it/s] 52it [00:05, 9.38it/s] 53it [00:05, 9.46it/s] 54it [00:05, 9.49it/s] 55it [00:06, 9.03it/s] 56it [00:06, 9.15it/s] 57it [00:06, 9.26it/s] 58it [00:06, 9.31it/s] 59it [00:06, 9.44it/s] 60it [00:06, 9.45it/s] 61it [00:06, 9.44it/s] 62it [00:06, 9.48it/s] 63it [00:06, 9.01it/s] 64it [00:07, 9.13it/s] 65it [00:07, 9.27it/s] 66it [00:07, 9.01it/s] 67it [00:07, 9.10it/s] 68it [00:07, 9.21it/s] 69it [00:07, 9.29it/s] 70it [00:07, 9.22it/s] 71it [00:07, 8.98it/s] 72it [00:07, 9.13it/s] 73it [00:08, 8.74it/s] 74it [00:08, 9.01it/s] 75it [00:08, 9.24it/s] 76it [00:08, 8.83it/s] 77it [00:08, 9.12it/s] 78it [00:08, 9.31it/s] 79it [00:08, 8.92it/s] 80it [00:08, 9.18it/s] 81it [00:08, 9.34it/s] 82it [00:09, 9.43it/s] 83it [00:09, 8.98it/s] 84it [00:09, 9.12it/s] 85it [00:09, 9.19it/s] 86it [00:09, 9.28it/s] 87it [00:09, 8.83it/s] 88it [00:09, 9.01it/s] 89it [00:09, 9.05it/s] 90it [00:09, 9.12it/s] 91it [00:10, 8.77it/s] 92it [00:10, 8.96it/s] 93it [00:10, 9.11it/s] 94it [00:10, 9.22it/s] 95it [00:10, 8.87it/s] 96it [00:10, 9.06it/s] 97it [00:10, 9.19it/s] 98it [00:10, 9.20it/s] 99it [00:10, 8.85it/s] 100it [00:11, 9.01it/s]2025-05-26 03:32:52,524 - INFO - [Epoch 052 | Batch 0100] IWAE-loss 4805.5391 | mean log_px -0.0203 | KL -3385.52 + 101it [00:11, 9.17it/s] 102it [00:11, 9.29it/s] 103it [00:11, 8.93it/s] 104it [00:11, 9.08it/s] 105it [00:11, 8.72it/s] 106it [00:11, 8.93it/s] 107it [00:11, 9.10it/s] 108it [00:11, 9.18it/s] 109it [00:12, 8.82it/s] 110it [00:12, 9.01it/s] 111it [00:12, 9.13it/s] 112it [00:12, 9.25it/s] 113it [00:12, 8.84it/s] 114it [00:12, 8.99it/s] 115it [00:12, 9.12it/s] 116it [00:12, 9.20it/s] 117it [00:12, 8.85it/s] 118it [00:13, 9.08it/s] 119it [00:13, 9.19it/s] 120it [00:13, 9.15it/s] 121it [00:13, 8.80it/s] 122it [00:13, 8.96it/s] 123it [00:13, 9.14it/s] 124it [00:13, 9.26it/s] 125it [00:13, 8.88it/s] 126it [00:13, 8.95it/s] 127it [00:14, 9.12it/s] 128it [00:14, 9.24it/s] 129it [00:14, 8.85it/s] 130it [00:14, 9.06it/s] 131it [00:14, 9.19it/s] 132it [00:14, 9.18it/s] 133it [00:14, 8.66it/s] 134it [00:14, 8.76it/s] 135it [00:14, 8.95it/s] 136it [00:15, 9.06it/s] 137it [00:15, 8.69it/s] 138it [00:15, 8.85it/s] 139it [00:15, 9.00it/s] 140it [00:15, 9.11it/s] 141it [00:15, 8.72it/s] 142it [00:15, 8.92it/s] 143it [00:15, 9.04it/s] 144it [00:15, 8.52it/s] 145it [00:16, 8.78it/s] 146it [00:16, 8.99it/s] 147it [00:16, 9.14it/s] 148it [00:16, 8.77it/s] 149it [00:16, 8.94it/s] 150it [00:16, 9.05it/s]2025-05-26 03:32:58,088 - INFO - [Epoch 052 | Batch 0150] IWAE-loss 5867.5352 | mean log_px -0.0419 | KL -3378.72 + 151it [00:16, 9.14it/s] 152it [00:16, 8.63it/s] 153it [00:16, 8.75it/s] 154it [00:17, 8.99it/s] 155it [00:17, 8.70it/s] 156it [00:17, 8.96it/s] 157it [00:17, 9.16it/s] 158it [00:17, 9.26it/s] 159it [00:17, 8.86it/s] 160it [00:17, 9.06it/s] 161it [00:17, 8.68it/s] 162it [00:17, 8.93it/s] 163it [00:18, 9.08it/s] 164it [00:18, 9.22it/s] 165it [00:18, 8.86it/s] 166it [00:18, 9.06it/s] 167it [00:18, 9.24it/s] 168it [00:18, 8.84it/s] 169it [00:18, 9.08it/s] 170it [00:18, 9.18it/s] 171it [00:18, 9.29it/s] 172it [00:19, 8.89it/s] 173it [00:19, 9.08it/s] 174it [00:19, 9.18it/s] 175it [00:19, 9.26it/s] 176it [00:19, 8.87it/s] 177it [00:19, 9.10it/s] 178it [00:19, 9.22it/s] 179it [00:19, 8.84it/s] 180it [00:19, 9.06it/s] 181it [00:20, 9.20it/s] 182it [00:20, 8.81it/s] 183it [00:20, 9.03it/s] 184it [00:20, 9.15it/s] 185it [00:20, 9.27it/s] 186it [00:20, 8.88it/s] 187it [00:20, 9.09it/s] 188it [00:20, 9.20it/s] 189it [00:20, 9.29it/s] 190it [00:21, 8.87it/s] 191it [00:21, 9.05it/s] 192it [00:21, 9.16it/s] 193it [00:21, 9.27it/s] 194it [00:21, 8.85it/s] 195it [00:21, 8.48it/s] 196it [00:21, 8.80it/s] 196it [00:21, 9.00it/s] +2025-05-26 03:33:03,201 - INFO - Epoch: 52, Objective: tensor([5528.3022], device='cuda:0', grad_fn=), Loss: 0.03874513879418373, KL/n: 69.0050048828125 + 0it [00:00, ?it/s]2025-05-26 03:33:03,483 - INFO - [Epoch 053 | Batch 0000] IWAE-loss 5155.4536 | mean log_px -0.0254 | KL -3377.25 + 1it [00:00, 4.61it/s] 2it [00:00, 6.56it/s] 3it [00:00, 7.66it/s] 4it [00:00, 8.26it/s] 5it [00:00, 8.65it/s] 6it [00:00, 8.94it/s] 7it [00:00, 9.14it/s] 8it [00:00, 9.27it/s] 9it [00:01, 9.38it/s] 10it [00:01, 9.42it/s] 11it [00:01, 9.44it/s] 12it [00:01, 9.43it/s] 13it [00:01, 9.52it/s] 14it [00:01, 9.50it/s] 15it [00:01, 9.54it/s] 16it [00:01, 9.55it/s] 17it [00:01, 9.60it/s] 18it [00:01, 9.60it/s] 19it [00:02, 9.61it/s] 20it [00:02, 9.64it/s] 21it [00:02, 9.68it/s] 22it [00:02, 9.69it/s] 23it [00:02, 9.67it/s] 24it [00:02, 9.63it/s] 25it [00:02, 9.57it/s] 26it [00:02, 9.60it/s] 27it [00:02, 9.65it/s] 28it [00:03, 9.58it/s] 29it [00:03, 9.59it/s] 30it [00:03, 9.59it/s] 31it [00:03, 9.56it/s] 32it [00:03, 9.56it/s] 33it [00:03, 9.58it/s] 34it [00:03, 9.58it/s] 35it [00:03, 9.58it/s] 36it [00:03, 9.55it/s] 37it [00:03, 9.56it/s] 38it [00:04, 9.53it/s] 39it [00:04, 9.56it/s] 40it [00:04, 9.55it/s] 41it [00:04, 9.58it/s] 42it [00:04, 9.57it/s] 43it [00:04, 9.32it/s] 44it [00:04, 9.00it/s] 45it [00:04, 9.18it/s] 46it [00:04, 9.30it/s] 47it [00:05, 8.86it/s] 48it [00:05, 9.02it/s] 49it [00:05, 9.19it/s] 50it [00:05, 9.26it/s]2025-05-26 03:33:08,782 - INFO - [Epoch 053 | Batch 0050] IWAE-loss 4669.8696 | mean log_px -0.0194 | KL -3377.31 + 51it [00:05, 8.86it/s] 52it [00:05, 9.06it/s] 53it [00:05, 9.22it/s] 54it [00:05, 8.87it/s] 55it [00:05, 9.09it/s] 56it [00:06, 9.16it/s] 57it [00:06, 9.23it/s] 58it [00:06, 9.33it/s] 59it [00:06, 9.38it/s] 60it [00:06, 9.40it/s] 61it [00:06, 9.47it/s] 62it [00:06, 9.49it/s] 63it [00:06, 9.52it/s] 64it [00:06, 9.53it/s] 65it [00:06, 9.60it/s] 66it [00:07, 9.61it/s] 67it [00:07, 9.64it/s] 68it [00:07, 9.59it/s] 69it [00:07, 9.56it/s] 70it [00:07, 9.56it/s] 71it [00:07, 9.60it/s] 72it [00:07, 9.60it/s] 73it [00:07, 9.24it/s] 74it [00:07, 9.36it/s] 75it [00:08, 9.48it/s] 76it [00:08, 9.53it/s] 77it [00:08, 9.55it/s] 78it [00:08, 9.54it/s] 79it [00:08, 9.60it/s] 80it [00:08, 9.59it/s] 81it [00:08, 9.57it/s] 82it [00:08, 9.57it/s] 83it [00:08, 9.56it/s] 84it [00:08, 9.59it/s] 85it [00:09, 9.57it/s] 86it [00:09, 9.57it/s] 87it [00:09, 9.59it/s] 88it [00:09, 9.58it/s] 89it [00:09, 9.62it/s] 90it [00:09, 9.56it/s] 91it [00:09, 9.60it/s] 92it [00:09, 9.58it/s] 93it [00:09, 9.58it/s] 94it [00:10, 9.55it/s] 95it [00:10, 9.55it/s] 96it [00:10, 9.51it/s] 97it [00:10, 9.53it/s] 98it [00:10, 9.56it/s] 99it [00:10, 9.57it/s] 100it [00:10, 9.58it/s]2025-05-26 03:33:14,055 - INFO - [Epoch 053 | Batch 0100] IWAE-loss 5013.9473 | mean log_px -0.0243 | KL -3370.79 + 101it [00:10, 9.60it/s] 102it [00:10, 9.64it/s] 103it [00:10, 9.60it/s] 104it [00:11, 9.56it/s] 105it [00:11, 9.54it/s] 106it [00:11, 8.97it/s] 107it [00:11, 9.14it/s] 108it [00:11, 9.26it/s] 109it [00:11, 9.35it/s] 110it [00:11, 9.39it/s] 111it [00:11, 9.46it/s] 112it [00:11, 9.50it/s] 113it [00:12, 9.12it/s] 114it [00:12, 9.23it/s] 115it [00:12, 9.35it/s] 116it [00:12, 9.38it/s] 117it [00:12, 9.48it/s] 118it [00:12, 9.46it/s] 119it [00:12, 9.09it/s] 120it [00:12, 9.22it/s] 121it [00:12, 9.08it/s] 122it [00:13, 9.06it/s] 123it [00:13, 9.21it/s] 124it [00:13, 9.37it/s] 125it [00:13, 9.47it/s] 126it [00:13, 9.56it/s] 127it [00:13, 9.55it/s] 128it [00:13, 9.41it/s] 129it [00:13, 9.14it/s] 130it [00:13, 9.20it/s] 131it [00:13, 9.24it/s] 132it [00:14, 8.58it/s] 133it [00:14, 8.80it/s] 134it [00:14, 8.95it/s] 135it [00:14, 9.10it/s] 136it [00:14, 9.33it/s] 137it [00:14, 8.95it/s] 138it [00:14, 9.22it/s] 139it [00:14, 9.43it/s] 141it [00:15, 9.73it/s] 142it [00:15, 9.38it/s] 144it [00:15, 9.66it/s] 146it [00:15, 9.80it/s] 148it [00:15, 9.90it/s] 150it [00:15, 9.95it/s]2025-05-26 03:33:19,373 - INFO - [Epoch 053 | Batch 0150] IWAE-loss 5491.2100 | mean log_px -0.0358 | KL -3374.70 + 152it [00:16, 9.98it/s] 154it [00:16, 10.00it/s] 156it [00:16, 10.03it/s] 158it [00:16, 10.05it/s] 160it [00:16, 10.05it/s] 162it [00:17, 10.06it/s] 164it [00:17, 10.05it/s] 166it [00:17, 10.05it/s] 168it [00:17, 10.05it/s] 170it [00:17, 10.05it/s] 172it [00:18, 10.05it/s] 174it [00:18, 9.79it/s] 176it [00:18, 9.88it/s] 178it [00:18, 9.93it/s] 180it [00:18, 9.98it/s] 182it [00:19, 10.00it/s] 184it [00:19, 10.02it/s] 186it [00:19, 9.68it/s] 187it [00:19, 9.60it/s] 188it [00:19, 9.54it/s] 189it [00:19, 9.54it/s] 191it [00:20, 9.73it/s] 192it [00:20, 9.79it/s] 193it [00:20, 9.34it/s] 194it [00:20, 9.48it/s] 195it [00:20, 9.14it/s] 196it [00:20, 9.46it/s] +2025-05-26 03:33:24,053 - INFO - Epoch: 53, Objective: tensor([5285.0635], device='cuda:0', grad_fn=), Loss: 0.031190963461995125, KL/n: 68.80663299560547 + 0it [00:00, ?it/s]2025-05-26 03:33:24,325 - INFO - [Epoch 054 | Batch 0000] IWAE-loss 4559.8145 | mean log_px -0.0225 | KL -3372.25 + 1it [00:00, 4.80it/s] 2it [00:00, 6.89it/s] 4it [00:00, 8.09it/s] 5it [00:00, 8.52it/s] 6it [00:00, 8.89it/s] 8it [00:00, 9.43it/s] 10it [00:01, 9.68it/s] 12it [00:01, 9.45it/s] 14it [00:01, 9.63it/s] 15it [00:01, 9.70it/s] 17it [00:01, 9.84it/s] 19it [00:02, 9.94it/s] 21it [00:02, 10.00it/s] 23it [00:02, 10.04it/s] 25it [00:02, 10.07it/s] 27it [00:02, 10.08it/s] 29it [00:03, 10.10it/s] 31it [00:03, 9.75it/s] 32it [00:03, 9.64it/s] 33it [00:03, 9.42it/s] 34it [00:03, 8.94it/s] 35it [00:03, 9.13it/s] 36it [00:03, 9.26it/s] 37it [00:03, 9.40it/s] 38it [00:04, 9.50it/s] 39it [00:04, 9.59it/s] 40it [00:04, 9.61it/s] 41it [00:04, 9.63it/s] 42it [00:04, 9.19it/s] 43it [00:04, 9.25it/s] 44it [00:04, 9.39it/s] 46it [00:04, 9.67it/s] 47it [00:04, 9.59it/s] 48it [00:05, 9.67it/s] 49it [00:05, 9.72it/s] 50it [00:05, 9.70it/s]2025-05-26 03:33:29,519 - INFO - [Epoch 054 | Batch 0050] IWAE-loss 4990.6138 | mean log_px -0.0290 | KL -3365.03 + 51it [00:05, 9.59it/s] 52it [00:05, 9.54it/s] 53it [00:05, 9.56it/s] 54it [00:05, 9.64it/s] 55it [00:05, 9.73it/s] 56it [00:05, 9.78it/s] 57it [00:05, 9.82it/s] 58it [00:06, 9.83it/s] 59it [00:06, 9.84it/s] 60it [00:06, 9.81it/s] 61it [00:06, 9.83it/s] 62it [00:06, 9.83it/s] 63it [00:06, 9.77it/s] 64it [00:06, 6.32it/s] 65it [00:06, 7.08it/s] 66it [00:07, 7.73it/s] 67it [00:07, 8.26it/s] 68it [00:07, 8.65it/s] 69it [00:07, 8.97it/s] 70it [00:07, 9.21it/s] 71it [00:07, 9.39it/s] 72it [00:07, 9.50it/s] 73it [00:07, 9.59it/s] 74it [00:07, 9.63it/s] 75it [00:08, 9.21it/s] 76it [00:08, 9.36it/s] 77it [00:08, 9.48it/s] 78it [00:08, 9.57it/s] 79it [00:08, 9.17it/s] 80it [00:08, 9.37it/s] 81it [00:08, 9.53it/s] 82it [00:08, 9.61it/s] 84it [00:08, 9.83it/s] 85it [00:09, 9.83it/s] 86it [00:09, 9.85it/s] 87it [00:09, 9.85it/s] 88it [00:09, 9.27it/s] 89it [00:09, 9.46it/s] 90it [00:09, 9.52it/s] 91it [00:09, 9.63it/s] 92it [00:09, 9.71it/s] 94it [00:09, 9.88it/s] 95it [00:10, 9.90it/s] 96it [00:10, 9.90it/s] 97it [00:10, 9.92it/s] 98it [00:10, 9.94it/s] 99it [00:10, 9.33it/s] 100it [00:10, 9.46it/s]2025-05-26 03:33:34,870 - INFO - [Epoch 054 | Batch 0100] IWAE-loss 5274.8164 | mean log_px -0.0305 | KL -3364.53 + 101it [00:10, 9.59it/s] 102it [00:10, 9.63it/s] 103it [00:10, 9.68it/s] 104it [00:11, 9.76it/s] 105it [00:11, 9.81it/s] 106it [00:11, 9.82it/s] 107it [00:11, 9.83it/s] 108it [00:11, 9.86it/s] 109it [00:11, 9.88it/s] 110it [00:11, 9.89it/s] 111it [00:11, 9.92it/s] 112it [00:11, 9.79it/s] 113it [00:11, 9.55it/s] 114it [00:12, 9.36it/s] 115it [00:12, 9.53it/s] 116it [00:12, 9.63it/s] 117it [00:12, 9.71it/s] 118it [00:12, 9.76it/s] 119it [00:12, 9.80it/s] 121it [00:12, 9.92it/s] 122it [00:12, 9.90it/s] 123it [00:12, 9.90it/s] 124it [00:13, 9.85it/s] 125it [00:13, 9.87it/s] 126it [00:13, 9.87it/s] 128it [00:13, 9.98it/s] 129it [00:13, 9.96it/s] 130it [00:13, 9.93it/s] 131it [00:13, 9.93it/s] 132it [00:13, 9.92it/s] 134it [00:14, 9.98it/s] 135it [00:14, 9.97it/s] 136it [00:14, 9.96it/s] 138it [00:14, 10.01it/s] 139it [00:14, 9.99it/s] 140it [00:14, 9.95it/s] 141it [00:14, 9.94it/s] 142it [00:14, 9.94it/s] 144it [00:15, 9.93it/s] 145it [00:15, 9.92it/s] 146it [00:15, 9.89it/s] 147it [00:15, 9.90it/s] 148it [00:15, 9.89it/s] 150it [00:15, 9.96it/s]2025-05-26 03:33:39,932 - INFO - [Epoch 054 | Batch 0150] IWAE-loss 4747.6250 | mean log_px -0.0197 | KL -3364.11 + 151it [00:15, 9.95it/s] 152it [00:15, 9.96it/s] 153it [00:15, 9.94it/s] 155it [00:16, 10.03it/s] 156it [00:16, 9.90it/s] 157it [00:16, 9.82it/s] 159it [00:16, 9.91it/s] 160it [00:16, 9.90it/s] 161it [00:16, 9.91it/s] 162it [00:16, 9.90it/s] 163it [00:16, 9.89it/s] 164it [00:17, 9.90it/s] 165it [00:17, 9.89it/s] 166it [00:17, 9.88it/s] 167it [00:17, 9.88it/s] 168it [00:17, 9.90it/s] 169it [00:17, 9.90it/s] 170it [00:17, 9.88it/s] 171it [00:17, 9.91it/s] 172it [00:17, 9.89it/s] 173it [00:18, 9.75it/s] 174it [00:18, 9.63it/s] 175it [00:18, 9.43it/s] 176it [00:18, 9.53it/s] 178it [00:18, 9.72it/s] 179it [00:18, 9.76it/s] 180it [00:18, 9.82it/s] 181it [00:18, 9.84it/s] 182it [00:18, 9.84it/s] 183it [00:19, 9.86it/s] 184it [00:19, 9.84it/s] 185it [00:19, 9.87it/s] 186it [00:19, 9.87it/s] 187it [00:19, 9.89it/s] 189it [00:19, 9.94it/s] 191it [00:19, 9.97it/s] 192it [00:19, 9.94it/s] 193it [00:20, 9.93it/s] 195it [00:20, 9.67it/s] 196it [00:20, 9.59it/s] +2025-05-26 03:33:44,614 - INFO - Epoch: 54, Objective: tensor([5742.4844], device='cuda:0', grad_fn=), Loss: 0.04035816341638565, KL/n: 68.60377502441406 + 0it [00:00, ?it/s]2025-05-26 03:33:44,901 - INFO - [Epoch 055 | Batch 0000] IWAE-loss 4954.8682 | mean log_px -0.0264 | KL -3363.76 + 1it [00:00, 5.21it/s] 2it [00:00, 7.20it/s] 4it [00:00, 8.80it/s] 6it [00:00, 9.35it/s] 7it [00:00, 9.49it/s] 8it [00:00, 9.60it/s] 10it [00:01, 9.80it/s] 12it [00:01, 9.91it/s] 14it [00:01, 9.98it/s] 15it [00:01, 9.98it/s] 17it [00:01, 10.05it/s] 19it [00:01, 10.08it/s] 21it [00:02, 10.09it/s] 23it [00:02, 10.06it/s] 25it [00:02, 10.08it/s] 27it [00:02, 10.06it/s] 29it [00:02, 10.03it/s] 31it [00:03, 10.03it/s] 33it [00:03, 10.07it/s] 35it [00:03, 10.08it/s] 37it [00:03, 10.07it/s] 39it [00:03, 10.09it/s] 41it [00:04, 10.06it/s] 43it [00:04, 10.09it/s] 45it [00:04, 10.07it/s] 47it [00:04, 10.09it/s] 49it [00:04, 10.11it/s]2025-05-26 03:33:49,869 - INFO - [Epoch 055 | Batch 0050] IWAE-loss 5218.8096 | mean log_px -0.0286 | KL -3357.67 + 51it [00:05, 10.04it/s] 53it [00:05, 10.04it/s] 55it [00:05, 10.06it/s] 57it [00:05, 10.08it/s] 59it [00:05, 10.10it/s] 61it [00:06, 10.11it/s] 63it [00:06, 10.10it/s] 65it [00:06, 10.09it/s] 67it [00:06, 10.08it/s] 69it [00:06, 10.06it/s] 71it [00:07, 9.98it/s] 73it [00:07, 10.02it/s] 75it [00:07, 10.03it/s] 77it [00:07, 10.05it/s] 79it [00:07, 10.02it/s] 81it [00:08, 10.00it/s] 83it [00:08, 10.04it/s] 85it [00:08, 10.05it/s] 87it [00:08, 10.03it/s] 89it [00:08, 10.00it/s] 91it [00:09, 10.04it/s] 93it [00:09, 9.98it/s] 94it [00:09, 9.95it/s] 96it [00:09, 10.00it/s] 97it [00:09, 9.95it/s] 98it [00:09, 9.94it/s] 100it [00:10, 10.00it/s]2025-05-26 03:33:54,856 - INFO - [Epoch 055 | Batch 0100] IWAE-loss 5689.7671 | mean log_px -0.0453 | KL -3352.47 + 101it [00:10, 10.00it/s] 103it [00:10, 10.04it/s] 105it [00:10, 10.07it/s] 107it [00:10, 9.99it/s] 109it [00:10, 10.02it/s] 111it [00:11, 10.06it/s] 113it [00:11, 10.06it/s] 115it [00:11, 10.08it/s] 117it [00:11, 10.07it/s] 119it [00:11, 10.08it/s] 121it [00:12, 10.08it/s] 123it [00:12, 10.08it/s] 125it [00:12, 10.10it/s] 127it [00:12, 10.10it/s] 129it [00:12, 10.10it/s] 131it [00:13, 10.13it/s] 133it [00:13, 10.13it/s] 135it [00:13, 10.05it/s] 137it [00:13, 10.06it/s] 139it [00:13, 10.08it/s] 141it [00:14, 10.06it/s] 143it [00:14, 9.82it/s] 144it [00:14, 9.77it/s] 145it [00:14, 9.81it/s] 146it [00:14, 9.85it/s] 148it [00:14, 9.95it/s] 150it [00:15, 9.97it/s]2025-05-26 03:33:59,844 - INFO - [Epoch 055 | Batch 0150] IWAE-loss 5461.5342 | mean log_px -0.0355 | KL -3352.60 + 151it [00:15, 9.96it/s] 153it [00:15, 9.99it/s] 154it [00:15, 9.96it/s] 156it [00:15, 10.01it/s] 158it [00:15, 10.04it/s] 160it [00:16, 9.98it/s] 162it [00:16, 10.02it/s] 164it [00:16, 10.03it/s] 166it [00:16, 10.03it/s] 168it [00:16, 10.02it/s] 170it [00:17, 10.06it/s] 172it [00:17, 10.07it/s] 174it [00:17, 10.10it/s] 176it [00:17, 10.09it/s] 178it [00:17, 10.08it/s] 180it [00:18, 10.09it/s] 182it [00:18, 10.04it/s] 184it [00:18, 10.02it/s] 186it [00:18, 9.99it/s] 187it [00:18, 9.99it/s] 189it [00:18, 10.03it/s] 191it [00:19, 10.07it/s] 193it [00:19, 10.10it/s] 195it [00:19, 9.85it/s] 196it [00:19, 9.96it/s] +2025-05-26 03:34:04,431 - INFO - Epoch: 55, Objective: tensor([5165.6812], device='cuda:0', grad_fn=), Loss: 0.03494435176253319, KL/n: 68.38105010986328 + 0it [00:00, ?it/s]2025-05-26 03:34:04,704 - INFO - [Epoch 056 | Batch 0000] IWAE-loss 4359.5181 | mean log_px -0.0144 | KL -3346.51 + 1it [00:00, 5.42it/s] 2it [00:00, 7.39it/s] 4it [00:00, 8.94it/s] 6it [00:00, 9.49it/s] 8it [00:00, 9.75it/s] 10it [00:01, 9.90it/s] 12it [00:01, 9.99it/s] 14it [00:01, 10.05it/s] 16it [00:01, 10.09it/s] 18it [00:01, 10.10it/s] 20it [00:02, 10.11it/s] 22it [00:02, 10.13it/s] 24it [00:02, 10.15it/s] 26it [00:02, 10.16it/s] 28it [00:02, 10.15it/s] 30it [00:03, 10.16it/s] 32it [00:03, 10.16it/s] 34it [00:03, 10.14it/s] 36it [00:03, 10.14it/s] 38it [00:03, 10.13it/s] 40it [00:04, 10.15it/s] 42it [00:04, 10.15it/s] 44it [00:04, 10.13it/s] 46it [00:04, 10.09it/s] 48it [00:04, 10.07it/s] 50it [00:05, 10.08it/s]2025-05-26 03:34:09,639 - INFO - [Epoch 056 | Batch 0050] IWAE-loss 7072.4180 | mean log_px -0.0646 | KL -3344.14 + 52it [00:05, 10.09it/s] 54it [00:05, 10.08it/s] 56it [00:05, 7.85it/s] 58it [00:05, 8.42it/s] 60it [00:06, 8.87it/s] 62it [00:06, 9.22it/s] 64it [00:06, 9.47it/s] 66it [00:06, 9.67it/s] 67it [00:06, 9.71it/s] 69it [00:07, 9.85it/s] 71it [00:07, 9.95it/s] 73it [00:07, 10.02it/s] 75it [00:07, 10.07it/s] 77it [00:07, 10.10it/s] 79it [00:08, 10.12it/s] 81it [00:08, 10.14it/s] 83it [00:08, 10.15it/s] 85it [00:08, 10.15it/s] 87it [00:08, 10.14it/s] 89it [00:09, 10.15it/s] 91it [00:09, 10.16it/s] 93it [00:09, 10.13it/s] 95it [00:09, 10.12it/s] 97it [00:09, 10.12it/s] 99it [00:10, 10.09it/s]2025-05-26 03:34:14,767 - INFO - [Epoch 056 | Batch 0100] IWAE-loss 4897.2031 | mean log_px -0.0227 | KL -3343.42 + 101it [00:10, 10.02it/s] 103it [00:10, 10.04it/s] 105it [00:10, 10.07it/s] 107it [00:10, 10.10it/s] 109it [00:11, 10.12it/s] 111it [00:11, 10.14it/s] 113it [00:11, 10.15it/s] 115it [00:11, 10.16it/s] 117it [00:11, 10.15it/s] 119it [00:12, 10.16it/s] 121it [00:12, 10.14it/s] 123it [00:12, 10.11it/s] 125it [00:12, 10.12it/s] 127it [00:12, 10.14it/s] 129it [00:13, 10.14it/s] 131it [00:13, 10.14it/s] 133it [00:13, 10.14it/s] 135it [00:13, 10.14it/s] 137it [00:13, 10.14it/s] 139it [00:13, 10.14it/s] 141it [00:14, 10.15it/s] 143it [00:14, 10.15it/s] 145it [00:14, 10.16it/s] 147it [00:14, 10.15it/s] 149it [00:14, 10.15it/s]2025-05-26 03:34:19,701 - INFO - [Epoch 056 | Batch 0150] IWAE-loss 4315.8975 | mean log_px -0.0143 | KL -3342.45 + 151it [00:15, 10.06it/s] 153it [00:15, 10.09it/s] 155it [00:15, 10.12it/s] 157it [00:15, 9.74it/s] 159it [00:15, 9.84it/s] 161it [00:16, 9.92it/s] 163it [00:16, 9.98it/s] 165it [00:16, 10.04it/s] 167it [00:16, 10.07it/s] 169it [00:16, 10.08it/s] 171it [00:17, 9.76it/s] 173it [00:17, 9.60it/s] 175it [00:17, 9.76it/s] 177it [00:17, 9.86it/s] 179it [00:18, 9.95it/s] 181it [00:18, 10.00it/s] 183it [00:18, 10.05it/s] 185it [00:18, 10.07it/s] 187it [00:18, 10.08it/s] 189it [00:18, 10.10it/s] 191it [00:19, 10.10it/s] 193it [00:19, 10.11it/s] 195it [00:19, 9.61it/s] 196it [00:19, 9.91it/s] +2025-05-26 03:34:24,348 - INFO - Epoch: 56, Objective: tensor([5050.2954], device='cuda:0', grad_fn=), Loss: 0.02728617750108242, KL/n: 68.18730926513672 + 0it [00:00, ?it/s]2025-05-26 03:34:24,616 - INFO - [Epoch 057 | Batch 0000] IWAE-loss 4560.9824 | mean log_px -0.0185 | KL -3340.02 + 1it [00:00, 4.84it/s] 2it [00:00, 6.90it/s] 4it [00:00, 8.60it/s] 6it [00:00, 9.24it/s] 8it [00:00, 9.58it/s] 10it [00:01, 9.75it/s] 12it [00:01, 9.84it/s] 14it [00:01, 9.90it/s] 15it [00:01, 9.90it/s] 16it [00:01, 9.76it/s] 17it [00:01, 9.74it/s] 19it [00:02, 9.90it/s] 21it [00:02, 9.97it/s] 23it [00:02, 10.03it/s] 25it [00:02, 10.07it/s] 27it [00:02, 10.08it/s] 29it [00:02, 10.07it/s] 31it [00:03, 10.08it/s] 33it [00:03, 10.09it/s] 35it [00:03, 10.10it/s] 37it [00:03, 10.10it/s] 39it [00:04, 9.77it/s] 40it [00:04, 9.80it/s] 42it [00:04, 9.53it/s] 44it [00:04, 9.70it/s] 46it [00:04, 9.55it/s] 48it [00:04, 9.71it/s] 50it [00:05, 9.81it/s]2025-05-26 03:34:29,684 - INFO - [Epoch 057 | Batch 0050] IWAE-loss 4015.7031 | mean log_px -0.0109 | KL -3334.84 + 52it [00:05, 9.89it/s] 54it [00:05, 9.96it/s] 56it [00:05, 10.02it/s] 58it [00:05, 9.95it/s] 59it [00:06, 9.83it/s] 60it [00:06, 9.21it/s] 61it [00:06, 9.20it/s] 62it [00:06, 9.25it/s] 63it [00:06, 9.31it/s] 64it [00:06, 9.31it/s] 65it [00:06, 9.35it/s] 66it [00:06, 9.37it/s] 67it [00:06, 9.40it/s] 68it [00:07, 9.36it/s] 69it [00:07, 8.81it/s] 70it [00:07, 9.05it/s] 71it [00:07, 9.08it/s] 72it [00:07, 9.14it/s] 73it [00:07, 8.73it/s] 74it [00:07, 8.92it/s] 75it [00:07, 9.06it/s] 76it [00:07, 9.14it/s] 77it [00:08, 9.17it/s] 78it [00:08, 9.23it/s] 79it [00:08, 9.30it/s] 80it [00:08, 9.32it/s] 81it [00:08, 9.35it/s] 82it [00:08, 9.37it/s] 83it [00:08, 9.40it/s] 84it [00:08, 9.42it/s] 85it [00:08, 9.44it/s] 86it [00:08, 9.43it/s] 87it [00:09, 9.03it/s] 88it [00:09, 9.14it/s] 89it [00:09, 9.24it/s] 90it [00:09, 9.38it/s] 91it [00:09, 9.22it/s] 92it [00:09, 9.38it/s] 93it [00:09, 9.53it/s] 94it [00:09, 9.58it/s] 95it [00:09, 9.65it/s] 96it [00:10, 9.69it/s] 97it [00:10, 9.75it/s] 98it [00:10, 9.28it/s] 99it [00:10, 9.45it/s] 100it [00:10, 9.60it/s]2025-05-26 03:34:35,022 - INFO - [Epoch 057 | Batch 0100] IWAE-loss 4555.8833 | mean log_px -0.0193 | KL -3332.19 + 101it [00:10, 9.03it/s] 102it [00:10, 9.25it/s] 103it [00:10, 9.43it/s] 104it [00:10, 9.54it/s] 105it [00:11, 9.13it/s] 106it [00:11, 9.33it/s] 107it [00:11, 9.51it/s] 108it [00:11, 9.06it/s] 109it [00:11, 9.27it/s] 110it [00:11, 9.42it/s] 111it [00:11, 9.54it/s] 112it [00:11, 9.64it/s] 113it [00:11, 9.68it/s] 114it [00:11, 9.72it/s] 115it [00:12, 9.17it/s] 116it [00:12, 9.32it/s] 117it [00:12, 9.42it/s] 118it [00:12, 9.47it/s] 119it [00:12, 9.07it/s] 120it [00:12, 9.26it/s] 121it [00:12, 9.39it/s] 122it [00:12, 9.01it/s] 123it [00:12, 9.21it/s] 124it [00:13, 9.10it/s] 125it [00:13, 9.23it/s] 126it [00:13, 8.77it/s] 127it [00:13, 8.98it/s] 128it [00:13, 9.12it/s] 129it [00:13, 9.28it/s] 130it [00:13, 9.36it/s] 131it [00:13, 8.98it/s] 132it [00:13, 9.16it/s] 133it [00:14, 9.30it/s] 134it [00:14, 9.41it/s] 135it [00:14, 9.47it/s] 136it [00:14, 8.95it/s] 137it [00:14, 9.08it/s] 138it [00:14, 9.22it/s] 139it [00:14, 9.27it/s] 140it [00:14, 9.35it/s] 141it [00:14, 9.38it/s] 142it [00:15, 9.40it/s] 143it [00:15, 9.44it/s] 144it [00:15, 9.43it/s] 145it [00:15, 9.44it/s] 146it [00:15, 9.41it/s] 147it [00:15, 9.41it/s] 148it [00:15, 8.92it/s] 149it [00:15, 9.09it/s] 150it [00:15, 9.19it/s]2025-05-26 03:34:40,424 - INFO - [Epoch 057 | Batch 0150] IWAE-loss 4984.7964 | mean log_px -0.0261 | KL -3333.72 + 151it [00:15, 9.19it/s] 152it [00:16, 9.24it/s] 153it [00:16, 9.29it/s] 154it [00:16, 9.35it/s] 155it [00:16, 8.79it/s] 156it [00:16, 8.96it/s] 157it [00:16, 9.04it/s] 158it [00:16, 9.11it/s] 159it [00:16, 9.21it/s] 160it [00:16, 9.24it/s] 161it [00:17, 9.31it/s] 162it [00:17, 9.32it/s] 163it [00:17, 8.93it/s] 164it [00:17, 9.07it/s] 165it [00:17, 9.22it/s] 166it [00:17, 9.27it/s] 167it [00:17, 9.36it/s] 168it [00:17, 9.41it/s] 169it [00:17, 9.48it/s] 170it [00:18, 9.50it/s] 171it [00:18, 9.48it/s] 172it [00:18, 8.92it/s] 173it [00:18, 9.08it/s] 174it [00:18, 9.21it/s] 175it [00:18, 9.31it/s] 176it [00:18, 9.39it/s] 177it [00:18, 9.45it/s] 178it [00:18, 9.00it/s] 179it [00:19, 9.15it/s] 180it [00:19, 9.27it/s] 181it [00:19, 9.37it/s] 182it [00:19, 9.37it/s] 183it [00:19, 9.34it/s] 184it [00:19, 9.31it/s] 185it [00:19, 9.32it/s] 186it [00:19, 9.35it/s] 187it [00:19, 9.38it/s] 188it [00:19, 9.35it/s] 189it [00:20, 9.36it/s] 190it [00:20, 8.61it/s] 191it [00:20, 8.80it/s] 192it [00:20, 8.93it/s] 193it [00:20, 9.04it/s] 194it [00:20, 9.19it/s] 195it [00:20, 8.73it/s] 196it [00:20, 9.03it/s] 196it [00:20, 9.36it/s] +2025-05-26 03:34:45,428 - INFO - Epoch: 57, Objective: tensor([5603.3149], device='cuda:0', grad_fn=), Loss: 0.03557281568646431, KL/n: 67.98454284667969 + 0it [00:00, ?it/s]2025-05-26 03:34:45,698 - INFO - [Epoch 058 | Batch 0000] IWAE-loss 4603.7197 | mean log_px -0.0217 | KL -3329.28 + 1it [00:00, 5.41it/s] 2it [00:00, 7.24it/s] 3it [00:00, 8.18it/s] 4it [00:00, 8.72it/s] 5it [00:00, 9.00it/s] 6it [00:00, 9.19it/s] 7it [00:00, 9.30it/s] 8it [00:00, 9.36it/s] 9it [00:01, 9.43it/s] 10it [00:01, 9.46it/s] 11it [00:01, 9.49it/s] 12it [00:01, 9.51it/s] 13it [00:01, 9.49it/s] 14it [00:01, 9.49it/s] 15it [00:01, 9.52it/s] 16it [00:01, 9.54it/s] 17it [00:01, 9.53it/s] 18it [00:01, 9.52it/s] 19it [00:02, 9.56it/s] 20it [00:02, 9.54it/s] 21it [00:02, 9.54it/s] 22it [00:02, 9.54it/s] 23it [00:02, 9.50it/s] 24it [00:02, 9.55it/s] 25it [00:02, 9.50it/s] 26it [00:02, 9.51it/s] 27it [00:02, 9.45it/s] 28it [00:03, 9.48it/s] 29it [00:03, 9.50it/s] 30it [00:03, 9.54it/s] 31it [00:03, 8.84it/s] 32it [00:03, 9.04it/s] 33it [00:03, 9.18it/s] 34it [00:03, 9.24it/s] 35it [00:03, 9.37it/s] 36it [00:03, 9.42it/s] 37it [00:03, 9.46it/s] 38it [00:04, 8.95it/s] 39it [00:04, 9.12it/s] 40it [00:04, 9.26it/s] 41it [00:04, 9.38it/s] 42it [00:04, 9.44it/s] 43it [00:04, 9.46it/s] 44it [00:04, 9.45it/s] 45it [00:04, 8.93it/s] 46it [00:04, 9.07it/s] 47it [00:05, 9.21it/s] 48it [00:05, 9.30it/s] 49it [00:05, 9.38it/s] 50it [00:05, 6.17it/s]2025-05-26 03:34:51,197 - INFO - [Epoch 058 | Batch 0050] IWAE-loss 4924.8784 | mean log_px -0.0293 | KL -3323.80 + 51it [00:05, 6.90it/s] 52it [00:05, 7.50it/s] 53it [00:05, 8.03it/s] 54it [00:05, 8.42it/s] 55it [00:06, 8.76it/s] 56it [00:06, 8.95it/s] 57it [00:06, 9.12it/s] 58it [00:06, 9.20it/s] 59it [00:06, 9.28it/s] 60it [00:06, 9.36it/s] 61it [00:06, 9.37it/s] 62it [00:06, 9.41it/s] 63it [00:06, 9.47it/s] 64it [00:07, 9.45it/s] 65it [00:07, 9.48it/s] 66it [00:07, 9.44it/s] 67it [00:07, 9.50it/s] 68it [00:07, 9.48it/s] 69it [00:07, 9.41it/s] 70it [00:07, 9.39it/s] 71it [00:07, 9.47it/s] 72it [00:07, 9.45it/s] 73it [00:08, 9.49it/s] 74it [00:08, 9.50it/s] 75it [00:08, 9.53it/s] 76it [00:08, 9.50it/s] 77it [00:08, 9.50it/s] 78it [00:08, 9.49it/s] 79it [00:08, 9.47it/s] 80it [00:08, 9.52it/s] 81it [00:08, 9.53it/s] 82it [00:08, 9.50it/s] 83it [00:09, 9.50it/s] 84it [00:09, 9.48it/s] 85it [00:09, 9.51it/s] 86it [00:09, 9.47it/s] 87it [00:09, 9.50it/s] 88it [00:09, 9.53it/s] 89it [00:09, 9.56it/s] 90it [00:09, 9.50it/s] 91it [00:09, 9.54it/s] 92it [00:10, 8.97it/s] 93it [00:10, 9.12it/s] 94it [00:10, 9.14it/s] 95it [00:10, 9.22it/s] 96it [00:10, 9.29it/s] 97it [00:10, 9.32it/s] 98it [00:10, 9.35it/s] 99it [00:10, 8.83it/s] 100it [00:10, 8.96it/s]2025-05-26 03:34:56,517 - INFO - [Epoch 058 | Batch 0100] IWAE-loss 4599.8813 | mean log_px -0.0212 | KL -3328.67 + 101it [00:11, 9.12it/s] 102it [00:11, 9.22it/s] 103it [00:11, 9.28it/s] 104it [00:11, 9.31it/s] 105it [00:11, 9.36it/s] 106it [00:11, 9.43it/s] 107it [00:11, 9.39it/s] 108it [00:11, 9.39it/s] 109it [00:11, 9.39it/s] 110it [00:11, 8.94it/s] 111it [00:12, 9.08it/s] 112it [00:12, 9.15it/s] 113it [00:12, 9.21it/s] 114it [00:12, 9.23it/s] 115it [00:12, 9.23it/s] 116it [00:12, 9.24it/s] 117it [00:12, 9.29it/s] 118it [00:12, 9.35it/s] 119it [00:12, 9.40it/s] 120it [00:13, 9.36it/s] 121it [00:13, 9.39it/s] 122it [00:13, 9.43it/s] 123it [00:13, 9.43it/s] 124it [00:13, 9.50it/s] 125it [00:13, 9.53it/s] 126it [00:13, 9.47it/s] 127it [00:13, 9.48it/s] 128it [00:13, 9.44it/s] 129it [00:13, 9.50it/s] 130it [00:14, 8.95it/s] 131it [00:14, 9.12it/s] 132it [00:14, 8.70it/s] 133it [00:14, 8.94it/s] 134it [00:14, 9.12it/s] 135it [00:14, 9.23it/s] 136it [00:14, 9.15it/s] 137it [00:14, 8.67it/s] 138it [00:15, 8.77it/s] 139it [00:15, 8.96it/s] 140it [00:15, 9.01it/s] 141it [00:15, 8.64it/s] 142it [00:15, 8.84it/s] 143it [00:15, 9.01it/s] 144it [00:15, 9.13it/s] 145it [00:15, 8.75it/s] 146it [00:15, 8.85it/s] 147it [00:16, 8.99it/s] 148it [00:16, 9.12it/s] 149it [00:16, 8.72it/s] 150it [00:16, 8.73it/s]2025-05-26 03:35:01,995 - INFO - [Epoch 058 | Batch 0150] IWAE-loss 4261.2881 | mean log_px -0.0143 | KL -3324.48 + 151it [00:16, 8.66it/s] 152it [00:16, 8.18it/s] 153it [00:16, 8.49it/s] 154it [00:16, 8.69it/s] 155it [00:16, 8.94it/s] 156it [00:17, 9.11it/s] 157it [00:17, 9.26it/s] 158it [00:17, 9.36it/s] 159it [00:17, 9.42it/s] 160it [00:17, 9.47it/s] 161it [00:17, 9.05it/s] 162it [00:17, 9.21it/s] 163it [00:17, 9.31it/s] 164it [00:17, 8.89it/s] 165it [00:18, 9.06it/s] 166it [00:18, 9.23it/s] 167it [00:18, 9.31it/s] 168it [00:18, 9.37it/s] 169it [00:18, 9.34it/s] 170it [00:18, 9.38it/s] 171it [00:18, 9.46it/s] 172it [00:18, 9.47it/s] 173it [00:18, 9.46it/s] 174it [00:18, 9.47it/s] 175it [00:19, 9.50it/s] 176it [00:19, 9.55it/s] 177it [00:19, 9.09it/s] 178it [00:19, 9.23it/s] 179it [00:19, 9.27it/s] 180it [00:19, 9.34it/s] 181it [00:19, 9.43it/s] 182it [00:19, 9.46it/s] 183it [00:19, 8.92it/s] 184it [00:20, 9.13it/s] 185it [00:20, 9.27it/s] 186it [00:20, 9.31it/s] 187it [00:20, 8.86it/s] 188it [00:20, 9.06it/s] 189it [00:20, 9.23it/s] 190it [00:20, 9.25it/s] 191it [00:20, 9.36it/s] 192it [00:20, 8.97it/s] 193it [00:21, 9.17it/s] 194it [00:21, 9.26it/s] 195it [00:21, 8.30it/s] 196it [00:21, 8.67it/s] 196it [00:21, 9.13it/s] +2025-05-26 03:35:07,020 - INFO - Epoch: 58, Objective: tensor([4525.3076], device='cuda:0', grad_fn=), Loss: 0.021634532138705254, KL/n: 67.80258178710938 + 0it [00:00, ?it/s]2025-05-26 03:35:07,308 - INFO - [Epoch 059 | Batch 0000] IWAE-loss 4513.4170 | mean log_px -0.0270 | KL -3325.71 + 1it [00:00, 4.92it/s] 2it [00:00, 6.28it/s] 3it [00:00, 7.44it/s] 4it [00:00, 8.13it/s] 5it [00:00, 8.59it/s] 6it [00:00, 8.35it/s] 7it [00:00, 8.68it/s] 8it [00:00, 8.91it/s] 9it [00:01, 9.17it/s] 10it [00:01, 8.88it/s] 11it [00:01, 9.04it/s] 12it [00:01, 9.17it/s] 13it [00:01, 8.77it/s] 14it [00:01, 9.02it/s] 15it [00:01, 9.14it/s] 16it [00:01, 9.26it/s] 17it [00:01, 9.37it/s] 18it [00:02, 9.31it/s] 19it [00:02, 9.34it/s] 20it [00:02, 9.40it/s] 21it [00:02, 9.45it/s] 22it [00:02, 8.70it/s] 23it [00:02, 8.95it/s] 24it [00:02, 9.06it/s] 25it [00:02, 9.25it/s] 26it [00:02, 9.39it/s] 27it [00:03, 9.40it/s] 28it [00:03, 9.36it/s] 29it [00:03, 9.43it/s] 30it [00:03, 9.47it/s] 31it [00:03, 9.54it/s] 32it [00:03, 9.51it/s] 33it [00:03, 9.48it/s] 34it [00:03, 9.53it/s] 35it [00:03, 9.51it/s] 36it [00:03, 9.44it/s] 37it [00:04, 9.44it/s] 38it [00:04, 9.38it/s] 39it [00:04, 8.80it/s] 40it [00:04, 8.93it/s] 41it [00:04, 8.88it/s] 42it [00:04, 8.83it/s] 43it [00:04, 8.84it/s] 44it [00:04, 9.05it/s] 45it [00:05, 9.13it/s] 46it [00:05, 9.21it/s] 47it [00:05, 9.27it/s] 48it [00:05, 9.32it/s] 49it [00:05, 9.39it/s] 50it [00:05, 9.45it/s]2025-05-26 03:35:12,739 - INFO - [Epoch 059 | Batch 0050] IWAE-loss 4204.3833 | mean log_px -0.0140 | KL -3318.27 + 51it [00:05, 9.50it/s] 52it [00:05, 9.52it/s] 53it [00:05, 9.49it/s] 54it [00:05, 9.54it/s] 55it [00:06, 9.56it/s] 56it [00:06, 9.55it/s] 57it [00:06, 9.51it/s] 58it [00:06, 9.51it/s] 59it [00:06, 9.56it/s] 60it [00:06, 9.54it/s] 61it [00:06, 9.52it/s] 62it [00:06, 9.53it/s] 63it [00:06, 9.53it/s] 64it [00:07, 9.27it/s] 65it [00:07, 8.83it/s] 66it [00:07, 8.98it/s] 67it [00:07, 9.09it/s] 68it [00:07, 9.26it/s] 69it [00:07, 9.31it/s] 70it [00:07, 9.39it/s] 71it [00:07, 9.47it/s] 72it [00:07, 9.45it/s] 73it [00:07, 9.52it/s] 74it [00:08, 9.51it/s] 75it [00:08, 8.83it/s] 76it [00:08, 8.96it/s] 77it [00:08, 9.13it/s] 78it [00:08, 9.31it/s] 79it [00:08, 9.40it/s] 80it [00:08, 9.46it/s] 81it [00:08, 9.50it/s] 82it [00:08, 9.52it/s] 83it [00:09, 9.55it/s] 84it [00:09, 8.97it/s] 85it [00:09, 9.13it/s] 86it [00:09, 9.25it/s] 87it [00:09, 9.37it/s] 88it [00:09, 9.39it/s] 89it [00:09, 9.04it/s] 90it [00:09, 9.18it/s] 91it [00:09, 9.27it/s] 92it [00:10, 9.36it/s] 93it [00:10, 9.39it/s] 94it [00:10, 9.43it/s] 95it [00:10, 9.52it/s] 96it [00:10, 9.53it/s] 97it [00:10, 9.12it/s] 98it [00:10, 9.22it/s] 99it [00:10, 9.31it/s] 100it [00:10, 9.38it/s]2025-05-26 03:35:18,092 - INFO - [Epoch 059 | Batch 0100] IWAE-loss 4880.2090 | mean log_px -0.0276 | KL -3318.33 + 101it [00:10, 9.45it/s] 102it [00:11, 9.49it/s] 103it [00:11, 9.45it/s] 104it [00:11, 9.50it/s] 105it [00:11, 9.41it/s] 106it [00:11, 9.39it/s] 107it [00:11, 9.46it/s] 108it [00:11, 9.47it/s] 109it [00:11, 9.46it/s] 110it [00:11, 9.49it/s] 111it [00:12, 9.44it/s] 112it [00:12, 8.92it/s] 113it [00:12, 9.09it/s] 114it [00:12, 9.17it/s] 115it [00:12, 9.22it/s] 116it [00:12, 9.33it/s] 117it [00:12, 9.35it/s] 118it [00:12, 9.38it/s] 119it [00:12, 9.41it/s] 120it [00:13, 9.41it/s] 121it [00:13, 9.41it/s] 122it [00:13, 9.43it/s] 123it [00:13, 9.46it/s] 124it [00:13, 9.45it/s] 125it [00:13, 9.47it/s] 126it [00:13, 8.90it/s] 127it [00:13, 9.10it/s] 128it [00:13, 9.17it/s] 129it [00:13, 9.27it/s] 130it [00:14, 9.35it/s] 131it [00:14, 9.39it/s] 132it [00:14, 9.39it/s] 133it [00:14, 9.39it/s] 134it [00:14, 8.91it/s] 135it [00:14, 9.09it/s] 136it [00:14, 9.20it/s] 137it [00:14, 9.27it/s] 138it [00:14, 9.33it/s] 139it [00:15, 9.43it/s] 140it [00:15, 8.90it/s] 141it [00:15, 9.07it/s] 142it [00:15, 9.16it/s] 143it [00:15, 9.31it/s] 144it [00:15, 9.32it/s] 145it [00:15, 9.44it/s] 146it [00:15, 9.47it/s] 147it [00:15, 9.43it/s] 148it [00:16, 9.40it/s] 149it [00:16, 9.50it/s] 150it [00:16, 9.50it/s]2025-05-26 03:35:23,453 - INFO - [Epoch 059 | Batch 0150] IWAE-loss 4119.4390 | mean log_px -0.0125 | KL -3316.20 + 151it [00:16, 9.54it/s] 152it [00:16, 9.57it/s] 153it [00:16, 9.52it/s] 154it [00:16, 9.51it/s] 155it [00:16, 9.51it/s] 156it [00:16, 9.48it/s] 157it [00:16, 9.54it/s] 158it [00:17, 9.49it/s] 159it [00:17, 9.47it/s] 160it [00:17, 9.47it/s] 161it [00:17, 9.55it/s] 162it [00:17, 9.61it/s] 163it [00:17, 9.53it/s] 164it [00:17, 9.54it/s] 165it [00:17, 9.52it/s] 166it [00:17, 9.54it/s] 167it [00:18, 9.60it/s] 168it [00:18, 9.55it/s] 169it [00:18, 9.00it/s] 170it [00:18, 9.12it/s] 171it [00:18, 9.28it/s] 172it [00:18, 9.37it/s] 173it [00:18, 8.87it/s] 174it [00:18, 9.06it/s] 175it [00:18, 9.23it/s] 176it [00:19, 9.35it/s] 177it [00:19, 9.43it/s] 178it [00:19, 8.90it/s] 179it [00:19, 9.10it/s] 180it [00:19, 9.28it/s] 181it [00:19, 9.34it/s] 182it [00:19, 9.40it/s] 183it [00:19, 9.46it/s] 184it [00:19, 9.45it/s] 185it [00:19, 9.51it/s] 186it [00:20, 9.46it/s] 187it [00:20, 9.47it/s] 188it [00:20, 9.51it/s] 189it [00:20, 9.53it/s] 190it [00:20, 9.58it/s] 191it [00:20, 9.00it/s] 192it [00:20, 9.11it/s] 193it [00:20, 9.23it/s] 194it [00:20, 9.36it/s] 195it [00:21, 8.82it/s] 196it [00:21, 9.04it/s] 196it [00:21, 9.23it/s] +2025-05-26 03:35:28,377 - INFO - Epoch: 59, Objective: tensor([5065.8369], device='cuda:0', grad_fn=), Loss: 0.029969044029712677, KL/n: 67.60353088378906 + 0it [00:00, ?it/s]2025-05-26 03:35:28,691 - INFO - [Epoch 060 | Batch 0000] IWAE-loss 5187.5234 | mean log_px -0.0315 | KL -3310.47 + 1it [00:00, 4.03it/s] 2it [00:00, 6.05it/s] 3it [00:00, 7.24it/s] 4it [00:00, 7.97it/s] 5it [00:00, 8.44it/s] 6it [00:00, 8.79it/s] 7it [00:00, 9.04it/s] 8it [00:00, 8.86it/s] 9it [00:01, 9.00it/s] 10it [00:01, 9.06it/s] 11it [00:01, 9.21it/s] 12it [00:01, 9.33it/s] 13it [00:01, 9.40it/s] 14it [00:01, 9.44it/s] 15it [00:01, 9.45it/s] 16it [00:01, 9.49it/s] 17it [00:01, 9.43it/s] 18it [00:02, 9.44it/s] 19it [00:02, 9.12it/s] 20it [00:02, 9.20it/s] 21it [00:02, 9.28it/s] 22it [00:02, 9.36it/s] 23it [00:02, 9.39it/s] 24it [00:02, 9.26it/s] 25it [00:02, 9.33it/s] 26it [00:02, 9.26it/s] 27it [00:03, 9.37it/s] 28it [00:03, 9.44it/s] 29it [00:03, 9.46it/s] 30it [00:03, 9.11it/s] 31it [00:03, 9.21it/s] 32it [00:03, 9.29it/s] 33it [00:03, 9.31it/s] 34it [00:03, 9.39it/s] 35it [00:03, 9.44it/s] 36it [00:03, 9.48it/s] 37it [00:04, 9.51it/s] 38it [00:04, 9.52it/s] 39it [00:04, 8.97it/s] 40it [00:04, 9.10it/s] 41it [00:04, 9.22it/s] 42it [00:04, 9.18it/s] 43it [00:04, 8.59it/s] 44it [00:05, 5.80it/s] 45it [00:05, 6.56it/s] 46it [00:05, 6.91it/s] 47it [00:05, 7.54it/s] 48it [00:05, 8.06it/s] 49it [00:05, 8.47it/s] 50it [00:05, 8.75it/s]2025-05-26 03:35:34,311 - INFO - [Epoch 060 | Batch 0050] IWAE-loss 4562.0859 | mean log_px -0.0215 | KL -3308.93 + 51it [00:05, 8.94it/s] 52it [00:05, 9.07it/s] 53it [00:06, 9.23it/s] 54it [00:06, 9.24it/s] 55it [00:06, 9.32it/s] 56it [00:06, 9.23it/s] 57it [00:06, 9.26it/s] 58it [00:06, 9.26it/s] 59it [00:06, 9.29it/s] 60it [00:06, 9.38it/s] 61it [00:06, 9.42it/s] 62it [00:07, 9.46it/s] 63it [00:07, 9.47it/s] 64it [00:07, 9.48it/s] 65it [00:07, 9.51it/s] 66it [00:07, 9.45it/s] 67it [00:07, 9.49it/s] 68it [00:07, 9.50it/s] 69it [00:07, 9.52it/s] 70it [00:07, 9.49it/s] 71it [00:07, 9.02it/s] 72it [00:08, 9.14it/s] 73it [00:08, 9.27it/s] 74it [00:08, 9.31it/s] 75it [00:08, 9.37it/s] 76it [00:08, 9.40it/s] 77it [00:08, 9.47it/s] 78it [00:08, 9.45it/s] 79it [00:08, 9.48it/s] 80it [00:08, 9.00it/s] 81it [00:09, 9.15it/s] 82it [00:09, 9.22it/s] 83it [00:09, 9.32it/s] 84it [00:09, 9.38it/s] 85it [00:09, 9.40it/s] 86it [00:09, 9.50it/s] 87it [00:09, 9.51it/s] 88it [00:09, 9.53it/s] 89it [00:09, 9.52it/s] 90it [00:09, 9.53it/s] 91it [00:10, 9.54it/s] 92it [00:10, 9.55it/s] 93it [00:10, 9.53it/s] 94it [00:10, 9.50it/s] 95it [00:10, 9.52it/s] 96it [00:10, 9.52it/s] 97it [00:10, 9.51it/s] 98it [00:10, 9.51it/s] 99it [00:10, 9.57it/s] 100it [00:11, 9.60it/s]2025-05-26 03:35:39,614 - INFO - [Epoch 060 | Batch 0100] IWAE-loss 4293.2979 | mean log_px -0.0141 | KL -3304.83 + 101it [00:11, 9.59it/s] 102it [00:11, 9.56it/s] 103it [00:11, 9.56it/s] 104it [00:11, 9.55it/s] 105it [00:11, 9.46it/s] 106it [00:11, 9.46it/s] 107it [00:11, 9.46it/s] 108it [00:11, 9.47it/s] 109it [00:11, 9.50it/s] 110it [00:12, 9.17it/s] 111it [00:12, 9.28it/s] 112it [00:12, 9.38it/s] 113it [00:12, 9.46it/s] 114it [00:12, 9.49it/s] 115it [00:12, 8.97it/s] 116it [00:12, 9.14it/s] 117it [00:12, 9.27it/s] 118it [00:12, 9.36it/s] 119it [00:13, 9.38it/s] 120it [00:13, 9.45it/s] 121it [00:13, 9.49it/s] 122it [00:13, 9.50it/s] 123it [00:13, 9.50it/s] 124it [00:13, 9.53it/s] 125it [00:13, 9.54it/s] 126it [00:13, 9.55it/s] 127it [00:13, 9.56it/s] 128it [00:14, 9.55it/s] 129it [00:14, 9.58it/s] 130it [00:14, 9.56it/s] 131it [00:14, 9.56it/s] 132it [00:14, 9.54it/s] 133it [00:14, 9.48it/s] 134it [00:14, 9.51it/s] 135it [00:14, 9.53it/s] 136it [00:14, 9.53it/s] 137it [00:14, 9.53it/s] 138it [00:15, 9.54it/s] 139it [00:15, 9.53it/s] 140it [00:15, 9.51it/s] 141it [00:15, 9.50it/s] 142it [00:15, 9.42it/s] 143it [00:15, 9.43it/s] 144it [00:15, 9.41it/s] 145it [00:15, 9.50it/s] 146it [00:15, 9.50it/s] 147it [00:16, 9.52it/s] 148it [00:16, 9.47it/s] 149it [00:16, 8.99it/s] 150it [00:16, 9.10it/s]2025-05-26 03:35:44,921 - INFO - [Epoch 060 | Batch 0150] IWAE-loss 4515.0557 | mean log_px -0.0186 | KL -3300.35 + 151it [00:16, 9.18it/s] 152it [00:16, 9.29it/s] 153it [00:16, 9.37it/s] 154it [00:16, 9.41it/s] 155it [00:16, 9.45it/s] 156it [00:16, 9.45it/s] 157it [00:17, 9.00it/s] 158it [00:17, 9.13it/s] 159it [00:17, 9.25it/s] 160it [00:17, 9.31it/s] 161it [00:17, 9.39it/s] 162it [00:17, 9.44it/s] 163it [00:17, 9.46it/s] 164it [00:17, 9.48it/s] 165it [00:17, 9.51it/s] 166it [00:18, 9.34it/s] 167it [00:18, 9.44it/s] 168it [00:18, 9.46it/s] 169it [00:18, 9.49it/s] 170it [00:18, 9.53it/s] 171it [00:18, 9.50it/s] 172it [00:18, 9.38it/s] 173it [00:18, 9.34it/s] 174it [00:18, 9.35it/s] 175it [00:19, 9.43it/s] 176it [00:19, 9.44it/s] 177it [00:19, 9.47it/s] 178it [00:19, 9.48it/s] 179it [00:19, 9.52it/s] 180it [00:19, 9.49it/s] 181it [00:19, 9.49it/s] 182it [00:19, 9.46it/s] 183it [00:19, 9.49it/s] 184it [00:19, 9.55it/s] 185it [00:20, 9.51it/s] 186it [00:20, 8.95it/s] 187it [00:20, 8.98it/s] 188it [00:20, 9.10it/s] 189it [00:20, 9.19it/s] 190it [00:20, 9.31it/s] 191it [00:20, 9.32it/s] 192it [00:20, 9.37it/s] 193it [00:20, 9.43it/s] 194it [00:21, 9.43it/s] 195it [00:21, 8.86it/s] 196it [00:21, 9.10it/s] 196it [00:21, 9.20it/s] +2025-05-26 03:35:49,825 - INFO - Epoch: 60, Objective: tensor([4183.7256], device='cuda:0', grad_fn=), Loss: 0.01641184277832508, KL/n: 67.38818359375 + 0it [00:00, ?it/s]2025-05-26 03:35:50,104 - INFO - [Epoch 061 | Batch 0000] IWAE-loss 4341.6694 | mean log_px -0.0202 | KL -3302.52 + 1it [00:00, 4.73it/s] 2it [00:00, 6.69it/s] 3it [00:00, 7.78it/s] 4it [00:00, 8.36it/s] 5it [00:00, 8.79it/s] 6it [00:00, 9.00it/s] 7it [00:00, 9.20it/s] 8it [00:00, 9.28it/s] 9it [00:01, 9.37it/s] 10it [00:01, 9.47it/s] 11it [00:01, 9.50it/s] 12it [00:01, 8.95it/s] 13it [00:01, 9.14it/s] 14it [00:01, 9.25it/s] 15it [00:01, 9.32it/s] 16it [00:01, 8.88it/s] 17it [00:01, 9.13it/s] 18it [00:02, 9.27it/s] 19it [00:02, 9.35it/s] 20it [00:02, 9.38it/s] 21it [00:02, 9.38it/s] 22it [00:02, 9.40it/s] 23it [00:02, 9.44it/s] 24it [00:02, 9.51it/s] 25it [00:02, 9.48it/s] 26it [00:02, 9.45it/s] 27it [00:02, 9.46it/s] 28it [00:03, 9.47it/s] 29it [00:03, 9.48it/s] 30it [00:03, 9.54it/s] 31it [00:03, 9.57it/s] 32it [00:03, 9.54it/s] 33it [00:03, 9.54it/s] 34it [00:03, 9.53it/s] 35it [00:03, 9.58it/s] 36it [00:03, 9.57it/s] 37it [00:04, 9.57it/s] 38it [00:04, 9.54it/s] 39it [00:04, 9.54it/s] 40it [00:04, 9.57it/s] 41it [00:04, 9.48it/s] 42it [00:04, 9.51it/s] 43it [00:04, 9.54it/s] 44it [00:04, 9.00it/s] 45it [00:04, 9.17it/s] 46it [00:04, 9.28it/s] 47it [00:05, 9.36it/s] 48it [00:05, 9.42it/s] 49it [00:05, 9.46it/s] 50it [00:05, 9.51it/s]2025-05-26 03:35:55,432 - INFO - [Epoch 061 | Batch 0050] IWAE-loss 4877.6030 | mean log_px -0.0282 | KL -3295.02 + 51it [00:05, 9.51it/s] 52it [00:05, 8.99it/s] 53it [00:05, 9.19it/s] 54it [00:05, 9.33it/s] 55it [00:05, 9.41it/s] 56it [00:06, 9.43it/s] 57it [00:06, 9.47it/s] 58it [00:06, 9.45it/s] 59it [00:06, 9.49it/s] 60it [00:06, 9.51it/s] 61it [00:06, 9.50it/s] 62it [00:06, 9.52it/s] 63it [00:06, 9.51it/s] 64it [00:06, 9.52it/s] 65it [00:07, 9.52it/s] 66it [00:07, 9.50it/s] 67it [00:07, 9.53it/s] 68it [00:07, 9.51it/s] 69it [00:07, 9.48it/s] 70it [00:07, 9.46it/s] 71it [00:07, 9.07it/s] 72it [00:07, 9.22it/s] 73it [00:07, 9.30it/s] 74it [00:07, 9.31it/s] 75it [00:08, 8.85it/s] 76it [00:08, 9.06it/s] 77it [00:08, 8.81it/s] 78it [00:08, 9.00it/s] 79it [00:08, 9.11it/s] 80it [00:08, 9.26it/s] 81it [00:08, 8.82it/s] 82it [00:08, 9.01it/s] 83it [00:08, 9.18it/s] 84it [00:09, 9.28it/s] 85it [00:09, 8.82it/s] 86it [00:09, 9.01it/s] 87it [00:09, 9.15it/s] 88it [00:09, 9.22it/s] 89it [00:09, 9.33it/s] 90it [00:09, 9.24it/s] 91it [00:09, 8.92it/s] 92it [00:09, 9.10it/s] 93it [00:10, 9.25it/s] 94it [00:10, 9.29it/s] 95it [00:10, 9.34it/s] 96it [00:10, 9.41it/s] 97it [00:10, 8.91it/s] 98it [00:10, 9.03it/s] 99it [00:10, 9.17it/s] 100it [00:10, 9.29it/s]2025-05-26 03:36:00,844 - INFO - [Epoch 061 | Batch 0100] IWAE-loss 4193.9419 | mean log_px -0.0158 | KL -3287.98 + 101it [00:10, 9.39it/s] 102it [00:11, 9.39it/s] 103it [00:11, 9.41it/s] 104it [00:11, 9.03it/s] 105it [00:11, 9.16it/s] 106it [00:11, 9.15it/s] 107it [00:11, 9.28it/s] 108it [00:11, 8.84it/s] 109it [00:11, 9.04it/s] 110it [00:11, 9.18it/s] 111it [00:12, 9.32it/s] 112it [00:12, 8.85it/s] 113it [00:12, 9.03it/s] 114it [00:12, 9.14it/s] 115it [00:12, 9.22it/s] 116it [00:12, 9.30it/s] 117it [00:12, 8.84it/s] 118it [00:12, 9.01it/s] 119it [00:12, 9.18it/s] 120it [00:13, 9.29it/s] 121it [00:13, 8.81it/s] 122it [00:13, 8.73it/s] 123it [00:13, 8.40it/s] 124it [00:13, 8.60it/s] 125it [00:13, 8.96it/s] 126it [00:13, 9.22it/s] 127it [00:13, 9.43it/s] 128it [00:13, 9.56it/s] 129it [00:13, 9.68it/s] 130it [00:14, 9.72it/s] 131it [00:14, 9.79it/s] 132it [00:14, 9.78it/s] 133it [00:14, 9.81it/s] 134it [00:14, 9.85it/s] 135it [00:14, 9.88it/s] 136it [00:14, 9.67it/s] 137it [00:14, 9.35it/s] 138it [00:14, 9.18it/s] 139it [00:15, 8.86it/s] 140it [00:15, 9.10it/s] 141it [00:15, 9.30it/s] 142it [00:15, 9.42it/s] 143it [00:15, 9.51it/s] 144it [00:15, 9.56it/s] 145it [00:15, 9.62it/s] 146it [00:15, 9.14it/s] 147it [00:15, 9.22it/s] 148it [00:16, 9.28it/s] 149it [00:16, 9.34it/s] 150it [00:16, 9.44it/s]2025-05-26 03:36:06,243 - INFO - [Epoch 061 | Batch 0150] IWAE-loss 4477.5815 | mean log_px -0.0203 | KL -3289.90 + 151it [00:16, 9.52it/s] 152it [00:16, 9.13it/s] 153it [00:16, 9.11it/s] 154it [00:16, 9.22it/s] 155it [00:16, 9.39it/s] 156it [00:16, 9.48it/s] 157it [00:16, 9.58it/s] 158it [00:17, 9.64it/s] 159it [00:17, 9.70it/s] 160it [00:17, 9.72it/s] 161it [00:17, 9.69it/s] 162it [00:17, 9.76it/s] 163it [00:17, 9.31it/s] 164it [00:17, 9.47it/s] 165it [00:17, 9.61it/s] 166it [00:17, 9.71it/s] 167it [00:17, 9.79it/s] 168it [00:18, 9.84it/s] 169it [00:18, 9.89it/s] 170it [00:18, 9.30it/s] 171it [00:18, 9.48it/s] 172it [00:18, 9.61it/s] 173it [00:18, 9.69it/s] 174it [00:18, 9.77it/s] 175it [00:18, 9.83it/s] 176it [00:18, 9.87it/s] 177it [00:19, 9.89it/s] 178it [00:19, 9.91it/s] 179it [00:19, 9.91it/s] 180it [00:19, 9.91it/s] 181it [00:19, 9.93it/s] 182it [00:19, 9.84it/s] 183it [00:19, 9.80it/s] 184it [00:19, 9.42it/s] 185it [00:19, 9.58it/s] 186it [00:19, 9.70it/s] 188it [00:20, 9.85it/s] 189it [00:20, 9.87it/s] 190it [00:20, 9.90it/s] 192it [00:20, 9.95it/s] 193it [00:20, 9.96it/s] 194it [00:20, 9.95it/s] 195it [00:20, 9.46it/s] 196it [00:21, 9.32it/s] +2025-05-26 03:36:10,990 - INFO - Epoch: 61, Objective: tensor([6526.4443], device='cuda:0', grad_fn=), Loss: 0.049620795994997025, KL/n: 67.15840148925781 + 0it [00:00, ?it/s]2025-05-26 03:36:11,271 - INFO - [Epoch 062 | Batch 0000] IWAE-loss 4576.0898 | mean log_px -0.0238 | KL -3289.67 + 1it [00:00, 4.71it/s] 2it [00:00, 6.73it/s] 4it [00:00, 8.46it/s] 6it [00:00, 8.68it/s] 7it [00:00, 8.96it/s] 8it [00:00, 9.19it/s] 9it [00:01, 9.38it/s] 10it [00:01, 9.10it/s] 11it [00:01, 9.15it/s] 12it [00:01, 9.32it/s] 13it [00:01, 8.91it/s] 14it [00:01, 9.16it/s] 15it [00:01, 9.37it/s] 16it [00:01, 9.43it/s] 17it [00:01, 8.98it/s] 18it [00:02, 9.18it/s] 19it [00:02, 9.36it/s] 20it [00:02, 9.45it/s] 21it [00:02, 8.92it/s] 22it [00:02, 9.13it/s] 23it [00:02, 9.31it/s] 24it [00:02, 9.42it/s] 25it [00:02, 8.98it/s] 26it [00:02, 9.21it/s] 27it [00:02, 9.39it/s] 28it [00:03, 9.47it/s] 29it [00:03, 9.01it/s] 30it [00:03, 9.26it/s] 31it [00:03, 9.43it/s] 32it [00:03, 9.52it/s] 33it [00:03, 9.06it/s] 34it [00:03, 9.27it/s] 35it [00:03, 9.46it/s] 36it [00:03, 9.58it/s] 37it [00:04, 9.09it/s] 38it [00:04, 9.30it/s] 39it [00:04, 9.47it/s] 40it [00:04, 9.58it/s] 41it [00:04, 9.09it/s] 42it [00:04, 9.30it/s] 43it [00:04, 9.49it/s] 44it [00:04, 9.60it/s] 45it [00:04, 9.11it/s] 46it [00:05, 6.10it/s] 47it [00:05, 6.59it/s] 48it [00:05, 7.29it/s] 49it [00:05, 7.92it/s] 50it [00:05, 8.39it/s]2025-05-26 03:36:16,842 - INFO - [Epoch 062 | Batch 0050] IWAE-loss 4915.9707 | mean log_px -0.0268 | KL -3286.16 + 51it [00:05, 8.30it/s] 52it [00:05, 8.71it/s] 53it [00:05, 9.06it/s] 54it [00:06, 9.29it/s] 55it [00:06, 8.91it/s] 56it [00:06, 9.17it/s] 57it [00:06, 9.39it/s] 58it [00:06, 9.53it/s] 59it [00:06, 9.07it/s] 60it [00:06, 9.27it/s] 61it [00:06, 9.45it/s] 62it [00:06, 9.58it/s] 63it [00:07, 9.10it/s] 64it [00:07, 9.33it/s] 65it [00:07, 9.51it/s] 66it [00:07, 9.63it/s] 67it [00:07, 9.14it/s] 68it [00:07, 9.35it/s] 69it [00:07, 9.52it/s] 70it [00:07, 9.62it/s] 71it [00:07, 9.02it/s] 72it [00:08, 9.22it/s] 73it [00:08, 8.85it/s] 74it [00:08, 9.06it/s] 75it [00:08, 9.27it/s] 76it [00:08, 9.39it/s] 77it [00:08, 8.98it/s] 78it [00:08, 9.22it/s] 79it [00:08, 8.88it/s] 80it [00:08, 9.09it/s] 81it [00:09, 9.28it/s] 82it [00:09, 9.42it/s] 83it [00:09, 8.92it/s] 84it [00:09, 9.15it/s] 85it [00:09, 9.21it/s] 86it [00:09, 9.34it/s] 87it [00:09, 8.92it/s] 88it [00:09, 9.09it/s] 89it [00:09, 9.31it/s] 90it [00:09, 9.49it/s] 91it [00:10, 9.02it/s] 92it [00:10, 9.25it/s] 93it [00:10, 9.43it/s] 94it [00:10, 9.55it/s] 95it [00:10, 9.06it/s] 96it [00:10, 9.27it/s] 97it [00:10, 9.44it/s] 98it [00:10, 9.56it/s] 99it [00:10, 9.09it/s] 100it [00:11, 9.28it/s]2025-05-26 03:36:22,243 - INFO - [Epoch 062 | Batch 0100] IWAE-loss 4170.7461 | mean log_px -0.0182 | KL -3282.61 + 101it [00:11, 9.45it/s] 102it [00:11, 9.48it/s] 103it [00:11, 9.36it/s] 104it [00:11, 8.95it/s] 105it [00:11, 9.09it/s] 106it [00:11, 9.26it/s] 107it [00:11, 9.32it/s] 108it [00:11, 8.89it/s] 109it [00:12, 9.04it/s] 110it [00:12, 9.21it/s] 111it [00:12, 9.33it/s] 112it [00:12, 9.39it/s] 113it [00:12, 9.44it/s] 114it [00:12, 9.47it/s] 115it [00:12, 9.51it/s] 116it [00:12, 9.51it/s] 117it [00:12, 9.49it/s] 118it [00:12, 9.15it/s] 119it [00:13, 9.25it/s] 120it [00:13, 9.31it/s] 121it [00:13, 8.90it/s] 122it [00:13, 9.06it/s] 123it [00:13, 9.13it/s] 124it [00:13, 9.28it/s] 125it [00:13, 9.34it/s] 126it [00:13, 9.38it/s] 127it [00:13, 9.42it/s] 128it [00:14, 9.45it/s] 129it [00:14, 9.47it/s] 130it [00:14, 9.50it/s] 131it [00:14, 9.48it/s] 132it [00:14, 9.44it/s] 133it [00:14, 9.46it/s] 134it [00:14, 9.44it/s] 135it [00:14, 9.50it/s] 136it [00:14, 9.50it/s] 137it [00:15, 9.55it/s] 138it [00:15, 9.54it/s] 139it [00:15, 9.53it/s] 140it [00:15, 9.49it/s] 141it [00:15, 9.51it/s] 142it [00:15, 9.56it/s] 143it [00:15, 9.55it/s] 144it [00:15, 9.54it/s] 145it [00:15, 9.54it/s] 146it [00:15, 9.53it/s] 147it [00:16, 9.00it/s] 148it [00:16, 9.15it/s] 149it [00:16, 9.23it/s] 150it [00:16, 9.28it/s]2025-05-26 03:36:27,594 - INFO - [Epoch 062 | Batch 0150] IWAE-loss 4884.0713 | mean log_px -0.0360 | KL -3281.47 + 151it [00:16, 9.27it/s] 152it [00:16, 9.30it/s] 153it [00:16, 9.37it/s] 154it [00:16, 9.39it/s] 155it [00:16, 9.44it/s] 156it [00:17, 9.49it/s] 157it [00:17, 9.53it/s] 158it [00:17, 9.02it/s] 159it [00:17, 8.96it/s] 160it [00:17, 9.09it/s] 161it [00:17, 8.87it/s] 162it [00:17, 9.11it/s] 163it [00:17, 9.33it/s] 164it [00:17, 8.92it/s] 165it [00:18, 8.80it/s] 166it [00:18, 9.09it/s] 167it [00:18, 9.24it/s] 168it [00:18, 8.85it/s] 169it [00:18, 9.11it/s] 170it [00:18, 9.31it/s] 171it [00:18, 8.88it/s] 172it [00:18, 9.17it/s] 173it [00:18, 9.35it/s] 174it [00:19, 9.46it/s] 175it [00:19, 9.59it/s] 176it [00:19, 9.63it/s] 177it [00:19, 9.21it/s] 178it [00:19, 9.36it/s] 179it [00:19, 9.51it/s] 180it [00:19, 9.61it/s] 181it [00:19, 9.71it/s] 182it [00:19, 9.77it/s] 183it [00:19, 9.81it/s] 184it [00:20, 9.86it/s] 185it [00:20, 9.84it/s] 186it [00:20, 9.83it/s] 187it [00:20, 9.84it/s] 188it [00:20, 9.87it/s] 189it [00:20, 9.84it/s] 190it [00:20, 9.34it/s] 191it [00:20, 9.52it/s] 192it [00:20, 9.65it/s] 193it [00:20, 9.74it/s] 194it [00:21, 9.78it/s] 195it [00:21, 8.58it/s] 196it [00:21, 9.16it/s] +2025-05-26 03:36:32,519 - INFO - Epoch: 62, Objective: tensor([5284.1826], device='cuda:0', grad_fn=), Loss: 0.03511318191885948, KL/n: 66.92284393310547 + 0it [00:00, ?it/s]2025-05-26 03:36:32,803 - INFO - [Epoch 063 | Batch 0000] IWAE-loss 4192.7603 | mean log_px -0.0176 | KL -3279.23 + 1it [00:00, 5.28it/s] 2it [00:00, 6.74it/s] 3it [00:00, 7.91it/s] 4it [00:00, 8.60it/s] 6it [00:00, 8.90it/s] 7it [00:00, 9.17it/s] 8it [00:00, 9.38it/s] 10it [00:01, 9.66it/s] 12it [00:01, 9.81it/s] 13it [00:01, 9.84it/s] 14it [00:01, 9.47it/s] 15it [00:01, 9.52it/s] 16it [00:01, 9.60it/s] 18it [00:01, 9.78it/s] 20it [00:02, 9.88it/s] 21it [00:02, 9.84it/s] 22it [00:02, 9.87it/s] 23it [00:02, 9.46it/s] 24it [00:02, 9.58it/s] 26it [00:02, 9.80it/s] 27it [00:02, 9.75it/s] 28it [00:02, 9.50it/s] 29it [00:03, 9.37it/s] 30it [00:03, 9.43it/s] 31it [00:03, 9.58it/s] 32it [00:03, 9.24it/s] 34it [00:03, 9.59it/s] 35it [00:03, 9.20it/s] 37it [00:03, 9.56it/s] 38it [00:04, 9.65it/s] 40it [00:04, 9.80it/s] 41it [00:04, 9.80it/s] 42it [00:04, 9.70it/s] 43it [00:04, 8.85it/s] 44it [00:04, 9.05it/s] 45it [00:04, 9.24it/s] 46it [00:04, 9.39it/s] 47it [00:05, 9.50it/s] 48it [00:05, 9.59it/s] 49it [00:05, 9.66it/s] 50it [00:05, 9.71it/s]2025-05-26 03:36:38,023 - INFO - [Epoch 063 | Batch 0050] IWAE-loss 4688.5366 | mean log_px -0.0212 | KL -3273.02 + 51it [00:05, 9.14it/s] 52it [00:05, 9.33it/s] 53it [00:05, 9.42it/s] 54it [00:05, 8.96it/s] 56it [00:05, 9.43it/s] 58it [00:06, 9.67it/s] 60it [00:06, 9.79it/s] 62it [00:06, 9.60it/s] 64it [00:06, 9.74it/s] 66it [00:06, 9.84it/s] 67it [00:07, 9.85it/s] 68it [00:07, 9.52it/s] 70it [00:07, 9.69it/s] 71it [00:07, 9.75it/s] 72it [00:07, 9.79it/s] 73it [00:07, 9.44it/s] 74it [00:07, 9.57it/s] 76it [00:08, 9.75it/s] 78it [00:08, 9.87it/s] 80it [00:08, 9.90it/s] 81it [00:08, 9.91it/s] 82it [00:08, 9.92it/s] 83it [00:08, 9.93it/s] 84it [00:08, 9.95it/s] 86it [00:09, 9.99it/s] 88it [00:09, 9.99it/s] 90it [00:09, 9.99it/s] 91it [00:09, 9.99it/s] 92it [00:09, 9.96it/s] 93it [00:09, 9.48it/s] 94it [00:09, 9.58it/s] 95it [00:09, 9.67it/s] 96it [00:10, 9.29it/s] 98it [00:10, 9.61it/s] 99it [00:10, 9.21it/s]2025-05-26 03:36:43,191 - INFO - [Epoch 063 | Batch 0100] IWAE-loss 4749.5503 | mean log_px -0.0224 | KL -3273.87 + 101it [00:10, 9.53it/s] 102it [00:10, 9.62it/s] 104it [00:10, 9.78it/s] 105it [00:10, 9.79it/s] 106it [00:11, 9.67it/s] 107it [00:11, 9.31it/s] 108it [00:11, 9.48it/s] 109it [00:11, 9.53it/s] 110it [00:11, 9.11it/s] 111it [00:11, 9.33it/s] 112it [00:11, 9.49it/s] 113it [00:11, 9.16it/s] 114it [00:11, 9.32it/s] 115it [00:12, 9.47it/s] 116it [00:12, 9.60it/s] 117it [00:12, 9.71it/s] 119it [00:12, 9.90it/s] 121it [00:12, 9.95it/s] 122it [00:12, 9.91it/s] 123it [00:12, 9.44it/s] 124it [00:12, 9.56it/s] 125it [00:13, 9.63it/s] 127it [00:13, 9.81it/s] 129it [00:13, 9.92it/s] 130it [00:13, 9.91it/s] 131it [00:13, 9.85it/s] 132it [00:13, 9.86it/s] 134it [00:13, 9.94it/s] 136it [00:14, 9.98it/s] 138it [00:14, 10.00it/s] 140it [00:14, 10.02it/s] 142it [00:14, 10.02it/s] 144it [00:14, 10.03it/s] 146it [00:15, 10.02it/s] 148it [00:15, 10.04it/s] 150it [00:15, 10.05it/s]2025-05-26 03:36:48,289 - INFO - [Epoch 063 | Batch 0150] IWAE-loss 3977.1768 | mean log_px -0.0134 | KL -3273.26 + 152it [00:15, 10.04it/s] 154it [00:15, 10.05it/s] 156it [00:16, 10.05it/s] 158it [00:16, 10.05it/s] 160it [00:16, 10.03it/s] 162it [00:16, 10.05it/s] 164it [00:16, 9.95it/s] 165it [00:17, 9.64it/s] 166it [00:17, 9.71it/s] 168it [00:17, 9.84it/s] 170it [00:17, 9.91it/s] 172it [00:17, 9.96it/s] 173it [00:17, 9.64it/s] 175it [00:18, 9.78it/s] 177it [00:18, 9.85it/s] 179it [00:18, 9.92it/s] 180it [00:18, 9.91it/s] 181it [00:18, 9.93it/s] 182it [00:18, 9.92it/s] 183it [00:18, 9.38it/s] 185it [00:19, 9.63it/s] 186it [00:19, 9.69it/s] 188it [00:19, 9.83it/s] 189it [00:19, 9.39it/s] 190it [00:19, 9.45it/s] 191it [00:19, 9.55it/s] 192it [00:19, 9.64it/s] 193it [00:19, 9.72it/s] 195it [00:20, 9.51it/s] 196it [00:20, 9.18it/s] 196it [00:20, 9.63it/s] +2025-05-26 03:36:53,010 - INFO - Epoch: 63, Objective: tensor([5113.3408], device='cuda:0', grad_fn=), Loss: 0.03467189148068428, KL/n: 66.71068572998047 + 0it [00:00, ?it/s]2025-05-26 03:36:53,297 - INFO - [Epoch 064 | Batch 0000] IWAE-loss 4048.0391 | mean log_px -0.0111 | KL -3268.86 + 1it [00:00, 5.01it/s] 2it [00:00, 7.03it/s] 4it [00:00, 8.70it/s] 6it [00:00, 9.33it/s] 8it [00:00, 9.65it/s] 9it [00:00, 9.70it/s] 10it [00:01, 9.74it/s] 12it [00:01, 9.88it/s] 13it [00:01, 9.90it/s] 15it [00:01, 10.00it/s] 16it [00:01, 10.00it/s] 18it [00:01, 9.91it/s] 19it [00:02, 9.58it/s] 21it [00:02, 9.77it/s] 22it [00:02, 9.47it/s] 24it [00:02, 9.69it/s] 26it [00:02, 9.83it/s] 28it [00:02, 9.94it/s] 30it [00:03, 9.90it/s] 31it [00:03, 9.60it/s] 33it [00:03, 9.78it/s] 35it [00:03, 9.89it/s] 36it [00:03, 9.91it/s] 38it [00:03, 9.99it/s] 39it [00:04, 9.70it/s] 41it [00:04, 9.84it/s] 43it [00:04, 9.93it/s] 45it [00:04, 10.01it/s] 47it [00:04, 9.68it/s] 49it [00:05, 7.54it/s]2025-05-26 03:36:58,555 - INFO - [Epoch 064 | Batch 0050] IWAE-loss 4078.9944 | mean log_px -0.0116 | KL -3263.32 + 51it [00:05, 8.18it/s] 53it [00:05, 8.69it/s] 55it [00:05, 8.80it/s] 56it [00:05, 8.97it/s] 57it [00:06, 9.15it/s] 59it [00:06, 9.47it/s] 61it [00:06, 9.66it/s] 62it [00:06, 9.72it/s] 64it [00:06, 9.84it/s] 66it [00:06, 9.93it/s] 68it [00:07, 9.98it/s] 70it [00:07, 10.02it/s] 72it [00:07, 10.04it/s] 74it [00:07, 10.06it/s] 76it [00:07, 10.09it/s] 78it [00:08, 10.10it/s] 80it [00:08, 10.12it/s] 82it [00:08, 10.14it/s] 84it [00:08, 10.14it/s] 86it [00:08, 10.08it/s] 88it [00:09, 9.82it/s] 90it [00:09, 9.91it/s] 92it [00:09, 9.99it/s] 94it [00:09, 10.04it/s] 96it [00:09, 10.07it/s] 98it [00:10, 9.74it/s] 100it [00:10, 9.83it/s]2025-05-26 03:37:03,572 - INFO - [Epoch 064 | Batch 0100] IWAE-loss 4177.9673 | mean log_px -0.0192 | KL -3262.71 + 102it [00:10, 9.91it/s] 104it [00:10, 9.65it/s] 106it [00:10, 9.79it/s] 108it [00:11, 9.89it/s] 110it [00:11, 9.95it/s] 112it [00:11, 10.00it/s] 114it [00:11, 10.04it/s] 116it [00:11, 10.07it/s] 118it [00:12, 10.10it/s] 120it [00:12, 10.11it/s] 122it [00:12, 9.85it/s] 124it [00:12, 9.93it/s] 126it [00:12, 9.96it/s] 128it [00:13, 10.01it/s] 130it [00:13, 9.71it/s] 131it [00:13, 9.75it/s] 133it [00:13, 9.85it/s] 134it [00:13, 9.39it/s] 136it [00:14, 9.63it/s] 138it [00:14, 9.76it/s] 139it [00:14, 9.80it/s] 140it [00:14, 9.84it/s] 141it [00:14, 9.38it/s] 143it [00:14, 9.63it/s] 144it [00:14, 9.69it/s] 146it [00:15, 9.87it/s] 148it [00:15, 9.95it/s] 149it [00:15, 9.95it/s] 150it [00:15, 9.82it/s]2025-05-26 03:37:08,662 - INFO - [Epoch 064 | Batch 0150] IWAE-loss 4131.0303 | mean log_px -0.0125 | KL -3256.42 + 151it [00:15, 9.12it/s] 153it [00:15, 9.51it/s] 155it [00:15, 9.72it/s] 156it [00:16, 9.47it/s] 158it [00:16, 9.70it/s] 160it [00:16, 9.84it/s] 162it [00:16, 9.91it/s] 163it [00:16, 9.62it/s] 165it [00:17, 9.79it/s] 167it [00:17, 9.90it/s] 169it [00:17, 9.98it/s] 171it [00:17, 10.02it/s] 173it [00:17, 10.06it/s] 175it [00:17, 10.08it/s] 177it [00:18, 10.09it/s] 179it [00:18, 10.10it/s] 181it [00:18, 10.11it/s] 183it [00:18, 10.11it/s] 185it [00:18, 10.11it/s] 187it [00:19, 10.06it/s] 189it [00:19, 10.07it/s] 191it [00:19, 9.96it/s] 192it [00:19, 9.96it/s] 194it [00:19, 9.97it/s] 195it [00:20, 9.65it/s] 196it [00:20, 9.72it/s] +2025-05-26 03:37:13,305 - INFO - Epoch: 64, Objective: tensor([4486.4854], device='cuda:0', grad_fn=), Loss: 0.017137622460722923, KL/n: 66.45817565917969 + 0it [00:00, ?it/s]2025-05-26 03:37:13,584 - INFO - [Epoch 065 | Batch 0000] IWAE-loss 4915.1265 | mean log_px -0.0304 | KL -3253.02 + 1it [00:00, 5.19it/s] 2it [00:00, 7.04it/s] 3it [00:00, 8.04it/s] 4it [00:00, 8.60it/s] 5it [00:00, 8.82it/s] 6it [00:00, 9.05it/s] 7it [00:00, 9.27it/s] 8it [00:00, 8.89it/s] 9it [00:01, 9.18it/s] 10it [00:01, 9.26it/s] 11it [00:01, 9.33it/s] 12it [00:01, 9.45it/s] 13it [00:01, 9.55it/s] 14it [00:01, 9.61it/s] 15it [00:01, 9.68it/s] 16it [00:01, 9.72it/s] 17it [00:01, 9.78it/s] 18it [00:01, 9.78it/s] 19it [00:02, 9.83it/s] 20it [00:02, 9.85it/s] 21it [00:02, 9.87it/s] 22it [00:02, 9.82it/s] 23it [00:02, 9.81it/s] 24it [00:02, 9.82it/s] 25it [00:02, 9.85it/s] 26it [00:02, 9.85it/s] 27it [00:02, 9.85it/s] 28it [00:02, 9.78it/s] 29it [00:03, 9.81it/s] 30it [00:03, 9.82it/s] 31it [00:03, 9.85it/s] 32it [00:03, 9.84it/s] 33it [00:03, 9.82it/s] 34it [00:03, 9.80it/s] 35it [00:03, 9.81it/s] 36it [00:03, 9.81it/s] 37it [00:03, 9.79it/s] 38it [00:04, 9.80it/s] 39it [00:04, 9.78it/s] 40it [00:04, 9.77it/s] 41it [00:04, 9.79it/s] 42it [00:04, 9.57it/s] 43it [00:04, 9.63it/s] 44it [00:04, 9.67it/s] 45it [00:04, 9.73it/s] 46it [00:04, 9.73it/s] 47it [00:04, 9.75it/s] 48it [00:05, 9.76it/s] 49it [00:05, 9.79it/s] 50it [00:05, 9.80it/s]2025-05-26 03:37:18,738 - INFO - [Epoch 065 | Batch 0050] IWAE-loss 4041.6321 | mean log_px -0.0125 | KL -3247.29 + 51it [00:05, 9.80it/s] 52it [00:05, 9.78it/s] 53it [00:05, 9.79it/s] 54it [00:05, 9.80it/s] 55it [00:05, 9.81it/s] 56it [00:05, 9.77it/s] 57it [00:05, 9.80it/s] 58it [00:06, 9.81it/s] 59it [00:06, 9.82it/s] 60it [00:06, 9.79it/s] 61it [00:06, 9.33it/s] 62it [00:06, 9.43it/s] 63it [00:06, 9.57it/s] 64it [00:06, 9.60it/s] 65it [00:06, 9.50it/s] 66it [00:06, 9.52it/s] 67it [00:07, 9.54it/s] 68it [00:07, 9.53it/s] 69it [00:07, 9.55it/s] 70it [00:07, 9.51it/s] 71it [00:07, 9.08it/s] 72it [00:07, 9.20it/s] 73it [00:07, 9.36it/s] 74it [00:07, 9.48it/s] 75it [00:07, 9.50it/s] 76it [00:07, 9.43it/s] 77it [00:08, 9.46it/s] 78it [00:08, 9.47it/s] 79it [00:08, 9.47it/s] 80it [00:08, 9.47it/s] 81it [00:08, 9.60it/s] 82it [00:08, 9.66it/s] 83it [00:08, 9.63it/s] 84it [00:08, 9.68it/s] 85it [00:08, 9.74it/s] 86it [00:08, 9.78it/s] 87it [00:09, 9.77it/s] 88it [00:09, 9.76it/s] 89it [00:09, 9.75it/s] 90it [00:09, 9.71it/s] 92it [00:09, 9.83it/s] 93it [00:09, 9.83it/s] 94it [00:09, 9.85it/s] 95it [00:09, 9.84it/s] 96it [00:10, 9.83it/s] 97it [00:10, 9.74it/s] 98it [00:10, 9.65it/s] 99it [00:10, 9.58it/s] 100it [00:10, 9.56it/s]2025-05-26 03:37:23,941 - INFO - [Epoch 065 | Batch 0100] IWAE-loss 4149.1934 | mean log_px -0.0150 | KL -3245.47 + 101it [00:10, 9.47it/s] 102it [00:10, 9.55it/s] 103it [00:10, 9.64it/s] 104it [00:10, 9.66it/s] 105it [00:10, 9.71it/s] 106it [00:11, 9.75it/s] 107it [00:11, 9.79it/s] 108it [00:11, 9.80it/s] 109it [00:11, 9.82it/s] 110it [00:11, 9.78it/s] 111it [00:11, 9.80it/s] 112it [00:11, 9.78it/s] 113it [00:11, 9.79it/s] 114it [00:11, 9.81it/s] 115it [00:11, 9.84it/s] 116it [00:12, 9.83it/s] 117it [00:12, 9.84it/s] 118it [00:12, 9.85it/s] 119it [00:12, 9.81it/s] 120it [00:12, 9.81it/s] 121it [00:12, 9.82it/s] 122it [00:12, 9.85it/s] 123it [00:12, 9.85it/s] 124it [00:12, 9.83it/s] 125it [00:12, 9.82it/s] 126it [00:13, 9.81it/s] 127it [00:13, 9.82it/s] 128it [00:13, 9.78it/s] 129it [00:13, 9.77it/s] 130it [00:13, 9.76it/s] 131it [00:13, 9.75it/s] 132it [00:13, 9.79it/s] 133it [00:13, 9.82it/s] 134it [00:13, 9.85it/s] 135it [00:14, 9.23it/s] 136it [00:14, 9.38it/s] 137it [00:14, 9.48it/s] 138it [00:14, 9.54it/s] 139it [00:14, 9.62it/s] 140it [00:14, 9.64it/s] 141it [00:14, 9.72it/s] 142it [00:14, 9.74it/s] 143it [00:14, 9.72it/s] 144it [00:14, 9.70it/s] 145it [00:15, 9.73it/s] 146it [00:15, 9.06it/s] 147it [00:15, 9.25it/s] 148it [00:15, 9.31it/s] 149it [00:15, 9.40it/s] 150it [00:15, 9.38it/s]2025-05-26 03:37:29,105 - INFO - [Epoch 065 | Batch 0150] IWAE-loss 5137.2002 | mean log_px -0.0301 | KL -3244.56 + 151it [00:15, 8.92it/s] 152it [00:15, 9.04it/s] 153it [00:15, 9.14it/s] 154it [00:16, 9.22it/s] 155it [00:16, 9.31it/s] 156it [00:16, 9.34it/s] 157it [00:16, 9.07it/s] 158it [00:16, 9.29it/s] 159it [00:16, 8.80it/s] 160it [00:16, 9.07it/s] 161it [00:16, 9.29it/s] 162it [00:16, 9.44it/s] 163it [00:17, 9.56it/s] 164it [00:17, 9.64it/s] 165it [00:17, 9.69it/s] 166it [00:17, 9.73it/s] 167it [00:17, 9.78it/s] 168it [00:17, 9.78it/s] 169it [00:17, 9.77it/s] 170it [00:17, 9.78it/s] 171it [00:17, 9.81it/s] 172it [00:17, 9.81it/s] 173it [00:18, 9.81it/s] 174it [00:18, 9.81it/s] 175it [00:18, 9.78it/s] 176it [00:18, 9.76it/s] 177it [00:18, 9.77it/s] 178it [00:18, 9.80it/s] 179it [00:18, 9.81it/s] 180it [00:18, 9.80it/s] 181it [00:18, 9.81it/s] 182it [00:18, 9.83it/s] 183it [00:19, 9.84it/s] 184it [00:19, 9.84it/s] 185it [00:19, 9.84it/s] 186it [00:19, 9.82it/s] 187it [00:19, 9.85it/s] 188it [00:19, 9.87it/s] 189it [00:19, 9.88it/s] 190it [00:19, 9.88it/s] 191it [00:19, 9.89it/s] 192it [00:19, 9.89it/s] 193it [00:20, 9.87it/s] 194it [00:20, 9.85it/s] 195it [00:20, 9.43it/s] 196it [00:20, 9.59it/s] +2025-05-26 03:37:33,879 - INFO - Epoch: 65, Objective: tensor([4243.4243], device='cuda:0', grad_fn=), Loss: 0.016095492988824844, KL/n: 66.21897888183594 + 0it [00:00, ?it/s]2025-05-26 03:37:34,166 - INFO - [Epoch 066 | Batch 0000] IWAE-loss 4330.0098 | mean log_px -0.0173 | KL -3242.21 + 1it [00:00, 4.46it/s] 2it [00:00, 6.55it/s] 4it [00:00, 8.36it/s] 6it [00:00, 9.08it/s] 8it [00:00, 9.43it/s] 10it [00:01, 9.65it/s] 12it [00:01, 9.78it/s] 13it [00:01, 9.48it/s] 15it [00:01, 9.68it/s] 16it [00:01, 9.74it/s] 17it [00:01, 9.79it/s] 18it [00:01, 9.84it/s] 20it [00:02, 9.91it/s] 21it [00:02, 9.92it/s] 22it [00:02, 9.92it/s] 23it [00:02, 9.94it/s] 24it [00:02, 9.93it/s] 26it [00:02, 9.49it/s] 28it [00:02, 9.70it/s] 30it [00:03, 9.80it/s] 31it [00:03, 9.84it/s] 32it [00:03, 9.87it/s] 33it [00:03, 9.49it/s] 34it [00:03, 9.61it/s] 36it [00:03, 9.77it/s] 38it [00:03, 9.86it/s] 39it [00:04, 9.89it/s] 40it [00:04, 9.89it/s] 42it [00:04, 9.94it/s] 44it [00:04, 9.97it/s] 46it [00:04, 9.98it/s] 47it [00:04, 9.95it/s] 48it [00:04, 9.95it/s] 50it [00:05, 9.95it/s]2025-05-26 03:37:39,259 - INFO - [Epoch 066 | Batch 0050] IWAE-loss 5074.5923 | mean log_px -0.0331 | KL -3240.32 + 51it [00:05, 6.80it/s] 52it [00:05, 7.30it/s] 54it [00:05, 8.20it/s] 55it [00:05, 8.54it/s] 56it [00:06, 8.72it/s] 57it [00:06, 9.00it/s] 58it [00:06, 9.19it/s] 59it [00:06, 8.79it/s] 60it [00:06, 8.89it/s] 61it [00:06, 9.17it/s] 62it [00:06, 9.39it/s] 63it [00:06, 9.55it/s] 64it [00:06, 9.67it/s] 65it [00:06, 9.74it/s] 66it [00:07, 9.78it/s] 67it [00:07, 9.84it/s] 69it [00:07, 9.93it/s] 70it [00:07, 9.94it/s] 71it [00:07, 9.89it/s] 72it [00:07, 9.90it/s] 73it [00:07, 9.92it/s] 74it [00:07, 9.85it/s] 75it [00:07, 9.76it/s] 76it [00:08, 9.80it/s] 77it [00:08, 9.85it/s] 79it [00:08, 9.92it/s] 80it [00:08, 9.94it/s] 82it [00:08, 9.95it/s] 83it [00:08, 9.96it/s] 84it [00:08, 9.97it/s] 85it [00:08, 9.97it/s] 86it [00:09, 9.98it/s] 88it [00:09, 9.99it/s] 90it [00:09, 10.01it/s] 92it [00:09, 10.01it/s] 94it [00:09, 9.71it/s] 95it [00:09, 9.72it/s] 96it [00:10, 9.77it/s] 97it [00:10, 9.81it/s] 98it [00:10, 9.43it/s] 99it [00:10, 9.55it/s] 100it [00:10, 9.66it/s]2025-05-26 03:37:44,582 - INFO - [Epoch 066 | Batch 0100] IWAE-loss 4414.3447 | mean log_px -0.0179 | KL -3239.95 + 101it [00:10, 9.75it/s] 102it [00:10, 9.80it/s] 104it [00:10, 9.89it/s] 106it [00:11, 9.94it/s] 107it [00:11, 9.92it/s] 108it [00:11, 9.93it/s] 109it [00:11, 9.95it/s] 110it [00:11, 9.93it/s] 111it [00:11, 9.95it/s] 112it [00:11, 9.93it/s] 114it [00:11, 9.88it/s] 115it [00:12, 9.88it/s] 116it [00:12, 9.88it/s] 117it [00:12, 9.87it/s] 118it [00:12, 9.89it/s] 119it [00:12, 9.33it/s] 120it [00:12, 9.49it/s] 121it [00:12, 9.53it/s] 122it [00:12, 9.63it/s] 123it [00:12, 9.71it/s] 124it [00:12, 9.76it/s] 125it [00:13, 9.82it/s] 126it [00:13, 9.23it/s] 127it [00:13, 9.37it/s] 128it [00:13, 9.39it/s] 129it [00:13, 9.41it/s] 130it [00:13, 9.43it/s] 131it [00:13, 9.56it/s] 132it [00:13, 9.65it/s] 133it [00:13, 9.74it/s] 134it [00:14, 9.78it/s] 135it [00:14, 9.83it/s] 136it [00:14, 9.86it/s] 137it [00:14, 9.88it/s] 138it [00:14, 9.90it/s] 139it [00:14, 9.91it/s] 140it [00:14, 9.89it/s] 141it [00:14, 9.92it/s] 143it [00:14, 9.98it/s] 145it [00:15, 10.01it/s] 147it [00:15, 10.03it/s] 149it [00:15, 10.04it/s]2025-05-26 03:37:49,675 - INFO - [Epoch 066 | Batch 0150] IWAE-loss 4754.2173 | mean log_px -0.0265 | KL -3233.78 + 151it [00:15, 10.02it/s] 153it [00:15, 10.03it/s] 155it [00:16, 10.05it/s] 157it [00:16, 10.05it/s] 159it [00:16, 10.05it/s] 161it [00:16, 10.06it/s] 163it [00:16, 10.07it/s] 165it [00:17, 10.07it/s] 167it [00:17, 10.05it/s] 169it [00:17, 9.75it/s] 170it [00:17, 9.74it/s] 171it [00:17, 9.78it/s] 172it [00:17, 9.78it/s] 173it [00:17, 9.80it/s] 174it [00:18, 9.83it/s] 175it [00:18, 9.87it/s] 177it [00:18, 9.95it/s] 178it [00:18, 9.82it/s] 179it [00:18, 9.43it/s] 180it [00:18, 9.52it/s] 181it [00:18, 9.61it/s] 182it [00:18, 9.70it/s] 183it [00:18, 9.19it/s] 184it [00:19, 9.39it/s] 185it [00:19, 9.52it/s] 186it [00:19, 9.58it/s] 188it [00:19, 9.80it/s] 190it [00:19, 9.54it/s] 192it [00:19, 9.73it/s] 194it [00:20, 9.85it/s] 195it [00:20, 9.58it/s] 196it [00:20, 9.37it/s] 196it [00:20, 9.61it/s] +2025-05-26 03:37:54,398 - INFO - Epoch: 66, Objective: tensor([4165.6123], device='cuda:0', grad_fn=), Loss: 0.015236176550388336, KL/n: 65.961181640625 + 0it [00:00, ?it/s]2025-05-26 03:37:54,680 - INFO - [Epoch 067 | Batch 0000] IWAE-loss 4508.1504 | mean log_px -0.0203 | KL -3233.36 + 1it [00:00, 5.28it/s] 2it [00:00, 6.69it/s] 4it [00:00, 8.47it/s] 6it [00:00, 9.16it/s] 8it [00:00, 9.50it/s] 10it [00:01, 9.69it/s] 12it [00:01, 9.81it/s] 13it [00:01, 9.83it/s] 14it [00:01, 9.49it/s] 16it [00:01, 9.71it/s] 18it [00:01, 9.76it/s] 20it [00:02, 9.84it/s] 22it [00:02, 9.90it/s] 24it [00:02, 9.93it/s] 25it [00:02, 9.94it/s] 26it [00:02, 9.94it/s] 28it [00:02, 9.56it/s] 30it [00:03, 9.72it/s] 32it [00:03, 9.82it/s] 33it [00:03, 9.45it/s] 34it [00:03, 9.56it/s] 36it [00:03, 9.74it/s] 38it [00:03, 9.85it/s] 40it [00:04, 9.90it/s] 42it [00:04, 9.94it/s] 43it [00:04, 9.91it/s] 44it [00:04, 9.57it/s] 45it [00:04, 9.64it/s] 46it [00:04, 9.72it/s] 47it [00:04, 9.33it/s] 49it [00:05, 9.63it/s]2025-05-26 03:37:59,800 - INFO - [Epoch 067 | Batch 0050] IWAE-loss 4197.2188 | mean log_px -0.0214 | KL -3226.38 + 51it [00:05, 9.36it/s] 52it [00:05, 9.49it/s] 54it [00:05, 9.69it/s] 56it [00:05, 9.82it/s] 57it [00:05, 9.85it/s] 58it [00:06, 9.87it/s] 60it [00:06, 9.94it/s] 61it [00:06, 9.93it/s] 62it [00:06, 9.92it/s] 63it [00:06, 9.94it/s] 64it [00:06, 9.85it/s] 65it [00:06, 9.25it/s] 66it [00:06, 9.42it/s] 67it [00:06, 9.53it/s] 68it [00:07, 9.61it/s] 69it [00:07, 9.70it/s] 70it [00:07, 9.75it/s] 71it [00:07, 9.30it/s] 72it [00:07, 9.35it/s] 73it [00:07, 9.46it/s] 74it [00:07, 9.51it/s] 75it [00:07, 9.64it/s] 76it [00:07, 9.69it/s] 77it [00:08, 9.73it/s] 78it [00:08, 9.77it/s] 79it [00:08, 9.19it/s] 80it [00:08, 9.41it/s] 81it [00:08, 9.51it/s] 83it [00:08, 9.74it/s] 85it [00:08, 9.84it/s] 86it [00:08, 9.86it/s] 88it [00:09, 9.59it/s] 89it [00:09, 9.66it/s] 91it [00:09, 9.79it/s] 92it [00:09, 9.82it/s] 93it [00:09, 9.86it/s] 94it [00:09, 9.89it/s] 96it [00:09, 9.59it/s] 97it [00:10, 9.59it/s] 98it [00:10, 9.65it/s] 99it [00:10, 9.62it/s] 100it [00:10, 9.13it/s]2025-05-26 03:38:04,996 - INFO - [Epoch 067 | Batch 0100] IWAE-loss 4479.0835 | mean log_px -0.0211 | KL -3224.74 + 101it [00:10, 9.34it/s] 102it [00:10, 9.51it/s] 104it [00:10, 9.74it/s] 106it [00:11, 9.83it/s] 107it [00:11, 9.86it/s] 109it [00:11, 9.94it/s] 110it [00:11, 9.56it/s] 111it [00:11, 9.63it/s] 112it [00:11, 9.72it/s] 113it [00:11, 9.79it/s] 114it [00:11, 9.83it/s] 115it [00:11, 9.86it/s] 116it [00:12, 9.89it/s] 117it [00:12, 9.85it/s] 119it [00:12, 9.94it/s] 121it [00:12, 9.98it/s] 123it [00:12, 10.01it/s] 124it [00:12, 9.99it/s] 125it [00:12, 9.98it/s] 127it [00:13, 10.00it/s] 128it [00:13, 9.51it/s] 129it [00:13, 9.59it/s] 130it [00:13, 9.60it/s] 131it [00:13, 9.65it/s] 132it [00:13, 9.70it/s] 133it [00:13, 9.28it/s] 134it [00:13, 9.42it/s] 135it [00:14, 8.92it/s] 136it [00:14, 9.13it/s] 137it [00:14, 9.33it/s] 138it [00:14, 9.44it/s] 139it [00:14, 9.58it/s] 140it [00:14, 9.60it/s] 141it [00:14, 9.66it/s] 142it [00:14, 9.21it/s] 143it [00:14, 9.34it/s] 144it [00:14, 9.47it/s] 145it [00:15, 9.57it/s] 146it [00:15, 9.14it/s] 147it [00:15, 9.30it/s] 148it [00:15, 8.88it/s] 149it [00:15, 9.12it/s] 150it [00:15, 9.29it/s]2025-05-26 03:38:10,197 - INFO - [Epoch 067 | Batch 0150] IWAE-loss 4168.6562 | mean log_px -0.0179 | KL -3215.23 + 151it [00:15, 8.87it/s] 152it [00:15, 9.13it/s] 153it [00:15, 9.34it/s] 154it [00:16, 9.48it/s] 155it [00:16, 9.58it/s] 156it [00:16, 9.14it/s] 157it [00:16, 9.23it/s] 158it [00:16, 9.39it/s] 159it [00:16, 9.54it/s] 160it [00:16, 9.14it/s] 161it [00:16, 9.34it/s] 162it [00:16, 9.46it/s] 163it [00:16, 9.51it/s] 164it [00:17, 9.57it/s] 165it [00:17, 9.07it/s] 166it [00:17, 9.09it/s] 167it [00:17, 9.13it/s] 168it [00:17, 8.70it/s] 169it [00:17, 8.92it/s] 170it [00:17, 9.07it/s] 171it [00:17, 9.04it/s] 172it [00:17, 9.18it/s] 173it [00:18, 8.75it/s] 174it [00:18, 8.98it/s] 175it [00:18, 9.14it/s] 176it [00:18, 9.22it/s] 177it [00:18, 8.76it/s] 178it [00:18, 9.01it/s] 179it [00:18, 9.22it/s] 180it [00:18, 9.36it/s] 181it [00:18, 8.94it/s] 182it [00:19, 9.18it/s] 183it [00:19, 9.36it/s] 184it [00:19, 9.47it/s] 185it [00:19, 8.99it/s] 186it [00:19, 9.18it/s] 187it [00:19, 9.35it/s] 188it [00:19, 8.89it/s] 189it [00:19, 9.07it/s] 190it [00:19, 8.71it/s] 191it [00:20, 9.02it/s] 192it [00:20, 9.22it/s] 193it [00:20, 9.37it/s] 194it [00:20, 8.91it/s] 195it [00:20, 8.70it/s] 196it [00:20, 9.47it/s] +2025-05-26 03:38:15,221 - INFO - Epoch: 67, Objective: tensor([4425.1938], device='cuda:0', grad_fn=), Loss: 0.020734276622533798, KL/n: 65.69780731201172 + 0it [00:00, ?it/s]2025-05-26 03:38:15,687 - INFO - [Epoch 068 | Batch 0000] IWAE-loss 4215.6938 | mean log_px -0.0170 | KL -3219.93 + 1it [00:00, 4.63it/s] 3it [00:00, 7.74it/s] 5it [00:00, 8.74it/s] 6it [00:00, 8.98it/s] 8it [00:00, 8.99it/s] 10it [00:01, 9.37it/s] 11it [00:01, 9.49it/s] 13it [00:01, 9.72it/s] 15it [00:01, 9.86it/s] 17it [00:01, 9.94it/s] 19it [00:02, 9.99it/s] 21it [00:02, 10.02it/s] 23it [00:02, 9.76it/s] 25it [00:02, 9.87it/s] 27it [00:02, 9.93it/s] 29it [00:03, 9.98it/s] 31it [00:03, 10.02it/s] 33it [00:03, 10.04it/s] 35it [00:03, 10.04it/s] 37it [00:03, 10.05it/s] 39it [00:04, 10.06it/s] 41it [00:04, 10.07it/s] 43it [00:04, 10.07it/s] 45it [00:04, 10.08it/s] 47it [00:04, 10.08it/s] 49it [00:05, 9.82it/s]2025-05-26 03:38:20,738 - INFO - [Epoch 068 | Batch 0050] IWAE-loss 4135.7124 | mean log_px -0.0192 | KL -3214.93 + 51it [00:05, 9.87it/s] 53it [00:05, 9.94it/s] 54it [00:05, 9.95it/s] 56it [00:05, 9.99it/s] 57it [00:05, 9.96it/s] 59it [00:06, 10.02it/s] 61it [00:06, 10.05it/s] 63it [00:06, 10.07it/s] 65it [00:06, 10.04it/s] 67it [00:06, 10.06it/s] 69it [00:07, 9.79it/s] 71it [00:07, 9.88it/s] 73it [00:07, 9.94it/s] 75it [00:07, 9.99it/s] 77it [00:07, 10.03it/s] 79it [00:08, 10.05it/s] 81it [00:08, 10.02it/s] 83it [00:08, 10.00it/s] 85it [00:08, 10.02it/s] 87it [00:08, 10.04it/s] 89it [00:09, 10.06it/s] 91it [00:09, 10.04it/s] 93it [00:09, 10.06it/s] 95it [00:09, 9.86it/s] 97it [00:09, 9.93it/s] 99it [00:10, 9.98it/s]2025-05-26 03:38:25,738 - INFO - [Epoch 068 | Batch 0100] IWAE-loss 4981.6865 | mean log_px -0.0295 | KL -3210.19 + 101it [00:10, 9.68it/s] 103it [00:10, 9.80it/s] 105it [00:10, 9.88it/s] 107it [00:10, 9.95it/s] 109it [00:11, 9.99it/s] 111it [00:11, 9.99it/s] 112it [00:11, 9.99it/s] 114it [00:11, 10.03it/s] 116it [00:11, 10.04it/s] 118it [00:11, 9.97it/s] 120it [00:12, 9.66it/s] 122it [00:12, 9.78it/s] 124it [00:12, 9.87it/s] 126it [00:12, 9.94it/s] 128it [00:12, 9.98it/s] 130it [00:13, 9.67it/s] 132it [00:13, 9.80it/s] 133it [00:13, 9.83it/s] 135it [00:13, 9.89it/s] 137it [00:13, 9.94it/s] 138it [00:13, 9.87it/s] 139it [00:14, 9.43it/s] 141it [00:14, 9.66it/s] 143it [00:14, 9.78it/s] 144it [00:14, 9.37it/s] 146it [00:14, 9.60it/s] 148it [00:15, 9.39it/s] 150it [00:15, 9.61it/s]2025-05-26 03:38:30,857 - INFO - [Epoch 068 | Batch 0150] IWAE-loss 3965.0554 | mean log_px -0.0127 | KL -3208.22 + 151it [00:15, 9.37it/s] 153it [00:15, 9.61it/s] 155it [00:15, 9.75it/s] 156it [00:15, 9.75it/s] 158it [00:16, 9.86it/s] 160it [00:16, 9.93it/s] 162it [00:16, 9.98it/s] 164it [00:16, 10.02it/s] 166it [00:16, 10.04it/s] 168it [00:17, 10.06it/s] 170it [00:17, 10.08it/s] 172it [00:17, 10.08it/s] 174it [00:17, 10.09it/s] 176it [00:17, 9.74it/s] 178it [00:18, 9.85it/s] 180it [00:18, 9.92it/s] 182it [00:18, 9.97it/s] 184it [00:18, 10.02it/s] 186it [00:18, 10.02it/s] 188it [00:19, 10.05it/s] 190it [00:19, 10.07it/s] 192it [00:19, 10.09it/s] 194it [00:19, 10.09it/s] 196it [00:19, 9.87it/s] 196it [00:19, 9.83it/s] +2025-05-26 03:38:35,474 - INFO - Epoch: 68, Objective: tensor([4401.1167], device='cuda:0', grad_fn=), Loss: 0.016813162714242935, KL/n: 65.4537582397461 + 0it [00:00, ?it/s]2025-05-26 03:38:35,760 - INFO - [Epoch 069 | Batch 0000] IWAE-loss 3877.0161 | mean log_px -0.0104 | KL -3203.73 + 1it [00:00, 4.49it/s] 2it [00:00, 6.59it/s] 4it [00:00, 8.44it/s] 6it [00:00, 9.17it/s] 7it [00:00, 8.90it/s] 9it [00:01, 9.37it/s] 11it [00:01, 9.64it/s] 13it [00:01, 9.82it/s] 15it [00:01, 9.92it/s] 17it [00:01, 9.98it/s] 19it [00:02, 10.02it/s] 21it [00:02, 10.01it/s] 22it [00:02, 10.00it/s] 24it [00:02, 10.02it/s] 26it [00:02, 10.01it/s] 28it [00:02, 10.02it/s] 30it [00:03, 10.05it/s] 32it [00:03, 9.66it/s] 34it [00:03, 9.77it/s] 36it [00:03, 9.86it/s] 37it [00:03, 9.50it/s] 38it [00:03, 9.60it/s] 40it [00:04, 9.77it/s] 42it [00:04, 9.51it/s] 44it [00:04, 9.69it/s] 46it [00:04, 9.82it/s] 48it [00:04, 9.91it/s] 50it [00:05, 9.96it/s]2025-05-26 03:38:40,848 - INFO - [Epoch 069 | Batch 0050] IWAE-loss 3863.5151 | mean log_px -0.0112 | KL -3199.91 + 51it [00:05, 9.52it/s] 52it [00:05, 9.56it/s] 53it [00:05, 9.58it/s] 54it [00:05, 9.63it/s] 55it [00:05, 9.67it/s] 56it [00:05, 9.69it/s] 58it [00:06, 9.87it/s] 60it [00:06, 9.97it/s] 62it [00:06, 10.01it/s] 64it [00:06, 10.04it/s] 66it [00:06, 10.06it/s] 68it [00:07, 10.06it/s] 70it [00:07, 10.07it/s] 72it [00:07, 9.69it/s] 73it [00:07, 9.70it/s] 74it [00:07, 9.59it/s] 75it [00:07, 9.01it/s] 76it [00:07, 9.11it/s] 77it [00:07, 9.17it/s] 78it [00:08, 8.79it/s] 79it [00:08, 8.93it/s] 80it [00:08, 9.03it/s] 81it [00:08, 8.57it/s] 82it [00:08, 8.69it/s] 83it [00:08, 8.83it/s] 84it [00:08, 8.53it/s] 85it [00:08, 8.73it/s] 86it [00:09, 8.80it/s] 87it [00:09, 8.90it/s] 88it [00:09, 8.65it/s] 89it [00:09, 8.87it/s] 90it [00:09, 8.91it/s] 91it [00:09, 8.91it/s] 92it [00:09, 8.97it/s] 93it [00:09, 9.00it/s] 94it [00:09, 9.05it/s] 95it [00:10, 9.08it/s] 96it [00:10, 9.19it/s] 97it [00:10, 9.17it/s] 98it [00:10, 9.21it/s] 99it [00:10, 9.24it/s] 100it [00:10, 9.31it/s]2025-05-26 03:38:46,229 - INFO - [Epoch 069 | Batch 0100] IWAE-loss 3742.5066 | mean log_px -0.0079 | KL -3197.15 + 101it [00:10, 9.51it/s] 103it [00:10, 9.78it/s] 105it [00:11, 9.91it/s] 107it [00:11, 10.01it/s] 109it [00:11, 10.05it/s] 111it [00:11, 10.08it/s] 113it [00:11, 10.09it/s] 115it [00:12, 10.10it/s] 117it [00:12, 10.11it/s] 119it [00:12, 10.11it/s] 121it [00:12, 10.11it/s] 123it [00:12, 10.12it/s] 125it [00:13, 10.12it/s] 127it [00:13, 9.78it/s] 129it [00:13, 9.88it/s] 131it [00:13, 9.94it/s] 133it [00:13, 9.99it/s] 135it [00:14, 10.02it/s] 137it [00:14, 10.04it/s] 139it [00:14, 10.06it/s] 141it [00:14, 9.99it/s] 143it [00:14, 10.03it/s] 145it [00:15, 10.06it/s] 147it [00:15, 10.07it/s] 149it [00:15, 10.09it/s]2025-05-26 03:38:51,218 - INFO - [Epoch 069 | Batch 0150] IWAE-loss 4124.4932 | mean log_px -0.0141 | KL -3199.10 + 151it [00:15, 9.80it/s] 153it [00:15, 9.56it/s] 155it [00:16, 9.66it/s] 157it [00:16, 9.78it/s] 159it [00:16, 9.88it/s] 160it [00:16, 9.61it/s] 162it [00:16, 9.73it/s] 164it [00:16, 9.85it/s] 165it [00:17, 9.57it/s] 166it [00:17, 9.65it/s] 168it [00:17, 9.48it/s] 169it [00:17, 9.58it/s] 171it [00:17, 9.45it/s] 173it [00:17, 9.69it/s] 175it [00:18, 9.84it/s] 177it [00:18, 9.94it/s] 179it [00:18, 10.01it/s] 180it [00:18, 9.69it/s] 182it [00:18, 9.83it/s] 183it [00:18, 9.54it/s] 184it [00:19, 9.51it/s] 186it [00:19, 9.74it/s] 188it [00:19, 9.87it/s] 190it [00:19, 9.95it/s] 192it [00:19, 10.01it/s] 194it [00:20, 10.05it/s] 196it [00:20, 9.43it/s] 196it [00:20, 9.63it/s] +2025-05-26 03:38:55,959 - INFO - Epoch: 69, Objective: tensor([5429.6377], device='cuda:0', grad_fn=), Loss: 0.039554789662361145, KL/n: 65.18160247802734 + 0it [00:00, ?it/s]2025-05-26 03:38:56,422 - INFO - [Epoch 070 | Batch 0000] IWAE-loss 3927.8982 | mean log_px -0.0122 | KL -3190.02 + 1it [00:00, 5.29it/s] 2it [00:00, 6.74it/s] 4it [00:00, 8.47it/s] 6it [00:00, 9.16it/s] 8it [00:00, 9.50it/s] 10it [00:01, 9.67it/s] 11it [00:01, 9.32it/s] 12it [00:01, 9.45it/s] 14it [00:01, 9.66it/s] 15it [00:01, 9.73it/s] 16it [00:01, 9.31it/s] 18it [00:01, 9.60it/s] 19it [00:02, 9.67it/s] 21it [00:02, 9.82it/s] 22it [00:02, 9.83it/s] 23it [00:02, 9.38it/s] 24it [00:02, 9.48it/s] 25it [00:02, 9.53it/s] 26it [00:02, 9.49it/s] 27it [00:02, 9.05it/s] 28it [00:03, 9.25it/s] 29it [00:03, 9.41it/s] 30it [00:03, 9.52it/s] 31it [00:03, 9.60it/s] 32it [00:03, 9.22it/s] 33it [00:03, 9.40it/s] 34it [00:03, 9.50it/s] 36it [00:03, 9.75it/s] 38it [00:04, 9.84it/s] 39it [00:04, 9.79it/s] 40it [00:04, 9.42it/s] 42it [00:04, 9.66it/s] 43it [00:04, 9.28it/s] 44it [00:04, 9.44it/s] 46it [00:04, 9.66it/s] 48it [00:05, 9.82it/s] 49it [00:05, 9.85it/s] 50it [00:05, 9.78it/s]2025-05-26 03:39:01,627 - INFO - [Epoch 070 | Batch 0050] IWAE-loss 4088.9717 | mean log_px -0.0128 | KL -3193.53 + 51it [00:05, 9.25it/s] 52it [00:05, 9.44it/s] 54it [00:05, 9.66it/s] 56it [00:05, 9.81it/s] 58it [00:06, 9.88it/s] 60it [00:06, 9.92it/s] 61it [00:06, 9.53it/s] 63it [00:06, 9.71it/s] 64it [00:06, 9.76it/s] 66it [00:06, 9.89it/s] 67it [00:07, 9.91it/s] 69it [00:07, 9.95it/s] 70it [00:07, 9.95it/s] 72it [00:07, 10.01it/s] 73it [00:07, 10.00it/s] 75it [00:07, 10.03it/s] 77it [00:08, 10.00it/s] 78it [00:08, 9.98it/s] 80it [00:08, 10.03it/s] 82it [00:08, 10.01it/s] 84it [00:08, 10.03it/s] 86it [00:08, 10.00it/s] 88it [00:09, 10.02it/s] 90it [00:09, 10.05it/s] 92it [00:09, 9.71it/s] 94it [00:09, 9.80it/s] 95it [00:09, 9.84it/s] 96it [00:09, 9.49it/s] 97it [00:10, 9.55it/s] 98it [00:10, 9.61it/s] 99it [00:10, 9.18it/s] 100it [00:10, 9.38it/s]2025-05-26 03:39:06,733 - INFO - [Epoch 070 | Batch 0100] IWAE-loss 4525.4941 | mean log_px -0.0213 | KL -3186.68 + 101it [00:10, 9.47it/s] 103it [00:10, 9.64it/s] 105it [00:10, 9.77it/s] 106it [00:11, 9.81it/s] 108it [00:11, 9.58it/s] 109it [00:11, 9.55it/s] 110it [00:11, 9.60it/s] 111it [00:11, 9.17it/s] 112it [00:11, 9.36it/s] 113it [00:11, 9.52it/s] 114it [00:11, 9.64it/s] 115it [00:11, 9.74it/s] 116it [00:12, 9.80it/s] 117it [00:12, 9.85it/s] 118it [00:12, 9.89it/s] 120it [00:12, 9.96it/s] 121it [00:12, 9.41it/s] 122it [00:12, 9.56it/s] 123it [00:12, 9.65it/s] 124it [00:12, 9.73it/s] 125it [00:12, 9.80it/s] 126it [00:13, 9.84it/s] 128it [00:13, 9.89it/s] 129it [00:13, 9.49it/s] 131it [00:13, 9.69it/s] 132it [00:13, 9.76it/s] 134it [00:13, 9.84it/s] 136it [00:14, 9.90it/s] 137it [00:14, 9.56it/s] 138it [00:14, 9.65it/s] 140it [00:14, 9.81it/s] 142it [00:14, 9.90it/s] 143it [00:14, 9.52it/s] 144it [00:14, 9.62it/s] 146it [00:15, 9.45it/s] 148it [00:15, 9.66it/s] 149it [00:15, 9.71it/s] 150it [00:15, 9.74it/s]2025-05-26 03:39:11,892 - INFO - [Epoch 070 | Batch 0150] IWAE-loss 3830.5117 | mean log_px -0.0118 | KL -3191.07 + 151it [00:15, 9.77it/s] 152it [00:15, 9.26it/s] 154it [00:15, 9.58it/s] 155it [00:16, 9.67it/s] 156it [00:16, 9.69it/s] 157it [00:16, 9.76it/s] 158it [00:16, 9.27it/s] 159it [00:16, 9.45it/s] 160it [00:16, 9.55it/s] 161it [00:16, 9.15it/s] 162it [00:16, 9.33it/s] 163it [00:16, 9.51it/s] 164it [00:17, 9.59it/s] 166it [00:17, 9.77it/s] 167it [00:17, 9.72it/s] 168it [00:17, 9.24it/s] 169it [00:17, 9.31it/s] 170it [00:17, 9.02it/s] 171it [00:17, 8.62it/s] 172it [00:17, 8.91it/s] 173it [00:18, 9.16it/s] 174it [00:18, 9.31it/s] 175it [00:18, 8.88it/s] 176it [00:18, 8.89it/s] 177it [00:18, 8.97it/s] 178it [00:18, 9.21it/s] 179it [00:18, 9.37it/s] 180it [00:18, 9.50it/s] 181it [00:18, 9.59it/s] 182it [00:18, 9.64it/s] 183it [00:19, 9.69it/s] 184it [00:19, 9.09it/s] 185it [00:19, 9.31it/s] 186it [00:19, 9.42it/s] 187it [00:19, 9.41it/s] 188it [00:19, 9.51it/s] 189it [00:19, 9.63it/s] 190it [00:19, 9.62it/s] 191it [00:19, 9.58it/s] 192it [00:20, 9.29it/s] 193it [00:20, 9.29it/s] 194it [00:20, 9.31it/s] 195it [00:20, 8.91it/s] 196it [00:20, 9.14it/s] 196it [00:20, 9.54it/s] +2025-05-26 03:39:16,829 - INFO - Epoch: 70, Objective: tensor([4718.2910], device='cuda:0', grad_fn=), Loss: 0.02613232657313347, KL/n: 64.95722961425781 + 0it [00:00, ?it/s]2025-05-26 03:39:17,083 - INFO - [Epoch 071 | Batch 0000] IWAE-loss 4098.5879 | mean log_px -0.0153 | KL -3181.93 + 1it [00:00, 5.24it/s] 2it [00:00, 7.15it/s] 3it [00:00, 8.10it/s] 4it [00:00, 8.57it/s] 5it [00:00, 8.58it/s] 6it [00:00, 8.26it/s] 7it [00:00, 8.59it/s] 8it [00:00, 8.91it/s] 9it [00:01, 9.09it/s] 10it [00:01, 9.25it/s] 11it [00:01, 9.39it/s] 12it [00:01, 8.97it/s] 13it [00:01, 9.13it/s] 14it [00:01, 9.24it/s] 15it [00:01, 9.26it/s] 16it [00:01, 8.84it/s] 17it [00:01, 9.03it/s] 18it [00:02, 9.17it/s] 19it [00:02, 9.31it/s] 20it [00:02, 8.86it/s] 21it [00:02, 9.10it/s] 22it [00:02, 9.23it/s] 23it [00:02, 9.24it/s] 24it [00:02, 8.81it/s] 25it [00:02, 9.05it/s] 26it [00:02, 8.72it/s] 27it [00:03, 8.96it/s] 28it [00:03, 9.08it/s] 29it [00:03, 9.23it/s] 30it [00:03, 8.84it/s] 31it [00:03, 9.05it/s] 32it [00:03, 9.21it/s] 33it [00:03, 9.33it/s] 34it [00:03, 9.40it/s] 35it [00:03, 9.44it/s] 36it [00:04, 9.52it/s] 37it [00:04, 9.58it/s] 38it [00:04, 9.07it/s] 39it [00:04, 9.20it/s] 40it [00:04, 9.28it/s] 41it [00:04, 9.38it/s] 42it [00:04, 9.09it/s] 43it [00:04, 9.23it/s] 44it [00:04, 9.01it/s] 45it [00:04, 9.19it/s] 46it [00:05, 8.97it/s] 47it [00:05, 9.15it/s] 48it [00:05, 9.18it/s] 49it [00:05, 9.24it/s] 50it [00:05, 9.33it/s]2025-05-26 03:39:22,562 - INFO - [Epoch 071 | Batch 0050] IWAE-loss 3795.4751 | mean log_px -0.0104 | KL -3178.03 + 51it [00:05, 9.36it/s] 52it [00:05, 8.91it/s] 53it [00:05, 9.07it/s] 54it [00:05, 9.19it/s] 55it [00:06, 9.32it/s] 56it [00:06, 9.05it/s] 57it [00:06, 9.22it/s] 58it [00:06, 9.31it/s] 59it [00:06, 8.90it/s] 60it [00:06, 9.10it/s] 61it [00:06, 9.25it/s] 62it [00:06, 9.30it/s] 63it [00:06, 9.40it/s] 64it [00:07, 9.45it/s] 65it [00:07, 9.51it/s] 66it [00:07, 9.17it/s] 67it [00:07, 9.31it/s] 68it [00:07, 8.76it/s] 69it [00:07, 8.95it/s] 70it [00:07, 9.05it/s] 71it [00:07, 9.22it/s] 72it [00:07, 9.32it/s] 73it [00:08, 9.42it/s] 74it [00:08, 9.43it/s] 75it [00:08, 9.52it/s] 76it [00:08, 9.51it/s] 77it [00:08, 9.44it/s] 78it [00:08, 9.47it/s] 79it [00:08, 9.45it/s] 80it [00:08, 8.92it/s] 81it [00:08, 8.90it/s] 82it [00:09, 8.77it/s] 83it [00:09, 9.02it/s] 84it [00:09, 9.21it/s] 85it [00:09, 9.35it/s] 86it [00:09, 9.43it/s] 87it [00:09, 9.51it/s] 88it [00:09, 9.55it/s] 89it [00:09, 9.61it/s] 90it [00:09, 9.52it/s] 91it [00:09, 9.58it/s] 92it [00:10, 9.61it/s] 93it [00:10, 9.60it/s] 94it [00:10, 9.60it/s] 95it [00:10, 9.58it/s] 96it [00:10, 9.57it/s] 97it [00:10, 9.58it/s] 98it [00:10, 9.02it/s] 99it [00:10, 9.09it/s] 100it [00:10, 9.27it/s]2025-05-26 03:39:27,946 - INFO - [Epoch 071 | Batch 0100] IWAE-loss 3703.3640 | mean log_px -0.0093 | KL -3174.69 + 101it [00:11, 9.38it/s] 102it [00:11, 9.48it/s] 103it [00:11, 9.53it/s] 104it [00:11, 9.55it/s] 105it [00:11, 9.57it/s] 106it [00:11, 9.56it/s] 107it [00:11, 9.60it/s] 108it [00:11, 9.58it/s] 109it [00:11, 9.59it/s] 110it [00:11, 9.59it/s] 111it [00:12, 9.44it/s] 112it [00:12, 8.87it/s] 113it [00:12, 8.83it/s] 114it [00:12, 9.04it/s] 115it [00:12, 9.17it/s] 116it [00:12, 8.74it/s] 117it [00:12, 9.01it/s] 118it [00:12, 9.14it/s] 119it [00:12, 9.20it/s] 120it [00:13, 9.39it/s] 121it [00:13, 9.56it/s] 122it [00:13, 9.65it/s] 123it [00:13, 9.68it/s] 124it [00:13, 9.77it/s] 125it [00:13, 9.80it/s] 127it [00:13, 9.93it/s] 129it [00:13, 10.00it/s] 131it [00:14, 10.05it/s] 133it [00:14, 10.10it/s] 135it [00:14, 10.11it/s] 137it [00:14, 10.07it/s] 139it [00:14, 10.09it/s] 141it [00:15, 10.03it/s] 143it [00:15, 9.71it/s] 145it [00:15, 9.83it/s] 147it [00:15, 9.92it/s] 148it [00:15, 9.90it/s] 150it [00:16, 9.97it/s]2025-05-26 03:39:33,101 - INFO - [Epoch 071 | Batch 0150] IWAE-loss 3954.1804 | mean log_px -0.0154 | KL -3167.20 + 151it [00:16, 9.94it/s] 153it [00:16, 10.00it/s] 155it [00:16, 9.74it/s] 156it [00:16, 9.69it/s] 158it [00:16, 9.82it/s] 160it [00:17, 9.92it/s] 162it [00:17, 9.98it/s] 164it [00:17, 10.03it/s] 166it [00:17, 10.06it/s] 168it [00:17, 10.10it/s] 170it [00:18, 10.11it/s] 172it [00:18, 10.09it/s] 174it [00:18, 10.11it/s] 176it [00:18, 9.98it/s] 177it [00:18, 9.92it/s] 179it [00:18, 9.98it/s] 180it [00:19, 9.96it/s] 182it [00:19, 10.03it/s] 184it [00:19, 10.08it/s] 186it [00:19, 10.08it/s] 188it [00:19, 10.10it/s] 190it [00:20, 10.13it/s] 192it [00:20, 10.14it/s] 194it [00:20, 10.15it/s] 196it [00:20, 9.87it/s] 196it [00:20, 9.45it/s] +2025-05-26 03:39:37,701 - INFO - Epoch: 71, Objective: tensor([4948.8066], device='cuda:0', grad_fn=), Loss: 0.03435065969824791, KL/n: 64.70899200439453 + 0it [00:00, ?it/s]2025-05-26 03:39:38,159 - INFO - [Epoch 072 | Batch 0000] IWAE-loss 4508.8237 | mean log_px -0.0191 | KL -3173.76 + 1it [00:00, 5.48it/s] 2it [00:00, 7.44it/s] 4it [00:00, 8.95it/s] 6it [00:00, 9.47it/s] 8it [00:00, 9.75it/s] 10it [00:01, 9.87it/s] 12it [00:01, 9.95it/s] 14it [00:01, 10.01it/s] 16it [00:01, 10.05it/s] 18it [00:01, 10.08it/s] 20it [00:02, 10.09it/s] 22it [00:02, 10.05it/s] 24it [00:02, 9.58it/s] 25it [00:02, 9.53it/s] 27it [00:02, 9.71it/s] 29it [00:02, 9.84it/s] 31it [00:03, 9.91it/s] 32it [00:03, 9.92it/s] 34it [00:03, 9.99it/s] 36it [00:03, 10.02it/s] 38it [00:03, 10.03it/s] 40it [00:04, 10.07it/s] 42it [00:04, 10.09it/s] 44it [00:04, 10.05it/s] 46it [00:04, 10.08it/s] 48it [00:04, 10.08it/s] 50it [00:05, 10.11it/s]2025-05-26 03:39:43,155 - INFO - [Epoch 072 | Batch 0050] IWAE-loss 4654.4067 | mean log_px -0.0212 | KL -3164.67 + 52it [00:05, 10.10it/s] 54it [00:05, 10.12it/s] 56it [00:05, 10.13it/s] 58it [00:05, 10.11it/s] 60it [00:06, 10.10it/s] 62it [00:06, 10.10it/s] 64it [00:06, 10.00it/s] 66it [00:06, 9.54it/s] 68it [00:06, 9.70it/s] 70it [00:07, 9.82it/s] 72it [00:07, 9.89it/s] 74it [00:07, 9.95it/s] 76it [00:07, 10.00it/s] 78it [00:07, 9.60it/s] 79it [00:08, 9.55it/s] 80it [00:08, 9.56it/s] 82it [00:08, 9.45it/s] 84it [00:08, 9.67it/s] 86it [00:08, 9.82it/s] 88it [00:08, 9.92it/s] 90it [00:09, 9.95it/s] 92it [00:09, 9.69it/s] 94it [00:09, 9.74it/s] 95it [00:09, 9.73it/s] 96it [00:09, 9.34it/s] 98it [00:09, 9.61it/s] 100it [00:10, 9.72it/s]2025-05-26 03:39:48,264 - INFO - [Epoch 072 | Batch 0100] IWAE-loss 5721.9814 | mean log_px -0.0405 | KL -3163.68 + 101it [00:10, 9.34it/s] 103it [00:10, 9.62it/s] 105it [00:10, 9.78it/s] 106it [00:10, 9.49it/s] 107it [00:10, 9.59it/s] 109it [00:11, 9.79it/s] 110it [00:11, 9.39it/s] 112it [00:11, 9.65it/s] 114it [00:11, 9.81it/s] 116it [00:11, 9.90it/s] 118it [00:12, 9.97it/s] 120it [00:12, 10.01it/s] 121it [00:12, 9.61it/s] 123it [00:12, 9.78it/s] 125it [00:12, 9.89it/s] 127it [00:12, 9.97it/s] 129it [00:13, 10.02it/s] 131it [00:13, 10.04it/s] 133it [00:13, 10.02it/s] 134it [00:13, 9.71it/s] 136it [00:13, 9.84it/s] 138it [00:14, 9.92it/s] 140it [00:14, 9.98it/s] 142it [00:14, 10.02it/s] 144it [00:14, 10.04it/s] 146it [00:14, 10.05it/s] 148it [00:15, 10.06it/s] 150it [00:15, 10.08it/s]2025-05-26 03:39:53,324 - INFO - [Epoch 072 | Batch 0150] IWAE-loss 4235.5010 | mean log_px -0.0156 | KL -3162.35 + 152it [00:15, 9.76it/s] 154it [00:15, 9.54it/s] 156it [00:15, 9.70it/s] 158it [00:16, 9.82it/s] 160it [00:16, 9.59it/s] 162it [00:16, 9.74it/s] 164it [00:16, 9.86it/s] 166it [00:16, 9.94it/s] 168it [00:17, 10.00it/s] 170it [00:17, 9.76it/s] 171it [00:17, 9.80it/s] 172it [00:17, 9.50it/s] 173it [00:17, 9.60it/s] 175it [00:17, 9.82it/s] 177it [00:18, 9.54it/s] 179it [00:18, 9.72it/s] 180it [00:18, 9.45it/s] 182it [00:18, 9.69it/s] 184it [00:18, 9.82it/s] 185it [00:18, 9.46it/s] 187it [00:19, 9.68it/s] 189it [00:19, 9.82it/s] 191it [00:19, 9.91it/s] 192it [00:19, 9.60it/s] 194it [00:19, 9.77it/s] 195it [00:19, 9.52it/s] 196it [00:20, 9.30it/s] 196it [00:20, 9.76it/s] +2025-05-26 03:39:58,103 - INFO - Epoch: 72, Objective: tensor([3779.6716], device='cuda:0', grad_fn=), Loss: 0.01213796902447939, KL/n: 64.47173309326172 + 0it [00:00, ?it/s]2025-05-26 03:39:58,380 - INFO - [Epoch 073 | Batch 0000] IWAE-loss 4182.9614 | mean log_px -0.0191 | KL -3160.06 + 1it [00:00, 5.42it/s] 2it [00:00, 6.79it/s] 4it [00:00, 8.53it/s] 6it [00:00, 9.17it/s] 7it [00:00, 9.28it/s] 8it [00:00, 9.33it/s] 9it [00:01, 8.99it/s] 10it [00:01, 9.25it/s] 12it [00:01, 9.12it/s] 14it [00:01, 9.46it/s] 15it [00:01, 9.56it/s] 16it [00:01, 9.65it/s] 18it [00:01, 9.81it/s] 20it [00:02, 9.89it/s] 22it [00:02, 9.95it/s] 23it [00:02, 9.64it/s] 24it [00:02, 9.71it/s] 26it [00:02, 9.82it/s] 27it [00:02, 9.85it/s] 28it [00:02, 9.48it/s] 30it [00:03, 9.64it/s] 32it [00:03, 9.73it/s] 33it [00:03, 9.35it/s] 34it [00:03, 9.33it/s] 35it [00:03, 9.44it/s] 36it [00:03, 9.55it/s] 37it [00:03, 9.67it/s] 38it [00:04, 9.75it/s] 40it [00:04, 9.85it/s] 42it [00:04, 9.91it/s] 43it [00:04, 9.86it/s] 44it [00:04, 9.70it/s] 45it [00:04, 9.67it/s] 46it [00:04, 9.71it/s] 47it [00:04, 9.72it/s] 48it [00:05, 9.79it/s] 50it [00:05, 9.90it/s]2025-05-26 03:40:03,550 - INFO - [Epoch 073 | Batch 0050] IWAE-loss 4043.1121 | mean log_px -0.0134 | KL -3153.70 + 51it [00:05, 9.90it/s] 52it [00:05, 9.91it/s] 54it [00:05, 9.98it/s] 56it [00:05, 10.01it/s] 58it [00:06, 10.00it/s] 60it [00:06, 10.02it/s] 62it [00:06, 9.74it/s] 64it [00:06, 9.83it/s] 66it [00:06, 9.89it/s] 68it [00:07, 9.94it/s] 70it [00:07, 9.98it/s] 72it [00:07, 9.65it/s] 74it [00:07, 9.77it/s] 76it [00:07, 9.85it/s] 77it [00:07, 9.87it/s] 78it [00:08, 9.90it/s] 80it [00:08, 9.95it/s] 82it [00:08, 9.99it/s] 84it [00:08, 10.00it/s] 86it [00:08, 10.01it/s] 88it [00:09, 10.02it/s] 90it [00:09, 10.03it/s] 92it [00:09, 10.01it/s] 94it [00:09, 9.68it/s] 95it [00:09, 9.73it/s] 97it [00:10, 9.84it/s] 98it [00:10, 9.45it/s] 100it [00:10, 9.65it/s]2025-05-26 03:40:08,623 - INFO - [Epoch 073 | Batch 0100] IWAE-loss 4164.0747 | mean log_px -0.0208 | KL -3156.93 + 101it [00:10, 9.29it/s] 102it [00:10, 9.40it/s] 104it [00:10, 9.63it/s] 106it [00:10, 9.77it/s] 107it [00:11, 9.46it/s] 109it [00:11, 9.67it/s] 111it [00:11, 9.46it/s] 112it [00:11, 9.55it/s] 114it [00:11, 9.72it/s] 115it [00:11, 9.34it/s] 116it [00:12, 9.47it/s] 117it [00:12, 9.52it/s] 118it [00:12, 9.62it/s] 120it [00:12, 9.79it/s] 121it [00:12, 9.83it/s] 122it [00:12, 9.87it/s] 123it [00:12, 9.90it/s] 124it [00:12, 9.93it/s] 126it [00:13, 9.96it/s] 127it [00:13, 9.96it/s] 128it [00:13, 9.96it/s] 129it [00:13, 9.97it/s] 131it [00:13, 9.99it/s] 132it [00:13, 9.98it/s] 133it [00:13, 9.98it/s] 134it [00:13, 9.97it/s] 136it [00:14, 9.98it/s] 138it [00:14, 9.99it/s] 139it [00:14, 9.51it/s] 140it [00:14, 9.61it/s] 142it [00:14, 9.78it/s] 143it [00:14, 9.82it/s] 144it [00:14, 9.86it/s] 145it [00:14, 9.89it/s] 146it [00:15, 9.92it/s] 148it [00:15, 9.91it/s] 150it [00:15, 9.95it/s]2025-05-26 03:40:13,742 - INFO - [Epoch 073 | Batch 0150] IWAE-loss 4541.8203 | mean log_px -0.0273 | KL -3146.10 + 151it [00:15, 9.48it/s] 152it [00:15, 9.58it/s] 153it [00:15, 9.66it/s] 155it [00:15, 9.34it/s] 156it [00:16, 9.46it/s] 157it [00:16, 9.51it/s] 158it [00:16, 9.63it/s] 159it [00:16, 9.24it/s] 161it [00:16, 9.58it/s] 162it [00:16, 9.65it/s] 164it [00:16, 9.81it/s] 166it [00:17, 9.90it/s] 168it [00:17, 9.93it/s] 169it [00:17, 9.60it/s] 170it [00:17, 9.68it/s] 171it [00:17, 9.75it/s] 173it [00:17, 9.88it/s] 174it [00:17, 9.90it/s] 176it [00:18, 9.94it/s] 178it [00:18, 9.66it/s] 180it [00:18, 9.77it/s] 181it [00:18, 9.80it/s] 183it [00:18, 9.88it/s] 184it [00:18, 9.84it/s] 185it [00:19, 9.28it/s] 186it [00:19, 9.31it/s] 187it [00:19, 9.46it/s] 188it [00:19, 9.60it/s] 189it [00:19, 9.70it/s] 190it [00:19, 9.18it/s] 192it [00:19, 9.54it/s] 194it [00:20, 9.74it/s] 195it [00:20, 9.11it/s] 196it [00:20, 9.65it/s] +2025-05-26 03:40:18,541 - INFO - Epoch: 73, Objective: tensor([3657.3047], device='cuda:0', grad_fn=), Loss: 0.007871869951486588, KL/n: 64.23025512695312 + 0it [00:00, ?it/s]2025-05-26 03:40:18,996 - INFO - [Epoch 074 | Batch 0000] IWAE-loss 4381.4062 | mean log_px -0.0209 | KL -3141.13 + 1it [00:00, 5.46it/s] 2it [00:00, 6.84it/s] 4it [00:00, 8.53it/s] 5it [00:00, 8.42it/s] 7it [00:00, 9.10it/s] 8it [00:00, 8.83it/s] 10it [00:01, 9.32it/s] 12it [00:01, 9.56it/s] 13it [00:01, 9.61it/s] 15it [00:01, 9.78it/s] 17it [00:01, 9.56it/s] 18it [00:01, 9.62it/s] 20it [00:02, 9.79it/s] 22it [00:02, 9.90it/s] 24it [00:02, 9.97it/s] 26it [00:02, 10.01it/s] 27it [00:02, 9.42it/s] 28it [00:02, 9.44it/s] 30it [00:03, 9.66it/s] 31it [00:03, 9.29it/s] 33it [00:03, 9.57it/s] 35it [00:03, 9.75it/s] 37it [00:03, 9.87it/s] 39it [00:04, 9.96it/s] 40it [00:04, 9.93it/s] 42it [00:04, 9.99it/s] 44it [00:04, 10.03it/s] 45it [00:04, 9.71it/s] 47it [00:04, 9.84it/s] 49it [00:05, 9.92it/s]2025-05-26 03:40:24,136 - INFO - [Epoch 074 | Batch 0050] IWAE-loss 4331.8213 | mean log_px -0.0203 | KL -3145.59 + 51it [00:05, 9.62it/s] 53it [00:05, 9.77it/s] 55it [00:05, 9.87it/s] 57it [00:05, 9.94it/s] 59it [00:06, 9.99it/s] 61it [00:06, 10.02it/s] 63it [00:06, 10.05it/s] 65it [00:06, 10.08it/s] 67it [00:06, 9.74it/s] 68it [00:07, 9.78it/s] 70it [00:07, 9.88it/s] 72it [00:07, 9.94it/s] 74it [00:07, 9.98it/s] 75it [00:07, 9.67it/s] 77it [00:07, 9.81it/s] 79it [00:08, 9.91it/s] 81it [00:08, 9.98it/s] 82it [00:08, 9.65it/s] 84it [00:08, 9.80it/s] 85it [00:08, 9.52it/s] 87it [00:08, 9.72it/s] 89it [00:09, 9.84it/s] 91it [00:09, 9.94it/s] 92it [00:09, 9.63it/s] 94it [00:09, 9.79it/s] 96it [00:09, 9.90it/s] 98it [00:10, 9.95it/s] 99it [00:10, 9.94it/s] 100it [00:10, 9.84it/s]2025-05-26 03:40:29,217 - INFO - [Epoch 074 | Batch 0100] IWAE-loss 3966.7395 | mean log_px -0.0130 | KL -3133.57 + 101it [00:10, 9.37it/s] 103it [00:10, 9.64it/s] 104it [00:10, 9.71it/s] 106it [00:10, 9.43it/s] 108it [00:11, 9.64it/s] 110it [00:11, 9.79it/s] 112it [00:11, 9.89it/s] 114it [00:11, 9.95it/s] 116it [00:11, 10.00it/s] 118it [00:12, 10.03it/s] 120it [00:12, 10.05it/s] 122it [00:12, 10.06it/s] 124it [00:12, 10.08it/s] 126it [00:12, 10.08it/s] 128it [00:13, 10.09it/s] 130it [00:13, 10.10it/s] 132it [00:13, 10.09it/s] 134it [00:13, 10.09it/s] 136it [00:13, 10.08it/s] 138it [00:14, 10.05it/s] 140it [00:14, 9.93it/s] 142it [00:14, 9.63it/s] 144it [00:14, 9.75it/s] 146it [00:14, 9.52it/s] 148it [00:15, 9.67it/s] 150it [00:15, 9.80it/s]2025-05-26 03:40:34,281 - INFO - [Epoch 074 | Batch 0150] IWAE-loss 3943.3928 | mean log_px -0.0122 | KL -3135.55 + 151it [00:15, 9.46it/s] 153it [00:15, 9.58it/s] 154it [00:15, 9.65it/s] 156it [00:15, 9.81it/s] 158it [00:16, 9.91it/s] 159it [00:16, 9.92it/s] 160it [00:16, 9.84it/s] 161it [00:16, 9.45it/s] 163it [00:16, 9.71it/s] 165it [00:16, 9.44it/s] 167it [00:17, 9.66it/s] 169it [00:17, 9.77it/s] 171it [00:17, 9.87it/s] 173it [00:17, 9.95it/s] 175it [00:17, 9.99it/s] 177it [00:18, 10.03it/s] 179it [00:18, 10.06it/s] 181it [00:18, 10.07it/s] 183it [00:18, 10.07it/s] 185it [00:18, 10.09it/s] 187it [00:19, 9.82it/s] 189it [00:19, 9.91it/s] 191it [00:19, 9.71it/s] 192it [00:19, 9.73it/s] 194it [00:19, 9.86it/s] 195it [00:19, 9.59it/s] 196it [00:20, 9.28it/s] 196it [00:20, 9.73it/s] +2025-05-26 03:40:38,999 - INFO - Epoch: 74, Objective: tensor([3946.5691], device='cuda:0', grad_fn=), Loss: 0.01754077710211277, KL/n: 63.97822570800781 + 0it [00:00, ?it/s]2025-05-26 03:40:39,297 - INFO - [Epoch 075 | Batch 0000] IWAE-loss 4051.3987 | mean log_px -0.0158 | KL -3134.45 + 1it [00:00, 5.07it/s] 2it [00:00, 7.13it/s] 3it [00:00, 8.15it/s] 4it [00:00, 8.11it/s] 5it [00:00, 8.70it/s] 6it [00:00, 9.09it/s] 7it [00:00, 9.36it/s] 8it [00:00, 9.52it/s] 9it [00:01, 9.63it/s] 11it [00:01, 9.83it/s] 12it [00:01, 9.85it/s] 14it [00:01, 9.48it/s] 15it [00:01, 9.60it/s] 16it [00:01, 9.66it/s] 18it [00:01, 9.82it/s] 20it [00:02, 9.91it/s] 21it [00:02, 9.90it/s] 23it [00:02, 9.97it/s] 24it [00:02, 9.51it/s] 26it [00:02, 9.70it/s] 28it [00:02, 9.80it/s] 30it [00:03, 9.52it/s] 32it [00:03, 9.67it/s] 33it [00:03, 9.33it/s] 35it [00:03, 9.55it/s] 36it [00:03, 9.63it/s] 38it [00:04, 9.79it/s] 40it [00:04, 9.84it/s] 42it [00:04, 9.91it/s] 44it [00:04, 9.96it/s] 46it [00:04, 9.63it/s] 47it [00:04, 9.65it/s] 48it [00:05, 9.71it/s] 49it [00:05, 9.31it/s] 50it [00:05, 9.45it/s]2025-05-26 03:40:44,469 - INFO - [Epoch 075 | Batch 0050] IWAE-loss 3742.8145 | mean log_px -0.0096 | KL -3130.84 + 51it [00:05, 9.42it/s] 52it [00:05, 9.52it/s] 53it [00:05, 9.20it/s] 54it [00:05, 9.40it/s] 56it [00:05, 9.68it/s] 58it [00:06, 9.80it/s] 60it [00:06, 9.89it/s] 62it [00:06, 9.94it/s] 64it [00:06, 9.62it/s] 66it [00:06, 9.75it/s] 68it [00:07, 9.85it/s] 69it [00:07, 9.87it/s] 70it [00:07, 9.45it/s] 71it [00:07, 9.56it/s] 72it [00:07, 9.66it/s] 74it [00:07, 9.80it/s] 76it [00:07, 9.89it/s] 78it [00:08, 9.92it/s] 80it [00:08, 9.98it/s] 81it [00:08, 9.97it/s] 82it [00:08, 9.93it/s] 83it [00:08, 9.45it/s] 85it [00:08, 9.69it/s] 86it [00:08, 9.76it/s] 88it [00:09, 9.85it/s] 89it [00:09, 9.43it/s] 90it [00:09, 9.43it/s] 91it [00:09, 9.47it/s] 92it [00:09, 9.39it/s] 93it [00:09, 9.48it/s] 94it [00:09, 9.59it/s] 95it [00:09, 9.68it/s] 96it [00:10, 9.74it/s] 97it [00:10, 9.76it/s] 98it [00:10, 9.78it/s] 99it [00:10, 9.80it/s] 100it [00:10, 9.80it/s]2025-05-26 03:40:49,609 - INFO - [Epoch 075 | Batch 0100] IWAE-loss 4642.5938 | mean log_px -0.0251 | KL -3130.53 + 101it [00:10, 9.21it/s] 102it [00:10, 9.38it/s] 103it [00:10, 9.53it/s] 104it [00:10, 9.47it/s] 105it [00:10, 9.60it/s] 106it [00:11, 9.71it/s] 108it [00:11, 9.86it/s] 109it [00:11, 9.90it/s] 111it [00:11, 9.96it/s] 113it [00:11, 9.99it/s] 115it [00:11, 10.01it/s] 116it [00:12, 10.01it/s] 118it [00:12, 10.02it/s] 120it [00:12, 10.00it/s] 121it [00:12, 9.98it/s] 122it [00:12, 9.97it/s] 123it [00:12, 9.97it/s] 124it [00:12, 9.98it/s] 125it [00:12, 9.52it/s] 126it [00:13, 9.51it/s] 127it [00:13, 9.63it/s] 129it [00:13, 9.82it/s] 130it [00:13, 9.80it/s] 132it [00:13, 9.87it/s] 133it [00:13, 9.48it/s] 134it [00:13, 9.59it/s] 136it [00:14, 9.38it/s] 137it [00:14, 9.51it/s] 138it [00:14, 9.62it/s] 140it [00:14, 9.75it/s] 142it [00:14, 9.53it/s] 143it [00:14, 9.61it/s] 145it [00:15, 9.74it/s] 146it [00:15, 9.43it/s] 147it [00:15, 9.51it/s] 148it [00:15, 9.58it/s] 149it [00:15, 9.67it/s] 150it [00:15, 9.17it/s]2025-05-26 03:40:54,777 - INFO - [Epoch 075 | Batch 0150] IWAE-loss 4248.3130 | mean log_px -0.0234 | KL -3122.70 + 151it [00:15, 9.35it/s] 153it [00:15, 9.66it/s] 154it [00:15, 9.67it/s] 156it [00:16, 9.83it/s] 158it [00:16, 9.90it/s] 159it [00:16, 9.90it/s] 160it [00:16, 9.86it/s] 162it [00:16, 9.42it/s] 163it [00:16, 9.53it/s] 164it [00:17, 9.64it/s] 165it [00:17, 9.72it/s] 166it [00:17, 9.74it/s] 168it [00:17, 9.87it/s] 170it [00:17, 9.94it/s] 171it [00:17, 9.88it/s] 172it [00:17, 9.88it/s] 174it [00:18, 9.93it/s] 176it [00:18, 9.97it/s] 178it [00:18, 9.99it/s] 179it [00:18, 9.56it/s] 180it [00:18, 9.65it/s] 181it [00:18, 9.73it/s] 182it [00:18, 9.27it/s] 184it [00:19, 9.58it/s] 185it [00:19, 9.20it/s] 186it [00:19, 9.34it/s] 187it [00:19, 9.48it/s] 188it [00:19, 9.57it/s] 189it [00:19, 9.69it/s] 191it [00:19, 9.85it/s] 192it [00:19, 9.35it/s] 193it [00:20, 9.42it/s] 194it [00:20, 9.04it/s] 195it [00:20, 8.90it/s] 196it [00:20, 9.60it/s] +2025-05-26 03:40:59,552 - INFO - Epoch: 75, Objective: tensor([4487.3818], device='cuda:0', grad_fn=), Loss: 0.022050147876143456, KL/n: 63.74296569824219 + 0it [00:00, ?it/s]2025-05-26 03:40:59,988 - INFO - [Epoch 076 | Batch 0000] IWAE-loss 3891.9312 | mean log_px -0.0134 | KL -3123.93 + 1it [00:00, 5.40it/s] 2it [00:00, 7.34it/s] 4it [00:00, 8.87it/s] 6it [00:00, 9.41it/s] 8it [00:00, 9.69it/s] 10it [00:01, 9.81it/s] 12it [00:01, 9.90it/s] 14it [00:01, 9.75it/s] 16it [00:01, 9.85it/s] 18it [00:01, 9.94it/s] 20it [00:02, 10.00it/s] 22it [00:02, 10.03it/s] 24it [00:02, 9.70it/s] 26it [00:02, 9.81it/s] 28it [00:02, 9.89it/s] 30it [00:03, 9.96it/s] 32it [00:03, 9.99it/s] 34it [00:03, 10.02it/s] 36it [00:03, 10.04it/s] 38it [00:03, 10.06it/s] 40it [00:04, 10.07it/s] 42it [00:04, 10.05it/s] 44it [00:04, 9.71it/s] 46it [00:04, 9.83it/s] 48it [00:04, 9.90it/s] 50it [00:05, 9.96it/s]2025-05-26 03:41:05,034 - INFO - [Epoch 076 | Batch 0050] IWAE-loss 3677.9912 | mean log_px -0.0094 | KL -3120.58 + 51it [00:05, 9.58it/s] 53it [00:05, 9.73it/s] 54it [00:05, 9.77it/s] 56it [00:05, 9.87it/s] 57it [00:05, 9.47it/s] 58it [00:05, 9.56it/s] 60it [00:06, 9.75it/s] 62it [00:06, 9.85it/s] 64it [00:06, 9.92it/s] 65it [00:06, 9.53it/s] 67it [00:06, 9.71it/s] 69it [00:07, 9.83it/s] 71it [00:07, 9.91it/s] 72it [00:07, 9.91it/s] 73it [00:07, 9.92it/s] 74it [00:07, 9.39it/s] 75it [00:07, 9.51it/s] 77it [00:07, 9.29it/s] 78it [00:08, 9.44it/s] 79it [00:08, 9.55it/s] 81it [00:08, 9.32it/s] 82it [00:08, 9.45it/s] 84it [00:08, 9.67it/s] 86it [00:08, 9.81it/s] 88it [00:09, 9.89it/s] 90it [00:09, 9.95it/s] 91it [00:09, 9.95it/s] 93it [00:09, 10.00it/s] 95it [00:09, 9.64it/s] 97it [00:09, 9.78it/s] 98it [00:10, 9.82it/s] 99it [00:10, 9.83it/s] 100it [00:10, 9.46it/s]2025-05-26 03:41:10,205 - INFO - [Epoch 076 | Batch 0100] IWAE-loss 4684.5400 | mean log_px -0.0297 | KL -3118.37 + 101it [00:10, 9.57it/s] 102it [00:10, 9.68it/s] 103it [00:10, 9.74it/s] 104it [00:10, 9.23it/s] 106it [00:10, 9.57it/s] 108it [00:11, 9.75it/s] 109it [00:11, 9.77it/s] 110it [00:11, 9.76it/s] 111it [00:11, 9.40it/s] 113it [00:11, 9.66it/s] 114it [00:11, 9.73it/s] 115it [00:11, 9.78it/s] 116it [00:11, 9.83it/s] 117it [00:12, 9.83it/s] 119it [00:12, 9.94it/s] 120it [00:12, 9.93it/s] 122it [00:12, 9.98it/s] 124it [00:12, 10.00it/s] 126it [00:12, 10.02it/s] 128it [00:13, 10.04it/s] 130it [00:13, 9.69it/s] 132it [00:13, 9.80it/s] 134it [00:13, 9.89it/s] 136it [00:13, 9.94it/s] 137it [00:14, 9.94it/s] 138it [00:14, 9.92it/s] 140it [00:14, 9.97it/s] 142it [00:14, 10.01it/s] 143it [00:14, 9.58it/s] 144it [00:14, 9.66it/s] 146it [00:14, 9.82it/s] 147it [00:15, 9.83it/s] 148it [00:15, 9.46it/s] 150it [00:15, 9.70it/s]2025-05-26 03:41:15,304 - INFO - [Epoch 076 | Batch 0150] IWAE-loss 4113.5596 | mean log_px -0.0186 | KL -3107.95 + 151it [00:15, 9.31it/s] 153it [00:15, 9.60it/s] 154it [00:15, 9.23it/s] 156it [00:16, 9.54it/s] 158it [00:16, 9.73it/s] 159it [00:16, 9.77it/s] 160it [00:16, 9.45it/s] 162it [00:16, 9.68it/s] 164it [00:16, 9.82it/s] 166it [00:17, 9.91it/s] 167it [00:17, 9.60it/s] 169it [00:17, 9.76it/s] 171it [00:17, 9.87it/s] 172it [00:17, 9.88it/s] 173it [00:17, 9.55it/s] 175it [00:17, 9.75it/s] 177it [00:18, 9.57it/s] 179it [00:18, 9.72it/s] 180it [00:18, 9.75it/s] 181it [00:18, 9.32it/s] 182it [00:18, 9.40it/s] 184it [00:18, 9.55it/s] 185it [00:19, 9.58it/s] 186it [00:19, 9.19it/s] 187it [00:19, 9.18it/s] 188it [00:19, 8.85it/s] 189it [00:19, 9.11it/s] 190it [00:19, 9.32it/s] 192it [00:19, 9.65it/s] 194it [00:19, 9.32it/s] 195it [00:20, 8.96it/s] 196it [00:20, 9.11it/s] 196it [00:20, 9.66it/s] +2025-05-26 03:41:20,158 - INFO - Epoch: 76, Objective: tensor([3478.5898], device='cuda:0', grad_fn=), Loss: 0.005448373034596443, KL/n: 63.492427825927734 + 0it [00:00, ?it/s]2025-05-26 03:41:20,427 - INFO - [Epoch 077 | Batch 0000] IWAE-loss 3869.8042 | mean log_px -0.0148 | KL -3113.27 + 1it [00:00, 5.61it/s] 2it [00:00, 6.91it/s] 4it [00:00, 8.61it/s] 6it [00:00, 9.26it/s] 7it [00:00, 9.41it/s] 8it [00:00, 9.56it/s] 9it [00:01, 9.24it/s] 11it [00:01, 9.59it/s] 13it [00:01, 9.78it/s] 15it [00:01, 9.89it/s] 17it [00:01, 9.96it/s] 19it [00:02, 10.00it/s] 20it [00:02, 9.67it/s] 22it [00:02, 9.80it/s] 24it [00:02, 9.91it/s] 26it [00:02, 9.98it/s] 28it [00:02, 10.03it/s] 30it [00:03, 9.77it/s] 32it [00:03, 9.86it/s] 34it [00:03, 9.94it/s] 36it [00:03, 10.00it/s] 38it [00:03, 10.03it/s] 40it [00:04, 9.96it/s] 41it [00:04, 9.56it/s] 42it [00:04, 9.57it/s] 43it [00:04, 9.64it/s] 44it [00:04, 9.72it/s] 46it [00:04, 9.88it/s] 48it [00:04, 9.96it/s] 49it [00:05, 9.95it/s] 50it [00:05, 9.57it/s]2025-05-26 03:41:25,522 - INFO - [Epoch 077 | Batch 0050] IWAE-loss 4025.5740 | mean log_px -0.0166 | KL -3104.95 + 51it [00:05, 9.67it/s] 53it [00:05, 9.36it/s] 54it [00:05, 9.41it/s] 56it [00:05, 9.65it/s] 57it [00:05, 9.36it/s] 58it [00:06, 9.48it/s] 60it [00:06, 9.37it/s] 61it [00:06, 9.46it/s] 63it [00:06, 9.66it/s] 64it [00:06, 9.73it/s] 66it [00:06, 9.87it/s] 68it [00:07, 9.93it/s] 69it [00:07, 9.52it/s] 71it [00:07, 9.72it/s] 72it [00:07, 9.31it/s] 74it [00:07, 9.58it/s] 75it [00:07, 9.66it/s] 77it [00:07, 9.82it/s] 78it [00:08, 9.84it/s] 79it [00:08, 9.40it/s] 80it [00:08, 9.53it/s] 82it [00:08, 9.74it/s] 84it [00:08, 9.85it/s] 86it [00:08, 9.51it/s] 88it [00:09, 9.68it/s] 90it [00:09, 9.80it/s] 92it [00:09, 9.89it/s] 94it [00:09, 9.95it/s] 96it [00:09, 9.91it/s] 97it [00:10, 9.55it/s] 98it [00:10, 9.63it/s] 100it [00:10, 9.80it/s]2025-05-26 03:41:30,693 - INFO - [Epoch 077 | Batch 0100] IWAE-loss 3877.6897 | mean log_px -0.0162 | KL -3102.57 + 101it [00:10, 9.83it/s] 102it [00:10, 9.48it/s] 104it [00:10, 9.69it/s] 106it [00:10, 9.81it/s] 108it [00:11, 9.89it/s] 110it [00:11, 9.95it/s] 112it [00:11, 10.00it/s] 114it [00:11, 10.03it/s] 116it [00:11, 10.04it/s] 118it [00:12, 10.06it/s] 120it [00:12, 10.07it/s] 122it [00:12, 10.07it/s] 124it [00:12, 10.08it/s] 126it [00:12, 10.06it/s] 128it [00:13, 10.05it/s] 130it [00:13, 10.07it/s] 132it [00:13, 10.06it/s] 134it [00:13, 9.79it/s] 135it [00:13, 9.80it/s] 136it [00:13, 9.42it/s] 138it [00:14, 9.64it/s] 139it [00:14, 9.37it/s] 140it [00:14, 9.47it/s] 142it [00:14, 9.70it/s] 143it [00:14, 9.33it/s] 145it [00:14, 9.61it/s] 147it [00:15, 9.78it/s] 149it [00:15, 9.88it/s] 150it [00:15, 9.51it/s]2025-05-26 03:41:35,788 - INFO - [Epoch 077 | Batch 0150] IWAE-loss 3844.5071 | mean log_px -0.0126 | KL -3099.34 + 151it [00:15, 9.58it/s] 153it [00:15, 9.77it/s] 155it [00:15, 9.89it/s] 156it [00:16, 9.48it/s] 158it [00:16, 9.68it/s] 160it [00:16, 9.81it/s] 161it [00:16, 9.83it/s] 163it [00:16, 9.93it/s] 165it [00:16, 9.98it/s] 167it [00:17, 10.03it/s] 169it [00:17, 10.05it/s] 171it [00:17, 10.08it/s] 173it [00:17, 10.09it/s] 175it [00:17, 10.10it/s] 177it [00:18, 9.74it/s] 179it [00:18, 9.84it/s] 181it [00:18, 9.92it/s] 182it [00:18, 9.92it/s] 184it [00:18, 9.98it/s] 185it [00:18, 9.58it/s] 187it [00:19, 9.75it/s] 189it [00:19, 9.86it/s] 191it [00:19, 9.61it/s] 192it [00:19, 9.66it/s] 194it [00:19, 9.75it/s] 195it [00:20, 9.50it/s] 196it [00:20, 9.72it/s] +2025-05-26 03:41:40,460 - INFO - Epoch: 77, Objective: tensor([3908.6809], device='cuda:0', grad_fn=), Loss: 0.015703242272138596, KL/n: 63.27415466308594 + 0it [00:00, ?it/s]2025-05-26 03:41:40,923 - INFO - [Epoch 078 | Batch 0000] IWAE-loss 3679.0872 | mean log_px -0.0106 | KL -3098.49 + 1it [00:00, 4.79it/s] 2it [00:00, 6.84it/s] 4it [00:00, 8.57it/s] 6it [00:00, 9.22it/s] 7it [00:00, 9.03it/s] 8it [00:00, 9.22it/s] 9it [00:01, 9.42it/s] 11it [00:01, 9.71it/s] 13it [00:01, 9.85it/s] 14it [00:01, 9.88it/s] 16it [00:01, 9.95it/s] 18it [00:01, 9.99it/s] 20it [00:02, 10.03it/s] 22it [00:02, 10.05it/s] 24it [00:02, 10.05it/s] 26it [00:02, 10.05it/s] 28it [00:02, 10.06it/s] 30it [00:03, 10.06it/s] 32it [00:03, 10.06it/s] 34it [00:03, 9.77it/s] 36it [00:03, 9.53it/s] 37it [00:03, 9.60it/s] 39it [00:04, 9.76it/s] 40it [00:04, 9.47it/s] 42it [00:04, 9.66it/s] 44it [00:04, 9.79it/s] 46it [00:04, 9.88it/s] 48it [00:04, 9.94it/s] 50it [00:05, 9.98it/s]2025-05-26 03:41:46,006 - INFO - [Epoch 078 | Batch 0050] IWAE-loss 4400.3760 | mean log_px -0.0214 | KL -3091.28 + 52it [00:05, 10.01it/s] 54it [00:05, 10.03it/s] 56it [00:05, 9.78it/s] 58it [00:05, 9.86it/s] 59it [00:06, 9.87it/s] 61it [00:06, 9.89it/s] 62it [00:06, 9.90it/s] 64it [00:06, 9.97it/s] 66it [00:06, 10.00it/s] 68it [00:06, 9.99it/s] 70it [00:07, 10.01it/s] 72it [00:07, 10.03it/s] 74it [00:07, 10.05it/s] 76it [00:07, 9.71it/s] 78it [00:07, 9.81it/s] 80it [00:08, 9.88it/s] 82it [00:08, 9.63it/s] 84it [00:08, 9.75it/s] 85it [00:08, 9.79it/s] 86it [00:08, 9.83it/s] 87it [00:08, 9.84it/s] 88it [00:09, 9.81it/s] 89it [00:09, 9.41it/s] 91it [00:09, 9.69it/s] 92it [00:09, 9.28it/s] 94it [00:09, 9.58it/s] 95it [00:09, 9.23it/s] 97it [00:09, 9.53it/s] 99it [00:10, 9.72it/s] 100it [00:10, 9.77it/s]2025-05-26 03:41:51,119 - INFO - [Epoch 078 | Batch 0100] IWAE-loss 4047.0798 | mean log_px -0.0176 | KL -3091.62 + 101it [00:10, 9.31it/s] 102it [00:10, 9.30it/s] 103it [00:10, 9.34it/s] 104it [00:10, 9.44it/s] 105it [00:10, 9.55it/s] 106it [00:10, 9.62it/s] 107it [00:11, 9.69it/s] 108it [00:11, 9.14it/s] 109it [00:11, 9.33it/s] 110it [00:11, 9.46it/s] 111it [00:11, 9.56it/s] 112it [00:11, 9.61it/s] 113it [00:11, 9.64it/s] 114it [00:11, 9.10it/s] 116it [00:11, 9.53it/s] 118it [00:12, 9.73it/s] 119it [00:12, 9.68it/s] 120it [00:12, 9.70it/s] 121it [00:12, 9.77it/s] 123it [00:12, 9.88it/s] 124it [00:12, 9.90it/s] 126it [00:12, 9.96it/s] 128it [00:13, 10.02it/s] 130it [00:13, 10.03it/s] 132it [00:13, 9.67it/s] 134it [00:13, 9.78it/s] 136it [00:14, 9.87it/s] 138it [00:14, 9.94it/s] 140it [00:14, 9.72it/s] 142it [00:14, 9.82it/s] 144it [00:14, 9.90it/s] 146it [00:15, 9.96it/s] 148it [00:15, 10.00it/s] 150it [00:15, 10.03it/s]2025-05-26 03:41:56,251 - INFO - [Epoch 078 | Batch 0150] IWAE-loss 4209.9824 | mean log_px -0.0231 | KL -3090.24 + 152it [00:15, 9.65it/s] 154it [00:15, 9.79it/s] 156it [00:16, 9.87it/s] 158it [00:16, 9.93it/s] 160it [00:16, 9.97it/s] 162it [00:16, 10.01it/s] 164it [00:16, 9.68it/s] 166it [00:17, 9.81it/s] 168it [00:17, 9.88it/s] 170it [00:17, 9.95it/s] 172it [00:17, 9.99it/s] 174it [00:17, 9.64it/s] 175it [00:17, 9.58it/s] 176it [00:18, 9.44it/s] 177it [00:18, 9.50it/s] 178it [00:18, 9.59it/s] 180it [00:18, 9.34it/s] 182it [00:18, 9.61it/s] 184it [00:18, 9.74it/s] 186it [00:19, 9.65it/s] 188it [00:19, 9.78it/s] 190it [00:19, 9.86it/s] 192it [00:19, 9.66it/s] 193it [00:19, 9.71it/s] 194it [00:19, 9.77it/s] 195it [00:20, 9.47it/s] 196it [00:20, 9.70it/s] +2025-05-26 03:42:00,994 - INFO - Epoch: 78, Objective: tensor([4202.6504], device='cuda:0', grad_fn=), Loss: 0.022261351346969604, KL/n: 63.005916595458984 + 0it [00:00, ?it/s]2025-05-26 03:42:01,262 - INFO - [Epoch 079 | Batch 0000] IWAE-loss 3951.9302 | mean log_px -0.0140 | KL -3084.01 + 1it [00:00, 4.83it/s] 2it [00:00, 6.88it/s] 4it [00:00, 8.59it/s] 6it [00:00, 9.23it/s] 8it [00:00, 9.56it/s] 9it [00:01, 9.62it/s] 10it [00:01, 9.69it/s] 11it [00:01, 9.71it/s] 13it [00:01, 9.40it/s] 14it [00:01, 9.53it/s] 15it [00:01, 9.44it/s] 16it [00:01, 9.58it/s] 18it [00:01, 9.80it/s] 19it [00:02, 9.33it/s] 20it [00:02, 9.49it/s] 21it [00:02, 9.62it/s] 22it [00:02, 9.23it/s] 24it [00:02, 9.56it/s] 26it [00:02, 9.75it/s] 28it [00:02, 9.87it/s] 29it [00:03, 9.47it/s] 30it [00:03, 9.54it/s] 31it [00:03, 9.53it/s] 32it [00:03, 9.14it/s] 34it [00:03, 9.49it/s] 35it [00:03, 9.11it/s] 37it [00:03, 9.45it/s] 39it [00:04, 9.68it/s] 41it [00:04, 9.81it/s] 42it [00:04, 9.82it/s] 44it [00:04, 9.91it/s] 46it [00:04, 9.97it/s] 48it [00:05, 10.01it/s] 50it [00:05, 9.67it/s]2025-05-26 03:42:06,454 - INFO - [Epoch 079 | Batch 0050] IWAE-loss 4607.3691 | mean log_px -0.0238 | KL -3084.28 + 51it [00:05, 9.73it/s] 52it [00:05, 9.78it/s] 54it [00:05, 9.90it/s] 56it [00:05, 9.96it/s] 58it [00:06, 10.00it/s] 60it [00:06, 10.04it/s] 62it [00:06, 10.00it/s] 64it [00:06, 10.02it/s] 66it [00:06, 10.04it/s] 68it [00:07, 10.03it/s] 70it [00:07, 10.05it/s] 72it [00:07, 10.05it/s] 74it [00:07, 10.06it/s] 76it [00:07, 10.08it/s] 78it [00:08, 9.73it/s] 80it [00:08, 9.81it/s] 82it [00:08, 9.90it/s] 84it [00:08, 9.95it/s] 85it [00:08, 9.71it/s] 87it [00:08, 9.83it/s] 88it [00:09, 9.86it/s] 89it [00:09, 9.43it/s] 91it [00:09, 9.67it/s] 93it [00:09, 9.51it/s] 95it [00:09, 9.70it/s] 97it [00:10, 9.82it/s] 99it [00:10, 9.61it/s] 100it [00:10, 9.68it/s]2025-05-26 03:42:11,520 - INFO - [Epoch 079 | Batch 0100] IWAE-loss 4182.2646 | mean log_px -0.0189 | KL -3085.25 + 102it [00:10, 9.51it/s] 104it [00:10, 9.71it/s] 106it [00:10, 9.54it/s] 107it [00:11, 9.57it/s] 108it [00:11, 9.63it/s] 110it [00:11, 9.79it/s] 112it [00:11, 9.87it/s] 114it [00:11, 9.94it/s] 116it [00:11, 9.98it/s] 118it [00:12, 10.02it/s] 120it [00:12, 10.03it/s] 122it [00:12, 10.05it/s] 124it [00:12, 10.05it/s] 126it [00:12, 10.05it/s] 128it [00:13, 9.71it/s] 130it [00:13, 9.81it/s] 131it [00:13, 9.79it/s] 132it [00:13, 9.30it/s] 133it [00:13, 9.37it/s] 134it [00:13, 9.50it/s] 135it [00:13, 9.59it/s] 136it [00:14, 9.24it/s] 137it [00:14, 9.43it/s] 138it [00:14, 9.54it/s] 139it [00:14, 9.63it/s] 140it [00:14, 9.68it/s] 141it [00:14, 9.60it/s] 142it [00:14, 9.58it/s] 143it [00:14, 9.59it/s] 144it [00:14, 9.66it/s] 145it [00:14, 9.69it/s] 146it [00:15, 9.73it/s] 147it [00:15, 9.77it/s] 148it [00:15, 9.77it/s] 149it [00:15, 9.81it/s] 150it [00:15, 9.80it/s]2025-05-26 03:42:16,657 - INFO - [Epoch 079 | Batch 0150] IWAE-loss 3905.8240 | mean log_px -0.0154 | KL -3072.65 + 151it [00:15, 9.80it/s] 152it [00:15, 9.80it/s] 153it [00:15, 9.81it/s] 154it [00:15, 9.82it/s] 155it [00:15, 9.82it/s] 156it [00:16, 9.82it/s] 157it [00:16, 9.84it/s] 158it [00:16, 9.82it/s] 159it [00:16, 9.83it/s] 160it [00:16, 9.82it/s] 161it [00:16, 9.84it/s] 162it [00:16, 9.83it/s] 163it [00:16, 9.84it/s] 164it [00:16, 9.85it/s] 165it [00:16, 9.84it/s] 166it [00:17, 9.84it/s] 167it [00:17, 9.85it/s] 168it [00:17, 9.83it/s] 169it [00:17, 9.83it/s] 170it [00:17, 9.80it/s] 171it [00:17, 9.77it/s] 172it [00:17, 9.78it/s] 173it [00:17, 9.81it/s] 174it [00:17, 9.79it/s] 175it [00:18, 9.78it/s] 176it [00:18, 9.78it/s] 177it [00:18, 9.78it/s] 178it [00:18, 9.78it/s] 179it [00:18, 9.76it/s] 180it [00:18, 9.78it/s] 181it [00:18, 9.78it/s] 182it [00:18, 9.78it/s] 183it [00:18, 9.79it/s] 184it [00:18, 9.81it/s] 185it [00:19, 9.81it/s] 186it [00:19, 9.81it/s] 187it [00:19, 9.82it/s] 188it [00:19, 9.82it/s] 189it [00:19, 9.81it/s] 190it [00:19, 9.80it/s] 191it [00:19, 9.80it/s] 192it [00:19, 9.81it/s] 193it [00:19, 9.82it/s] 194it [00:19, 9.82it/s] 195it [00:20, 9.36it/s] 196it [00:20, 9.69it/s] +2025-05-26 03:42:21,353 - INFO - Epoch: 79, Objective: tensor([3949.7637], device='cuda:0', grad_fn=), Loss: 0.015167269855737686, KL/n: 62.748844146728516 + 0it [00:00, ?it/s]2025-05-26 03:42:21,821 - INFO - [Epoch 080 | Batch 0000] IWAE-loss 4421.7627 | mean log_px -0.0238 | KL -3073.79 + 1it [00:00, 5.17it/s] 2it [00:00, 7.07it/s] 3it [00:00, 8.09it/s] 4it [00:00, 8.69it/s] 5it [00:00, 9.07it/s] 6it [00:00, 9.29it/s] 7it [00:00, 9.40it/s] 8it [00:00, 9.33it/s] 9it [00:01, 9.26it/s] 10it [00:01, 9.10it/s] 11it [00:01, 9.29it/s] 12it [00:01, 9.42it/s] 13it [00:01, 9.53it/s] 14it [00:01, 9.59it/s] 15it [00:01, 9.63it/s] 16it [00:01, 9.68it/s] 17it [00:01, 9.71it/s] 18it [00:01, 9.71it/s] 19it [00:02, 9.74it/s] 20it [00:02, 9.70it/s] 21it [00:02, 9.72it/s] 22it [00:02, 9.32it/s] 23it [00:02, 9.16it/s] 24it [00:02, 9.17it/s] 25it [00:02, 9.30it/s] 26it [00:02, 9.36it/s] 27it [00:02, 9.44it/s] 28it [00:03, 9.48it/s] 29it [00:03, 9.53it/s] 30it [00:03, 9.55it/s] 31it [00:03, 9.58it/s] 32it [00:03, 9.57it/s] 33it [00:03, 9.59it/s] 34it [00:03, 9.60it/s] 35it [00:03, 9.52it/s] 36it [00:03, 9.57it/s] 37it [00:03, 9.62it/s] 38it [00:04, 9.64it/s] 39it [00:04, 9.68it/s] 40it [00:04, 9.68it/s] 41it [00:04, 9.72it/s] 42it [00:04, 9.66it/s] 43it [00:04, 9.70it/s] 44it [00:04, 9.71it/s] 45it [00:04, 9.73it/s] 46it [00:04, 9.75it/s] 47it [00:04, 9.77it/s] 48it [00:05, 9.77it/s] 49it [00:05, 9.78it/s] 50it [00:05, 9.75it/s]2025-05-26 03:42:27,036 - INFO - [Epoch 080 | Batch 0050] IWAE-loss 4183.6655 | mean log_px -0.0173 | KL -3067.25 + 51it [00:05, 9.60it/s] 52it [00:05, 9.63it/s] 53it [00:05, 9.68it/s] 54it [00:05, 9.70it/s] 55it [00:05, 9.74it/s] 56it [00:05, 9.74it/s] 57it [00:06, 9.74it/s] 58it [00:06, 9.75it/s] 59it [00:06, 9.78it/s] 60it [00:06, 9.78it/s] 61it [00:06, 9.78it/s] 62it [00:06, 9.78it/s] 63it [00:06, 9.71it/s] 64it [00:06, 9.75it/s] 65it [00:06, 9.81it/s] 66it [00:06, 9.82it/s] 67it [00:07, 9.84it/s] 68it [00:07, 9.84it/s] 69it [00:07, 9.85it/s] 70it [00:07, 9.83it/s] 71it [00:07, 9.84it/s] 72it [00:07, 9.81it/s] 73it [00:07, 9.83it/s] 74it [00:07, 9.84it/s] 75it [00:07, 9.86it/s] 76it [00:07, 9.82it/s] 77it [00:08, 9.85it/s] 78it [00:08, 9.84it/s] 79it [00:08, 9.86it/s] 80it [00:08, 9.88it/s] 81it [00:08, 9.88it/s] 82it [00:08, 9.88it/s] 83it [00:08, 9.89it/s] 84it [00:08, 9.88it/s] 85it [00:08, 9.89it/s] 86it [00:08, 9.87it/s] 87it [00:09, 9.86it/s] 88it [00:09, 9.86it/s] 89it [00:09, 9.88it/s] 90it [00:09, 9.87it/s] 91it [00:09, 9.86it/s] 92it [00:09, 9.85it/s] 93it [00:09, 9.78it/s] 94it [00:09, 9.79it/s] 96it [00:09, 9.91it/s] 97it [00:10, 9.92it/s] 98it [00:10, 9.94it/s] 99it [00:10, 9.37it/s] 100it [00:10, 9.50it/s]2025-05-26 03:42:32,143 - INFO - [Epoch 080 | Batch 0100] IWAE-loss 3951.3103 | mean log_px -0.0163 | KL -3071.85 + 101it [00:10, 9.58it/s] 102it [00:10, 9.66it/s] 103it [00:10, 9.74it/s] 104it [00:10, 9.78it/s] 106it [00:11, 9.42it/s] 107it [00:11, 9.50it/s] 109it [00:11, 9.72it/s] 110it [00:11, 9.70it/s] 112it [00:11, 9.83it/s] 113it [00:11, 9.85it/s] 114it [00:11, 9.87it/s] 115it [00:11, 9.87it/s] 116it [00:12, 9.90it/s] 117it [00:12, 9.32it/s] 118it [00:12, 9.46it/s] 119it [00:12, 9.60it/s] 120it [00:12, 9.66it/s] 121it [00:12, 9.75it/s] 122it [00:12, 9.81it/s] 123it [00:12, 9.85it/s] 124it [00:12, 9.85it/s] 125it [00:12, 9.89it/s] 126it [00:13, 9.24it/s] 127it [00:13, 9.44it/s] 129it [00:13, 9.76it/s] 130it [00:13, 9.80it/s] 131it [00:13, 9.85it/s] 132it [00:13, 9.88it/s] 134it [00:13, 9.96it/s] 135it [00:13, 9.96it/s] 136it [00:14, 9.38it/s] 138it [00:14, 9.67it/s] 139it [00:14, 9.72it/s] 141it [00:14, 9.87it/s] 142it [00:14, 9.87it/s] 144it [00:14, 9.62it/s] 146it [00:15, 9.79it/s] 148it [00:15, 9.90it/s] 150it [00:15, 9.97it/s]2025-05-26 03:42:37,262 - INFO - [Epoch 080 | Batch 0150] IWAE-loss 3631.5173 | mean log_px -0.0095 | KL -3060.06 + 151it [00:15, 9.97it/s] 153it [00:15, 9.65it/s] 154it [00:15, 9.70it/s] 156it [00:16, 9.45it/s] 158it [00:16, 9.65it/s] 160it [00:16, 9.77it/s] 162it [00:16, 9.86it/s] 163it [00:16, 9.76it/s] 164it [00:16, 9.45it/s] 165it [00:17, 9.57it/s] 167it [00:17, 9.78it/s] 169it [00:17, 9.70it/s] 170it [00:17, 9.42it/s] 172it [00:17, 9.67it/s] 173it [00:17, 9.23it/s] 175it [00:18, 9.54it/s] 177it [00:18, 9.73it/s] 179it [00:18, 9.85it/s] 181it [00:18, 9.93it/s] 183it [00:18, 9.99it/s] 185it [00:19, 10.03it/s] 187it [00:19, 10.05it/s] 189it [00:19, 10.06it/s] 191it [00:19, 9.73it/s] 193it [00:19, 9.84it/s] 195it [00:20, 9.34it/s] 196it [00:20, 9.64it/s] +2025-05-26 03:42:42,006 - INFO - Epoch: 80, Objective: tensor([3925.0637], device='cuda:0', grad_fn=), Loss: 0.012692895717918873, KL/n: 62.49341583251953 + 0it [00:00, ?it/s]2025-05-26 03:42:42,279 - INFO - [Epoch 081 | Batch 0000] IWAE-loss 4076.6638 | mean log_px -0.0189 | KL -3062.57 + 1it [00:00, 5.39it/s] 2it [00:00, 7.33it/s] 4it [00:00, 8.85it/s] 6it [00:00, 9.42it/s] 8it [00:00, 9.68it/s] 10it [00:01, 9.84it/s] 12it [00:01, 9.92it/s] 14it [00:01, 9.98it/s] 16it [00:01, 9.67it/s] 18it [00:01, 9.80it/s] 20it [00:02, 9.88it/s] 22it [00:02, 9.51it/s] 24it [00:02, 9.67it/s] 26it [00:02, 9.78it/s] 28it [00:02, 9.87it/s] 30it [00:03, 9.94it/s] 32it [00:03, 9.63it/s] 34it [00:03, 9.75it/s] 36it [00:03, 9.58it/s] 37it [00:03, 9.59it/s] 38it [00:03, 9.66it/s] 39it [00:04, 9.72it/s] 40it [00:04, 9.78it/s] 42it [00:04, 9.90it/s] 43it [00:04, 9.42it/s] 44it [00:04, 9.48it/s] 45it [00:04, 9.58it/s] 47it [00:04, 9.77it/s] 48it [00:05, 9.33it/s] 50it [00:05, 9.61it/s]2025-05-26 03:42:47,404 - INFO - [Epoch 081 | Batch 0050] IWAE-loss 3596.1819 | mean log_px -0.0087 | KL -3056.84 + 51it [00:05, 9.69it/s] 52it [00:05, 9.76it/s] 54it [00:05, 9.87it/s] 55it [00:05, 9.90it/s] 56it [00:05, 9.92it/s] 58it [00:06, 9.97it/s] 59it [00:06, 9.97it/s] 60it [00:06, 9.98it/s] 62it [00:06, 10.00it/s] 64it [00:06, 10.02it/s] 66it [00:06, 10.02it/s] 68it [00:07, 9.66it/s] 69it [00:07, 9.72it/s] 71it [00:07, 9.84it/s] 72it [00:07, 9.86it/s] 74it [00:07, 9.94it/s] 75it [00:07, 9.88it/s] 76it [00:07, 9.87it/s] 78it [00:08, 9.95it/s] 80it [00:08, 9.99it/s] 82it [00:08, 10.02it/s] 84it [00:08, 10.03it/s] 86it [00:08, 10.04it/s] 88it [00:09, 9.69it/s] 90it [00:09, 9.80it/s] 92it [00:09, 9.88it/s] 93it [00:09, 9.52it/s] 94it [00:09, 9.61it/s] 96it [00:09, 9.37it/s] 98it [00:10, 9.58it/s] 99it [00:10, 9.66it/s]2025-05-26 03:42:52,483 - INFO - [Epoch 081 | Batch 0100] IWAE-loss 4514.4556 | mean log_px -0.0243 | KL -3053.01 + 101it [00:10, 9.78it/s] 103it [00:10, 9.87it/s] 104it [00:10, 9.89it/s] 105it [00:10, 9.91it/s] 106it [00:10, 9.92it/s] 107it [00:11, 9.39it/s] 108it [00:11, 9.54it/s] 110it [00:11, 9.74it/s] 112it [00:11, 9.44it/s] 113it [00:11, 9.55it/s] 115it [00:11, 9.74it/s] 117it [00:12, 9.84it/s] 119it [00:12, 9.91it/s] 120it [00:12, 9.90it/s] 122it [00:12, 9.58it/s] 123it [00:12, 9.65it/s] 124it [00:12, 9.73it/s] 125it [00:12, 9.38it/s] 126it [00:12, 9.51it/s] 127it [00:13, 9.60it/s] 128it [00:13, 9.60it/s] 129it [00:13, 9.03it/s] 130it [00:13, 9.15it/s] 131it [00:13, 9.33it/s] 132it [00:13, 8.91it/s] 134it [00:13, 9.40it/s] 136it [00:14, 9.64it/s] 137it [00:14, 9.71it/s] 138it [00:14, 9.77it/s] 140it [00:14, 9.86it/s] 141it [00:14, 9.89it/s] 142it [00:14, 9.91it/s] 144it [00:14, 9.97it/s] 145it [00:14, 9.50it/s] 146it [00:15, 9.61it/s] 147it [00:15, 9.71it/s] 148it [00:15, 9.78it/s] 150it [00:15, 9.90it/s]2025-05-26 03:42:57,655 - INFO - [Epoch 081 | Batch 0150] IWAE-loss 3807.7285 | mean log_px -0.0127 | KL -3054.70 + 151it [00:15, 9.92it/s] 152it [00:15, 9.92it/s] 153it [00:15, 9.37it/s] 154it [00:15, 9.53it/s] 156it [00:16, 9.75it/s] 158it [00:16, 9.87it/s] 160it [00:16, 9.93it/s] 162it [00:16, 9.97it/s] 164it [00:16, 9.95it/s] 165it [00:16, 9.61it/s] 166it [00:17, 9.66it/s] 168it [00:17, 9.80it/s] 169it [00:17, 9.83it/s] 170it [00:17, 9.84it/s] 171it [00:17, 9.35it/s] 172it [00:17, 9.50it/s] 173it [00:17, 9.63it/s] 174it [00:17, 9.72it/s] 175it [00:18, 9.80it/s] 176it [00:18, 9.84it/s] 177it [00:18, 9.28it/s] 178it [00:18, 9.44it/s] 180it [00:18, 9.70it/s] 181it [00:18, 9.75it/s] 182it [00:18, 9.80it/s] 184it [00:18, 9.78it/s] 186it [00:19, 9.83it/s] 187it [00:19, 9.78it/s] 189it [00:19, 9.91it/s] 190it [00:19, 9.92it/s] 191it [00:19, 9.43it/s] 192it [00:19, 9.50it/s] 193it [00:19, 9.62it/s] 194it [00:20, 9.12it/s] 195it [00:20, 8.99it/s] 196it [00:20, 9.66it/s] +2025-05-26 03:43:02,419 - INFO - Epoch: 81, Objective: tensor([4405.5898], device='cuda:0', grad_fn=), Loss: 0.024367935955524445, KL/n: 62.24941635131836 + 0it [00:00, ?it/s]2025-05-26 03:43:02,870 - INFO - [Epoch 082 | Batch 0000] IWAE-loss 4408.0596 | mean log_px -0.0199 | KL -3051.39 + 1it [00:00, 4.79it/s] 2it [00:00, 6.88it/s] 4it [00:00, 8.60it/s] 6it [00:00, 9.28it/s] 8it [00:00, 9.61it/s] 10it [00:01, 9.79it/s] 12it [00:01, 9.91it/s] 14it [00:01, 9.84it/s] 15it [00:01, 9.59it/s] 16it [00:01, 9.67it/s] 17it [00:01, 9.67it/s] 18it [00:01, 9.73it/s] 20it [00:02, 9.91it/s] 22it [00:02, 9.99it/s] 24it [00:02, 10.05it/s] 26it [00:02, 10.09it/s] 28it [00:02, 10.11it/s] 30it [00:03, 9.84it/s] 32it [00:03, 9.92it/s] 34it [00:03, 9.98it/s] 36it [00:03, 10.03it/s] 38it [00:03, 9.78it/s] 40it [00:04, 9.90it/s] 42it [00:04, 9.98it/s] 44it [00:04, 10.02it/s] 46it [00:04, 9.81it/s] 48it [00:04, 9.91it/s] 50it [00:05, 9.99it/s]2025-05-26 03:43:07,919 - INFO - [Epoch 082 | Batch 0050] IWAE-loss 4216.4087 | mean log_px -0.0181 | KL -3045.86 + 51it [00:05, 9.98it/s] 52it [00:05, 9.92it/s] 54it [00:05, 9.99it/s] 56it [00:05, 10.04it/s] 58it [00:05, 10.07it/s] 60it [00:06, 10.09it/s] 62it [00:06, 10.10it/s] 64it [00:06, 9.73it/s] 66it [00:06, 9.85it/s] 68it [00:06, 9.65it/s] 70it [00:07, 9.79it/s] 71it [00:07, 9.52it/s] 73it [00:07, 9.71it/s] 75it [00:07, 9.84it/s] 77it [00:07, 9.92it/s] 79it [00:08, 9.99it/s] 81it [00:08, 10.05it/s] 83it [00:08, 9.73it/s] 85it [00:08, 9.85it/s] 87it [00:08, 9.93it/s] 89it [00:09, 9.98it/s] 91it [00:09, 10.02it/s] 93it [00:09, 10.04it/s] 95it [00:09, 10.07it/s] 97it [00:09, 9.80it/s] 98it [00:09, 9.80it/s] 100it [00:10, 9.91it/s]2025-05-26 03:43:12,972 - INFO - [Epoch 082 | Batch 0100] IWAE-loss 4081.9727 | mean log_px -0.0158 | KL -3040.89 + 102it [00:10, 9.62it/s] 104it [00:10, 9.77it/s] 105it [00:10, 9.52it/s] 107it [00:10, 9.72it/s] 109it [00:11, 9.86it/s] 111it [00:11, 9.94it/s] 113it [00:11, 10.00it/s] 115it [00:11, 10.02it/s] 116it [00:11, 9.98it/s] 117it [00:11, 9.60it/s] 118it [00:12, 9.67it/s] 119it [00:12, 9.71it/s] 120it [00:12, 9.74it/s] 121it [00:12, 9.34it/s] 122it [00:12, 9.50it/s] 123it [00:12, 9.63it/s] 124it [00:12, 9.71it/s] 125it [00:12, 9.74it/s] 126it [00:12, 9.79it/s] 127it [00:12, 9.84it/s] 128it [00:13, 9.87it/s] 129it [00:13, 9.25it/s] 130it [00:13, 9.45it/s] 132it [00:13, 9.71it/s] 133it [00:13, 9.39it/s] 134it [00:13, 9.46it/s] 135it [00:13, 9.03it/s] 136it [00:13, 9.26it/s] 137it [00:14, 9.37it/s] 138it [00:14, 9.07it/s] 139it [00:14, 9.26it/s] 140it [00:14, 9.45it/s] 141it [00:14, 9.54it/s] 142it [00:14, 9.64it/s] 143it [00:14, 9.42it/s] 144it [00:14, 8.99it/s] 145it [00:14, 8.90it/s] 146it [00:15, 8.52it/s] 147it [00:15, 8.83it/s] 148it [00:15, 9.03it/s] 149it [00:15, 9.23it/s] 150it [00:15, 9.38it/s]2025-05-26 03:43:18,240 - INFO - [Epoch 082 | Batch 0150] IWAE-loss 3857.5825 | mean log_px -0.0146 | KL -3036.50 + 151it [00:15, 9.47it/s] 152it [00:15, 9.09it/s] 153it [00:15, 9.21it/s] 154it [00:15, 9.31it/s] 155it [00:16, 8.86it/s] 156it [00:16, 9.05it/s] 157it [00:16, 9.18it/s] 158it [00:16, 9.28it/s] 159it [00:16, 9.26it/s] 160it [00:16, 8.74it/s] 161it [00:16, 9.04it/s] 162it [00:16, 9.20it/s] 163it [00:16, 9.25it/s] 164it [00:16, 9.38it/s] 165it [00:17, 8.88it/s] 166it [00:17, 9.06it/s] 167it [00:17, 9.20it/s] 168it [00:17, 9.25it/s] 169it [00:17, 9.37it/s] 170it [00:17, 8.82it/s] 171it [00:17, 9.05it/s] 172it [00:17, 9.16it/s] 173it [00:17, 9.30it/s] 174it [00:18, 9.47it/s] 175it [00:18, 9.57it/s] 176it [00:18, 9.65it/s] 177it [00:18, 9.73it/s] 178it [00:18, 9.26it/s] 179it [00:18, 9.36it/s] 180it [00:18, 9.49it/s] 181it [00:18, 8.85it/s] 182it [00:18, 8.99it/s] 183it [00:19, 8.74it/s] 184it [00:19, 8.98it/s] 185it [00:19, 9.20it/s] 186it [00:19, 9.29it/s] 187it [00:19, 9.41it/s] 188it [00:19, 9.48it/s] 189it [00:19, 8.94it/s] 190it [00:19, 9.10it/s] 191it [00:19, 9.21it/s] 192it [00:20, 9.30it/s] 193it [00:20, 8.94it/s] 194it [00:20, 9.10it/s] 195it [00:20, 8.76it/s] 196it [00:20, 9.05it/s] 196it [00:20, 9.54it/s] +2025-05-26 03:43:23,266 - INFO - Epoch: 82, Objective: tensor([3370.0046], device='cuda:0', grad_fn=), Loss: 0.005570830777287483, KL/n: 62.00031280517578 + 0it [00:00, ?it/s]2025-05-26 03:43:23,523 - INFO - [Epoch 083 | Batch 0000] IWAE-loss 4002.6240 | mean log_px -0.0153 | KL -3036.43 + 1it [00:00, 5.20it/s] 2it [00:00, 7.09it/s] 3it [00:00, 8.03it/s] 4it [00:00, 8.54it/s] 5it [00:00, 8.84it/s] 6it [00:00, 8.89it/s] 7it [00:00, 9.09it/s] 8it [00:00, 9.18it/s] 9it [00:01, 9.30it/s] 10it [00:01, 9.43it/s] 11it [00:01, 9.44it/s] 12it [00:01, 9.08it/s] 13it [00:01, 9.15it/s] 14it [00:01, 9.28it/s] 15it [00:01, 9.35it/s] 16it [00:01, 9.39it/s] 17it [00:01, 9.43it/s] 18it [00:02, 9.46it/s] 19it [00:02, 9.49it/s] 20it [00:02, 9.53it/s] 21it [00:02, 9.55it/s] 22it [00:02, 9.57it/s] 23it [00:02, 9.57it/s] 24it [00:02, 9.62it/s] 25it [00:02, 9.59it/s] 26it [00:02, 9.58it/s] 27it [00:02, 9.01it/s] 28it [00:03, 9.16it/s] 29it [00:03, 9.28it/s] 30it [00:03, 9.35it/s] 31it [00:03, 8.71it/s] 32it [00:03, 8.75it/s] 33it [00:03, 8.95it/s] 34it [00:03, 9.17it/s] 35it [00:03, 9.33it/s] 36it [00:03, 9.45it/s] 37it [00:04, 9.01it/s] 38it [00:04, 9.16it/s] 39it [00:04, 9.29it/s] 40it [00:04, 9.30it/s] 41it [00:04, 9.36it/s] 42it [00:04, 8.79it/s] 43it [00:04, 8.98it/s] 44it [00:04, 9.16it/s] 45it [00:04, 9.28it/s] 46it [00:05, 9.39it/s] 47it [00:05, 9.41it/s] 48it [00:05, 9.47it/s] 49it [00:05, 9.54it/s] 50it [00:05, 9.54it/s]2025-05-26 03:43:28,911 - INFO - [Epoch 083 | Batch 0050] IWAE-loss 3834.6262 | mean log_px -0.0148 | KL -3028.71 + 51it [00:05, 9.56it/s] 52it [00:05, 9.53it/s] 53it [00:05, 9.05it/s] 54it [00:05, 9.24it/s] 55it [00:05, 9.37it/s] 56it [00:06, 8.95it/s] 57it [00:06, 8.78it/s] 58it [00:06, 8.88it/s] 59it [00:06, 9.02it/s] 60it [00:06, 9.21it/s] 61it [00:06, 8.79it/s] 62it [00:06, 9.01it/s] 63it [00:06, 9.18it/s] 64it [00:06, 9.06it/s] 65it [00:07, 9.23it/s] 66it [00:07, 9.38it/s] 67it [00:07, 8.97it/s] 68it [00:07, 9.12it/s] 69it [00:07, 9.31it/s] 70it [00:07, 9.43it/s] 71it [00:07, 9.52it/s] 72it [00:07, 9.57it/s] 73it [00:07, 9.64it/s] 74it [00:08, 9.63it/s] 75it [00:08, 9.69it/s] 76it [00:08, 9.71it/s] 77it [00:08, 9.68it/s] 78it [00:08, 9.69it/s] 79it [00:08, 9.71it/s] 80it [00:08, 9.73it/s] 81it [00:08, 9.70it/s] 82it [00:08, 9.69it/s] 83it [00:08, 9.72it/s] 84it [00:09, 9.67it/s] 85it [00:09, 9.68it/s] 86it [00:09, 9.68it/s] 87it [00:09, 9.68it/s] 88it [00:09, 9.70it/s] 89it [00:09, 9.71it/s] 90it [00:09, 9.70it/s] 91it [00:09, 9.71it/s] 92it [00:09, 9.72it/s] 93it [00:10, 9.70it/s] 94it [00:10, 9.70it/s] 95it [00:10, 9.70it/s] 96it [00:10, 9.69it/s] 97it [00:10, 9.74it/s] 98it [00:10, 9.71it/s] 99it [00:10, 9.71it/s] 100it [00:10, 9.69it/s]2025-05-26 03:43:34,190 - INFO - [Epoch 083 | Batch 0100] IWAE-loss 4239.6172 | mean log_px -0.0240 | KL -3028.14 + 101it [00:10, 9.54it/s] 102it [00:10, 9.60it/s] 103it [00:11, 9.63it/s] 104it [00:11, 9.67it/s] 105it [00:11, 9.66it/s] 106it [00:11, 9.69it/s] 107it [00:11, 9.72it/s] 108it [00:11, 9.72it/s] 109it [00:11, 9.73it/s] 110it [00:11, 9.70it/s] 111it [00:11, 9.70it/s] 112it [00:11, 9.69it/s] 113it [00:12, 9.60it/s] 114it [00:12, 9.59it/s] 115it [00:12, 9.61it/s] 116it [00:12, 9.65it/s] 117it [00:12, 9.70it/s] 118it [00:12, 9.68it/s] 119it [00:12, 9.69it/s] 120it [00:12, 9.68it/s] 121it [00:12, 9.68it/s] 122it [00:13, 9.72it/s] 123it [00:13, 9.73it/s] 124it [00:13, 9.74it/s] 125it [00:13, 9.74it/s] 126it [00:13, 9.73it/s] 127it [00:13, 9.73it/s] 128it [00:13, 9.74it/s] 129it [00:13, 9.77it/s] 130it [00:13, 9.74it/s] 131it [00:13, 9.75it/s] 132it [00:14, 9.74it/s] 133it [00:14, 9.75it/s] 134it [00:14, 9.72it/s] 135it [00:14, 9.73it/s] 136it [00:14, 9.71it/s] 137it [00:14, 9.71it/s] 138it [00:14, 9.73it/s] 139it [00:14, 9.76it/s] 140it [00:14, 9.77it/s] 141it [00:14, 9.79it/s] 142it [00:15, 9.76it/s] 143it [00:15, 9.77it/s] 144it [00:15, 9.77it/s] 145it [00:15, 9.78it/s] 146it [00:15, 9.77it/s] 147it [00:15, 9.69it/s] 148it [00:15, 9.70it/s] 149it [00:15, 9.10it/s] 150it [00:15, 9.29it/s]2025-05-26 03:43:39,363 - INFO - [Epoch 083 | Batch 0150] IWAE-loss 3907.8083 | mean log_px -0.0154 | KL -3022.59 + 151it [00:16, 9.40it/s] 152it [00:16, 9.52it/s] 153it [00:16, 9.60it/s] 154it [00:16, 9.65it/s] 155it [00:16, 9.70it/s] 156it [00:16, 9.71it/s] 157it [00:16, 9.70it/s] 158it [00:16, 9.69it/s] 159it [00:16, 9.72it/s] 160it [00:16, 9.12it/s] 161it [00:17, 9.32it/s] 162it [00:17, 9.46it/s] 163it [00:17, 9.56it/s] 164it [00:17, 9.60it/s] 165it [00:17, 9.67it/s] 166it [00:17, 9.71it/s] 167it [00:17, 9.73it/s] 168it [00:17, 9.70it/s] 169it [00:17, 9.66it/s] 170it [00:17, 9.64it/s] 171it [00:18, 9.63it/s] 172it [00:18, 9.64it/s] 173it [00:18, 9.68it/s] 174it [00:18, 9.68it/s] 175it [00:18, 9.09it/s] 176it [00:18, 9.28it/s] 177it [00:18, 9.43it/s] 178it [00:18, 9.54it/s] 179it [00:18, 9.59it/s] 180it [00:19, 9.66it/s] 181it [00:19, 9.68it/s] 182it [00:19, 9.70it/s] 183it [00:19, 9.71it/s] 184it [00:19, 9.16it/s] 185it [00:19, 9.29it/s] 186it [00:19, 9.43it/s] 187it [00:19, 9.52it/s] 188it [00:19, 9.58it/s] 189it [00:19, 9.61it/s] 190it [00:20, 9.57it/s] 191it [00:20, 9.61it/s] 192it [00:20, 9.62it/s] 193it [00:20, 9.64it/s] 194it [00:20, 9.62it/s] 195it [00:20, 9.07it/s] 196it [00:20, 9.44it/s] +2025-05-26 03:43:44,162 - INFO - Epoch: 83, Objective: tensor([3918.3167], device='cuda:0', grad_fn=), Loss: 0.013034864328801632, KL/n: 61.751060485839844 + 0it [00:00, ?it/s]2025-05-26 03:43:44,615 - INFO - [Epoch 084 | Batch 0000] IWAE-loss 3879.0281 | mean log_px -0.0132 | KL -3020.57 + 1it [00:00, 4.71it/s] 2it [00:00, 6.69it/s] 3it [00:00, 7.82it/s] 4it [00:00, 8.47it/s] 5it [00:00, 8.90it/s] 6it [00:00, 9.18it/s] 7it [00:00, 9.38it/s] 8it [00:00, 9.47it/s] 9it [00:01, 9.55it/s] 10it [00:01, 9.63it/s] 11it [00:01, 9.06it/s] 12it [00:01, 9.27it/s] 13it [00:01, 9.40it/s] 14it [00:01, 9.50it/s] 15it [00:01, 9.63it/s] 16it [00:01, 9.68it/s] 17it [00:01, 9.71it/s] 18it [00:01, 9.72it/s] 19it [00:02, 9.73it/s] 20it [00:02, 9.76it/s] 21it [00:02, 9.75it/s] 22it [00:02, 9.76it/s] 23it [00:02, 9.04it/s] 24it [00:02, 9.23it/s] 25it [00:02, 9.40it/s] 26it [00:02, 9.51it/s] 27it [00:02, 9.53it/s] 28it [00:03, 9.60it/s] 29it [00:03, 9.69it/s] 30it [00:03, 9.70it/s] 31it [00:03, 9.26it/s] 32it [00:03, 9.42it/s] 33it [00:03, 9.55it/s] 34it [00:03, 9.60it/s] 35it [00:03, 9.67it/s] 36it [00:03, 9.64it/s] 37it [00:03, 9.69it/s] 38it [00:04, 9.29it/s] 39it [00:04, 9.46it/s] 40it [00:04, 9.54it/s] 41it [00:04, 9.62it/s] 42it [00:04, 9.65it/s] 43it [00:04, 9.73it/s] 44it [00:04, 9.20it/s] 45it [00:04, 9.36it/s] 46it [00:04, 9.42it/s] 47it [00:05, 9.54it/s] 48it [00:05, 9.58it/s] 49it [00:05, 9.62it/s] 50it [00:05, 9.08it/s]2025-05-26 03:43:49,897 - INFO - [Epoch 084 | Batch 0050] IWAE-loss 3803.3413 | mean log_px -0.0113 | KL -3022.37 + 51it [00:05, 9.09it/s] 52it [00:05, 9.26it/s] 53it [00:05, 9.42it/s] 54it [00:05, 9.52it/s] 55it [00:05, 9.54it/s] 56it [00:05, 9.62it/s] 57it [00:06, 9.62it/s] 58it [00:06, 9.55it/s] 59it [00:06, 9.52it/s] 60it [00:06, 8.93it/s] 61it [00:06, 8.59it/s] 62it [00:06, 8.76it/s] 63it [00:06, 8.95it/s] 64it [00:06, 9.08it/s] 65it [00:06, 9.20it/s] 66it [00:07, 9.25it/s] 67it [00:07, 9.31it/s] 68it [00:07, 9.35it/s] 69it [00:07, 9.36it/s] 70it [00:07, 9.36it/s] 71it [00:07, 9.46it/s] 72it [00:07, 9.44it/s] 73it [00:07, 9.40it/s] 74it [00:07, 9.40it/s] 75it [00:08, 9.43it/s] 76it [00:08, 9.49it/s] 77it [00:08, 9.47it/s] 78it [00:08, 9.53it/s] 79it [00:08, 9.53it/s] 80it [00:08, 9.53it/s] 81it [00:08, 8.99it/s] 82it [00:08, 9.12it/s] 83it [00:08, 9.16it/s] 84it [00:09, 9.25it/s] 85it [00:09, 9.33it/s] 86it [00:09, 9.38it/s] 87it [00:09, 9.47it/s] 88it [00:09, 9.02it/s] 89it [00:09, 9.14it/s] 90it [00:09, 9.22it/s] 91it [00:09, 9.29it/s] 92it [00:09, 8.81it/s] 93it [00:09, 9.00it/s] 94it [00:10, 9.08it/s] 95it [00:10, 9.08it/s] 96it [00:10, 8.60it/s] 97it [00:10, 8.83it/s] 98it [00:10, 8.67it/s] 99it [00:10, 8.97it/s] 100it [00:10, 9.21it/s]2025-05-26 03:43:55,307 - INFO - [Epoch 084 | Batch 0100] IWAE-loss 6303.6221 | mean log_px -0.0504 | KL -3017.94 + 101it [00:10, 9.40it/s] 102it [00:11, 8.91it/s] 103it [00:11, 9.16it/s] 104it [00:11, 9.36it/s] 105it [00:11, 9.46it/s] 106it [00:11, 9.04it/s] 107it [00:11, 9.29it/s] 108it [00:11, 9.48it/s] 109it [00:11, 9.59it/s] 110it [00:11, 9.68it/s] 111it [00:11, 9.75it/s] 112it [00:12, 9.81it/s] 113it [00:12, 9.86it/s] 114it [00:12, 9.84it/s] 115it [00:12, 9.87it/s] 116it [00:12, 9.25it/s] 117it [00:12, 9.38it/s] 118it [00:12, 9.49it/s] 119it [00:12, 9.60it/s] 120it [00:12, 9.66it/s] 121it [00:12, 9.69it/s] 122it [00:13, 9.74it/s] 123it [00:13, 9.76it/s] 124it [00:13, 9.78it/s] 125it [00:13, 9.78it/s] 126it [00:13, 9.78it/s] 127it [00:13, 9.79it/s] 128it [00:13, 9.80it/s] 129it [00:13, 9.11it/s] 130it [00:13, 9.30it/s] 131it [00:14, 9.33it/s] 132it [00:14, 9.21it/s] 133it [00:14, 8.76it/s] 134it [00:14, 9.03it/s] 135it [00:14, 9.27it/s] 136it [00:14, 9.35it/s] 137it [00:14, 9.46it/s] 138it [00:14, 9.57it/s] 139it [00:14, 9.63it/s] 140it [00:14, 9.66it/s] 141it [00:15, 9.70it/s] 142it [00:15, 9.19it/s] 143it [00:15, 9.30it/s] 144it [00:15, 9.42it/s] 145it [00:15, 9.51it/s] 146it [00:15, 9.57it/s] 147it [00:15, 9.66it/s] 148it [00:15, 9.69it/s] 149it [00:15, 9.73it/s] 150it [00:16, 9.77it/s]2025-05-26 03:44:00,558 - INFO - [Epoch 084 | Batch 0150] IWAE-loss 3802.7544 | mean log_px -0.0130 | KL -3015.59 + 151it [00:16, 9.78it/s] 152it [00:16, 9.78it/s] 153it [00:16, 9.78it/s] 154it [00:16, 9.79it/s] 155it [00:16, 9.79it/s] 156it [00:16, 9.80it/s] 157it [00:16, 9.82it/s] 158it [00:16, 9.82it/s] 159it [00:16, 9.82it/s] 160it [00:17, 9.81it/s] 161it [00:17, 9.83it/s] 162it [00:17, 9.80it/s] 163it [00:17, 9.81it/s] 164it [00:17, 9.17it/s] 165it [00:17, 9.34it/s] 166it [00:17, 9.48it/s] 167it [00:17, 9.57it/s] 168it [00:17, 9.62it/s] 169it [00:17, 9.70it/s] 170it [00:18, 9.68it/s] 171it [00:18, 9.71it/s] 172it [00:18, 9.75it/s] 173it [00:18, 9.77it/s] 174it [00:18, 9.77it/s] 175it [00:18, 9.67it/s] 176it [00:18, 9.70it/s] 177it [00:18, 9.74it/s] 178it [00:18, 9.72it/s] 179it [00:19, 9.24it/s] 180it [00:19, 9.34it/s] 181it [00:19, 9.51it/s] 182it [00:19, 9.60it/s] 183it [00:19, 9.68it/s] 184it [00:19, 9.23it/s] 185it [00:19, 9.39it/s] 186it [00:19, 9.53it/s] 187it [00:19, 9.37it/s] 188it [00:19, 9.50it/s] 189it [00:20, 9.59it/s] 190it [00:20, 9.15it/s] 191it [00:20, 9.37it/s] 192it [00:20, 9.48it/s] 193it [00:20, 9.56it/s] 194it [00:20, 9.65it/s] 195it [00:20, 9.11it/s] 196it [00:20, 9.38it/s] +2025-05-26 03:44:05,369 - INFO - Epoch: 84, Objective: tensor([4500.4517], device='cuda:0', grad_fn=), Loss: 0.03310453146696091, KL/n: 61.500885009765625 + 0it [00:00, ?it/s]2025-05-26 03:44:05,644 - INFO - [Epoch 085 | Batch 0000] IWAE-loss 3595.1533 | mean log_px -0.0110 | KL -3013.15 + 1it [00:00, 4.83it/s] 2it [00:00, 6.83it/s] 3it [00:00, 7.79it/s] 4it [00:00, 8.48it/s] 5it [00:00, 8.93it/s] 6it [00:00, 9.23it/s] 7it [00:00, 9.17it/s] 8it [00:00, 9.34it/s] 9it [00:01, 9.44it/s] 10it [00:01, 9.54it/s] 11it [00:01, 9.66it/s] 12it [00:01, 9.67it/s] 13it [00:01, 9.69it/s] 14it [00:01, 9.71it/s] 15it [00:01, 9.71it/s] 16it [00:01, 9.72it/s] 17it [00:01, 9.75it/s] 18it [00:01, 9.75it/s] 19it [00:02, 9.77it/s] 20it [00:02, 9.79it/s] 21it [00:02, 9.76it/s] 22it [00:02, 9.77it/s] 23it [00:02, 9.78it/s] 24it [00:02, 9.80it/s] 25it [00:02, 9.85it/s] 26it [00:02, 9.80it/s] 27it [00:02, 9.79it/s] 28it [00:02, 9.78it/s] 29it [00:03, 9.80it/s] 30it [00:03, 9.60it/s] 31it [00:03, 9.56it/s] 32it [00:03, 9.52it/s] 33it [00:03, 9.48it/s] 34it [00:03, 9.49it/s] 35it [00:03, 9.43it/s] 36it [00:03, 9.40it/s] 37it [00:03, 9.47it/s] 38it [00:04, 9.47it/s] 39it [00:04, 8.84it/s] 40it [00:04, 9.03it/s] 41it [00:04, 9.17it/s] 42it [00:04, 9.25it/s] 43it [00:04, 9.28it/s] 44it [00:04, 9.33it/s] 45it [00:04, 8.88it/s] 46it [00:04, 9.06it/s] 47it [00:05, 9.21it/s] 48it [00:05, 9.24it/s] 49it [00:05, 9.29it/s] 50it [00:05, 9.34it/s]2025-05-26 03:44:10,938 - INFO - [Epoch 085 | Batch 0050] IWAE-loss 3756.6094 | mean log_px -0.0141 | KL -3010.08 + 51it [00:05, 8.49it/s] 52it [00:05, 8.88it/s] 53it [00:05, 9.19it/s] 54it [00:05, 9.40it/s] 55it [00:05, 9.56it/s] 56it [00:05, 9.67it/s] 57it [00:06, 9.74it/s] 58it [00:06, 9.78it/s] 59it [00:06, 9.81it/s] 60it [00:06, 9.85it/s] 61it [00:06, 9.89it/s] 62it [00:06, 9.91it/s] 64it [00:06, 9.96it/s] 66it [00:07, 9.96it/s] 68it [00:07, 9.97it/s] 69it [00:07, 9.96it/s] 70it [00:07, 9.96it/s] 72it [00:07, 9.97it/s] 73it [00:07, 9.97it/s] 74it [00:07, 9.96it/s] 75it [00:07, 9.96it/s] 76it [00:08, 9.96it/s] 77it [00:08, 9.95it/s] 78it [00:08, 9.94it/s] 80it [00:08, 9.96it/s] 81it [00:08, 9.94it/s] 82it [00:08, 9.77it/s] 83it [00:08, 9.42it/s] 84it [00:08, 9.45it/s] 85it [00:08, 9.26it/s] 86it [00:09, 9.29it/s] 87it [00:09, 9.13it/s] 88it [00:09, 9.16it/s] 89it [00:09, 9.25it/s] 90it [00:09, 9.26it/s] 91it [00:09, 9.24it/s] 92it [00:09, 9.30it/s] 93it [00:09, 9.36it/s] 94it [00:09, 9.38it/s] 95it [00:10, 9.44it/s] 96it [00:10, 9.41it/s] 97it [00:10, 9.44it/s] 98it [00:10, 9.35it/s] 99it [00:10, 9.31it/s] 100it [00:10, 9.24it/s]2025-05-26 03:44:16,136 - INFO - [Epoch 085 | Batch 0100] IWAE-loss 3645.5867 | mean log_px -0.0103 | KL -3006.17 + 101it [00:10, 9.21it/s] 102it [00:10, 9.16it/s] 103it [00:10, 9.27it/s] 104it [00:10, 9.32it/s] 105it [00:11, 9.35it/s] 106it [00:11, 9.38it/s] 107it [00:11, 9.41it/s] 108it [00:11, 9.39it/s] 109it [00:11, 9.46it/s] 110it [00:11, 9.47it/s] 111it [00:11, 9.51it/s] 112it [00:11, 9.51it/s] 113it [00:11, 9.47it/s] 114it [00:12, 9.45it/s] 115it [00:12, 9.29it/s] 116it [00:12, 9.34it/s] 117it [00:12, 9.31it/s] 118it [00:12, 9.23it/s] 119it [00:12, 9.30it/s] 120it [00:12, 9.37it/s] 121it [00:12, 9.39it/s] 122it [00:12, 9.39it/s] 123it [00:13, 9.42it/s] 124it [00:13, 9.44it/s] 125it [00:13, 9.50it/s] 126it [00:13, 9.39it/s] 127it [00:13, 9.34it/s] 128it [00:13, 9.39it/s] 129it [00:13, 9.39it/s] 130it [00:13, 8.92it/s] 131it [00:13, 9.19it/s] 132it [00:13, 9.36it/s] 133it [00:14, 9.51it/s] 134it [00:14, 9.33it/s] 135it [00:14, 9.26it/s] 136it [00:14, 9.37it/s] 137it [00:14, 9.51it/s] 138it [00:14, 9.57it/s] 139it [00:14, 9.62it/s] 140it [00:14, 9.62it/s] 141it [00:14, 9.68it/s] 142it [00:15, 9.70it/s] 143it [00:15, 9.75it/s] 144it [00:15, 9.75it/s] 145it [00:15, 9.75it/s] 146it [00:15, 9.63it/s] 147it [00:15, 9.71it/s] 148it [00:15, 9.76it/s] 149it [00:15, 9.76it/s] 150it [00:15, 9.76it/s]2025-05-26 03:44:21,413 - INFO - [Epoch 085 | Batch 0150] IWAE-loss 4150.4175 | mean log_px -0.0174 | KL -3003.18 + 151it [00:15, 9.78it/s] 152it [00:16, 9.78it/s] 153it [00:16, 9.59it/s] 154it [00:16, 9.58it/s] 155it [00:16, 9.67it/s] 156it [00:16, 9.71it/s] 157it [00:16, 9.27it/s] 158it [00:16, 9.32it/s] 159it [00:16, 9.43it/s] 160it [00:16, 9.46it/s] 161it [00:17, 9.52it/s] 162it [00:17, 9.49it/s] 163it [00:17, 9.51it/s] 164it [00:17, 9.51it/s] 165it [00:17, 9.53it/s] 166it [00:17, 9.52it/s] 167it [00:17, 9.54it/s] 168it [00:17, 9.53it/s] 169it [00:17, 9.54it/s] 170it [00:17, 9.49it/s] 171it [00:18, 9.49it/s] 172it [00:18, 9.50it/s] 173it [00:18, 9.51it/s] 174it [00:18, 9.50it/s] 175it [00:18, 9.53it/s] 176it [00:18, 9.49it/s] 177it [00:18, 9.52it/s] 178it [00:18, 9.48it/s] 179it [00:18, 9.49it/s] 180it [00:19, 9.50it/s] 181it [00:19, 9.54it/s] 182it [00:19, 9.50it/s] 183it [00:19, 9.52it/s] 184it [00:19, 9.49it/s] 185it [00:19, 9.49it/s] 186it [00:19, 9.50it/s] 187it [00:19, 9.53it/s] 188it [00:19, 9.49it/s] 189it [00:19, 9.53it/s] 190it [00:20, 9.50it/s] 191it [00:20, 9.48it/s] 192it [00:20, 9.51it/s] 193it [00:20, 9.54it/s] 194it [00:20, 9.53it/s] 195it [00:20, 8.91it/s] 196it [00:20, 9.12it/s] 196it [00:20, 9.44it/s] +2025-05-26 03:44:26,270 - INFO - Epoch: 85, Objective: tensor([3568.9839], device='cuda:0', grad_fn=), Loss: 0.01087101548910141, KL/n: 61.26937484741211 + 0it [00:00, ?it/s]2025-05-26 03:44:26,739 - INFO - [Epoch 086 | Batch 0000] IWAE-loss 3738.7234 | mean log_px -0.0156 | KL -3002.08 + 1it [00:00, 4.69it/s] 2it [00:00, 6.14it/s] 3it [00:00, 7.42it/s] 4it [00:00, 7.75it/s] 5it [00:00, 8.40it/s] 6it [00:00, 8.81it/s] 7it [00:00, 9.10it/s] 8it [00:00, 8.78it/s] 9it [00:01, 9.07it/s] 10it [00:01, 9.30it/s] 11it [00:01, 9.49it/s] 12it [00:01, 9.57it/s] 13it [00:01, 8.95it/s] 14it [00:01, 9.12it/s] 15it [00:01, 9.33it/s] 16it [00:01, 9.44it/s] 17it [00:01, 9.56it/s] 18it [00:02, 9.01it/s] 19it [00:02, 9.25it/s] 20it [00:02, 9.43it/s] 21it [00:02, 9.57it/s] 22it [00:02, 9.58it/s] 23it [00:02, 9.10it/s] 24it [00:02, 9.28it/s] 25it [00:02, 9.40it/s] 26it [00:02, 9.50it/s] 27it [00:03, 9.55it/s] 28it [00:03, 9.61it/s] 29it [00:03, 9.51it/s] 30it [00:03, 8.92it/s] 31it [00:03, 8.93it/s] 32it [00:03, 9.14it/s] 33it [00:03, 9.16it/s] 34it [00:03, 8.96it/s] 36it [00:04, 9.00it/s] 38it [00:04, 9.38it/s] 40it [00:04, 9.63it/s] 42it [00:04, 9.77it/s] 44it [00:04, 9.88it/s] 46it [00:04, 9.95it/s] 48it [00:05, 10.01it/s] 50it [00:05, 10.04it/s]2025-05-26 03:44:32,049 - INFO - [Epoch 086 | Batch 0050] IWAE-loss 3615.4333 | mean log_px -0.0113 | KL -2999.07 + 52it [00:05, 9.70it/s] 53it [00:05, 9.68it/s] 55it [00:05, 9.76it/s] 56it [00:06, 9.79it/s] 58it [00:06, 9.90it/s] 60it [00:06, 9.98it/s] 62it [00:06, 10.02it/s] 64it [00:06, 10.05it/s] 66it [00:07, 10.07it/s] 68it [00:07, 10.08it/s] 70it [00:07, 10.09it/s] 72it [00:07, 10.09it/s] 74it [00:07, 9.80it/s] 76it [00:08, 9.89it/s] 77it [00:08, 9.54it/s] 79it [00:08, 9.71it/s] 81it [00:08, 9.82it/s] 83it [00:08, 9.90it/s] 85it [00:08, 9.95it/s] 87it [00:09, 9.65it/s] 88it [00:09, 9.59it/s] 89it [00:09, 9.54it/s] 90it [00:09, 9.50it/s] 91it [00:09, 9.47it/s] 92it [00:09, 9.39it/s] 93it [00:09, 9.44it/s] 94it [00:09, 9.40it/s] 95it [00:10, 8.94it/s] 96it [00:10, 9.15it/s] 97it [00:10, 9.26it/s] 98it [00:10, 9.34it/s] 99it [00:10, 8.87it/s] 100it [00:10, 9.00it/s]2025-05-26 03:44:37,238 - INFO - [Epoch 086 | Batch 0100] IWAE-loss 4592.9512 | mean log_px -0.0254 | KL -2993.21 + 101it [00:10, 9.09it/s] 102it [00:10, 9.20it/s] 103it [00:10, 9.26it/s] 104it [00:11, 9.31it/s] 105it [00:11, 9.37it/s] 106it [00:11, 9.36it/s] 107it [00:11, 9.42it/s] 108it [00:11, 9.46it/s] 109it [00:11, 9.46it/s] 110it [00:11, 9.10it/s] 111it [00:11, 9.19it/s] 112it [00:11, 9.31it/s] 113it [00:11, 9.33it/s] 114it [00:12, 9.37it/s] 115it [00:12, 9.39it/s] 116it [00:12, 9.39it/s] 117it [00:12, 9.38it/s] 118it [00:12, 9.39it/s] 119it [00:12, 9.36it/s] 120it [00:12, 9.03it/s] 121it [00:12, 9.13it/s] 122it [00:12, 9.22it/s] 123it [00:13, 9.32it/s] 124it [00:13, 9.39it/s] 125it [00:13, 9.41it/s] 126it [00:13, 9.39it/s] 127it [00:13, 9.47it/s] 128it [00:13, 9.43it/s] 129it [00:13, 9.46it/s] 130it [00:13, 9.46it/s] 131it [00:13, 9.46it/s] 132it [00:13, 9.45it/s] 133it [00:14, 9.51it/s] 134it [00:14, 9.43it/s] 135it [00:14, 9.41it/s] 136it [00:14, 9.45it/s] 137it [00:14, 9.48it/s] 138it [00:14, 9.46it/s] 139it [00:14, 9.51it/s] 140it [00:14, 9.47it/s] 141it [00:14, 9.43it/s] 142it [00:15, 9.47it/s] 143it [00:15, 9.43it/s] 144it [00:15, 9.41it/s] 145it [00:15, 9.42it/s] 146it [00:15, 9.45it/s] 147it [00:15, 9.18it/s] 148it [00:15, 9.25it/s] 149it [00:15, 9.30it/s] 150it [00:15, 9.36it/s]2025-05-26 03:44:42,569 - INFO - [Epoch 086 | Batch 0150] IWAE-loss 3799.1528 | mean log_px -0.0115 | KL -2990.14 + 151it [00:16, 9.39it/s] 152it [00:16, 9.33it/s] 153it [00:16, 9.41it/s] 154it [00:16, 9.42it/s] 155it [00:16, 9.41it/s] 156it [00:16, 9.44it/s] 157it [00:16, 9.50it/s] 158it [00:16, 9.49it/s] 159it [00:16, 9.45it/s] 160it [00:16, 9.43it/s] 161it [00:17, 9.31it/s] 162it [00:17, 9.36it/s] 163it [00:17, 9.36it/s] 164it [00:17, 9.35it/s] 165it [00:17, 9.28it/s] 166it [00:17, 9.28it/s] 167it [00:17, 9.26it/s] 168it [00:17, 8.73it/s] 169it [00:17, 8.89it/s] 170it [00:18, 8.90it/s] 171it [00:18, 9.02it/s] 172it [00:18, 9.09it/s] 173it [00:18, 9.06it/s] 174it [00:18, 9.14it/s] 175it [00:18, 9.23it/s] 176it [00:18, 8.74it/s] 177it [00:18, 8.90it/s] 178it [00:18, 8.93it/s] 179it [00:19, 9.01it/s] 180it [00:19, 9.15it/s] 181it [00:19, 9.23it/s] 182it [00:19, 9.28it/s] 183it [00:19, 9.34it/s] 184it [00:19, 9.30it/s] 185it [00:19, 9.40it/s] 186it [00:19, 9.41it/s] 187it [00:19, 9.48it/s] 188it [00:20, 9.52it/s] 189it [00:20, 9.55it/s] 190it [00:20, 9.55it/s] 191it [00:20, 9.59it/s] 192it [00:20, 9.60it/s] 193it [00:20, 9.61it/s] 194it [00:20, 9.54it/s] 195it [00:20, 8.93it/s] 196it [00:20, 9.15it/s] 196it [00:20, 9.36it/s] +2025-05-26 03:44:47,538 - INFO - Epoch: 86, Objective: tensor([3665.3276], device='cuda:0', grad_fn=), Loss: 0.01617186702787876, KL/n: 61.00396728515625 + 0it [00:00, ?it/s]2025-05-26 03:44:47,828 - INFO - [Epoch 087 | Batch 0000] IWAE-loss 3902.4707 | mean log_px -0.0153 | KL -2986.10 + 1it [00:00, 4.44it/s] 2it [00:00, 6.42it/s] 3it [00:00, 7.59it/s] 4it [00:00, 8.23it/s] 5it [00:00, 8.26it/s] 6it [00:00, 8.65it/s] 7it [00:00, 8.99it/s] 8it [00:00, 9.13it/s] 9it [00:01, 8.93it/s] 10it [00:01, 9.09it/s] 11it [00:01, 9.20it/s] 12it [00:01, 8.78it/s] 13it [00:01, 8.96it/s] 14it [00:01, 9.18it/s] 15it [00:01, 9.30it/s] 16it [00:01, 9.35it/s] 17it [00:01, 9.38it/s] 18it [00:02, 8.91it/s] 19it [00:02, 9.02it/s] 20it [00:02, 9.13it/s] 21it [00:02, 9.15it/s] 22it [00:02, 9.26it/s] 23it [00:02, 9.34it/s] 24it [00:02, 9.40it/s] 25it [00:02, 9.46it/s] 26it [00:02, 9.47it/s] 27it [00:03, 9.48it/s] 28it [00:03, 9.49it/s] 29it [00:03, 9.50it/s] 30it [00:03, 9.52it/s] 31it [00:03, 9.49it/s] 32it [00:03, 9.50it/s] 33it [00:03, 8.97it/s] 34it [00:03, 9.10it/s] 35it [00:03, 9.25it/s] 36it [00:03, 9.31it/s] 37it [00:04, 9.38it/s] 38it [00:04, 8.88it/s] 39it [00:04, 9.06it/s] 40it [00:04, 9.20it/s] 41it [00:04, 9.28it/s] 42it [00:04, 9.33it/s] 43it [00:04, 9.39it/s] 44it [00:04, 9.37it/s] 45it [00:04, 9.39it/s] 46it [00:05, 9.42it/s] 47it [00:05, 9.45it/s] 48it [00:05, 9.48it/s] 49it [00:05, 9.49it/s] 50it [00:05, 9.50it/s]2025-05-26 03:44:53,230 - INFO - [Epoch 087 | Batch 0050] IWAE-loss 4207.4248 | mean log_px -0.0193 | KL -2987.37 + 51it [00:05, 9.47it/s] 52it [00:05, 9.53it/s] 53it [00:05, 9.54it/s] 54it [00:05, 9.51it/s] 55it [00:06, 9.47it/s] 56it [00:06, 9.49it/s] 57it [00:06, 8.99it/s] 58it [00:06, 9.12it/s] 59it [00:06, 9.23it/s] 60it [00:06, 9.24it/s] 61it [00:06, 9.38it/s] 62it [00:06, 9.47it/s] 63it [00:06, 8.93it/s] 64it [00:07, 9.08it/s] 65it [00:07, 9.18it/s] 66it [00:07, 9.03it/s] 67it [00:07, 9.08it/s] 68it [00:07, 9.22it/s] 69it [00:07, 9.39it/s] 70it [00:07, 9.48it/s] 71it [00:07, 8.94it/s] 72it [00:07, 9.13it/s] 73it [00:07, 9.18it/s] 74it [00:08, 9.32it/s] 75it [00:08, 8.85it/s] 76it [00:08, 9.11it/s] 77it [00:08, 9.17it/s] 78it [00:08, 9.27it/s] 79it [00:08, 9.32it/s] 80it [00:08, 9.34it/s] 81it [00:08, 9.40it/s] 82it [00:08, 9.40it/s] 83it [00:09, 9.47it/s] 84it [00:09, 9.40it/s] 85it [00:09, 9.46it/s] 86it [00:09, 9.50it/s] 87it [00:09, 9.53it/s] 88it [00:09, 9.55it/s] 89it [00:09, 9.51it/s] 90it [00:09, 9.47it/s] 91it [00:09, 9.39it/s] 92it [00:10, 9.40it/s] 93it [00:10, 9.38it/s] 94it [00:10, 8.94it/s] 95it [00:10, 8.85it/s] 96it [00:10, 9.03it/s] 97it [00:10, 9.10it/s] 98it [00:10, 9.12it/s] 99it [00:10, 9.23it/s] 100it [00:10, 9.26it/s]2025-05-26 03:44:58,632 - INFO - [Epoch 087 | Batch 0100] IWAE-loss 3976.6338 | mean log_px -0.0192 | KL -2984.05 + 101it [00:11, 9.26it/s] 102it [00:11, 9.31it/s] 103it [00:11, 9.34it/s] 104it [00:11, 9.33it/s] 105it [00:11, 9.42it/s] 106it [00:11, 9.47it/s] 107it [00:11, 9.49it/s] 108it [00:11, 9.50it/s] 109it [00:11, 9.50it/s] 110it [00:11, 9.45it/s] 111it [00:12, 9.53it/s] 112it [00:12, 8.95it/s] 113it [00:12, 9.07it/s] 114it [00:12, 9.20it/s] 115it [00:12, 9.32it/s] 116it [00:12, 8.92it/s] 117it [00:12, 9.11it/s] 118it [00:12, 9.20it/s] 119it [00:12, 9.30it/s] 120it [00:13, 8.82it/s] 121it [00:13, 9.01it/s] 122it [00:13, 9.13it/s] 123it [00:13, 9.23it/s] 124it [00:13, 9.31it/s] 125it [00:13, 8.63it/s] 126it [00:13, 8.65it/s] 127it [00:13, 8.81it/s] 128it [00:13, 9.03it/s] 129it [00:14, 9.17it/s] 130it [00:14, 9.29it/s] 131it [00:14, 9.16it/s] 132it [00:14, 9.09it/s] 133it [00:14, 8.53it/s] 134it [00:14, 8.74it/s] 135it [00:14, 8.97it/s] 136it [00:14, 9.09it/s] 137it [00:14, 9.22it/s] 138it [00:15, 9.28it/s] 139it [00:15, 9.32it/s] 140it [00:15, 9.20it/s] 141it [00:15, 9.23it/s] 142it [00:15, 9.30it/s] 143it [00:15, 9.35it/s] 144it [00:15, 9.37it/s] 145it [00:15, 9.39it/s] 146it [00:15, 9.41it/s] 147it [00:16, 9.48it/s] 148it [00:16, 9.47it/s] 149it [00:16, 8.98it/s] 150it [00:16, 9.14it/s]2025-05-26 03:45:04,078 - INFO - [Epoch 087 | Batch 0150] IWAE-loss 3641.0764 | mean log_px -0.0103 | KL -2975.16 + 151it [00:16, 9.28it/s] 152it [00:16, 9.32it/s] 153it [00:16, 9.39it/s] 154it [00:16, 9.42it/s] 155it [00:16, 9.44it/s] 156it [00:16, 9.43it/s] 157it [00:17, 9.13it/s] 158it [00:17, 9.25it/s] 159it [00:17, 9.38it/s] 160it [00:17, 9.42it/s] 161it [00:17, 9.46it/s] 162it [00:17, 9.46it/s] 163it [00:17, 9.48it/s] 164it [00:17, 9.48it/s] 165it [00:17, 9.46it/s] 166it [00:18, 9.45it/s] 167it [00:18, 9.47it/s] 168it [00:18, 9.47it/s] 169it [00:18, 9.48it/s] 170it [00:18, 9.52it/s] 171it [00:18, 9.50it/s] 172it [00:18, 9.40it/s] 173it [00:18, 9.43it/s] 174it [00:18, 9.44it/s] 175it [00:18, 9.50it/s] 176it [00:19, 9.47it/s] 177it [00:19, 9.47it/s] 178it [00:19, 9.49it/s] 179it [00:19, 9.48it/s] 180it [00:19, 9.12it/s] 181it [00:19, 9.23it/s] 182it [00:19, 9.31it/s] 183it [00:19, 9.36it/s] 184it [00:19, 9.38it/s] 185it [00:20, 9.35it/s] 186it [00:20, 8.87it/s] 187it [00:20, 8.95it/s] 188it [00:20, 9.09it/s] 189it [00:20, 9.20it/s] 190it [00:20, 9.29it/s] 191it [00:20, 9.29it/s] 192it [00:20, 9.13it/s] 193it [00:20, 9.19it/s] 194it [00:21, 9.27it/s] 195it [00:21, 8.77it/s] 196it [00:21, 9.06it/s] 196it [00:21, 9.19it/s] +2025-05-26 03:45:09,011 - INFO - Epoch: 87, Objective: tensor([3995.7356], device='cuda:0', grad_fn=), Loss: 0.013150476850569248, KL/n: 60.77505874633789 + 0it [00:00, ?it/s]2025-05-26 03:45:09,475 - INFO - [Epoch 088 | Batch 0000] IWAE-loss 3533.7141 | mean log_px -0.0108 | KL -2978.48 + 1it [00:00, 4.76it/s] 2it [00:00, 6.64it/s] 3it [00:00, 7.75it/s] 4it [00:00, 8.34it/s] 5it [00:00, 8.78it/s] 6it [00:00, 9.06it/s] 7it [00:00, 9.17it/s] 8it [00:00, 9.23it/s] 9it [00:01, 9.28it/s] 10it [00:01, 9.33it/s] 11it [00:01, 9.39it/s] 12it [00:01, 9.47it/s] 13it [00:01, 9.46it/s] 14it [00:01, 9.40it/s] 15it [00:01, 9.45it/s] 16it [00:01, 9.46it/s] 17it [00:01, 9.50it/s] 18it [00:02, 9.48it/s] 19it [00:02, 9.45it/s] 20it [00:02, 9.45it/s] 21it [00:02, 9.52it/s] 22it [00:02, 9.56it/s] 23it [00:02, 9.01it/s] 24it [00:02, 9.08it/s] 25it [00:02, 9.25it/s] 26it [00:02, 9.31it/s] 27it [00:02, 9.34it/s] 28it [00:03, 9.25it/s] 29it [00:03, 9.36it/s] 30it [00:03, 9.39it/s] 31it [00:03, 9.39it/s] 32it [00:03, 9.36it/s] 33it [00:03, 9.43it/s] 34it [00:03, 9.43it/s] 35it [00:03, 9.41it/s] 36it [00:03, 9.43it/s] 37it [00:04, 9.46it/s] 38it [00:04, 9.50it/s] 39it [00:04, 9.48it/s] 40it [00:04, 9.48it/s] 41it [00:04, 9.49it/s] 42it [00:04, 8.99it/s] 43it [00:04, 9.19it/s] 44it [00:04, 9.25it/s] 45it [00:04, 9.29it/s] 46it [00:05, 9.33it/s] 47it [00:05, 9.37it/s] 48it [00:05, 9.40it/s] 49it [00:05, 9.36it/s] 50it [00:05, 9.38it/s]2025-05-26 03:45:14,821 - INFO - [Epoch 088 | Batch 0050] IWAE-loss 4089.7800 | mean log_px -0.0202 | KL -2976.60 + 51it [00:05, 9.43it/s] 52it [00:05, 9.06it/s] 53it [00:05, 9.18it/s] 54it [00:05, 9.23it/s] 55it [00:05, 9.27it/s] 56it [00:06, 8.99it/s] 57it [00:06, 9.13it/s] 58it [00:06, 9.23it/s] 59it [00:06, 8.78it/s] 60it [00:06, 8.92it/s] 61it [00:06, 9.06it/s] 62it [00:06, 9.10it/s] 63it [00:06, 9.01it/s] 64it [00:06, 8.68it/s] 65it [00:07, 8.89it/s] 66it [00:07, 8.61it/s] 67it [00:07, 8.87it/s] 68it [00:07, 9.03it/s] 69it [00:07, 8.69it/s] 70it [00:07, 8.86it/s] 71it [00:07, 9.06it/s] 72it [00:07, 9.19it/s] 73it [00:08, 8.78it/s] 74it [00:08, 8.98it/s] 75it [00:08, 9.16it/s] 76it [00:08, 8.70it/s] 77it [00:08, 8.85it/s] 78it [00:08, 9.00it/s] 79it [00:08, 9.14it/s] 80it [00:08, 8.78it/s] 81it [00:08, 8.98it/s] 82it [00:08, 9.10it/s] 83it [00:09, 9.20it/s] 84it [00:09, 8.84it/s] 85it [00:09, 8.99it/s] 86it [00:09, 9.11it/s] 87it [00:09, 9.22it/s] 88it [00:09, 8.84it/s] 89it [00:09, 9.02it/s] 90it [00:09, 9.17it/s] 91it [00:09, 9.27it/s] 92it [00:10, 8.83it/s] 93it [00:10, 9.01it/s] 94it [00:10, 9.13it/s] 95it [00:10, 9.24it/s] 96it [00:10, 8.86it/s] 97it [00:10, 9.05it/s] 98it [00:10, 9.18it/s] 99it [00:10, 9.29it/s] 100it [00:10, 8.86it/s]2025-05-26 03:45:20,383 - INFO - [Epoch 088 | Batch 0100] IWAE-loss 3568.9946 | mean log_px -0.0101 | KL -2965.73 + 101it [00:11, 9.06it/s] 102it [00:11, 9.19it/s] 103it [00:11, 8.84it/s] 104it [00:11, 9.01it/s] 105it [00:11, 9.10it/s] 106it [00:11, 9.24it/s] 107it [00:11, 8.85it/s] 108it [00:11, 9.02it/s] 109it [00:11, 9.16it/s] 110it [00:12, 9.27it/s] 111it [00:12, 8.87it/s] 112it [00:12, 9.02it/s] 113it [00:12, 9.16it/s] 114it [00:12, 9.28it/s] 115it [00:12, 8.88it/s] 116it [00:12, 9.08it/s] 117it [00:12, 9.20it/s] 118it [00:12, 9.27it/s] 119it [00:13, 8.87it/s] 120it [00:13, 9.01it/s] 121it [00:13, 9.14it/s] 122it [00:13, 9.25it/s] 123it [00:13, 8.85it/s] 124it [00:13, 9.00it/s] 125it [00:13, 9.15it/s] 126it [00:13, 9.25it/s] 127it [00:13, 8.85it/s] 128it [00:14, 8.99it/s] 129it [00:14, 9.13it/s] 130it [00:14, 9.27it/s] 131it [00:14, 8.86it/s] 132it [00:14, 9.05it/s] 133it [00:14, 9.20it/s] 134it [00:14, 8.82it/s] 135it [00:14, 9.03it/s] 136it [00:14, 9.12it/s] 137it [00:15, 9.23it/s] 138it [00:15, 8.82it/s] 139it [00:15, 9.02it/s] 140it [00:15, 9.11it/s] 141it [00:15, 9.19it/s] 142it [00:15, 8.78it/s] 143it [00:15, 8.94it/s] 144it [00:15, 9.07it/s] 145it [00:15, 9.20it/s] 146it [00:16, 8.82it/s] 147it [00:16, 9.01it/s] 148it [00:16, 9.16it/s] 149it [00:16, 9.26it/s] 150it [00:16, 9.02it/s]2025-05-26 03:45:25,901 - INFO - [Epoch 088 | Batch 0150] IWAE-loss 3878.7766 | mean log_px -0.0216 | KL -2965.69 + 151it [00:16, 9.06it/s] 152it [00:16, 9.19it/s] 153it [00:16, 9.30it/s] 154it [00:16, 9.36it/s] 155it [00:17, 9.46it/s] 156it [00:17, 9.49it/s] 157it [00:17, 9.48it/s] 158it [00:17, 8.99it/s] 159it [00:17, 9.16it/s] 160it [00:17, 9.26it/s] 161it [00:17, 9.34it/s] 162it [00:17, 9.36it/s] 163it [00:17, 9.42it/s] 164it [00:17, 9.49it/s] 165it [00:18, 9.50it/s] 166it [00:18, 9.48it/s] 167it [00:18, 9.45it/s] 168it [00:18, 9.52it/s] 169it [00:18, 9.46it/s] 170it [00:18, 8.72it/s] 171it [00:18, 8.80it/s] 172it [00:18, 9.06it/s] 173it [00:18, 8.76it/s] 174it [00:19, 9.08it/s] 175it [00:19, 9.32it/s] 176it [00:19, 8.92it/s] 177it [00:19, 9.09it/s] 178it [00:19, 8.95it/s] 179it [00:19, 8.82it/s] 180it [00:19, 8.56it/s] 181it [00:19, 8.91it/s] 182it [00:19, 9.17it/s] 183it [00:20, 8.89it/s] 184it [00:20, 9.16it/s] 185it [00:20, 9.36it/s] 186it [00:20, 9.01it/s] 187it [00:20, 9.25it/s] 188it [00:20, 9.44it/s] 189it [00:20, 9.03it/s] 190it [00:20, 9.29it/s] 191it [00:20, 9.46it/s] 192it [00:21, 9.58it/s] 193it [00:21, 9.11it/s] 194it [00:21, 9.33it/s] 195it [00:21, 8.96it/s] 196it [00:21, 8.88it/s] 196it [00:21, 9.08it/s] +2025-05-26 03:45:30,916 - INFO - Epoch: 88, Objective: tensor([3712.7053], device='cuda:0', grad_fn=), Loss: 0.014657406136393547, KL/n: 60.55072784423828 + 0it [00:00, ?it/s]2025-05-26 03:45:31,203 - INFO - [Epoch 089 | Batch 0000] IWAE-loss 3791.1438 | mean log_px -0.0117 | KL -2966.70 + 1it [00:00, 5.23it/s] 2it [00:00, 6.58it/s] 4it [00:00, 8.41it/s] 5it [00:00, 8.84it/s] 7it [00:00, 8.90it/s] 8it [00:00, 9.15it/s] 10it [00:01, 9.52it/s] 11it [00:01, 9.19it/s] 13it [00:01, 9.53it/s] 14it [00:01, 9.57it/s] 15it [00:01, 9.05it/s] 16it [00:01, 8.91it/s] 17it [00:01, 9.12it/s] 19it [00:02, 9.50it/s] 21it [00:02, 9.71it/s] 23it [00:02, 9.85it/s] 24it [00:02, 9.87it/s] 26it [00:02, 9.89it/s] 27it [00:02, 9.47it/s] 28it [00:03, 9.53it/s] 29it [00:03, 9.63it/s] 30it [00:03, 9.72it/s] 31it [00:03, 9.25it/s] 32it [00:03, 9.28it/s] 33it [00:03, 9.44it/s] 34it [00:03, 9.58it/s] 36it [00:03, 9.77it/s] 38it [00:04, 9.88it/s] 40it [00:04, 9.93it/s] 41it [00:04, 9.95it/s] 42it [00:04, 9.48it/s] 44it [00:04, 9.69it/s] 46it [00:04, 9.81it/s] 47it [00:05, 9.40it/s] 49it [00:05, 9.63it/s] 50it [00:05, 9.70it/s]2025-05-26 03:45:36,419 - INFO - [Epoch 089 | Batch 0050] IWAE-loss 3452.4019 | mean log_px -0.0074 | KL -2963.17 + 51it [00:05, 9.76it/s] 52it [00:05, 9.81it/s] 53it [00:05, 9.33it/s] 55it [00:05, 9.63it/s] 56it [00:05, 9.69it/s] 57it [00:06, 9.34it/s] 58it [00:06, 9.48it/s] 60it [00:06, 9.70it/s] 62it [00:06, 9.81it/s] 63it [00:06, 9.38it/s] 64it [00:06, 9.51it/s] 65it [00:06, 9.62it/s] 66it [00:06, 9.72it/s] 68it [00:07, 9.84it/s] 70it [00:07, 9.93it/s] 72it [00:07, 9.97it/s] 74it [00:07, 10.00it/s] 76it [00:07, 10.01it/s] 77it [00:08, 10.01it/s] 78it [00:08, 10.00it/s] 80it [00:08, 9.66it/s] 82it [00:08, 9.77it/s] 84it [00:08, 9.85it/s] 85it [00:08, 9.87it/s] 86it [00:08, 9.89it/s] 88it [00:09, 9.49it/s] 89it [00:09, 9.58it/s] 90it [00:09, 9.53it/s] 91it [00:09, 9.60it/s] 93it [00:09, 9.77it/s] 95it [00:09, 9.88it/s] 96it [00:10, 9.89it/s] 98it [00:10, 9.95it/s] 99it [00:10, 9.96it/s]2025-05-26 03:45:41,533 - INFO - [Epoch 089 | Batch 0100] IWAE-loss 3771.1143 | mean log_px -0.0146 | KL -2961.73 + 101it [00:10, 9.97it/s] 102it [00:10, 9.55it/s] 103it [00:10, 9.63it/s] 104it [00:10, 9.70it/s] 106it [00:11, 9.84it/s] 108it [00:11, 9.54it/s] 110it [00:11, 9.70it/s] 112it [00:11, 9.81it/s] 114it [00:11, 9.87it/s] 116it [00:12, 9.92it/s] 117it [00:12, 9.93it/s] 119it [00:12, 9.97it/s] 121it [00:12, 10.00it/s] 122it [00:12, 9.58it/s] 124it [00:12, 9.73it/s] 125it [00:12, 9.78it/s] 126it [00:13, 9.82it/s] 127it [00:13, 9.86it/s] 128it [00:13, 9.89it/s] 130it [00:13, 9.96it/s] 131it [00:13, 9.96it/s] 132it [00:13, 9.43it/s] 134it [00:13, 9.68it/s] 136it [00:14, 9.42it/s] 138it [00:14, 9.65it/s] 140it [00:14, 9.78it/s] 141it [00:14, 9.43it/s] 143it [00:14, 9.64it/s] 145it [00:15, 9.76it/s] 146it [00:15, 9.78it/s] 147it [00:15, 9.43it/s] 148it [00:15, 9.54it/s] 149it [00:15, 9.65it/s] 150it [00:15, 9.18it/s]2025-05-26 03:45:46,702 - INFO - [Epoch 089 | Batch 0150] IWAE-loss 3447.8906 | mean log_px -0.0127 | KL -2953.03 + 152it [00:15, 9.50it/s] 154it [00:16, 9.28it/s] 156it [00:16, 9.54it/s] 158it [00:16, 9.71it/s] 160it [00:16, 9.45it/s] 162it [00:16, 9.62it/s] 163it [00:16, 9.69it/s] 165it [00:17, 9.81it/s] 166it [00:17, 9.84it/s] 168it [00:17, 9.91it/s] 169it [00:17, 9.93it/s] 170it [00:17, 9.44it/s] 171it [00:17, 9.56it/s] 172it [00:17, 9.66it/s] 173it [00:17, 9.73it/s] 175it [00:18, 9.87it/s] 176it [00:18, 9.90it/s] 177it [00:18, 9.36it/s] 179it [00:18, 9.62it/s] 180it [00:18, 9.70it/s] 181it [00:18, 9.35it/s] 182it [00:18, 9.51it/s] 184it [00:19, 9.72it/s] 185it [00:19, 9.78it/s] 186it [00:19, 9.83it/s] 188it [00:19, 9.92it/s] 189it [00:19, 9.93it/s] 190it [00:19, 9.94it/s] 192it [00:19, 9.99it/s] 193it [00:19, 9.99it/s] 194it [00:20, 9.95it/s] 195it [00:20, 9.56it/s] 196it [00:20, 9.62it/s] +2025-05-26 03:45:51,423 - INFO - Epoch: 89, Objective: tensor([3744.3455], device='cuda:0', grad_fn=), Loss: 0.016745569184422493, KL/n: 60.30201721191406 + 0it [00:00, ?it/s]2025-05-26 03:45:51,884 - INFO - [Epoch 090 | Batch 0000] IWAE-loss 4105.8560 | mean log_px -0.0164 | KL -2952.96 + 1it [00:00, 4.73it/s] 3it [00:00, 7.82it/s] 4it [00:00, 8.39it/s] 5it [00:00, 8.41it/s] 6it [00:00, 8.85it/s] 8it [00:00, 9.39it/s] 10it [00:01, 9.66it/s] 12it [00:01, 9.80it/s] 14it [00:01, 9.61it/s] 15it [00:01, 9.67it/s] 16it [00:01, 9.72it/s] 17it [00:01, 9.30it/s] 18it [00:01, 9.46it/s] 20it [00:02, 9.36it/s] 22it [00:02, 9.59it/s] 23it [00:02, 9.67it/s] 24it [00:02, 9.74it/s] 25it [00:02, 9.38it/s] 27it [00:02, 9.65it/s] 28it [00:03, 9.71it/s] 29it [00:03, 9.23it/s] 30it [00:03, 9.39it/s] 32it [00:03, 9.68it/s] 34it [00:03, 9.83it/s] 35it [00:03, 9.42it/s] 36it [00:03, 9.52it/s] 38it [00:04, 9.73it/s] 40it [00:04, 9.47it/s] 42it [00:04, 9.62it/s] 43it [00:04, 9.61it/s] 45it [00:04, 9.76it/s] 46it [00:04, 9.78it/s] 48it [00:05, 9.90it/s] 50it [00:05, 9.97it/s]2025-05-26 03:45:57,073 - INFO - [Epoch 090 | Batch 0050] IWAE-loss 3642.5940 | mean log_px -0.0134 | KL -2952.94 + 51it [00:05, 9.93it/s] 53it [00:05, 10.00it/s] 54it [00:05, 9.99it/s] 56it [00:05, 10.03it/s] 58it [00:06, 10.05it/s] 60it [00:06, 10.06it/s] 62it [00:06, 10.07it/s] 64it [00:06, 10.07it/s] 66it [00:06, 10.07it/s] 68it [00:07, 10.04it/s] 70it [00:07, 9.65it/s] 71it [00:07, 9.71it/s] 72it [00:07, 9.32it/s] 73it [00:07, 9.13it/s] 74it [00:07, 9.31it/s] 75it [00:07, 9.04it/s] 76it [00:07, 9.05it/s] 77it [00:08, 9.23it/s] 78it [00:08, 9.35it/s] 80it [00:08, 9.65it/s] 81it [00:08, 9.73it/s] 82it [00:08, 9.74it/s] 83it [00:08, 9.36it/s] 85it [00:08, 9.66it/s] 86it [00:09, 9.36it/s] 87it [00:09, 9.51it/s] 89it [00:09, 9.75it/s] 90it [00:09, 9.80it/s] 91it [00:09, 9.27it/s] 92it [00:09, 9.42it/s] 93it [00:09, 9.46it/s] 94it [00:09, 9.00it/s] 95it [00:09, 9.26it/s] 96it [00:10, 9.43it/s] 97it [00:10, 9.58it/s] 98it [00:10, 9.52it/s] 99it [00:10, 9.49it/s] 100it [00:10, 9.36it/s]2025-05-26 03:46:02,289 - INFO - [Epoch 090 | Batch 0100] IWAE-loss 4252.8389 | mean log_px -0.0252 | KL -2944.33 + 101it [00:10, 9.26it/s] 102it [00:10, 9.20it/s] 103it [00:10, 9.18it/s] 104it [00:10, 9.06it/s] 105it [00:11, 9.05it/s] 106it [00:11, 9.10it/s] 107it [00:11, 9.17it/s] 108it [00:11, 9.20it/s] 109it [00:11, 9.28it/s] 110it [00:11, 9.33it/s] 111it [00:11, 9.33it/s] 112it [00:11, 8.77it/s] 113it [00:11, 8.85it/s] 114it [00:12, 8.90it/s] 115it [00:12, 8.94it/s] 116it [00:12, 8.49it/s] 117it [00:12, 8.59it/s] 118it [00:12, 8.50it/s] 119it [00:12, 8.65it/s] 120it [00:12, 8.37it/s] 121it [00:12, 8.69it/s] 122it [00:12, 8.97it/s] 123it [00:13, 8.55it/s] 124it [00:13, 8.83it/s] 125it [00:13, 9.01it/s] 126it [00:13, 9.10it/s] 127it [00:13, 9.24it/s] 128it [00:13, 8.75it/s] 129it [00:13, 9.01it/s] 130it [00:13, 9.16it/s] 131it [00:13, 9.20it/s] 132it [00:14, 9.25it/s] 133it [00:14, 9.28it/s] 134it [00:14, 9.33it/s] 135it [00:14, 8.91it/s] 136it [00:14, 8.96it/s] 137it [00:14, 9.12it/s] 138it [00:14, 8.91it/s] 139it [00:14, 9.02it/s] 140it [00:14, 8.67it/s] 141it [00:15, 8.90it/s] 142it [00:15, 9.09it/s] 143it [00:15, 9.24it/s] 144it [00:15, 8.88it/s] 145it [00:15, 9.08it/s] 146it [00:15, 9.15it/s] 147it [00:15, 8.77it/s] 148it [00:15, 8.97it/s] 149it [00:15, 9.14it/s] 150it [00:16, 9.23it/s]2025-05-26 03:46:07,854 - INFO - [Epoch 090 | Batch 0150] IWAE-loss 3503.3472 | mean log_px -0.0103 | KL -2943.74 + 151it [00:16, 8.81it/s] 152it [00:16, 9.04it/s] 153it [00:16, 9.14it/s] 154it [00:16, 9.27it/s] 155it [00:16, 8.83it/s] 156it [00:16, 9.06it/s] 157it [00:16, 9.23it/s] 158it [00:16, 9.25it/s] 159it [00:17, 8.77it/s] 160it [00:17, 8.99it/s] 161it [00:17, 9.16it/s] 162it [00:17, 9.26it/s] 163it [00:17, 9.33it/s] 164it [00:17, 9.35it/s] 165it [00:17, 9.37it/s] 166it [00:17, 9.41it/s] 167it [00:17, 9.46it/s] 168it [00:18, 9.52it/s] 169it [00:18, 9.49it/s] 170it [00:18, 9.47it/s] 171it [00:18, 9.43it/s] 172it [00:18, 8.87it/s] 173it [00:18, 8.92it/s] 174it [00:18, 8.97it/s] 175it [00:18, 9.15it/s] 176it [00:18, 9.26it/s] 177it [00:18, 9.37it/s] 178it [00:19, 8.84it/s] 179it [00:19, 9.07it/s] 180it [00:19, 9.14it/s] 181it [00:19, 9.25it/s] 182it [00:19, 9.34it/s] 183it [00:19, 9.32it/s] 184it [00:19, 9.42it/s] 185it [00:19, 9.45it/s] 186it [00:19, 9.05it/s] 187it [00:20, 9.15it/s] 188it [00:20, 9.23it/s] 189it [00:20, 9.33it/s] 190it [00:20, 9.38it/s] 191it [00:20, 9.36it/s] 192it [00:20, 9.40it/s] 193it [00:20, 9.38it/s] 194it [00:20, 9.41it/s] 195it [00:20, 8.89it/s] 196it [00:21, 9.15it/s] 196it [00:21, 9.28it/s] +2025-05-26 03:46:12,855 - INFO - Epoch: 90, Objective: tensor([3948.3491], device='cuda:0', grad_fn=), Loss: 0.02164594642817974, KL/n: 60.072139739990234 + 0it [00:00, ?it/s]2025-05-26 03:46:13,125 - INFO - [Epoch 091 | Batch 0000] IWAE-loss 3966.0691 | mean log_px -0.0175 | KL -2943.96 + 1it [00:00, 4.80it/s] 2it [00:00, 6.72it/s] 3it [00:00, 7.79it/s] 4it [00:00, 8.32it/s] 5it [00:00, 8.75it/s] 6it [00:00, 8.44it/s] 7it [00:00, 8.77it/s] 8it [00:00, 8.99it/s] 9it [00:01, 9.13it/s] 10it [00:01, 8.75it/s] 11it [00:01, 9.02it/s] 12it [00:01, 9.14it/s] 13it [00:01, 8.85it/s] 14it [00:01, 9.04it/s] 15it [00:01, 9.17it/s] 16it [00:01, 9.19it/s] 17it [00:01, 8.77it/s] 18it [00:02, 9.01it/s] 19it [00:02, 9.14it/s] 20it [00:02, 9.29it/s] 21it [00:02, 8.89it/s] 22it [00:02, 9.09it/s] 23it [00:02, 9.27it/s] 24it [00:02, 8.83it/s] 25it [00:02, 9.00it/s] 26it [00:02, 9.18it/s] 27it [00:03, 9.34it/s] 28it [00:03, 8.89it/s] 29it [00:03, 9.13it/s] 30it [00:03, 9.24it/s] 31it [00:03, 9.38it/s] 32it [00:03, 8.91it/s] 33it [00:03, 8.85it/s] 34it [00:03, 8.98it/s] 35it [00:03, 8.63it/s] 36it [00:04, 8.86it/s] 37it [00:04, 8.98it/s] 38it [00:04, 9.06it/s] 39it [00:04, 8.69it/s] 40it [00:04, 8.85it/s] 41it [00:04, 9.00it/s] 42it [00:04, 8.63it/s] 43it [00:04, 8.84it/s] 44it [00:04, 8.98it/s] 45it [00:05, 9.08it/s] 46it [00:05, 8.76it/s] 47it [00:05, 9.04it/s] 48it [00:05, 9.23it/s] 49it [00:05, 8.88it/s] 50it [00:05, 9.11it/s]2025-05-26 03:46:18,678 - INFO - [Epoch 091 | Batch 0050] IWAE-loss 3997.3748 | mean log_px -0.0152 | KL -2940.93 + 51it [00:05, 9.28it/s] 52it [00:05, 8.89it/s] 53it [00:05, 9.13it/s] 54it [00:06, 9.29it/s] 55it [00:06, 9.42it/s] 56it [00:06, 8.98it/s] 57it [00:06, 9.18it/s] 58it [00:06, 9.33it/s] 59it [00:06, 8.91it/s] 60it [00:06, 9.14it/s] 61it [00:06, 9.31it/s] 62it [00:06, 9.42it/s] 63it [00:07, 8.99it/s] 64it [00:07, 9.16it/s] 65it [00:07, 9.32it/s] 66it [00:07, 9.08it/s] 67it [00:07, 9.26it/s] 68it [00:07, 8.87it/s] 69it [00:07, 9.08it/s] 70it [00:07, 9.25it/s] 71it [00:07, 8.87it/s] 72it [00:08, 9.10it/s] 73it [00:08, 9.28it/s] 74it [00:08, 8.86it/s] 75it [00:08, 9.11it/s] 76it [00:08, 8.77it/s] 77it [00:08, 9.04it/s] 78it [00:08, 9.21it/s] 79it [00:08, 9.34it/s] 80it [00:08, 8.92it/s] 81it [00:09, 9.14it/s] 82it [00:09, 9.25it/s] 83it [00:09, 8.88it/s] 84it [00:09, 9.07it/s] 85it [00:09, 8.75it/s] 86it [00:09, 9.01it/s] 87it [00:09, 9.21it/s] 88it [00:09, 8.81it/s] 89it [00:09, 9.04it/s] 90it [00:10, 9.22it/s] 91it [00:10, 8.82it/s] 92it [00:10, 8.78it/s] 93it [00:10, 8.98it/s] 94it [00:10, 8.64it/s] 95it [00:10, 8.86it/s] 96it [00:10, 9.01it/s] 97it [00:10, 9.08it/s] 98it [00:10, 8.69it/s] 99it [00:11, 8.84it/s] 100it [00:11, 9.05it/s]2025-05-26 03:46:24,205 - INFO - [Epoch 091 | Batch 0100] IWAE-loss 3747.8899 | mean log_px -0.0144 | KL -2939.49 + 101it [00:11, 9.14it/s] 102it [00:11, 8.72it/s] 103it [00:11, 8.90it/s] 104it [00:11, 8.89it/s] 105it [00:11, 9.06it/s] 106it [00:11, 9.13it/s] 107it [00:11, 9.21it/s] 108it [00:12, 9.26it/s] 109it [00:12, 9.32it/s] 110it [00:12, 8.77it/s] 111it [00:12, 9.02it/s] 112it [00:12, 9.05it/s] 113it [00:12, 9.23it/s] 114it [00:12, 8.90it/s] 115it [00:12, 9.13it/s] 116it [00:12, 9.27it/s] 117it [00:13, 8.84it/s] 118it [00:13, 9.06it/s] 119it [00:13, 9.13it/s] 120it [00:13, 9.22it/s] 121it [00:13, 8.82it/s] 122it [00:13, 9.07it/s] 123it [00:13, 9.26it/s] 124it [00:13, 9.39it/s] 125it [00:13, 8.96it/s] 126it [00:14, 9.17it/s] 127it [00:14, 9.33it/s] 128it [00:14, 9.43it/s] 129it [00:14, 8.98it/s] 130it [00:14, 9.17it/s] 131it [00:14, 9.31it/s] 132it [00:14, 9.43it/s] 133it [00:14, 9.00it/s] 134it [00:14, 9.20it/s] 135it [00:14, 9.36it/s] 136it [00:15, 8.94it/s] 137it [00:15, 9.16it/s] 138it [00:15, 9.25it/s] 139it [00:15, 9.02it/s] 140it [00:15, 9.21it/s] 141it [00:15, 8.84it/s] 142it [00:15, 9.08it/s] 143it [00:15, 9.26it/s] 144it [00:15, 9.39it/s] 145it [00:16, 8.96it/s] 146it [00:16, 9.16it/s] 147it [00:16, 9.33it/s] 148it [00:16, 9.05it/s] 149it [00:16, 9.25it/s] 150it [00:16, 8.87it/s]2025-05-26 03:46:29,693 - INFO - [Epoch 091 | Batch 0150] IWAE-loss 4462.9419 | mean log_px -0.0253 | KL -2929.27 + 151it [00:16, 9.08it/s] 152it [00:16, 9.26it/s] 153it [00:16, 9.41it/s] 154it [00:17, 8.98it/s] 155it [00:17, 9.20it/s] 156it [00:17, 9.35it/s] 157it [00:17, 8.94it/s] 158it [00:17, 9.17it/s] 159it [00:17, 9.35it/s] 160it [00:17, 9.46it/s] 161it [00:17, 9.55it/s] 162it [00:17, 9.61it/s] 163it [00:18, 9.67it/s] 164it [00:18, 9.69it/s] 165it [00:18, 9.70it/s] 166it [00:18, 9.72it/s] 167it [00:18, 9.17it/s] 168it [00:18, 9.32it/s] 169it [00:18, 9.46it/s] 170it [00:18, 9.54it/s] 171it [00:18, 9.62it/s] 172it [00:18, 9.66it/s] 173it [00:19, 9.70it/s] 174it [00:19, 9.72it/s] 175it [00:19, 9.73it/s] 176it [00:19, 9.73it/s] 177it [00:19, 9.74it/s] 178it [00:19, 9.19it/s] 179it [00:19, 9.36it/s] 180it [00:19, 9.47it/s] 181it [00:19, 9.56it/s] 182it [00:20, 9.61it/s] 183it [00:20, 9.66it/s] 184it [00:20, 9.69it/s] 185it [00:20, 9.72it/s] 186it [00:20, 9.16it/s] 187it [00:20, 9.34it/s] 188it [00:20, 9.44it/s] 189it [00:20, 9.53it/s] 190it [00:20, 9.60it/s] 191it [00:20, 9.66it/s] 192it [00:21, 9.69it/s] 193it [00:21, 9.16it/s] 194it [00:21, 9.34it/s] 195it [00:21, 8.87it/s] 196it [00:21, 8.68it/s] 196it [00:21, 9.08it/s] +2025-05-26 03:46:34,573 - INFO - Epoch: 91, Objective: tensor([3768.4514], device='cuda:0', grad_fn=), Loss: 0.01296775322407484, KL/n: 59.81892013549805 + 0it [00:00, ?it/s]2025-05-26 03:46:35,035 - INFO - [Epoch 092 | Batch 0000] IWAE-loss 3812.1208 | mean log_px -0.0154 | KL -2928.92 + 1it [00:00, 5.35it/s] 2it [00:00, 7.19it/s] 3it [00:00, 8.19it/s] 4it [00:00, 8.25it/s] 5it [00:00, 8.65it/s] 6it [00:00, 8.85it/s] 7it [00:00, 8.63it/s] 8it [00:00, 8.93it/s] 9it [00:01, 9.17it/s] 10it [00:01, 9.34it/s] 11it [00:01, 9.45it/s] 12it [00:01, 9.54it/s] 13it [00:01, 9.59it/s] 14it [00:01, 9.61it/s] 15it [00:01, 9.66it/s] 16it [00:01, 9.45it/s] 17it [00:01, 9.50it/s] 18it [00:01, 9.56it/s] 19it [00:02, 9.61it/s] 20it [00:02, 9.65it/s] 21it [00:02, 9.69it/s] 22it [00:02, 9.71it/s] 23it [00:02, 9.72it/s] 24it [00:02, 9.48it/s] 25it [00:02, 9.42it/s] 26it [00:02, 9.48it/s] 27it [00:02, 9.55it/s] 28it [00:03, 9.62it/s] 29it [00:03, 9.65it/s] 30it [00:03, 9.69it/s] 31it [00:03, 9.69it/s] 32it [00:03, 9.71it/s] 33it [00:03, 9.73it/s] 34it [00:03, 9.73it/s] 35it [00:03, 9.76it/s] 36it [00:03, 9.77it/s] 37it [00:03, 9.78it/s] 38it [00:04, 9.78it/s] 39it [00:04, 9.76it/s] 40it [00:04, 9.77it/s] 41it [00:04, 9.78it/s] 42it [00:04, 9.20it/s] 43it [00:04, 9.27it/s] 44it [00:04, 9.33it/s] 45it [00:04, 9.39it/s] 46it [00:04, 9.46it/s] 47it [00:05, 9.16it/s] 48it [00:05, 9.22it/s] 49it [00:05, 9.28it/s] 50it [00:05, 9.35it/s]2025-05-26 03:46:40,296 - INFO - [Epoch 092 | Batch 0050] IWAE-loss 3494.9722 | mean log_px -0.0081 | KL -2923.38 + 51it [00:05, 9.43it/s] 52it [00:05, 9.47it/s] 53it [00:05, 9.51it/s] 54it [00:05, 9.45it/s] 55it [00:05, 9.44it/s] 56it [00:05, 9.43it/s] 57it [00:06, 9.41it/s] 58it [00:06, 9.40it/s] 59it [00:06, 9.47it/s] 60it [00:06, 9.48it/s] 61it [00:06, 9.49it/s] 62it [00:06, 9.46it/s] 63it [00:06, 9.50it/s] 64it [00:06, 9.13it/s] 65it [00:06, 9.21it/s] 66it [00:07, 9.30it/s] 67it [00:07, 9.37it/s] 68it [00:07, 9.43it/s] 69it [00:07, 9.52it/s] 70it [00:07, 9.47it/s] 71it [00:07, 9.46it/s] 72it [00:07, 8.98it/s] 73it [00:07, 9.20it/s] 74it [00:07, 9.24it/s] 75it [00:08, 9.31it/s] 76it [00:08, 9.36it/s] 77it [00:08, 9.39it/s] 78it [00:08, 9.42it/s] 79it [00:08, 9.46it/s] 80it [00:08, 9.47it/s] 81it [00:08, 9.48it/s] 82it [00:08, 8.98it/s] 83it [00:08, 9.18it/s] 84it [00:08, 9.26it/s] 85it [00:09, 9.27it/s] 86it [00:09, 9.12it/s] 87it [00:09, 8.64it/s] 88it [00:09, 8.95it/s] 89it [00:09, 9.21it/s] 90it [00:09, 9.43it/s] 91it [00:09, 9.56it/s] 92it [00:09, 9.15it/s] 93it [00:09, 9.32it/s] 94it [00:10, 9.41it/s] 96it [00:10, 9.69it/s] 97it [00:10, 9.74it/s] 98it [00:10, 9.77it/s] 99it [00:10, 9.26it/s] 100it [00:10, 9.38it/s]2025-05-26 03:46:45,639 - INFO - [Epoch 092 | Batch 0100] IWAE-loss 3449.9321 | mean log_px -0.0083 | KL -2921.72 + 101it [00:10, 9.48it/s] 102it [00:10, 9.50it/s] 103it [00:10, 9.50it/s] 104it [00:11, 9.09it/s] 105it [00:11, 9.28it/s] 106it [00:11, 9.44it/s] 107it [00:11, 9.58it/s] 108it [00:11, 9.64it/s] 109it [00:11, 9.71it/s] 110it [00:11, 9.69it/s] 111it [00:11, 9.71it/s] 112it [00:11, 9.76it/s] 114it [00:12, 9.86it/s] 115it [00:12, 9.84it/s] 116it [00:12, 9.85it/s] 117it [00:12, 9.88it/s] 118it [00:12, 9.87it/s] 119it [00:12, 9.88it/s] 120it [00:12, 9.90it/s] 121it [00:12, 9.39it/s] 122it [00:12, 9.50it/s] 123it [00:13, 9.64it/s] 124it [00:13, 9.69it/s] 125it [00:13, 9.73it/s] 126it [00:13, 9.78it/s] 127it [00:13, 9.82it/s] 128it [00:13, 9.83it/s] 130it [00:13, 9.88it/s] 131it [00:13, 9.88it/s] 132it [00:13, 9.86it/s] 133it [00:14, 9.86it/s] 134it [00:14, 9.68it/s] 135it [00:14, 9.69it/s] 136it [00:14, 9.72it/s] 137it [00:14, 9.75it/s] 138it [00:14, 9.76it/s] 139it [00:14, 9.79it/s] 140it [00:14, 9.68it/s] 141it [00:14, 9.69it/s] 142it [00:15, 9.73it/s] 143it [00:15, 9.75it/s] 144it [00:15, 9.77it/s] 145it [00:15, 9.77it/s] 146it [00:15, 9.76it/s] 147it [00:15, 9.79it/s] 148it [00:15, 9.79it/s] 149it [00:15, 9.77it/s] 150it [00:15, 9.76it/s]2025-05-26 03:46:50,778 - INFO - [Epoch 092 | Batch 0150] IWAE-loss 3478.1560 | mean log_px -0.0111 | KL -2921.63 + 151it [00:15, 9.74it/s] 152it [00:16, 9.76it/s] 153it [00:16, 9.78it/s] 154it [00:16, 9.77it/s] 155it [00:16, 9.79it/s] 156it [00:16, 9.78it/s] 157it [00:16, 9.74it/s] 158it [00:16, 9.76it/s] 159it [00:16, 9.78it/s] 160it [00:16, 9.77it/s] 161it [00:16, 9.78it/s] 162it [00:17, 9.79it/s] 163it [00:17, 9.82it/s] 164it [00:17, 9.82it/s] 165it [00:17, 9.83it/s] 166it [00:17, 9.82it/s] 167it [00:17, 9.83it/s] 168it [00:17, 9.84it/s] 169it [00:17, 9.84it/s] 170it [00:17, 9.82it/s] 171it [00:17, 9.82it/s] 172it [00:18, 9.82it/s] 173it [00:18, 9.81it/s] 174it [00:18, 9.81it/s] 175it [00:18, 9.82it/s] 176it [00:18, 9.81it/s] 177it [00:18, 9.83it/s] 178it [00:18, 9.83it/s] 179it [00:18, 9.84it/s] 180it [00:18, 9.83it/s] 181it [00:18, 9.84it/s] 182it [00:19, 9.82it/s] 183it [00:19, 9.83it/s] 184it [00:19, 9.61it/s] 185it [00:19, 9.67it/s] 186it [00:19, 9.71it/s] 187it [00:19, 9.71it/s] 188it [00:19, 9.53it/s] 189it [00:19, 8.93it/s] 190it [00:19, 8.90it/s] 191it [00:20, 9.19it/s] 193it [00:20, 9.60it/s] 195it [00:20, 9.07it/s] 196it [00:20, 9.49it/s] +2025-05-26 03:46:55,549 - INFO - Epoch: 92, Objective: tensor([3705.5750], device='cuda:0', grad_fn=), Loss: 0.016982443630695343, KL/n: 59.582088470458984 + 0it [00:00, ?it/s]2025-05-26 03:46:55,832 - INFO - [Epoch 093 | Batch 0000] IWAE-loss 4068.8088 | mean log_px -0.0203 | KL -2920.25 + 1it [00:00, 5.38it/s] 2it [00:00, 7.34it/s] 4it [00:00, 8.87it/s] 6it [00:00, 9.37it/s] 7it [00:00, 9.51it/s] 8it [00:00, 9.60it/s] 9it [00:00, 9.68it/s] 10it [00:01, 9.74it/s] 11it [00:01, 9.78it/s] 12it [00:01, 9.82it/s] 13it [00:01, 9.86it/s] 14it [00:01, 9.86it/s] 15it [00:01, 9.89it/s] 16it [00:01, 9.86it/s] 17it [00:01, 9.87it/s] 18it [00:01, 9.88it/s] 19it [00:02, 9.83it/s] 20it [00:02, 9.83it/s] 21it [00:02, 9.84it/s] 22it [00:02, 9.81it/s] 23it [00:02, 9.83it/s] 24it [00:02, 9.82it/s] 25it [00:02, 9.83it/s] 26it [00:02, 9.84it/s] 27it [00:02, 9.68it/s] 28it [00:02, 9.70it/s] 29it [00:03, 9.76it/s] 30it [00:03, 9.79it/s] 31it [00:03, 9.83it/s] 32it [00:03, 9.80it/s] 33it [00:03, 9.83it/s] 34it [00:03, 9.81it/s] 35it [00:03, 9.83it/s] 36it [00:03, 9.79it/s] 37it [00:03, 9.82it/s] 38it [00:03, 9.80it/s] 39it [00:04, 9.83it/s] 40it [00:04, 9.84it/s] 41it [00:04, 9.86it/s] 42it [00:04, 9.87it/s] 43it [00:04, 9.89it/s] 44it [00:04, 9.88it/s] 45it [00:04, 9.65it/s] 46it [00:04, 9.71it/s] 47it [00:04, 9.58it/s] 48it [00:04, 9.62it/s] 49it [00:05, 9.66it/s] 50it [00:05, 9.73it/s]2025-05-26 03:47:00,920 - INFO - [Epoch 093 | Batch 0050] IWAE-loss 4193.2715 | mean log_px -0.0235 | KL -2915.12 + 51it [00:05, 9.75it/s] 52it [00:05, 9.78it/s] 53it [00:05, 9.82it/s] 54it [00:05, 9.83it/s] 55it [00:05, 9.77it/s] 56it [00:05, 9.80it/s] 57it [00:05, 9.83it/s] 58it [00:05, 9.85it/s] 59it [00:06, 9.87it/s] 60it [00:06, 9.67it/s] 61it [00:06, 9.65it/s] 62it [00:06, 9.71it/s] 63it [00:06, 9.76it/s] 64it [00:06, 9.76it/s] 65it [00:06, 9.79it/s] 66it [00:06, 9.81it/s] 67it [00:06, 9.80it/s] 68it [00:07, 9.82it/s] 69it [00:07, 9.79it/s] 70it [00:07, 9.43it/s] 71it [00:07, 9.52it/s] 72it [00:07, 9.57it/s] 73it [00:07, 9.66it/s] 74it [00:07, 9.73it/s] 75it [00:07, 9.75it/s] 76it [00:07, 9.78it/s] 77it [00:07, 9.81it/s] 78it [00:08, 9.77it/s] 79it [00:08, 9.80it/s] 80it [00:08, 9.82it/s] 81it [00:08, 9.84it/s] 82it [00:08, 9.84it/s] 83it [00:08, 9.83it/s] 84it [00:08, 9.84it/s] 85it [00:08, 9.87it/s] 86it [00:08, 9.88it/s] 87it [00:08, 9.88it/s] 88it [00:09, 9.88it/s] 89it [00:09, 9.90it/s] 90it [00:09, 9.89it/s] 91it [00:09, 9.89it/s] 92it [00:09, 9.88it/s] 93it [00:09, 9.89it/s] 94it [00:09, 9.88it/s] 95it [00:09, 9.89it/s] 96it [00:09, 9.89it/s] 97it [00:09, 9.90it/s] 98it [00:10, 9.89it/s] 99it [00:10, 9.91it/s] 100it [00:10, 9.90it/s]2025-05-26 03:47:06,017 - INFO - [Epoch 093 | Batch 0100] IWAE-loss 3753.0735 | mean log_px -0.0142 | KL -2914.49 + 101it [00:10, 9.88it/s] 102it [00:10, 9.87it/s] 103it [00:10, 9.90it/s] 104it [00:10, 9.89it/s] 105it [00:10, 9.89it/s] 106it [00:10, 9.89it/s] 107it [00:10, 9.90it/s] 108it [00:11, 9.88it/s] 109it [00:11, 9.89it/s] 110it [00:11, 9.79it/s] 111it [00:11, 9.66it/s] 112it [00:11, 9.38it/s] 113it [00:11, 9.47it/s] 114it [00:11, 9.55it/s] 115it [00:11, 9.62it/s] 116it [00:11, 9.64it/s] 117it [00:12, 9.66it/s] 118it [00:12, 9.68it/s] 119it [00:12, 9.70it/s] 120it [00:12, 9.71it/s] 121it [00:12, 9.71it/s] 122it [00:12, 9.68it/s] 123it [00:12, 9.71it/s] 124it [00:12, 9.74it/s] 125it [00:12, 9.80it/s] 126it [00:12, 9.83it/s] 127it [00:13, 9.86it/s] 128it [00:13, 9.86it/s] 129it [00:13, 9.89it/s] 130it [00:13, 9.90it/s] 131it [00:13, 9.91it/s] 132it [00:13, 9.74it/s] 133it [00:13, 9.69it/s] 134it [00:13, 9.72it/s] 135it [00:13, 9.77it/s] 136it [00:13, 9.75it/s] 137it [00:14, 9.79it/s] 138it [00:14, 9.80it/s] 139it [00:14, 9.82it/s] 140it [00:14, 9.83it/s] 141it [00:14, 9.85it/s] 142it [00:14, 9.87it/s] 143it [00:14, 9.83it/s] 144it [00:14, 9.82it/s] 145it [00:14, 9.84it/s] 146it [00:14, 9.82it/s] 147it [00:15, 9.84it/s] 148it [00:15, 9.85it/s] 149it [00:15, 9.89it/s] 150it [00:15, 9.90it/s]2025-05-26 03:47:11,129 - INFO - [Epoch 093 | Batch 0150] IWAE-loss 3694.4592 | mean log_px -0.0135 | KL -2910.63 + 151it [00:15, 9.89it/s] 152it [00:15, 9.89it/s] 153it [00:15, 9.91it/s] 154it [00:15, 9.92it/s] 155it [00:15, 9.93it/s] 156it [00:15, 9.92it/s] 157it [00:16, 9.93it/s] 158it [00:16, 9.77it/s] 159it [00:16, 9.78it/s] 160it [00:16, 9.80it/s] 161it [00:16, 9.84it/s] 162it [00:16, 9.87it/s] 163it [00:16, 9.88it/s] 164it [00:16, 9.89it/s] 165it [00:16, 9.91it/s] 166it [00:17, 9.90it/s] 167it [00:17, 9.91it/s] 168it [00:17, 9.92it/s] 169it [00:17, 9.93it/s] 170it [00:17, 9.92it/s] 171it [00:17, 9.92it/s] 172it [00:17, 9.92it/s] 173it [00:17, 9.94it/s] 174it [00:17, 9.94it/s] 175it [00:17, 9.94it/s] 176it [00:18, 9.94it/s] 177it [00:18, 9.94it/s] 178it [00:18, 9.93it/s] 179it [00:18, 9.90it/s] 180it [00:18, 9.90it/s] 181it [00:18, 9.90it/s] 182it [00:18, 9.90it/s] 183it [00:18, 9.91it/s] 184it [00:18, 9.78it/s] 185it [00:18, 9.68it/s] 186it [00:19, 9.69it/s] 187it [00:19, 9.77it/s] 188it [00:19, 9.81it/s] 189it [00:19, 9.85it/s] 190it [00:19, 9.87it/s] 191it [00:19, 9.89it/s] 192it [00:19, 9.88it/s] 193it [00:19, 9.90it/s] 194it [00:19, 9.90it/s] 195it [00:19, 9.41it/s] 196it [00:20, 9.75it/s] +2025-05-26 03:47:15,798 - INFO - Epoch: 93, Objective: tensor([3518.6760], device='cuda:0', grad_fn=), Loss: 0.009369171224534512, KL/n: 59.381324768066406 + 0it [00:00, ?it/s]2025-05-26 03:47:16,259 - INFO - [Epoch 094 | Batch 0000] IWAE-loss 3675.7261 | mean log_px -0.0113 | KL -2903.85 + 1it [00:00, 5.34it/s] 2it [00:00, 7.14it/s] 3it [00:00, 8.18it/s] 4it [00:00, 8.76it/s] 5it [00:00, 9.11it/s] 6it [00:00, 9.33it/s] 7it [00:00, 9.49it/s] 8it [00:00, 9.58it/s] 9it [00:01, 9.63it/s] 10it [00:01, 9.68it/s] 11it [00:01, 9.73it/s] 12it [00:01, 9.74it/s] 13it [00:01, 9.77it/s] 14it [00:01, 9.58it/s] 15it [00:01, 9.60it/s] 16it [00:01, 9.65it/s] 17it [00:01, 9.72it/s] 18it [00:01, 9.74it/s] 19it [00:02, 9.79it/s] 20it [00:02, 9.81it/s] 21it [00:02, 9.83it/s] 22it [00:02, 9.82it/s] 23it [00:02, 9.85it/s] 24it [00:02, 9.85it/s] 25it [00:02, 9.86it/s] 26it [00:02, 9.87it/s] 27it [00:02, 9.88it/s] 28it [00:02, 9.88it/s] 29it [00:03, 9.89it/s] 30it [00:03, 9.87it/s] 31it [00:03, 9.88it/s] 32it [00:03, 9.89it/s] 33it [00:03, 9.90it/s] 34it [00:03, 9.68it/s] 35it [00:03, 9.74it/s] 36it [00:03, 9.77it/s] 37it [00:03, 9.81it/s] 38it [00:03, 9.82it/s] 39it [00:04, 9.85it/s] 40it [00:04, 9.84it/s] 41it [00:04, 9.87it/s] 42it [00:04, 9.86it/s] 43it [00:04, 9.88it/s] 44it [00:04, 9.87it/s] 45it [00:04, 9.87it/s] 46it [00:04, 9.86it/s] 47it [00:04, 9.86it/s] 48it [00:04, 9.85it/s] 49it [00:05, 9.86it/s] 50it [00:05, 9.86it/s]2025-05-26 03:47:21,358 - INFO - [Epoch 094 | Batch 0050] IWAE-loss 4268.3975 | mean log_px -0.0242 | KL -2905.98 + 51it [00:05, 9.85it/s] 52it [00:05, 9.85it/s] 53it [00:05, 9.85it/s] 54it [00:05, 9.85it/s] 55it [00:05, 9.87it/s] 56it [00:05, 9.86it/s] 57it [00:05, 9.85it/s] 58it [00:05, 9.85it/s] 59it [00:06, 9.86it/s] 60it [00:06, 9.86it/s] 61it [00:06, 9.86it/s] 62it [00:06, 9.85it/s] 63it [00:06, 9.85it/s] 64it [00:06, 9.84it/s] 65it [00:06, 9.84it/s] 66it [00:06, 9.83it/s] 67it [00:06, 9.86it/s] 68it [00:07, 9.84it/s] 69it [00:07, 9.70it/s] 70it [00:07, 9.73it/s] 71it [00:07, 9.77it/s] 72it [00:07, 9.80it/s] 73it [00:07, 9.82it/s] 74it [00:07, 9.81it/s] 75it [00:07, 9.82it/s] 76it [00:07, 9.81it/s] 77it [00:07, 9.85it/s] 78it [00:08, 9.84it/s] 79it [00:08, 9.83it/s] 80it [00:08, 9.82it/s] 81it [00:08, 9.83it/s] 82it [00:08, 9.82it/s] 83it [00:08, 9.82it/s] 84it [00:08, 9.82it/s] 85it [00:08, 9.84it/s] 86it [00:08, 9.84it/s] 87it [00:08, 9.84it/s] 88it [00:09, 9.84it/s] 89it [00:09, 9.85it/s] 90it [00:09, 9.84it/s] 91it [00:09, 9.85it/s] 92it [00:09, 9.84it/s] 93it [00:09, 9.85it/s] 94it [00:09, 9.83it/s] 95it [00:09, 9.84it/s] 96it [00:09, 9.83it/s] 97it [00:09, 9.84it/s] 98it [00:10, 9.84it/s] 99it [00:10, 9.85it/s] 100it [00:10, 9.85it/s]2025-05-26 03:47:26,444 - INFO - [Epoch 094 | Batch 0100] IWAE-loss 3504.3542 | mean log_px -0.0100 | KL -2904.47 + 101it [00:10, 9.83it/s] 102it [00:10, 9.83it/s] 103it [00:10, 9.85it/s] 104it [00:10, 9.88it/s] 106it [00:10, 9.96it/s] 108it [00:11, 10.01it/s] 110it [00:11, 10.03it/s] 112it [00:11, 10.05it/s] 114it [00:11, 9.69it/s] 116it [00:11, 9.81it/s] 118it [00:12, 9.89it/s] 120it [00:12, 9.94it/s] 122it [00:12, 9.98it/s] 124it [00:12, 10.00it/s] 126it [00:12, 10.00it/s] 128it [00:13, 10.01it/s] 130it [00:13, 9.69it/s] 131it [00:13, 9.50it/s] 132it [00:13, 9.59it/s] 133it [00:13, 9.22it/s] 134it [00:13, 9.39it/s] 136it [00:13, 9.65it/s] 138it [00:14, 9.80it/s] 140it [00:14, 9.88it/s] 142it [00:14, 9.91it/s] 144it [00:14, 9.98it/s] 146it [00:14, 10.01it/s] 148it [00:15, 9.69it/s] 150it [00:15, 9.80it/s]2025-05-26 03:47:31,532 - INFO - [Epoch 094 | Batch 0150] IWAE-loss 3472.2581 | mean log_px -0.0113 | KL -2900.82 + 151it [00:15, 9.83it/s] 153it [00:15, 9.62it/s] 155it [00:15, 9.76it/s] 156it [00:15, 9.80it/s] 158it [00:16, 9.89it/s] 159it [00:16, 9.90it/s] 160it [00:16, 9.91it/s] 162it [00:16, 9.96it/s] 163it [00:16, 9.97it/s] 165it [00:16, 10.00it/s] 167it [00:17, 10.03it/s] 169it [00:17, 9.66it/s] 170it [00:17, 9.72it/s] 171it [00:17, 9.75it/s] 172it [00:17, 9.28it/s] 174it [00:17, 9.58it/s] 175it [00:17, 9.67it/s] 176it [00:18, 9.74it/s] 177it [00:18, 9.80it/s] 178it [00:18, 9.84it/s] 179it [00:18, 9.85it/s] 180it [00:18, 9.89it/s] 181it [00:18, 9.77it/s] 182it [00:18, 9.69it/s] 183it [00:18, 9.72it/s] 184it [00:18, 9.77it/s] 185it [00:18, 9.34it/s] 186it [00:19, 9.50it/s] 187it [00:19, 9.64it/s] 189it [00:19, 9.83it/s] 191it [00:19, 9.46it/s] 192it [00:19, 9.57it/s] 194it [00:19, 9.74it/s] 195it [00:20, 9.03it/s] 196it [00:20, 9.71it/s] +2025-05-26 03:47:36,291 - INFO - Epoch: 94, Objective: tensor([3317.0979], device='cuda:0', grad_fn=), Loss: 0.006679388228803873, KL/n: 59.15084457397461 + 0it [00:00, ?it/s]2025-05-26 03:47:36,564 - INFO - [Epoch 095 | Batch 0000] IWAE-loss 3526.1443 | mean log_px -0.0090 | KL -2896.83 + 1it [00:00, 5.45it/s] 2it [00:00, 6.67it/s] 3it [00:00, 7.86it/s] 5it [00:00, 8.98it/s] 6it [00:00, 9.24it/s] 8it [00:00, 9.61it/s] 10it [00:01, 9.78it/s] 12it [00:01, 9.88it/s] 14it [00:01, 9.93it/s] 16it [00:01, 9.97it/s] 18it [00:01, 9.60it/s] 19it [00:02, 9.51it/s] 20it [00:02, 9.01it/s] 21it [00:02, 9.18it/s] 22it [00:02, 9.29it/s] 23it [00:02, 9.43it/s] 24it [00:02, 9.17it/s] 25it [00:02, 9.33it/s] 26it [00:02, 9.47it/s] 27it [00:02, 9.58it/s] 28it [00:03, 9.59it/s] 29it [00:03, 9.04it/s] 30it [00:03, 9.22it/s] 31it [00:03, 9.36it/s] 32it [00:03, 9.51it/s] 33it [00:03, 9.50it/s] 34it [00:03, 9.52it/s] 35it [00:03, 9.15it/s] 36it [00:03, 9.36it/s] 37it [00:03, 9.53it/s] 38it [00:04, 9.64it/s] 39it [00:04, 9.73it/s] 40it [00:04, 9.13it/s] 41it [00:04, 9.37it/s] 42it [00:04, 9.52it/s] 43it [00:04, 9.65it/s] 44it [00:04, 9.74it/s] 45it [00:04, 9.80it/s] 46it [00:04, 9.82it/s] 47it [00:04, 9.86it/s] 48it [00:05, 9.89it/s] 50it [00:05, 9.93it/s]2025-05-26 03:47:41,785 - INFO - [Epoch 095 | Batch 0050] IWAE-loss 3349.6074 | mean log_px -0.0067 | KL -2888.48 + 51it [00:05, 9.39it/s] 52it [00:05, 9.54it/s] 53it [00:05, 9.65it/s] 54it [00:05, 9.73it/s] 55it [00:05, 9.31it/s] 56it [00:05, 9.48it/s] 57it [00:06, 9.63it/s] 58it [00:06, 9.71it/s] 59it [00:06, 9.78it/s] 60it [00:06, 9.83it/s] 61it [00:06, 9.87it/s] 62it [00:06, 9.88it/s] 63it [00:06, 9.88it/s] 64it [00:06, 9.29it/s] 66it [00:06, 9.61it/s] 67it [00:07, 9.67it/s] 68it [00:07, 9.18it/s] 69it [00:07, 9.38it/s] 70it [00:07, 9.54it/s] 71it [00:07, 9.66it/s] 72it [00:07, 9.68it/s] 73it [00:07, 9.77it/s] 74it [00:07, 9.79it/s] 76it [00:08, 9.89it/s] 77it [00:08, 9.38it/s] 78it [00:08, 9.51it/s] 79it [00:08, 9.63it/s] 80it [00:08, 9.24it/s] 81it [00:08, 9.43it/s] 82it [00:08, 9.57it/s] 84it [00:08, 9.77it/s] 85it [00:08, 9.82it/s] 86it [00:09, 9.86it/s] 87it [00:09, 9.89it/s] 88it [00:09, 9.33it/s] 90it [00:09, 9.62it/s] 91it [00:09, 9.70it/s] 92it [00:09, 9.26it/s] 93it [00:09, 9.44it/s] 94it [00:09, 9.57it/s] 95it [00:09, 9.68it/s] 96it [00:10, 9.77it/s] 98it [00:10, 9.39it/s] 100it [00:10, 9.63it/s]2025-05-26 03:47:47,003 - INFO - [Epoch 095 | Batch 0100] IWAE-loss 3535.2415 | mean log_px -0.0105 | KL -2890.72 + 101it [00:10, 9.67it/s] 102it [00:10, 9.74it/s] 103it [00:10, 9.79it/s] 105it [00:11, 9.90it/s] 106it [00:11, 9.92it/s] 107it [00:11, 9.92it/s] 108it [00:11, 9.91it/s] 109it [00:11, 9.33it/s] 110it [00:11, 9.50it/s] 112it [00:11, 9.74it/s] 114it [00:11, 9.43it/s] 115it [00:12, 9.49it/s] 116it [00:12, 9.49it/s] 117it [00:12, 9.59it/s] 118it [00:12, 9.70it/s] 120it [00:12, 9.85it/s] 121it [00:12, 9.86it/s] 122it [00:12, 9.32it/s] 124it [00:13, 9.57it/s] 125it [00:13, 9.65it/s] 126it [00:13, 9.72it/s] 128it [00:13, 9.86it/s] 130it [00:13, 9.90it/s] 131it [00:13, 9.81it/s] 132it [00:13, 9.45it/s] 134it [00:14, 9.68it/s] 136it [00:14, 9.81it/s] 138it [00:14, 9.88it/s] 139it [00:14, 9.90it/s] 141it [00:14, 9.94it/s] 142it [00:14, 9.94it/s] 144it [00:15, 9.97it/s] 145it [00:15, 9.97it/s] 146it [00:15, 9.96it/s] 147it [00:15, 9.96it/s] 149it [00:15, 9.99it/s] 150it [00:15, 9.98it/s]2025-05-26 03:47:52,111 - INFO - [Epoch 095 | Batch 0150] IWAE-loss 4350.0732 | mean log_px -0.0231 | KL -2887.25 + 151it [00:15, 9.43it/s] 153it [00:15, 9.67it/s] 154it [00:16, 9.73it/s] 155it [00:16, 9.77it/s] 156it [00:16, 9.83it/s] 157it [00:16, 9.86it/s] 158it [00:16, 9.89it/s] 159it [00:16, 9.76it/s] 160it [00:16, 9.31it/s] 161it [00:16, 9.50it/s] 162it [00:16, 9.63it/s] 164it [00:17, 9.81it/s] 165it [00:17, 9.86it/s] 166it [00:17, 9.88it/s] 167it [00:17, 9.90it/s] 169it [00:17, 9.96it/s] 170it [00:17, 9.97it/s] 171it [00:17, 9.41it/s] 172it [00:17, 9.55it/s] 173it [00:18, 9.62it/s] 174it [00:18, 9.72it/s] 175it [00:18, 9.33it/s] 176it [00:18, 9.49it/s] 177it [00:18, 9.63it/s] 178it [00:18, 9.12it/s] 180it [00:18, 9.51it/s] 181it [00:18, 9.22it/s] 182it [00:18, 9.40it/s] 183it [00:19, 9.55it/s] 184it [00:19, 9.65it/s] 186it [00:19, 9.80it/s] 187it [00:19, 9.44it/s] 188it [00:19, 9.55it/s] 189it [00:19, 9.66it/s] 190it [00:19, 9.74it/s] 191it [00:19, 9.19it/s] 192it [00:20, 9.39it/s] 193it [00:20, 9.56it/s] 195it [00:20, 9.43it/s] 196it [00:20, 9.22it/s] 196it [00:20, 9.56it/s] +2025-05-26 03:47:56,925 - INFO - Epoch: 95, Objective: tensor([3332.1047], device='cuda:0', grad_fn=), Loss: 0.008258700370788574, KL/n: 58.8862190246582 + 0it [00:00, ?it/s]2025-05-26 03:47:57,394 - INFO - [Epoch 096 | Batch 0000] IWAE-loss 4336.8301 | mean log_px -0.0305 | KL -2885.20 + 1it [00:00, 5.34it/s] 2it [00:00, 6.76it/s] 4it [00:00, 8.49it/s] 6it [00:00, 9.16it/s] 7it [00:00, 8.89it/s] 8it [00:00, 9.16it/s] 10it [00:01, 9.52it/s] 12it [00:01, 9.73it/s] 14it [00:01, 9.84it/s] 15it [00:01, 9.44it/s] 16it [00:01, 9.49it/s] 18it [00:01, 9.67it/s] 20it [00:02, 9.75it/s] 22it [00:02, 9.82it/s] 23it [00:02, 9.84it/s] 24it [00:02, 9.87it/s] 25it [00:02, 9.52it/s] 26it [00:02, 9.63it/s] 28it [00:02, 9.79it/s] 29it [00:03, 9.84it/s] 30it [00:03, 9.87it/s] 32it [00:03, 9.47it/s] 33it [00:03, 9.55it/s] 34it [00:03, 9.65it/s] 36it [00:03, 9.82it/s] 37it [00:03, 9.86it/s] 38it [00:03, 9.87it/s] 39it [00:04, 9.90it/s] 40it [00:04, 9.43it/s] 42it [00:04, 9.68it/s] 43it [00:04, 9.74it/s] 44it [00:04, 9.74it/s] 45it [00:04, 9.75it/s] 46it [00:04, 9.35it/s] 48it [00:05, 9.64it/s] 49it [00:05, 9.71it/s] 50it [00:05, 9.22it/s]2025-05-26 03:48:02,579 - INFO - [Epoch 096 | Batch 0050] IWAE-loss 3660.0618 | mean log_px -0.0111 | KL -2883.02 + 51it [00:05, 9.33it/s] 52it [00:05, 9.50it/s] 54it [00:05, 9.72it/s] 55it [00:05, 9.78it/s] 56it [00:05, 9.82it/s] 57it [00:05, 9.31it/s] 59it [00:06, 9.60it/s] 61it [00:06, 9.77it/s] 62it [00:06, 9.80it/s] 63it [00:06, 9.83it/s] 64it [00:06, 9.84it/s] 66it [00:06, 9.91it/s] 68it [00:07, 9.54it/s] 69it [00:07, 9.63it/s] 70it [00:07, 9.56it/s] 71it [00:07, 9.52it/s] 72it [00:07, 9.03it/s] 73it [00:07, 9.27it/s] 74it [00:07, 9.45it/s] 75it [00:07, 9.60it/s] 76it [00:07, 9.65it/s] 77it [00:08, 9.63it/s] 78it [00:08, 9.50it/s] 80it [00:08, 9.75it/s] 81it [00:08, 9.29it/s] 82it [00:08, 9.44it/s] 83it [00:08, 9.58it/s] 84it [00:08, 9.68it/s] 86it [00:08, 9.84it/s] 87it [00:09, 9.78it/s] 88it [00:09, 9.40it/s] 89it [00:09, 9.54it/s] 90it [00:09, 9.64it/s] 92it [00:09, 9.80it/s] 94it [00:09, 9.88it/s] 96it [00:10, 9.93it/s] 98it [00:10, 9.96it/s] 99it [00:10, 9.95it/s] 100it [00:10, 9.95it/s]2025-05-26 03:48:07,732 - INFO - [Epoch 096 | Batch 0100] IWAE-loss 3525.8738 | mean log_px -0.0101 | KL -2880.33 + 101it [00:10, 9.44it/s] 102it [00:10, 9.57it/s] 104it [00:10, 9.75it/s] 105it [00:10, 9.78it/s] 106it [00:11, 9.83it/s] 107it [00:11, 9.79it/s] 109it [00:11, 9.90it/s] 110it [00:11, 9.92it/s] 111it [00:11, 9.86it/s] 112it [00:11, 9.81it/s] 113it [00:11, 9.81it/s] 114it [00:11, 9.22it/s] 115it [00:11, 9.42it/s] 116it [00:12, 9.45it/s] 117it [00:12, 9.10it/s] 118it [00:12, 9.18it/s] 119it [00:12, 9.18it/s] 120it [00:12, 9.28it/s] 121it [00:12, 9.41it/s] 122it [00:12, 9.03it/s] 123it [00:12, 9.18it/s] 124it [00:12, 9.31it/s] 125it [00:13, 9.44it/s] 126it [00:13, 9.52it/s] 127it [00:13, 9.58it/s] 128it [00:13, 9.60it/s] 129it [00:13, 9.62it/s] 130it [00:13, 9.64it/s] 131it [00:13, 9.56it/s] 132it [00:13, 9.47it/s] 133it [00:13, 9.02it/s] 134it [00:14, 9.26it/s] 135it [00:14, 9.45it/s] 136it [00:14, 9.54it/s] 137it [00:14, 9.63it/s] 138it [00:14, 9.07it/s] 139it [00:14, 9.28it/s] 140it [00:14, 9.42it/s] 141it [00:14, 9.48it/s] 142it [00:14, 8.94it/s] 143it [00:14, 9.16it/s] 144it [00:15, 9.33it/s] 146it [00:15, 9.65it/s] 148it [00:15, 9.79it/s] 149it [00:15, 9.83it/s] 150it [00:15, 9.85it/s]2025-05-26 03:48:13,000 - INFO - [Epoch 096 | Batch 0150] IWAE-loss 3406.4150 | mean log_px -0.0099 | KL -2879.07 + 151it [00:15, 9.34it/s] 153it [00:16, 9.63it/s] 154it [00:16, 9.70it/s] 156it [00:16, 9.83it/s] 157it [00:16, 9.87it/s] 158it [00:16, 9.88it/s] 159it [00:16, 9.91it/s] 160it [00:16, 9.92it/s] 161it [00:16, 9.91it/s] 162it [00:16, 9.52it/s] 164it [00:17, 9.72it/s] 166it [00:17, 9.84it/s] 167it [00:17, 9.86it/s] 169it [00:17, 9.93it/s] 170it [00:17, 9.93it/s] 172it [00:17, 9.96it/s] 174it [00:18, 9.99it/s] 176it [00:18, 10.00it/s] 178it [00:18, 10.00it/s] 179it [00:18, 9.99it/s] 181it [00:18, 10.01it/s] 182it [00:18, 10.00it/s] 183it [00:19, 9.98it/s] 184it [00:19, 9.98it/s] 185it [00:19, 9.98it/s] 186it [00:19, 9.98it/s] 187it [00:19, 9.98it/s] 188it [00:19, 9.98it/s] 190it [00:19, 10.00it/s] 191it [00:19, 9.99it/s] 192it [00:19, 9.97it/s] 193it [00:20, 9.98it/s] 194it [00:20, 9.97it/s] 195it [00:20, 9.55it/s] 196it [00:20, 9.28it/s] 196it [00:20, 9.59it/s] +2025-05-26 03:48:17,680 - INFO - Epoch: 96, Objective: tensor([3542.8840], device='cuda:0', grad_fn=), Loss: 0.012501702643930912, KL/n: 58.68415069580078 + 0it [00:00, ?it/s]2025-05-26 03:48:17,962 - INFO - [Epoch 097 | Batch 0000] IWAE-loss 4043.2427 | mean log_px -0.0168 | KL -2875.78 + 1it [00:00, 5.34it/s] 2it [00:00, 6.77it/s] 4it [00:00, 8.53it/s] 6it [00:00, 9.22it/s] 8it [00:00, 9.55it/s] 10it [00:01, 9.72it/s] 12it [00:01, 9.85it/s] 14it [00:01, 9.55it/s] 16it [00:01, 9.72it/s] 18it [00:01, 9.84it/s] 20it [00:02, 9.92it/s] 22it [00:02, 9.95it/s] 23it [00:02, 9.91it/s] 24it [00:02, 9.91it/s] 26it [00:02, 9.67it/s] 28it [00:02, 9.80it/s] 29it [00:03, 9.83it/s] 31it [00:03, 9.92it/s] 33it [00:03, 9.98it/s] 35it [00:03, 10.03it/s] 37it [00:03, 10.06it/s] 39it [00:04, 10.07it/s] 41it [00:04, 10.08it/s] 43it [00:04, 10.08it/s] 45it [00:04, 9.74it/s] 47it [00:04, 9.85it/s] 49it [00:05, 9.92it/s]2025-05-26 03:48:23,012 - INFO - [Epoch 097 | Batch 0050] IWAE-loss 3348.9727 | mean log_px -0.0105 | KL -2877.25 + 51it [00:05, 9.63it/s] 53it [00:05, 9.76it/s] 55it [00:05, 9.86it/s] 57it [00:05, 9.94it/s] 59it [00:06, 9.98it/s] 61it [00:06, 10.02it/s] 63it [00:06, 10.03it/s] 65it [00:06, 9.80it/s] 67it [00:06, 9.89it/s] 68it [00:06, 9.89it/s] 70it [00:07, 9.95it/s] 72it [00:07, 9.99it/s] 74it [00:07, 10.03it/s] 76it [00:07, 10.04it/s] 78it [00:07, 10.05it/s] 80it [00:08, 9.72it/s] 82it [00:08, 9.83it/s] 84it [00:08, 9.92it/s] 86it [00:08, 9.97it/s] 88it [00:08, 10.00it/s] 90it [00:09, 10.03it/s] 92it [00:09, 10.05it/s] 94it [00:09, 9.72it/s] 96it [00:09, 9.83it/s] 97it [00:09, 9.50it/s] 99it [00:10, 9.67it/s]2025-05-26 03:48:28,080 - INFO - [Epoch 097 | Batch 0100] IWAE-loss 3721.4724 | mean log_px -0.0175 | KL -2865.73 + 101it [00:10, 9.44it/s] 102it [00:10, 9.53it/s] 103it [00:10, 9.55it/s] 104it [00:10, 9.24it/s] 105it [00:10, 9.41it/s] 106it [00:10, 9.53it/s] 107it [00:10, 9.64it/s] 108it [00:11, 9.27it/s] 109it [00:11, 9.44it/s] 110it [00:11, 9.57it/s] 111it [00:11, 9.02it/s] 112it [00:11, 9.26it/s] 113it [00:11, 9.40it/s] 114it [00:11, 9.54it/s] 115it [00:11, 9.02it/s] 116it [00:11, 9.26it/s] 117it [00:12, 9.47it/s] 119it [00:12, 9.75it/s] 121it [00:12, 9.88it/s] 123it [00:12, 9.95it/s] 124it [00:12, 9.61it/s] 126it [00:12, 9.79it/s] 128it [00:13, 9.89it/s] 130it [00:13, 9.96it/s] 132it [00:13, 10.01it/s] 134it [00:13, 10.04it/s] 135it [00:13, 9.98it/s] 136it [00:13, 9.93it/s] 138it [00:14, 9.98it/s] 140it [00:14, 9.63it/s] 142it [00:14, 9.78it/s] 144it [00:14, 9.88it/s] 146it [00:14, 9.94it/s] 148it [00:15, 9.99it/s] 149it [00:15, 9.96it/s] 150it [00:15, 9.51it/s]2025-05-26 03:48:33,253 - INFO - [Epoch 097 | Batch 0150] IWAE-loss 3712.6641 | mean log_px -0.0218 | KL -2866.04 + 151it [00:15, 9.57it/s] 152it [00:15, 9.66it/s] 154it [00:15, 9.82it/s] 155it [00:15, 9.43it/s] 157it [00:16, 9.65it/s] 158it [00:16, 9.71it/s] 159it [00:16, 9.75it/s] 160it [00:16, 9.81it/s] 162it [00:16, 9.91it/s] 163it [00:16, 9.54it/s] 165it [00:16, 9.76it/s] 167it [00:17, 9.88it/s] 169it [00:17, 9.96it/s] 171it [00:17, 10.00it/s] 173it [00:17, 10.04it/s] 175it [00:17, 10.06it/s] 177it [00:18, 9.80it/s] 179it [00:18, 9.89it/s] 180it [00:18, 9.60it/s] 182it [00:18, 9.77it/s] 184it [00:18, 9.87it/s] 185it [00:18, 9.80it/s] 186it [00:19, 9.38it/s] 187it [00:19, 9.45it/s] 189it [00:19, 9.71it/s] 191it [00:19, 9.85it/s] 193it [00:19, 9.95it/s] 195it [00:19, 9.73it/s] 196it [00:20, 9.74it/s] +2025-05-26 03:48:37,942 - INFO - Epoch: 97, Objective: tensor([3453.2244], device='cuda:0', grad_fn=), Loss: 0.01020082551985979, KL/n: 58.48168182373047 + 0it [00:00, ?it/s]2025-05-26 03:48:38,405 - INFO - [Epoch 098 | Batch 0000] IWAE-loss 3513.9075 | mean log_px -0.0093 | KL -2864.63 + 1it [00:00, 4.67it/s] 2it [00:00, 6.74it/s] 4it [00:00, 8.49it/s] 5it [00:00, 8.85it/s] 6it [00:00, 9.15it/s] 7it [00:00, 9.35it/s] 8it [00:00, 9.52it/s] 9it [00:01, 9.64it/s] 10it [00:01, 9.69it/s] 11it [00:01, 9.73it/s] 12it [00:01, 9.79it/s] 14it [00:01, 9.90it/s] 15it [00:01, 9.74it/s] 16it [00:01, 9.22it/s] 17it [00:01, 9.40it/s] 19it [00:02, 9.65it/s] 20it [00:02, 9.70it/s] 22it [00:02, 9.80it/s] 23it [00:02, 9.77it/s] 24it [00:02, 9.75it/s] 25it [00:02, 9.76it/s] 26it [00:02, 9.76it/s] 27it [00:02, 9.19it/s] 28it [00:03, 9.34it/s] 29it [00:03, 9.40it/s] 30it [00:03, 9.49it/s] 31it [00:03, 9.58it/s] 32it [00:03, 9.66it/s] 33it [00:03, 9.70it/s] 34it [00:03, 9.03it/s] 35it [00:03, 9.25it/s] 36it [00:03, 9.39it/s] 37it [00:03, 9.47it/s] 38it [00:04, 9.56it/s] 39it [00:04, 8.95it/s] 40it [00:04, 9.06it/s] 41it [00:04, 9.25it/s] 42it [00:04, 9.45it/s] 44it [00:04, 9.73it/s] 46it [00:04, 9.87it/s] 48it [00:05, 9.95it/s] 50it [00:05, 10.02it/s]2025-05-26 03:48:43,607 - INFO - [Epoch 098 | Batch 0050] IWAE-loss 4490.0361 | mean log_px -0.0283 | KL -2859.88 + 51it [00:05, 10.01it/s] 53it [00:05, 10.04it/s] 55it [00:05, 9.62it/s] 56it [00:05, 9.30it/s] 58it [00:06, 9.52it/s] 59it [00:06, 9.21it/s] 61it [00:06, 9.51it/s] 63it [00:06, 9.71it/s] 65it [00:06, 9.84it/s] 67it [00:07, 9.94it/s] 69it [00:07, 9.99it/s] 71it [00:07, 10.03it/s] 72it [00:07, 9.71it/s] 74it [00:07, 9.85it/s] 76it [00:07, 9.94it/s] 78it [00:08, 10.00it/s] 80it [00:08, 10.04it/s] 82it [00:08, 10.08it/s] 84it [00:08, 10.09it/s] 86it [00:08, 10.10it/s] 88it [00:09, 10.11it/s] 90it [00:09, 10.11it/s] 92it [00:09, 9.77it/s] 94it [00:09, 9.84it/s] 96it [00:09, 9.88it/s] 97it [00:10, 9.89it/s] 98it [00:10, 9.90it/s] 99it [00:10, 9.90it/s] 100it [00:10, 9.91it/s]2025-05-26 03:48:48,681 - INFO - [Epoch 098 | Batch 0100] IWAE-loss 3895.4548 | mean log_px -0.0165 | KL -2864.15 + 101it [00:10, 9.51it/s] 102it [00:10, 9.63it/s] 104it [00:10, 9.33it/s] 105it [00:10, 9.48it/s] 106it [00:10, 9.59it/s] 107it [00:11, 9.33it/s] 108it [00:11, 9.49it/s] 109it [00:11, 9.18it/s] 110it [00:11, 9.35it/s] 112it [00:11, 9.66it/s] 113it [00:11, 9.26it/s] 115it [00:11, 9.58it/s] 116it [00:12, 9.22it/s] 118it [00:12, 9.55it/s] 120it [00:12, 9.74it/s] 122it [00:12, 9.87it/s] 124it [00:12, 9.95it/s] 126it [00:13, 10.00it/s] 128it [00:13, 10.03it/s] 130it [00:13, 10.06it/s] 132it [00:13, 10.09it/s] 134it [00:13, 10.10it/s] 136it [00:14, 9.76it/s] 138it [00:14, 9.86it/s] 140it [00:14, 9.92it/s] 142it [00:14, 9.97it/s] 144it [00:14, 10.01it/s] 146it [00:15, 10.04it/s] 148it [00:15, 10.06it/s] 150it [00:15, 9.92it/s]2025-05-26 03:48:53,801 - INFO - [Epoch 098 | Batch 0150] IWAE-loss 3752.1211 | mean log_px -0.0133 | KL -2858.67 + 151it [00:15, 9.84it/s] 152it [00:15, 9.76it/s] 153it [00:15, 9.34it/s] 154it [00:15, 9.29it/s] 155it [00:16, 9.39it/s] 156it [00:16, 9.46it/s] 157it [00:16, 9.52it/s] 158it [00:16, 9.57it/s] 159it [00:16, 9.02it/s] 160it [00:16, 9.12it/s] 161it [00:16, 9.22it/s] 162it [00:16, 9.19it/s] 163it [00:16, 9.38it/s] 164it [00:16, 9.07it/s] 165it [00:17, 8.94it/s] 166it [00:17, 8.67it/s] 167it [00:17, 8.80it/s] 168it [00:17, 8.53it/s] 169it [00:17, 8.84it/s] 170it [00:17, 9.07it/s] 171it [00:17, 9.24it/s] 172it [00:17, 8.85it/s] 173it [00:18, 9.03it/s] 174it [00:18, 9.23it/s] 175it [00:18, 8.84it/s] 176it [00:18, 9.10it/s] 177it [00:18, 9.29it/s] 178it [00:18, 9.42it/s] 179it [00:18, 8.98it/s] 180it [00:18, 9.15it/s] 181it [00:18, 9.23it/s] 182it [00:19, 8.73it/s] 183it [00:19, 9.00it/s] 184it [00:19, 9.12it/s] 185it [00:19, 9.12it/s] 186it [00:19, 9.30it/s] 187it [00:19, 9.44it/s] 188it [00:19, 9.53it/s] 189it [00:19, 9.59it/s] 190it [00:19, 9.64it/s] 191it [00:19, 9.70it/s] 192it [00:20, 9.71it/s] 193it [00:20, 9.73it/s] 194it [00:20, 9.75it/s] 195it [00:20, 9.31it/s] 196it [00:20, 9.54it/s] +2025-05-26 03:48:58,799 - INFO - Epoch: 98, Objective: tensor([3792.0647], device='cuda:0', grad_fn=), Loss: 0.014100815169513226, KL/n: 58.269466400146484 + 0it [00:00, ?it/s]2025-05-26 03:48:59,084 - INFO - [Epoch 099 | Batch 0000] IWAE-loss 3312.5208 | mean log_px -0.0071 | KL -2853.84 + 1it [00:00, 5.32it/s] 2it [00:00, 6.69it/s] 3it [00:00, 7.49it/s] 4it [00:00, 8.25it/s] 5it [00:00, 8.18it/s] 6it [00:00, 8.61it/s] 7it [00:00, 8.96it/s] 8it [00:00, 9.18it/s] 9it [00:01, 9.39it/s] 10it [00:01, 8.94it/s] 11it [00:01, 9.18it/s] 12it [00:01, 9.32it/s] 13it [00:01, 9.29it/s] 14it [00:01, 9.27it/s] 15it [00:01, 8.74it/s] 16it [00:01, 8.97it/s] 17it [00:01, 9.05it/s] 18it [00:02, 9.24it/s] 19it [00:02, 8.85it/s] 20it [00:02, 9.08it/s] 21it [00:02, 9.30it/s] 22it [00:02, 9.43it/s] 23it [00:02, 8.99it/s] 24it [00:02, 9.19it/s] 25it [00:02, 9.36it/s] 26it [00:02, 9.49it/s] 27it [00:03, 9.04it/s] 28it [00:03, 9.22it/s] 29it [00:03, 9.40it/s] 30it [00:03, 9.50it/s] 31it [00:03, 9.58it/s] 32it [00:03, 9.64it/s] 33it [00:03, 9.68it/s] 34it [00:03, 9.69it/s] 35it [00:03, 9.73it/s] 36it [00:03, 9.74it/s] 37it [00:04, 9.75it/s] 38it [00:04, 9.74it/s] 39it [00:04, 9.77it/s] 40it [00:04, 9.13it/s] 41it [00:04, 9.29it/s] 42it [00:04, 9.41it/s] 43it [00:04, 9.51it/s] 44it [00:04, 9.55it/s] 45it [00:04, 9.60it/s] 46it [00:05, 9.63it/s] 47it [00:05, 9.06it/s] 48it [00:05, 9.21it/s] 49it [00:05, 9.37it/s] 50it [00:05, 9.34it/s]2025-05-26 03:49:04,458 - INFO - [Epoch 099 | Batch 0050] IWAE-loss 3289.7585 | mean log_px -0.0074 | KL -2854.63 + 51it [00:05, 9.32it/s] 52it [00:05, 9.33it/s] 53it [00:05, 9.34it/s] 54it [00:05, 9.36it/s] 55it [00:05, 9.16it/s] 56it [00:06, 8.75it/s] 57it [00:06, 8.96it/s] 58it [00:06, 9.12it/s] 59it [00:06, 8.74it/s] 60it [00:06, 8.93it/s] 61it [00:06, 9.10it/s] 62it [00:06, 8.72it/s] 63it [00:06, 8.94it/s] 64it [00:07, 8.92it/s] 65it [00:07, 8.82it/s] 66it [00:07, 8.45it/s] 67it [00:07, 8.73it/s] 68it [00:07, 8.88it/s] 69it [00:07, 8.99it/s] 70it [00:07, 9.11it/s] 71it [00:07, 8.69it/s] 72it [00:07, 8.80it/s] 73it [00:08, 9.00it/s] 74it [00:08, 9.06it/s] 75it [00:08, 9.15it/s] 76it [00:08, 8.70it/s] 77it [00:08, 8.86it/s] 78it [00:08, 8.95it/s] 79it [00:08, 9.03it/s] 80it [00:08, 9.11it/s] 81it [00:08, 9.12it/s] 82it [00:09, 8.72it/s] 83it [00:09, 9.04it/s] 85it [00:09, 9.48it/s] 87it [00:09, 9.70it/s] 89it [00:09, 9.83it/s] 90it [00:09, 9.85it/s] 91it [00:09, 9.88it/s] 93it [00:10, 9.96it/s] 94it [00:10, 9.96it/s] 96it [00:10, 9.57it/s] 97it [00:10, 9.65it/s] 99it [00:10, 9.81it/s]2025-05-26 03:49:09,858 - INFO - [Epoch 099 | Batch 0100] IWAE-loss 3397.9956 | mean log_px -0.0134 | KL -2848.25 + 101it [00:10, 9.51it/s] 103it [00:11, 9.71it/s] 104it [00:11, 9.77it/s] 106it [00:11, 9.87it/s] 107it [00:11, 9.48it/s] 109it [00:11, 9.69it/s] 111it [00:11, 9.82it/s] 112it [00:12, 9.44it/s] 114it [00:12, 9.66it/s] 115it [00:12, 9.72it/s] 117it [00:12, 9.45it/s] 119it [00:12, 9.66it/s] 121it [00:13, 9.79it/s] 123it [00:13, 9.60it/s] 125it [00:13, 9.74it/s] 126it [00:13, 9.41it/s] 128it [00:13, 9.63it/s] 130it [00:13, 9.78it/s] 132it [00:14, 9.88it/s] 134it [00:14, 9.94it/s] 136it [00:14, 9.98it/s] 138it [00:14, 9.75it/s] 139it [00:14, 9.78it/s] 140it [00:14, 9.76it/s] 141it [00:15, 9.24it/s] 142it [00:15, 9.35it/s] 144it [00:15, 9.63it/s] 146it [00:15, 9.79it/s] 147it [00:15, 9.82it/s] 149it [00:15, 9.92it/s] 150it [00:16, 9.93it/s]2025-05-26 03:49:15,014 - INFO - [Epoch 099 | Batch 0150] IWAE-loss 3503.2078 | mean log_px -0.0094 | KL -2843.22 + 151it [00:16, 9.43it/s] 152it [00:16, 9.54it/s] 154it [00:16, 9.76it/s] 156it [00:16, 9.87it/s] 158it [00:16, 9.63it/s] 160it [00:17, 9.78it/s] 162it [00:17, 9.87it/s] 163it [00:17, 9.49it/s] 165it [00:17, 9.70it/s] 167it [00:17, 9.45it/s] 169it [00:17, 9.65it/s] 171it [00:18, 9.78it/s] 173it [00:18, 9.88it/s] 174it [00:18, 9.65it/s] 176it [00:18, 9.80it/s] 178it [00:18, 9.90it/s] 180it [00:19, 9.96it/s] 181it [00:19, 9.91it/s] 182it [00:19, 9.93it/s] 183it [00:19, 9.47it/s] 185it [00:19, 9.71it/s] 187it [00:19, 9.85it/s] 189it [00:20, 9.93it/s] 191it [00:20, 10.00it/s] 193it [00:20, 9.76it/s] 194it [00:20, 9.80it/s] 195it [00:20, 9.34it/s] 196it [00:20, 9.42it/s] +2025-05-26 03:49:19,749 - INFO - Epoch: 99, Objective: tensor([3379.9856], device='cuda:0', grad_fn=), Loss: 0.00989951379597187, KL/n: 58.04240417480469 +2025-05-26 03:49:19,752 - INFO - Select objective: bbb + 0it [00:00, ?it/s] 2it [00:00, 15.71it/s] 5it [00:00, 22.66it/s] 8it [00:00, 24.55it/s] 11it [00:00, 26.32it/s] 14it [00:00, 27.43it/s] 17it [00:00, 28.00it/s] 20it [00:00, 28.36it/s] 23it [00:00, 28.65it/s] 26it [00:00, 28.84it/s] 29it [00:01, 29.01it/s] 32it [00:01, 29.21it/s] 35it [00:01, 29.28it/s] 38it [00:01, 29.37it/s] 41it [00:01, 29.38it/s] 44it [00:01, 29.38it/s] 47it [00:01, 29.20it/s] 50it [00:01, 29.25it/s] 53it [00:01, 29.21it/s] 56it [00:01, 29.22it/s] 59it [00:02, 28.38it/s] 62it [00:02, 28.35it/s] 65it [00:02, 28.28it/s] 68it [00:02, 28.66it/s] 72it [00:02, 29.16it/s] 76it [00:02, 29.49it/s] 79it [00:02, 29.40it/s] 82it [00:02, 29.40it/s] 85it [00:02, 29.47it/s] 88it [00:03, 29.42it/s] 91it [00:03, 29.45it/s] 94it [00:03, 29.47it/s] 97it [00:03, 29.60it/s] 101it [00:03, 29.78it/s] 105it [00:03, 29.91it/s] 109it [00:03, 30.02it/s] 113it [00:03, 30.06it/s] 117it [00:04, 30.11it/s] 121it [00:04, 30.11it/s] 125it [00:04, 30.16it/s] 129it [00:04, 30.22it/s] 133it [00:04, 30.19it/s] 137it [00:04, 30.11it/s] 141it [00:04, 30.09it/s] 145it [00:04, 30.10it/s] 149it [00:05, 30.14it/s] 153it [00:05, 30.14it/s] 157it [00:05, 30.16it/s] 161it [00:05, 30.20it/s] 165it [00:05, 30.19it/s] 169it [00:05, 30.17it/s] 173it [00:05, 30.22it/s] 177it [00:06, 30.18it/s] 181it [00:06, 30.24it/s] 185it [00:06, 30.21it/s] 189it [00:06, 30.22it/s] 193it [00:06, 30.21it/s] 197it [00:06, 30.26it/s] 201it [00:06, 30.23it/s] 205it [00:06, 30.24it/s] 209it [00:07, 30.21it/s] 213it [00:07, 30.21it/s] 217it [00:07, 30.25it/s] 221it [00:07, 30.18it/s] 225it [00:07, 30.20it/s] 229it [00:07, 30.22it/s] 233it [00:07, 30.22it/s] 237it [00:08, 30.18it/s] 241it [00:08, 30.19it/s] 245it [00:08, 30.17it/s] 249it [00:08, 30.19it/s] 253it [00:08, 30.22it/s] 257it [00:08, 30.20it/s] 261it [00:08, 30.21it/s] 265it [00:08, 30.10it/s] 269it [00:09, 30.09it/s] 273it [00:09, 30.12it/s] 277it [00:09, 30.27it/s] 280it [00:09, 29.39it/s] +2025-05-26 03:49:29,623 - INFO - Epoch: 0, Objective: 0.030164141207933426, Loss: 0.02757582627236843, KL/n: 0.002588314935564995 + 0%| | 0/84 [00:00), Loss: 0.43466299772262573, KL/n: 68.75403594970703 + 0it [00:00, ?it/s]2025-05-26 03:52:02,748 - INFO - [Epoch 001 | Batch 0000] IWAE-loss 28074.5488 | mean log_px -0.3577 | KL -3369.96 + 1it [00:00, 4.86it/s] 2it [00:00, 6.81it/s] 3it [00:00, 7.84it/s] 4it [00:00, 7.90it/s] 5it [00:00, 8.44it/s] 6it [00:00, 8.80it/s] 7it [00:00, 9.06it/s] 8it [00:00, 8.64it/s] 9it [00:01, 8.93it/s] 10it [00:01, 9.07it/s] 11it [00:01, 9.23it/s] 12it [00:01, 8.75it/s] 13it [00:01, 8.95it/s] 14it [00:01, 9.11it/s] 15it [00:01, 9.22it/s] 16it [00:01, 8.84it/s] 17it [00:01, 9.04it/s] 18it [00:02, 9.14it/s] 19it [00:02, 8.80it/s] 20it [00:02, 9.03it/s] 21it [00:02, 9.10it/s] 22it [00:02, 9.26it/s] 23it [00:02, 8.77it/s] 24it [00:02, 8.97it/s] 25it [00:02, 9.07it/s] 26it [00:02, 9.11it/s] 27it [00:03, 9.12it/s] 28it [00:03, 9.17it/s] 29it [00:03, 9.17it/s] 30it [00:03, 9.20it/s] 31it [00:03, 9.25it/s] 32it [00:03, 9.26it/s] 33it [00:03, 9.33it/s] 34it [00:03, 9.31it/s] 35it [00:03, 9.24it/s] 36it [00:04, 9.22it/s] 37it [00:04, 9.22it/s] 38it [00:04, 9.25it/s] 39it [00:04, 9.29it/s] 40it [00:04, 9.30it/s] 41it [00:04, 9.32it/s] 42it [00:04, 9.34it/s] 43it [00:04, 9.37it/s] 44it [00:04, 9.34it/s] 45it [00:05, 9.35it/s] 46it [00:05, 9.34it/s] 47it [00:05, 9.40it/s] 48it [00:05, 9.38it/s] 49it [00:05, 9.43it/s] 50it [00:05, 9.38it/s]2025-05-26 03:52:08,208 - INFO - [Epoch 001 | Batch 0050] IWAE-loss 26761.6230 | mean log_px -0.3389 | KL -3393.95 + 51it [00:05, 9.44it/s] 52it [00:05, 9.48it/s] 53it [00:05, 9.52it/s] 54it [00:05, 9.50it/s] 55it [00:06, 9.47it/s] 56it [00:06, 9.44it/s] 57it [00:06, 9.44it/s] 58it [00:06, 9.47it/s] 59it [00:06, 9.43it/s] 60it [00:06, 9.42it/s] 61it [00:06, 9.47it/s] 62it [00:06, 9.48it/s] 63it [00:06, 9.44it/s] 64it [00:07, 9.44it/s] 65it [00:07, 9.46it/s] 66it [00:07, 9.47it/s] 67it [00:07, 9.49it/s] 68it [00:07, 9.37it/s] 69it [00:07, 9.35it/s] 70it [00:07, 9.35it/s] 71it [00:07, 9.46it/s] 72it [00:07, 9.49it/s] 73it [00:07, 9.49it/s] 74it [00:08, 9.39it/s] 75it [00:08, 9.10it/s] 76it [00:08, 9.20it/s] 77it [00:08, 9.29it/s] 78it [00:08, 9.31it/s] 79it [00:08, 9.21it/s] 80it [00:08, 9.23it/s] 81it [00:08, 9.25it/s] 82it [00:08, 9.25it/s] 83it [00:09, 9.28it/s] 84it [00:09, 9.32it/s] 85it [00:09, 9.30it/s] 86it [00:09, 9.31it/s] 87it [00:09, 9.34it/s] 88it [00:09, 9.37it/s] 89it [00:09, 9.36it/s] 90it [00:09, 8.98it/s] 91it [00:09, 9.13it/s] 92it [00:10, 9.20it/s] 93it [00:10, 9.29it/s] 94it [00:10, 9.33it/s] 95it [00:10, 9.38it/s] 96it [00:10, 9.41it/s] 97it [00:10, 9.44it/s] 98it [00:10, 9.48it/s] 99it [00:10, 9.48it/s] 100it [00:10, 9.43it/s]2025-05-26 03:52:13,546 - INFO - [Epoch 001 | Batch 0100] IWAE-loss 28285.6133 | mean log_px -0.3769 | KL -3410.21 + 101it [00:10, 9.44it/s] 102it [00:11, 9.41it/s] 103it [00:11, 9.41it/s] 104it [00:11, 9.39it/s] 105it [00:11, 9.46it/s] 106it [00:11, 9.48it/s] 107it [00:11, 9.49it/s] 108it [00:11, 9.48it/s] 109it [00:11, 9.50it/s] 110it [00:11, 9.52it/s] 111it [00:12, 8.93it/s] 112it [00:12, 9.02it/s] 113it [00:12, 9.14it/s] 114it [00:12, 9.25it/s] 115it [00:12, 9.32it/s] 116it [00:12, 8.87it/s] 117it [00:12, 9.01it/s] 118it [00:12, 9.16it/s] 119it [00:12, 9.27it/s] 120it [00:13, 9.34it/s] 121it [00:13, 9.34it/s] 122it [00:13, 9.40it/s] 123it [00:13, 9.42it/s] 124it [00:13, 9.41it/s] 125it [00:13, 8.92it/s] 126it [00:13, 9.09it/s] 127it [00:13, 9.22it/s] 128it [00:13, 9.32it/s] 129it [00:14, 9.35it/s] 130it [00:14, 9.41it/s] 131it [00:14, 9.36it/s] 132it [00:14, 8.88it/s] 133it [00:14, 9.03it/s] 134it [00:14, 9.16it/s] 135it [00:14, 9.25it/s] 136it [00:14, 9.33it/s] 137it [00:14, 9.38it/s] 138it [00:14, 9.40it/s] 139it [00:15, 9.42it/s] 140it [00:15, 9.25it/s] 141it [00:15, 8.90it/s] 142it [00:15, 9.06it/s] 143it [00:15, 9.17it/s] 144it [00:15, 8.74it/s] 145it [00:15, 8.94it/s] 146it [00:15, 9.07it/s] 147it [00:15, 9.09it/s] 148it [00:16, 9.16it/s] 149it [00:16, 9.23it/s] 150it [00:16, 8.78it/s]2025-05-26 03:52:18,985 - INFO - [Epoch 001 | Batch 0150] IWAE-loss 24188.4082 | mean log_px -0.3034 | KL -3424.15 + 151it [00:16, 8.95it/s] 152it [00:16, 9.08it/s] 153it [00:16, 9.20it/s] 154it [00:16, 9.27it/s] 155it [00:16, 9.34it/s] 156it [00:16, 9.35it/s] 157it [00:17, 9.39it/s] 158it [00:17, 9.41it/s] 159it [00:17, 9.42it/s] 160it [00:17, 9.40it/s] 161it [00:17, 9.44it/s] 162it [00:17, 9.43it/s] 163it [00:17, 9.41it/s] 164it [00:17, 9.40it/s] 165it [00:17, 9.40it/s] 166it [00:18, 9.42it/s] 167it [00:18, 9.47it/s] 168it [00:18, 9.51it/s] 169it [00:18, 9.53it/s] 170it [00:18, 9.42it/s] 171it [00:18, 9.47it/s] 172it [00:18, 9.42it/s] 173it [00:18, 9.40it/s] 174it [00:18, 9.20it/s] 175it [00:18, 9.28it/s] 176it [00:19, 9.32it/s] 177it [00:19, 9.36it/s] 178it [00:19, 9.39it/s] 179it [00:19, 9.41it/s] 180it [00:19, 9.41it/s] 181it [00:19, 9.38it/s] 182it [00:19, 9.37it/s] 183it [00:19, 9.39it/s] 184it [00:19, 9.27it/s] 185it [00:20, 8.97it/s] 186it [00:20, 9.03it/s] 187it [00:20, 9.14it/s] 188it [00:20, 9.23it/s] 189it [00:20, 9.27it/s] 190it [00:20, 9.31it/s] 191it [00:20, 9.36it/s] 192it [00:20, 9.35it/s] 193it [00:20, 9.34it/s] 194it [00:21, 9.36it/s] 195it [00:21, 8.90it/s] 196it [00:21, 9.15it/s] 196it [00:21, 9.20it/s] +2025-05-26 03:52:23,912 - INFO - Epoch: 1, Objective: tensor([25134.6309], device='cuda:0', grad_fn=), Loss: 0.3120049238204956, KL/n: 70.07382202148438 + 0it [00:00, ?it/s]2025-05-26 03:52:24,198 - INFO - [Epoch 002 | Batch 0000] IWAE-loss 26034.8926 | mean log_px -0.3319 | KL -3429.36 + 1it [00:00, 4.94it/s] 2it [00:00, 6.84it/s] 3it [00:00, 7.95it/s] 4it [00:00, 8.55it/s] 5it [00:00, 8.91it/s] 6it [00:00, 9.15it/s] 7it [00:00, 9.31it/s] 8it [00:00, 9.38it/s] 9it [00:01, 8.88it/s] 10it [00:01, 9.06it/s] 11it [00:01, 9.25it/s] 12it [00:01, 9.33it/s] 13it [00:01, 9.40it/s] 14it [00:01, 9.41it/s] 15it [00:01, 9.44it/s] 16it [00:01, 9.51it/s] 17it [00:01, 9.58it/s] 18it [00:01, 9.54it/s] 19it [00:02, 9.57it/s] 20it [00:02, 9.56it/s] 21it [00:02, 9.56it/s] 22it [00:02, 9.55it/s] 23it [00:02, 9.56it/s] 24it [00:02, 9.52it/s] 25it [00:02, 9.55it/s] 26it [00:02, 9.46it/s] 27it [00:02, 9.49it/s] 28it [00:03, 9.54it/s] 29it [00:03, 9.56it/s] 30it [00:03, 9.55it/s] 31it [00:03, 9.12it/s] 32it [00:03, 9.28it/s] 33it [00:03, 9.37it/s] 34it [00:03, 9.43it/s] 35it [00:03, 9.51it/s] 36it [00:03, 9.51it/s] 37it [00:03, 9.59it/s] 38it [00:04, 9.58it/s] 39it [00:04, 9.61it/s] 40it [00:04, 9.59it/s] 41it [00:04, 9.63it/s] 42it [00:04, 9.28it/s] 43it [00:04, 9.38it/s] 44it [00:04, 9.45it/s] 45it [00:04, 9.12it/s] 46it [00:04, 9.27it/s] 47it [00:05, 9.34it/s] 48it [00:05, 8.93it/s] 49it [00:05, 9.14it/s] 50it [00:05, 9.24it/s]2025-05-26 03:52:29,502 - INFO - [Epoch 002 | Batch 0050] IWAE-loss 24607.2324 | mean log_px -0.3063 | KL -3444.27 + 51it [00:05, 9.33it/s] 52it [00:05, 8.90it/s] 53it [00:05, 9.13it/s] 54it [00:05, 9.21it/s] 55it [00:05, 9.36it/s] 56it [00:06, 8.93it/s] 57it [00:06, 9.14it/s] 58it [00:06, 9.29it/s] 59it [00:06, 9.39it/s] 60it [00:06, 9.06it/s] 61it [00:06, 9.20it/s] 62it [00:06, 9.34it/s] 63it [00:06, 8.94it/s] 64it [00:06, 9.10it/s] 65it [00:07, 9.23it/s] 66it [00:07, 9.35it/s] 67it [00:07, 9.45it/s] 68it [00:07, 9.48it/s] 69it [00:07, 9.52it/s] 70it [00:07, 9.54it/s] 71it [00:07, 9.53it/s] 72it [00:07, 9.52it/s] 73it [00:07, 9.51it/s] 74it [00:07, 9.56it/s] 75it [00:08, 9.53it/s] 76it [00:08, 9.53it/s] 77it [00:08, 9.55it/s] 78it [00:08, 9.58it/s] 79it [00:08, 9.64it/s] 80it [00:08, 9.66it/s] 81it [00:08, 9.63it/s] 82it [00:08, 9.59it/s] 83it [00:08, 9.20it/s] 84it [00:09, 9.36it/s] 85it [00:09, 9.47it/s] 86it [00:09, 9.51it/s] 87it [00:09, 9.57it/s] 88it [00:09, 9.61it/s] 89it [00:09, 9.63it/s] 90it [00:09, 9.61it/s] 91it [00:09, 9.64it/s] 92it [00:09, 9.66it/s] 93it [00:09, 9.70it/s] 94it [00:10, 6.37it/s] 95it [00:10, 7.11it/s] 96it [00:10, 7.67it/s] 97it [00:10, 8.18it/s] 98it [00:10, 8.52it/s] 99it [00:10, 8.86it/s] 100it [00:10, 9.06it/s]2025-05-26 03:52:34,968 - INFO - [Epoch 002 | Batch 0100] IWAE-loss 20464.7461 | mean log_px -0.2492 | KL -3452.10 + 101it [00:10, 9.22it/s] 102it [00:11, 9.33it/s] 103it [00:11, 9.39it/s] 104it [00:11, 9.26it/s] 105it [00:11, 9.34it/s] 106it [00:11, 9.45it/s] 107it [00:11, 9.56it/s] 108it [00:11, 9.44it/s] 109it [00:11, 9.55it/s] 110it [00:11, 9.58it/s] 111it [00:12, 9.65it/s] 112it [00:12, 9.63it/s] 113it [00:12, 9.64it/s] 114it [00:12, 9.66it/s] 115it [00:12, 9.71it/s] 116it [00:12, 9.63it/s] 117it [00:12, 9.66it/s] 118it [00:12, 9.47it/s] 119it [00:12, 9.49it/s] 120it [00:12, 9.46it/s] 121it [00:13, 9.55it/s] 122it [00:13, 9.57it/s] 123it [00:13, 9.59it/s] 124it [00:13, 9.62it/s] 125it [00:13, 9.41it/s] 126it [00:13, 9.47it/s] 127it [00:13, 9.52it/s] 128it [00:13, 9.53it/s] 129it [00:13, 9.61it/s] 130it [00:14, 9.66it/s] 131it [00:14, 9.69it/s] 132it [00:14, 9.69it/s] 133it [00:14, 9.69it/s] 134it [00:14, 9.71it/s] 135it [00:14, 9.73it/s] 136it [00:14, 9.73it/s] 137it [00:14, 9.72it/s] 138it [00:14, 9.62it/s] 139it [00:14, 9.62it/s] 140it [00:15, 9.61it/s] 141it [00:15, 9.65it/s] 142it [00:15, 9.64it/s] 143it [00:15, 9.66it/s] 144it [00:15, 9.65it/s] 145it [00:15, 9.65it/s] 146it [00:15, 8.94it/s] 147it [00:15, 9.17it/s] 148it [00:15, 9.25it/s] 149it [00:15, 9.38it/s] 150it [00:16, 9.47it/s]2025-05-26 03:52:40,201 - INFO - [Epoch 002 | Batch 0150] IWAE-loss 18063.8633 | mean log_px -0.2179 | KL -3453.99 + 151it [00:16, 9.07it/s] 152it [00:16, 9.14it/s] 153it [00:16, 9.17it/s] 154it [00:16, 9.33it/s] 155it [00:16, 9.38it/s] 156it [00:16, 9.01it/s] 157it [00:16, 9.22it/s] 158it [00:16, 9.32it/s] 159it [00:17, 9.33it/s] 160it [00:17, 9.42it/s] 161it [00:17, 9.47it/s] 162it [00:17, 9.47it/s] 163it [00:17, 9.54it/s] 164it [00:17, 9.03it/s] 165it [00:17, 9.20it/s] 166it [00:17, 9.34it/s] 167it [00:17, 9.41it/s] 168it [00:18, 9.46it/s] 169it [00:18, 9.53it/s] 170it [00:18, 9.54it/s] 171it [00:18, 9.58it/s] 172it [00:18, 9.60it/s] 173it [00:18, 9.57it/s] 174it [00:18, 9.61it/s] 175it [00:18, 9.67it/s] 176it [00:18, 9.66it/s] 177it [00:18, 9.66it/s] 178it [00:19, 9.63it/s] 179it [00:19, 9.66it/s] 180it [00:19, 9.63it/s] 181it [00:19, 9.58it/s] 182it [00:19, 9.60it/s] 183it [00:19, 9.63it/s] 184it [00:19, 9.61it/s] 185it [00:19, 9.57it/s] 186it [00:19, 9.54it/s] 187it [00:20, 9.60it/s] 188it [00:20, 9.56it/s] 189it [00:20, 9.46it/s] 190it [00:20, 9.52it/s] 191it [00:20, 9.60it/s] 192it [00:20, 9.57it/s] 193it [00:20, 9.60it/s] 194it [00:20, 9.61it/s] 195it [00:20, 8.54it/s] 196it [00:20, 8.87it/s] 196it [00:21, 9.31it/s] +2025-05-26 03:52:45,100 - INFO - Epoch: 2, Objective: tensor([23773.6406], device='cuda:0', grad_fn=), Loss: 0.30370157957077026, KL/n: 70.60922241210938 + 0it [00:00, ?it/s]2025-05-26 03:52:45,376 - INFO - [Epoch 003 | Batch 0000] IWAE-loss 22127.6270 | mean log_px -0.2715 | KL -3458.96 + 1it [00:00, 5.42it/s] 2it [00:00, 7.21it/s] 3it [00:00, 8.16it/s] 4it [00:00, 8.03it/s] 5it [00:00, 8.51it/s] 6it [00:00, 8.85it/s] 7it [00:00, 9.13it/s] 8it [00:00, 9.28it/s] 9it [00:01, 9.36it/s] 10it [00:01, 9.44it/s] 11it [00:01, 9.47it/s] 12it [00:01, 9.48it/s] 13it [00:01, 9.51it/s] 14it [00:01, 9.51it/s] 15it [00:01, 9.52it/s] 16it [00:01, 9.48it/s] 17it [00:01, 9.53it/s] 18it [00:01, 9.54it/s] 19it [00:02, 9.54it/s] 20it [00:02, 9.50it/s] 21it [00:02, 9.51it/s] 22it [00:02, 9.52it/s] 23it [00:02, 9.54it/s] 24it [00:02, 9.54it/s] 25it [00:02, 9.58it/s] 26it [00:02, 9.56it/s] 27it [00:02, 9.57it/s] 28it [00:03, 9.57it/s] 29it [00:03, 9.58it/s] 30it [00:03, 9.03it/s] 31it [00:03, 9.18it/s] 32it [00:03, 9.30it/s] 33it [00:03, 9.36it/s] 34it [00:03, 8.89it/s] 35it [00:03, 9.13it/s] 36it [00:03, 9.24it/s] 37it [00:04, 9.32it/s] 38it [00:04, 9.34it/s] 39it [00:04, 8.97it/s] 40it [00:04, 9.12it/s] 41it [00:04, 9.27it/s] 42it [00:04, 9.38it/s] 43it [00:04, 9.43it/s] 44it [00:04, 9.46it/s] 45it [00:04, 9.49it/s] 46it [00:04, 9.39it/s] 47it [00:05, 9.45it/s] 48it [00:05, 9.51it/s] 49it [00:05, 9.53it/s] 50it [00:05, 9.46it/s]2025-05-26 03:52:50,697 - INFO - [Epoch 003 | Batch 0050] IWAE-loss 18690.7363 | mean log_px -0.2205 | KL -3462.40 + 51it [00:05, 9.49it/s] 52it [00:05, 9.49it/s] 53it [00:05, 9.54it/s] 54it [00:05, 9.50it/s] 55it [00:05, 9.47it/s] 56it [00:06, 9.47it/s] 57it [00:06, 9.52it/s] 58it [00:06, 9.56it/s] 59it [00:06, 9.60it/s] 60it [00:06, 9.59it/s] 61it [00:06, 9.00it/s] 62it [00:06, 9.16it/s] 63it [00:06, 9.25it/s] 64it [00:06, 9.34it/s] 65it [00:07, 8.89it/s] 66it [00:07, 9.05it/s] 67it [00:07, 9.21it/s] 68it [00:07, 9.29it/s] 69it [00:07, 9.34it/s] 70it [00:07, 9.38it/s] 71it [00:07, 9.45it/s] 72it [00:07, 9.48it/s] 73it [00:07, 9.45it/s] 74it [00:07, 8.89it/s] 75it [00:08, 9.13it/s] 76it [00:08, 9.18it/s] 77it [00:08, 9.25it/s] 78it [00:08, 9.29it/s] 79it [00:08, 9.37it/s] 80it [00:08, 9.38it/s] 81it [00:08, 8.80it/s] 82it [00:08, 8.88it/s] 83it [00:08, 8.94it/s] 84it [00:09, 9.13it/s] 85it [00:09, 8.84it/s] 86it [00:09, 9.05it/s] 87it [00:09, 9.23it/s] 88it [00:09, 9.36it/s] 89it [00:09, 8.91it/s] 90it [00:09, 9.09it/s] 91it [00:09, 9.18it/s] 92it [00:09, 9.22it/s] 93it [00:10, 8.85it/s] 94it [00:10, 9.08it/s] 95it [00:10, 9.24it/s] 96it [00:10, 9.21it/s] 97it [00:10, 8.84it/s] 98it [00:10, 9.06it/s] 99it [00:10, 9.22it/s] 100it [00:10, 9.35it/s]2025-05-26 03:52:56,120 - INFO - [Epoch 003 | Batch 0100] IWAE-loss 22098.5781 | mean log_px -0.2703 | KL -3471.58 + 101it [00:10, 8.87it/s] 102it [00:11, 9.08it/s] 103it [00:11, 9.26it/s] 104it [00:11, 9.37it/s] 105it [00:11, 8.90it/s] 106it [00:11, 9.07it/s] 107it [00:11, 9.25it/s] 108it [00:11, 9.37it/s] 109it [00:11, 8.89it/s] 110it [00:11, 9.08it/s] 111it [00:12, 9.26it/s] 112it [00:12, 9.34it/s] 113it [00:12, 8.91it/s] 114it [00:12, 9.13it/s] 115it [00:12, 9.30it/s] 116it [00:12, 9.38it/s] 117it [00:12, 8.90it/s] 118it [00:12, 9.13it/s] 119it [00:12, 9.30it/s] 120it [00:13, 9.35it/s] 121it [00:13, 8.86it/s] 122it [00:13, 9.07it/s] 123it [00:13, 9.24it/s] 124it [00:13, 9.33it/s] 125it [00:13, 8.89it/s] 126it [00:13, 9.10it/s] 127it [00:13, 9.24it/s] 128it [00:13, 9.33it/s] 129it [00:14, 8.90it/s] 130it [00:14, 9.10it/s] 131it [00:14, 9.28it/s] 132it [00:14, 9.36it/s] 133it [00:14, 9.32it/s] 134it [00:14, 8.90it/s] 135it [00:14, 9.10it/s] 136it [00:14, 9.24it/s] 137it [00:14, 9.24it/s] 138it [00:14, 8.82it/s] 139it [00:15, 9.01it/s] 140it [00:15, 9.21it/s] 141it [00:15, 9.29it/s] 142it [00:15, 8.87it/s] 143it [00:15, 9.06it/s] 144it [00:15, 9.20it/s] 145it [00:15, 8.83it/s] 146it [00:15, 8.97it/s] 147it [00:15, 9.18it/s] 148it [00:16, 9.32it/s] 149it [00:16, 9.02it/s] 150it [00:16, 9.11it/s]2025-05-26 03:53:01,605 - INFO - [Epoch 003 | Batch 0150] IWAE-loss 23228.7480 | mean log_px -0.2856 | KL -3470.63 + 151it [00:16, 9.24it/s] 152it [00:16, 8.82it/s] 153it [00:16, 9.07it/s] 154it [00:16, 9.24it/s] 155it [00:16, 9.31it/s] 156it [00:16, 8.84it/s] 157it [00:17, 8.97it/s] 158it [00:17, 9.18it/s] 159it [00:17, 9.26it/s] 160it [00:17, 8.84it/s] 161it [00:17, 9.06it/s] 162it [00:17, 9.19it/s] 163it [00:17, 9.32it/s] 164it [00:17, 8.89it/s] 165it [00:17, 9.08it/s] 166it [00:18, 9.22it/s] 167it [00:18, 9.39it/s] 168it [00:18, 9.49it/s] 169it [00:18, 9.56it/s] 170it [00:18, 9.57it/s] 171it [00:18, 9.63it/s] 172it [00:18, 9.60it/s] 173it [00:18, 9.63it/s] 174it [00:18, 9.59it/s] 175it [00:18, 9.61it/s] 176it [00:19, 9.60it/s] 177it [00:19, 9.62it/s] 178it [00:19, 9.43it/s] 179it [00:19, 9.44it/s] 180it [00:19, 9.50it/s] 181it [00:19, 9.57it/s] 182it [00:19, 9.60it/s] 183it [00:19, 9.64it/s] 184it [00:19, 9.65it/s] 185it [00:20, 9.62it/s] 186it [00:20, 9.57it/s] 187it [00:20, 9.59it/s] 188it [00:20, 9.62it/s] 189it [00:20, 9.64it/s] 190it [00:20, 9.62it/s] 191it [00:20, 9.62it/s] 192it [00:20, 9.59it/s] 193it [00:20, 9.41it/s] 194it [00:20, 9.47it/s] 195it [00:21, 8.95it/s] 196it [00:21, 9.16it/s] 196it [00:21, 9.21it/s] +2025-05-26 03:53:06,508 - INFO - Epoch: 3, Objective: tensor([23300.8750], device='cuda:0', grad_fn=), Loss: 0.2900332510471344, KL/n: 70.9906005859375 + 0it [00:00, ?it/s]2025-05-26 03:53:06,970 - INFO - [Epoch 004 | Batch 0000] IWAE-loss 12282.2793 | mean log_px -0.1411 | KL -3474.90 + 1it [00:00, 4.60it/s] 2it [00:00, 6.65it/s] 3it [00:00, 7.78it/s] 4it [00:00, 8.46it/s] 5it [00:00, 8.89it/s] 6it [00:00, 9.11it/s] 7it [00:00, 9.32it/s] 8it [00:00, 9.46it/s] 9it [00:01, 9.53it/s] 10it [00:01, 9.54it/s] 11it [00:01, 9.54it/s] 12it [00:01, 9.50it/s] 13it [00:01, 9.58it/s] 14it [00:01, 9.53it/s] 15it [00:01, 9.58it/s] 16it [00:01, 8.89it/s] 17it [00:01, 9.08it/s] 18it [00:02, 9.19it/s] 19it [00:02, 9.31it/s] 20it [00:02, 9.22it/s] 21it [00:02, 9.35it/s] 22it [00:02, 9.01it/s] 23it [00:02, 9.08it/s] 24it [00:02, 9.21it/s] 25it [00:02, 9.31it/s] 26it [00:02, 9.38it/s] 27it [00:02, 9.48it/s] 28it [00:03, 9.53it/s] 29it [00:03, 8.98it/s] 30it [00:03, 9.09it/s] 31it [00:03, 9.20it/s] 32it [00:03, 9.34it/s] 33it [00:03, 9.43it/s] 34it [00:03, 9.41it/s] 35it [00:03, 9.37it/s] 36it [00:03, 9.41it/s] 37it [00:04, 9.41it/s] 38it [00:04, 9.47it/s] 39it [00:04, 9.54it/s] 40it [00:04, 9.00it/s] 41it [00:04, 9.18it/s] 42it [00:04, 9.24it/s] 43it [00:04, 9.38it/s] 44it [00:04, 9.45it/s] 45it [00:04, 9.56it/s] 46it [00:05, 9.58it/s] 47it [00:05, 9.61it/s] 48it [00:05, 9.63it/s] 49it [00:05, 9.66it/s] 50it [00:05, 9.61it/s]2025-05-26 03:53:12,305 - INFO - [Epoch 004 | Batch 0050] IWAE-loss 23196.6523 | mean log_px -0.2816 | KL -3483.42 + 51it [00:05, 9.60it/s] 52it [00:05, 9.62it/s] 53it [00:05, 9.68it/s] 54it [00:05, 9.62it/s] 55it [00:05, 9.64it/s] 56it [00:06, 9.58it/s] 57it [00:06, 9.60it/s] 58it [00:06, 9.58it/s] 59it [00:06, 9.61it/s] 60it [00:06, 9.60it/s] 61it [00:06, 9.60it/s] 62it [00:06, 9.58it/s] 63it [00:06, 9.56it/s] 64it [00:06, 9.54it/s] 65it [00:06, 9.56it/s] 66it [00:07, 9.56it/s] 67it [00:07, 9.54it/s] 68it [00:07, 9.54it/s] 69it [00:07, 9.58it/s] 70it [00:07, 9.61it/s] 71it [00:07, 9.62it/s] 72it [00:07, 9.65it/s] 73it [00:07, 9.63it/s] 74it [00:07, 9.66it/s] 75it [00:08, 9.68it/s] 76it [00:08, 9.66it/s] 77it [00:08, 9.64it/s] 78it [00:08, 9.63it/s] 79it [00:08, 9.65it/s] 80it [00:08, 9.61it/s] 81it [00:08, 9.61it/s] 82it [00:08, 9.63it/s] 83it [00:08, 9.60it/s] 84it [00:08, 9.55it/s] 85it [00:09, 9.55it/s] 86it [00:09, 9.59it/s] 87it [00:09, 9.62it/s] 88it [00:09, 9.63it/s] 89it [00:09, 9.09it/s] 90it [00:09, 9.27it/s] 91it [00:09, 9.38it/s] 92it [00:09, 9.41it/s] 93it [00:09, 9.43it/s] 94it [00:10, 9.42it/s] 95it [00:10, 9.50it/s] 96it [00:10, 9.52it/s] 97it [00:10, 9.54it/s] 98it [00:10, 9.56it/s] 99it [00:10, 9.07it/s] 100it [00:10, 9.24it/s]2025-05-26 03:53:17,553 - INFO - [Epoch 004 | Batch 0100] IWAE-loss 22043.1543 | mean log_px -0.2736 | KL -3483.78 + 101it [00:10, 9.26it/s] 102it [00:10, 9.35it/s] 103it [00:10, 9.42it/s] 104it [00:11, 9.44it/s] 105it [00:11, 8.91it/s] 106it [00:11, 9.14it/s] 107it [00:11, 9.26it/s] 108it [00:11, 9.34it/s] 109it [00:11, 9.26it/s] 110it [00:11, 9.30it/s] 111it [00:11, 9.40it/s] 112it [00:11, 9.42it/s] 113it [00:12, 9.10it/s] 114it [00:12, 9.25it/s] 115it [00:12, 9.34it/s] 116it [00:12, 9.41it/s] 117it [00:12, 8.98it/s] 118it [00:12, 9.13it/s] 119it [00:12, 9.27it/s] 120it [00:12, 9.38it/s] 121it [00:12, 9.01it/s] 122it [00:13, 9.19it/s] 123it [00:13, 9.36it/s] 124it [00:13, 8.91it/s] 125it [00:13, 9.10it/s] 126it [00:13, 9.23it/s] 127it [00:13, 9.31it/s] 128it [00:13, 8.86it/s] 129it [00:13, 9.07it/s] 130it [00:13, 9.18it/s] 131it [00:14, 9.25it/s] 132it [00:14, 8.81it/s] 133it [00:14, 9.04it/s] 134it [00:14, 9.20it/s] 135it [00:14, 9.32it/s] 136it [00:14, 9.43it/s] 137it [00:14, 9.39it/s] 138it [00:14, 8.88it/s] 139it [00:14, 9.11it/s] 140it [00:15, 9.27it/s] 141it [00:15, 9.43it/s] 142it [00:15, 9.55it/s] 143it [00:15, 9.60it/s] 144it [00:15, 9.59it/s] 145it [00:15, 9.61it/s] 146it [00:15, 9.62it/s] 147it [00:15, 9.63it/s] 148it [00:15, 9.60it/s] 149it [00:15, 9.61it/s] 150it [00:16, 9.61it/s]2025-05-26 03:53:22,932 - INFO - [Epoch 004 | Batch 0150] IWAE-loss 22188.4727 | mean log_px -0.2672 | KL -3485.55 + 151it [00:16, 9.07it/s] 152it [00:16, 9.05it/s] 153it [00:16, 9.28it/s] 154it [00:16, 9.46it/s] 155it [00:16, 9.57it/s] 156it [00:16, 9.65it/s] 157it [00:16, 9.69it/s] 158it [00:16, 9.69it/s] 159it [00:16, 9.75it/s] 160it [00:17, 9.77it/s] 161it [00:17, 9.80it/s] 162it [00:17, 9.23it/s] 163it [00:17, 9.41it/s] 164it [00:17, 9.53it/s] 165it [00:17, 9.65it/s] 166it [00:17, 9.72it/s] 167it [00:17, 9.78it/s] 168it [00:17, 9.81it/s] 169it [00:18, 9.84it/s] 170it [00:18, 9.87it/s] 171it [00:18, 9.82it/s] 172it [00:18, 9.74it/s] 173it [00:18, 9.79it/s] 174it [00:18, 9.04it/s] 175it [00:18, 8.91it/s] 176it [00:18, 8.79it/s] 177it [00:18, 9.02it/s] 178it [00:19, 9.20it/s] 179it [00:19, 9.33it/s] 180it [00:19, 9.43it/s] 181it [00:19, 9.52it/s] 182it [00:19, 9.56it/s] 183it [00:19, 9.32it/s] 184it [00:19, 9.06it/s] 185it [00:19, 9.20it/s] 186it [00:19, 9.30it/s] 187it [00:19, 9.47it/s] 188it [00:20, 9.54it/s] 189it [00:20, 8.99it/s] 190it [00:20, 9.24it/s] 191it [00:20, 9.38it/s] 192it [00:20, 9.47it/s] 193it [00:20, 9.59it/s] 194it [00:20, 9.61it/s] 195it [00:20, 9.10it/s] 196it [00:20, 9.34it/s] +2025-05-26 03:53:27,816 - INFO - Epoch: 4, Objective: tensor([19702.6348], device='cuda:0', grad_fn=), Loss: 0.23782320320606232, KL/n: 71.2601089477539 + 0it [00:00, ?it/s]2025-05-26 03:53:28,090 - INFO - [Epoch 005 | Batch 0000] IWAE-loss 16530.5488 | mean log_px -0.1878 | KL -3492.38 + 1it [00:00, 5.35it/s] 2it [00:00, 6.63it/s] 3it [00:00, 7.81it/s] 4it [00:00, 8.52it/s] 5it [00:00, 8.93it/s] 6it [00:00, 9.21it/s] 7it [00:00, 9.44it/s] 8it [00:00, 9.57it/s] 9it [00:01, 9.64it/s] 10it [00:01, 9.69it/s] 11it [00:01, 9.74it/s] 12it [00:01, 9.75it/s] 13it [00:01, 9.75it/s] 14it [00:01, 9.16it/s] 15it [00:01, 9.26it/s] 16it [00:01, 9.17it/s] 17it [00:01, 9.23it/s] 18it [00:01, 9.27it/s] 19it [00:02, 9.38it/s] 20it [00:02, 9.48it/s] 21it [00:02, 9.56it/s] 22it [00:02, 9.63it/s] 23it [00:02, 9.63it/s] 24it [00:02, 9.70it/s] 25it [00:02, 9.13it/s] 26it [00:02, 9.30it/s] 27it [00:02, 9.45it/s] 28it [00:03, 9.08it/s] 29it [00:03, 9.27it/s] 30it [00:03, 9.42it/s] 31it [00:03, 9.53it/s] 32it [00:03, 9.61it/s] 33it [00:03, 9.67it/s] 34it [00:03, 9.71it/s] 35it [00:03, 9.74it/s] 36it [00:03, 9.77it/s] 37it [00:03, 9.78it/s] 38it [00:04, 9.77it/s] 39it [00:04, 9.76it/s] 40it [00:04, 9.74it/s] 41it [00:04, 9.14it/s] 42it [00:04, 9.33it/s] 43it [00:04, 9.45it/s] 44it [00:04, 9.52it/s] 45it [00:04, 9.60it/s] 46it [00:04, 9.67it/s] 47it [00:05, 9.71it/s] 48it [00:05, 9.73it/s] 49it [00:05, 9.73it/s] 50it [00:05, 9.75it/s]2025-05-26 03:53:33,330 - INFO - [Epoch 005 | Batch 0050] IWAE-loss 17774.5938 | mean log_px -0.2058 | KL -3492.53 + 51it [00:05, 9.78it/s] 52it [00:05, 9.77it/s] 53it [00:05, 9.16it/s] 54it [00:05, 9.33it/s] 55it [00:05, 9.45it/s] 56it [00:05, 9.53it/s] 57it [00:06, 9.16it/s] 58it [00:06, 9.30it/s] 59it [00:06, 9.46it/s] 60it [00:06, 9.54it/s] 61it [00:06, 9.62it/s] 62it [00:06, 9.20it/s] 63it [00:06, 9.32it/s] 64it [00:06, 9.43it/s] 65it [00:06, 9.54it/s] 66it [00:07, 9.61it/s] 67it [00:07, 9.67it/s] 68it [00:07, 9.70it/s] 69it [00:07, 9.72it/s] 70it [00:07, 9.73it/s] 71it [00:07, 9.74it/s] 72it [00:07, 9.75it/s] 73it [00:07, 9.77it/s] 74it [00:07, 9.77it/s] 75it [00:07, 9.72it/s] 76it [00:08, 9.23it/s] 77it [00:08, 9.36it/s] 78it [00:08, 9.48it/s] 79it [00:08, 8.98it/s] 80it [00:08, 9.18it/s] 81it [00:08, 9.30it/s] 82it [00:08, 9.43it/s] 83it [00:08, 9.56it/s] 84it [00:08, 9.61it/s] 85it [00:09, 9.69it/s] 86it [00:09, 9.68it/s] 87it [00:09, 9.20it/s] 88it [00:09, 9.35it/s] 89it [00:09, 9.49it/s] 90it [00:09, 8.97it/s] 91it [00:09, 9.16it/s] 92it [00:09, 9.35it/s] 93it [00:09, 9.48it/s] 94it [00:09, 9.15it/s] 95it [00:10, 9.32it/s] 96it [00:10, 9.46it/s] 97it [00:10, 9.57it/s] 98it [00:10, 9.63it/s] 99it [00:10, 9.69it/s] 100it [00:10, 9.23it/s]2025-05-26 03:53:38,629 - INFO - [Epoch 005 | Batch 0100] IWAE-loss 13819.5430 | mean log_px -0.1567 | KL -3497.92 + 101it [00:10, 9.37it/s] 102it [00:10, 9.50it/s] 103it [00:10, 9.57it/s] 104it [00:11, 9.65it/s] 105it [00:11, 9.68it/s] 106it [00:11, 9.72it/s] 107it [00:11, 9.76it/s] 108it [00:11, 9.75it/s] 109it [00:11, 9.74it/s] 110it [00:11, 9.74it/s] 111it [00:11, 9.75it/s] 112it [00:11, 9.75it/s] 113it [00:11, 9.77it/s] 114it [00:12, 9.77it/s] 115it [00:12, 9.75it/s] 116it [00:12, 9.10it/s] 117it [00:12, 9.26it/s] 118it [00:12, 9.41it/s] 119it [00:12, 9.54it/s] 120it [00:12, 9.57it/s] 121it [00:12, 9.65it/s] 122it [00:12, 9.66it/s] 123it [00:13, 9.71it/s] 124it [00:13, 9.75it/s] 125it [00:13, 9.69it/s] 126it [00:13, 9.72it/s] 127it [00:13, 8.94it/s] 128it [00:13, 9.13it/s] 129it [00:13, 9.32it/s] 130it [00:13, 9.43it/s] 131it [00:13, 9.54it/s] 132it [00:13, 9.60it/s] 133it [00:14, 9.65it/s] 134it [00:14, 9.66it/s] 135it [00:14, 9.72it/s] 136it [00:14, 9.70it/s] 137it [00:14, 9.70it/s] 138it [00:14, 9.69it/s] 139it [00:14, 9.67it/s] 140it [00:14, 9.66it/s] 141it [00:14, 9.70it/s] 142it [00:14, 9.69it/s] 143it [00:15, 9.72it/s] 144it [00:15, 9.72it/s] 145it [00:15, 9.74it/s] 146it [00:15, 9.68it/s] 147it [00:15, 9.58it/s] 148it [00:15, 9.62it/s] 149it [00:15, 9.11it/s] 150it [00:15, 9.27it/s]2025-05-26 03:53:43,843 - INFO - [Epoch 005 | Batch 0150] IWAE-loss 18954.9707 | mean log_px -0.2272 | KL -3503.50 + 151it [00:15, 9.40it/s] 152it [00:16, 9.49it/s] 153it [00:16, 9.58it/s] 154it [00:16, 9.66it/s] 155it [00:16, 9.71it/s] 156it [00:16, 9.71it/s] 157it [00:16, 9.74it/s] 158it [00:16, 9.75it/s] 159it [00:16, 9.76it/s] 160it [00:16, 9.73it/s] 161it [00:16, 9.73it/s] 162it [00:17, 9.74it/s] 163it [00:17, 9.78it/s] 164it [00:17, 9.73it/s] 165it [00:17, 9.76it/s] 166it [00:17, 9.77it/s] 167it [00:17, 9.79it/s] 168it [00:17, 9.78it/s] 169it [00:17, 9.81it/s] 170it [00:17, 9.79it/s] 171it [00:17, 9.77it/s] 172it [00:18, 9.77it/s] 173it [00:18, 9.76it/s] 174it [00:18, 9.24it/s] 175it [00:18, 9.39it/s] 176it [00:18, 9.54it/s] 177it [00:18, 9.64it/s] 178it [00:18, 9.68it/s] 179it [00:18, 9.72it/s] 180it [00:18, 9.75it/s] 181it [00:19, 9.77it/s] 182it [00:19, 9.80it/s] 183it [00:19, 9.79it/s] 184it [00:19, 9.79it/s] 185it [00:19, 9.81it/s] 186it [00:19, 9.29it/s] 187it [00:19, 9.46it/s] 188it [00:19, 9.56it/s] 189it [00:19, 9.63it/s] 190it [00:19, 9.68it/s] 191it [00:20, 9.72it/s] 192it [00:20, 9.74it/s] 193it [00:20, 9.77it/s] 194it [00:20, 9.76it/s] 195it [00:20, 9.22it/s] 196it [00:20, 9.49it/s] +2025-05-26 03:53:48,596 - INFO - Epoch: 5, Objective: tensor([12165.8643], device='cuda:0', grad_fn=), Loss: 0.1356792002916336, KL/n: 71.50433349609375 + 0it [00:00, ?it/s]2025-05-26 03:53:49,052 - INFO - [Epoch 006 | Batch 0000] IWAE-loss 17046.0859 | mean log_px -0.1989 | KL -3502.32 + 1it [00:00, 5.37it/s] 2it [00:00, 7.22it/s] 3it [00:00, 8.24it/s] 4it [00:00, 8.78it/s] 5it [00:00, 9.13it/s] 6it [00:00, 9.33it/s] 7it [00:00, 9.48it/s] 8it [00:00, 9.58it/s] 9it [00:01, 9.64it/s] 10it [00:01, 9.69it/s] 11it [00:01, 9.72it/s] 12it [00:01, 9.72it/s] 13it [00:01, 9.76it/s] 14it [00:01, 9.77it/s] 15it [00:01, 9.79it/s] 16it [00:01, 9.80it/s] 17it [00:01, 9.82it/s] 18it [00:01, 9.81it/s] 19it [00:02, 9.83it/s] 20it [00:02, 9.85it/s] 21it [00:02, 9.84it/s] 22it [00:02, 9.85it/s] 23it [00:02, 9.84it/s] 24it [00:02, 9.83it/s] 25it [00:02, 9.85it/s] 26it [00:02, 9.79it/s] 27it [00:02, 9.78it/s] 28it [00:02, 9.79it/s] 29it [00:03, 9.81it/s] 30it [00:03, 9.79it/s] 31it [00:03, 9.78it/s] 32it [00:03, 9.80it/s] 33it [00:03, 9.79it/s] 34it [00:03, 9.79it/s] 35it [00:03, 9.82it/s] 36it [00:03, 9.80it/s] 37it [00:03, 9.77it/s] 38it [00:03, 9.64it/s] 39it [00:04, 9.64it/s] 40it [00:04, 9.68it/s] 41it [00:04, 9.67it/s] 42it [00:04, 9.68it/s] 43it [00:04, 9.70it/s] 44it [00:04, 9.73it/s] 45it [00:04, 9.71it/s] 46it [00:04, 9.69it/s] 47it [00:04, 9.72it/s] 48it [00:04, 9.72it/s] 49it [00:05, 9.64it/s] 50it [00:05, 9.67it/s]2025-05-26 03:53:54,176 - INFO - [Epoch 006 | Batch 0050] IWAE-loss 15465.3457 | mean log_px -0.1867 | KL -3503.66 + 51it [00:05, 9.66it/s] 52it [00:05, 9.67it/s] 53it [00:05, 9.64it/s] 54it [00:05, 9.64it/s] 55it [00:05, 9.44it/s] 56it [00:05, 9.51it/s] 57it [00:05, 9.55it/s] 58it [00:06, 9.60it/s] 59it [00:06, 9.49it/s] 60it [00:06, 9.55it/s] 61it [00:06, 9.64it/s] 62it [00:06, 9.72it/s] 63it [00:06, 9.73it/s] 64it [00:06, 9.70it/s] 65it [00:06, 9.66it/s] 66it [00:06, 9.69it/s] 67it [00:06, 9.70it/s] 68it [00:07, 9.71it/s] 69it [00:07, 9.72it/s] 70it [00:07, 9.73it/s] 71it [00:07, 9.39it/s] 72it [00:07, 9.27it/s] 73it [00:07, 9.21it/s] 74it [00:07, 9.23it/s] 75it [00:07, 9.31it/s] 76it [00:07, 9.35it/s] 77it [00:08, 9.37it/s] 78it [00:08, 9.45it/s] 79it [00:08, 9.52it/s] 80it [00:08, 9.16it/s] 81it [00:08, 9.30it/s] 82it [00:08, 9.41it/s] 83it [00:08, 9.40it/s] 84it [00:08, 9.48it/s] 85it [00:08, 9.30it/s] 86it [00:09, 8.77it/s] 87it [00:09, 8.62it/s] 88it [00:09, 8.91it/s] 89it [00:09, 9.18it/s] 90it [00:09, 9.33it/s] 91it [00:09, 9.46it/s] 92it [00:09, 9.57it/s] 93it [00:09, 9.66it/s] 94it [00:09, 9.68it/s] 95it [00:09, 9.72it/s] 96it [00:10, 9.77it/s] 97it [00:10, 9.75it/s] 98it [00:10, 9.76it/s] 99it [00:10, 9.21it/s] 100it [00:10, 9.37it/s]2025-05-26 03:53:59,465 - INFO - [Epoch 006 | Batch 0100] IWAE-loss 16232.7539 | mean log_px -0.1872 | KL -3505.36 + 101it [00:10, 9.49it/s] 102it [00:10, 9.57it/s] 103it [00:10, 9.66it/s] 104it [00:10, 9.10it/s] 105it [00:11, 9.30it/s] 106it [00:11, 9.45it/s] 107it [00:11, 9.57it/s] 108it [00:11, 9.61it/s] 109it [00:11, 9.12it/s] 110it [00:11, 9.32it/s] 111it [00:11, 9.47it/s] 112it [00:11, 9.55it/s] 113it [00:11, 9.63it/s] 114it [00:11, 9.60it/s] 115it [00:12, 9.68it/s] 116it [00:12, 9.72it/s] 117it [00:12, 9.75it/s] 118it [00:12, 9.78it/s] 119it [00:12, 9.77it/s] 120it [00:12, 9.68it/s] 121it [00:12, 9.64it/s] 122it [00:12, 9.67it/s] 123it [00:12, 9.70it/s] 124it [00:12, 9.73it/s] 125it [00:13, 9.78it/s] 126it [00:13, 9.79it/s] 127it [00:13, 9.83it/s] 128it [00:13, 9.82it/s] 129it [00:13, 9.83it/s] 130it [00:13, 9.82it/s] 131it [00:13, 9.85it/s] 132it [00:13, 9.86it/s] 133it [00:13, 9.27it/s] 134it [00:14, 9.29it/s] 135it [00:14, 9.40it/s] 136it [00:14, 9.49it/s] 137it [00:14, 9.60it/s] 138it [00:14, 9.66it/s] 139it [00:14, 9.74it/s] 140it [00:14, 9.75it/s] 141it [00:14, 9.80it/s] 142it [00:14, 9.80it/s] 143it [00:14, 9.79it/s] 144it [00:15, 9.23it/s] 145it [00:15, 9.38it/s] 146it [00:15, 9.48it/s] 147it [00:15, 9.49it/s] 148it [00:15, 9.59it/s] 149it [00:15, 9.63it/s] 150it [00:15, 9.67it/s]2025-05-26 03:54:04,664 - INFO - [Epoch 006 | Batch 0150] IWAE-loss 16457.2578 | mean log_px -0.1880 | KL -3506.98 + 151it [00:15, 9.73it/s] 152it [00:15, 9.74it/s] 153it [00:16, 9.73it/s] 154it [00:16, 9.73it/s] 155it [00:16, 9.78it/s] 156it [00:16, 9.75it/s] 157it [00:16, 9.75it/s] 158it [00:16, 9.73it/s] 159it [00:16, 9.74it/s] 160it [00:16, 9.74it/s] 161it [00:16, 9.77it/s] 162it [00:16, 9.77it/s] 163it [00:17, 9.78it/s] 164it [00:17, 9.76it/s] 165it [00:17, 9.80it/s] 166it [00:17, 9.82it/s] 167it [00:17, 9.84it/s] 168it [00:17, 9.82it/s] 169it [00:17, 9.81it/s] 170it [00:17, 9.83it/s] 171it [00:17, 9.83it/s] 172it [00:17, 9.82it/s] 173it [00:18, 9.83it/s] 174it [00:18, 9.79it/s] 175it [00:18, 9.67it/s] 176it [00:18, 9.69it/s] 177it [00:18, 9.74it/s] 178it [00:18, 9.76it/s] 179it [00:18, 9.81it/s] 180it [00:18, 9.80it/s] 181it [00:18, 9.81it/s] 182it [00:18, 9.82it/s] 183it [00:19, 9.80it/s] 184it [00:19, 9.64it/s] 185it [00:19, 9.70it/s] 186it [00:19, 9.46it/s] 187it [00:19, 9.14it/s] 188it [00:19, 9.33it/s] 189it [00:19, 9.47it/s] 190it [00:19, 9.36it/s] 191it [00:19, 9.08it/s] 192it [00:20, 8.72it/s] 193it [00:20, 8.41it/s] 194it [00:20, 8.76it/s] 195it [00:20, 8.59it/s] 196it [00:20, 9.52it/s] +2025-05-26 03:54:09,490 - INFO - Epoch: 6, Objective: tensor([15376.6016], device='cuda:0', grad_fn=), Loss: 0.17358337342739105, KL/n: 71.75361633300781 + 0it [00:00, ?it/s]2025-05-26 03:54:09,751 - INFO - [Epoch 007 | Batch 0000] IWAE-loss 17575.0977 | mean log_px -0.2084 | KL -3514.32 + 1it [00:00, 5.96it/s] 2it [00:00, 7.10it/s] 3it [00:00, 7.99it/s] 4it [00:00, 8.64it/s] 5it [00:00, 8.99it/s] 6it [00:00, 9.25it/s] 7it [00:00, 9.41it/s] 8it [00:00, 9.54it/s] 9it [00:01, 9.60it/s] 10it [00:01, 9.51it/s] 11it [00:01, 9.41it/s] 12it [00:01, 9.53it/s] 13it [00:01, 9.58it/s] 14it [00:01, 9.63it/s] 15it [00:01, 9.61it/s] 16it [00:01, 9.66it/s] 17it [00:01, 9.71it/s] 18it [00:01, 9.75it/s] 19it [00:02, 9.79it/s] 20it [00:02, 9.77it/s] 21it [00:02, 9.52it/s] 22it [00:02, 9.59it/s] 23it [00:02, 9.68it/s] 24it [00:02, 9.72it/s] 25it [00:02, 9.75it/s] 26it [00:02, 9.79it/s] 27it [00:02, 9.35it/s] 28it [00:02, 9.48it/s] 29it [00:03, 9.56it/s] 30it [00:03, 9.61it/s] 31it [00:03, 9.66it/s] 32it [00:03, 9.68it/s] 33it [00:03, 9.73it/s] 34it [00:03, 9.74it/s] 35it [00:03, 9.78it/s] 36it [00:03, 9.79it/s] 37it [00:03, 9.81it/s] 38it [00:04, 9.77it/s] 39it [00:04, 9.79it/s] 40it [00:04, 9.82it/s] 41it [00:04, 9.79it/s] 42it [00:04, 9.81it/s] 43it [00:04, 9.77it/s] 44it [00:04, 9.78it/s] 45it [00:04, 9.50it/s] 46it [00:04, 9.61it/s] 47it [00:04, 9.67it/s] 48it [00:05, 9.71it/s] 49it [00:05, 9.76it/s] 50it [00:05, 9.75it/s]2025-05-26 03:54:14,930 - INFO - [Epoch 007 | Batch 0050] IWAE-loss 11222.3057 | mean log_px -0.1177 | KL -3518.79 + 51it [00:05, 9.77it/s] 52it [00:05, 9.77it/s] 53it [00:05, 9.55it/s] 54it [00:05, 9.02it/s] 55it [00:05, 9.23it/s] 56it [00:05, 9.40it/s] 57it [00:06, 8.93it/s] 58it [00:06, 9.03it/s] 59it [00:06, 9.22it/s] 60it [00:06, 9.34it/s] 61it [00:06, 9.45it/s] 62it [00:06, 9.51it/s] 63it [00:06, 9.60it/s] 64it [00:06, 9.65it/s] 65it [00:06, 9.72it/s] 66it [00:06, 9.73it/s] 67it [00:07, 9.75it/s] 68it [00:07, 9.77it/s] 69it [00:07, 9.37it/s] 70it [00:07, 9.50it/s] 71it [00:07, 9.61it/s] 72it [00:07, 9.66it/s] 73it [00:07, 9.71it/s] 74it [00:07, 9.74it/s] 75it [00:07, 9.76it/s] 76it [00:07, 9.76it/s] 77it [00:08, 9.78it/s] 78it [00:08, 9.82it/s] 79it [00:08, 9.82it/s] 80it [00:08, 9.83it/s] 81it [00:08, 9.81it/s] 82it [00:08, 9.82it/s] 83it [00:08, 9.83it/s] 84it [00:08, 9.83it/s] 85it [00:08, 9.82it/s] 86it [00:08, 9.83it/s] 87it [00:09, 9.83it/s] 88it [00:09, 9.83it/s] 89it [00:09, 9.81it/s] 90it [00:09, 9.78it/s] 91it [00:09, 9.81it/s] 92it [00:09, 9.81it/s] 93it [00:09, 9.81it/s] 94it [00:09, 9.83it/s] 95it [00:09, 9.65it/s] 96it [00:10, 9.63it/s] 97it [00:10, 9.72it/s] 98it [00:10, 9.76it/s] 99it [00:10, 9.73it/s] 100it [00:10, 9.76it/s]2025-05-26 03:54:20,114 - INFO - [Epoch 007 | Batch 0100] IWAE-loss 15323.3848 | mean log_px -0.1767 | KL -3517.25 + 101it [00:10, 9.70it/s] 102it [00:10, 9.74it/s] 103it [00:10, 9.78it/s] 104it [00:10, 9.81it/s] 105it [00:10, 9.83it/s] 106it [00:11, 9.82it/s] 107it [00:11, 9.84it/s] 108it [00:11, 9.84it/s] 109it [00:11, 9.84it/s] 110it [00:11, 9.84it/s] 111it [00:11, 9.81it/s] 112it [00:11, 9.81it/s] 113it [00:11, 9.81it/s] 114it [00:11, 9.80it/s] 115it [00:11, 9.82it/s] 116it [00:12, 9.80it/s] 117it [00:12, 9.82it/s] 118it [00:12, 9.79it/s] 119it [00:12, 9.79it/s] 120it [00:12, 9.77it/s] 121it [00:12, 9.78it/s] 122it [00:12, 9.76it/s] 123it [00:12, 9.78it/s] 124it [00:12, 9.78it/s] 125it [00:12, 9.79it/s] 126it [00:13, 9.80it/s] 127it [00:13, 9.80it/s] 128it [00:13, 9.76it/s] 129it [00:13, 9.76it/s] 130it [00:13, 9.73it/s] 131it [00:13, 9.76it/s] 132it [00:13, 9.75it/s] 133it [00:13, 9.76it/s] 134it [00:13, 9.78it/s] 135it [00:14, 9.75it/s] 136it [00:14, 9.74it/s] 137it [00:14, 9.74it/s] 138it [00:14, 9.29it/s] 139it [00:14, 9.43it/s] 140it [00:14, 9.49it/s] 141it [00:14, 9.60it/s] 142it [00:14, 9.64it/s] 143it [00:14, 9.71it/s] 144it [00:14, 9.72it/s] 145it [00:15, 9.76it/s] 146it [00:15, 9.78it/s] 147it [00:15, 9.79it/s] 148it [00:15, 9.80it/s] 149it [00:15, 9.73it/s] 150it [00:15, 9.75it/s]2025-05-26 03:54:25,244 - INFO - [Epoch 007 | Batch 0150] IWAE-loss 19223.7129 | mean log_px -0.2297 | KL -3526.62 + 151it [00:15, 9.74it/s] 152it [00:15, 9.73it/s] 153it [00:15, 9.75it/s] 154it [00:15, 9.74it/s] 155it [00:16, 9.73it/s] 156it [00:16, 9.73it/s] 157it [00:16, 9.75it/s] 158it [00:16, 9.74it/s] 159it [00:16, 9.76it/s] 160it [00:16, 9.74it/s] 161it [00:16, 9.75it/s] 162it [00:16, 9.76it/s] 163it [00:16, 9.78it/s] 164it [00:16, 9.61it/s] 165it [00:17, 9.68it/s] 166it [00:17, 9.72it/s] 167it [00:17, 9.77it/s] 168it [00:17, 9.79it/s] 169it [00:17, 9.80it/s] 170it [00:17, 9.56it/s] 171it [00:17, 9.64it/s] 172it [00:17, 9.53it/s] 173it [00:17, 9.65it/s] 174it [00:18, 9.71it/s] 175it [00:18, 9.78it/s] 176it [00:18, 9.76it/s] 177it [00:18, 9.23it/s] 178it [00:18, 9.39it/s] 179it [00:18, 9.51it/s] 180it [00:18, 9.61it/s] 181it [00:18, 9.33it/s] 182it [00:18, 9.46it/s] 183it [00:18, 9.58it/s] 184it [00:19, 9.64it/s] 185it [00:19, 9.69it/s] 186it [00:19, 9.70it/s] 187it [00:19, 9.74it/s] 188it [00:19, 9.74it/s] 189it [00:19, 9.74it/s] 190it [00:19, 9.60it/s] 191it [00:19, 8.92it/s] 192it [00:19, 9.12it/s] 193it [00:20, 9.23it/s] 194it [00:20, 9.40it/s] 195it [00:20, 8.51it/s] 196it [00:20, 9.59it/s] +2025-05-26 03:54:30,067 - INFO - Epoch: 7, Objective: tensor([11751.9316], device='cuda:0', grad_fn=), Loss: 0.11317390948534012, KL/n: 71.94717407226562 + 0it [00:00, ?it/s]2025-05-26 03:54:30,533 - INFO - [Epoch 008 | Batch 0000] IWAE-loss 14055.2070 | mean log_px -0.1545 | KL -3523.18 + 1it [00:00, 5.27it/s] 2it [00:00, 7.21it/s] 3it [00:00, 8.22it/s] 4it [00:00, 8.70it/s] 5it [00:00, 8.99it/s] 6it [00:00, 9.23it/s] 7it [00:00, 9.40it/s] 8it [00:00, 9.54it/s] 9it [00:01, 9.64it/s] 10it [00:01, 9.69it/s] 11it [00:01, 9.74it/s] 12it [00:01, 9.74it/s] 13it [00:01, 9.80it/s] 14it [00:01, 9.77it/s] 15it [00:01, 9.82it/s] 16it [00:01, 9.80it/s] 17it [00:01, 9.81it/s] 18it [00:01, 9.79it/s] 19it [00:02, 9.81it/s] 20it [00:02, 9.74it/s] 21it [00:02, 9.78it/s] 22it [00:02, 9.77it/s] 23it [00:02, 9.77it/s] 24it [00:02, 9.75it/s] 25it [00:02, 9.59it/s] 26it [00:02, 9.30it/s] 27it [00:02, 9.34it/s] 28it [00:02, 9.41it/s] 29it [00:03, 9.48it/s] 30it [00:03, 9.52it/s] 31it [00:03, 9.56it/s] 32it [00:03, 9.59it/s] 33it [00:03, 9.62it/s] 34it [00:03, 9.62it/s] 35it [00:03, 9.63it/s] 36it [00:03, 9.60it/s] 37it [00:03, 9.60it/s] 38it [00:04, 9.60it/s] 39it [00:04, 9.66it/s] 40it [00:04, 9.70it/s] 41it [00:04, 9.10it/s] 42it [00:04, 9.29it/s] 43it [00:04, 9.43it/s] 44it [00:04, 9.54it/s] 45it [00:04, 9.63it/s] 46it [00:04, 9.67it/s] 47it [00:04, 9.75it/s] 48it [00:05, 9.77it/s] 49it [00:05, 9.81it/s] 50it [00:05, 9.81it/s]2025-05-26 03:54:35,708 - INFO - [Epoch 008 | Batch 0050] IWAE-loss 12810.5664 | mean log_px -0.1418 | KL -3528.74 + 51it [00:05, 9.82it/s] 52it [00:05, 9.84it/s] 53it [00:05, 9.86it/s] 54it [00:05, 9.87it/s] 55it [00:05, 9.21it/s] 56it [00:05, 9.36it/s] 57it [00:05, 9.51it/s] 58it [00:06, 9.62it/s] 59it [00:06, 9.69it/s] 60it [00:06, 9.71it/s] 61it [00:06, 9.72it/s] 62it [00:06, 9.74it/s] 63it [00:06, 9.79it/s] 64it [00:06, 9.78it/s] 65it [00:06, 9.79it/s] 66it [00:06, 9.80it/s] 67it [00:07, 9.83it/s] 68it [00:07, 9.82it/s] 69it [00:07, 9.83it/s] 70it [00:07, 9.83it/s] 71it [00:07, 9.33it/s] 72it [00:07, 9.45it/s] 73it [00:07, 9.51it/s] 74it [00:07, 9.61it/s] 75it [00:07, 9.05it/s] 76it [00:07, 9.25it/s] 77it [00:08, 9.40it/s] 78it [00:08, 9.55it/s] 79it [00:08, 9.05it/s] 80it [00:08, 9.20it/s] 81it [00:08, 9.36it/s] 82it [00:08, 9.47it/s] 83it [00:08, 9.57it/s] 84it [00:08, 9.66it/s] 85it [00:08, 9.73it/s] 86it [00:09, 9.79it/s] 87it [00:09, 9.78it/s] 88it [00:09, 9.80it/s] 89it [00:09, 9.83it/s] 90it [00:09, 9.82it/s] 91it [00:09, 9.84it/s] 92it [00:09, 9.72it/s] 93it [00:09, 9.76it/s] 94it [00:09, 9.75it/s] 95it [00:09, 9.76it/s] 96it [00:10, 9.75it/s] 97it [00:10, 9.29it/s] 98it [00:10, 9.42it/s] 99it [00:10, 9.51it/s] 100it [00:10, 9.58it/s]2025-05-26 03:54:40,914 - INFO - [Epoch 008 | Batch 0100] IWAE-loss 9847.4746 | mean log_px -0.0930 | KL -3528.36 + 101it [00:10, 9.66it/s] 102it [00:10, 9.71it/s] 103it [00:10, 9.77it/s] 104it [00:10, 9.80it/s] 105it [00:10, 9.84it/s] 106it [00:11, 9.85it/s] 107it [00:11, 9.81it/s] 108it [00:11, 9.78it/s] 109it [00:11, 9.79it/s] 110it [00:11, 9.79it/s] 111it [00:11, 9.78it/s] 112it [00:11, 9.78it/s] 113it [00:11, 9.82it/s] 114it [00:11, 9.82it/s] 115it [00:11, 9.83it/s] 116it [00:12, 9.82it/s] 117it [00:12, 9.82it/s] 118it [00:12, 9.80it/s] 119it [00:12, 9.82it/s] 120it [00:12, 9.82it/s] 121it [00:12, 9.80it/s] 122it [00:12, 9.80it/s] 123it [00:12, 9.81it/s] 124it [00:12, 9.81it/s] 125it [00:13, 9.82it/s] 126it [00:13, 9.80it/s] 127it [00:13, 9.82it/s] 128it [00:13, 9.31it/s] 129it [00:13, 9.47it/s] 130it [00:13, 9.56it/s] 131it [00:13, 9.61it/s] 132it [00:13, 9.67it/s] 133it [00:13, 9.74it/s] 134it [00:13, 9.75it/s] 135it [00:14, 9.77it/s] 136it [00:14, 9.80it/s] 137it [00:14, 9.07it/s] 138it [00:14, 9.12it/s] 139it [00:14, 9.32it/s] 140it [00:14, 9.45it/s] 141it [00:14, 9.56it/s] 142it [00:14, 9.19it/s] 143it [00:14, 9.37it/s] 144it [00:15, 9.49it/s] 145it [00:15, 9.60it/s] 146it [00:15, 9.65it/s] 147it [00:15, 9.71it/s] 148it [00:15, 9.75it/s] 149it [00:15, 9.79it/s] 150it [00:15, 9.77it/s]2025-05-26 03:54:46,076 - INFO - [Epoch 008 | Batch 0150] IWAE-loss 11725.8896 | mean log_px -0.1225 | KL -3532.75 + 151it [00:15, 9.78it/s] 152it [00:15, 9.79it/s] 153it [00:15, 9.77it/s] 154it [00:16, 9.77it/s] 155it [00:16, 9.78it/s] 156it [00:16, 9.80it/s] 157it [00:16, 9.80it/s] 158it [00:16, 9.79it/s] 159it [00:16, 9.68it/s] 160it [00:16, 9.72it/s] 161it [00:16, 9.77it/s] 162it [00:16, 9.79it/s] 163it [00:16, 9.80it/s] 164it [00:17, 9.79it/s] 165it [00:17, 9.83it/s] 166it [00:17, 9.83it/s] 167it [00:17, 9.32it/s] 168it [00:17, 9.42it/s] 169it [00:17, 9.54it/s] 170it [00:17, 9.09it/s] 171it [00:17, 9.31it/s] 172it [00:17, 9.44it/s] 173it [00:18, 9.04it/s] 174it [00:18, 9.24it/s] 175it [00:18, 9.43it/s] 176it [00:18, 9.44it/s] 177it [00:18, 9.56it/s] 178it [00:18, 9.64it/s] 179it [00:18, 9.72it/s] 180it [00:18, 9.77it/s] 181it [00:18, 9.82it/s] 182it [00:18, 9.77it/s] 183it [00:19, 9.79it/s] 184it [00:19, 9.79it/s] 185it [00:19, 9.77it/s] 186it [00:19, 9.81it/s] 187it [00:19, 9.83it/s] 188it [00:19, 9.80it/s] 189it [00:19, 9.78it/s] 190it [00:19, 9.47it/s] 191it [00:19, 8.94it/s] 192it [00:20, 9.19it/s] 193it [00:20, 9.39it/s] 194it [00:20, 9.49it/s] 195it [00:20, 8.61it/s] 196it [00:20, 9.55it/s] +2025-05-26 03:54:50,907 - INFO - Epoch: 8, Objective: tensor([19531.0215], device='cuda:0', grad_fn=), Loss: 0.22876138985157013, KL/n: 72.13713073730469 + 0it [00:00, ?it/s]2025-05-26 03:54:51,182 - INFO - [Epoch 009 | Batch 0000] IWAE-loss 15139.6064 | mean log_px -0.1711 | KL -3532.32 + 1it [00:00, 5.38it/s] 2it [00:00, 7.25it/s] 3it [00:00, 8.27it/s] 4it [00:00, 8.84it/s] 5it [00:00, 9.18it/s] 6it [00:00, 9.37it/s] 7it [00:00, 9.54it/s] 8it [00:00, 9.62it/s] 9it [00:01, 9.68it/s] 10it [00:01, 9.74it/s] 11it [00:01, 9.78it/s] 12it [00:01, 9.77it/s] 13it [00:01, 9.77it/s] 14it [00:01, 9.78it/s] 15it [00:01, 9.79it/s] 16it [00:01, 9.77it/s] 17it [00:01, 9.29it/s] 18it [00:01, 9.41it/s] 19it [00:02, 9.55it/s] 20it [00:02, 9.60it/s] 21it [00:02, 9.69it/s] 22it [00:02, 9.70it/s] 23it [00:02, 9.73it/s] 24it [00:02, 9.76it/s] 25it [00:02, 9.76it/s] 26it [00:02, 9.26it/s] 27it [00:02, 9.42it/s] 28it [00:02, 9.55it/s] 29it [00:03, 9.63it/s] 30it [00:03, 9.68it/s] 31it [00:03, 9.72it/s] 32it [00:03, 9.74it/s] 33it [00:03, 9.78it/s] 34it [00:03, 9.30it/s] 35it [00:03, 9.43it/s] 36it [00:03, 9.54it/s] 37it [00:03, 9.64it/s] 38it [00:04, 9.15it/s] 39it [00:04, 8.90it/s] 40it [00:04, 9.13it/s] 41it [00:04, 9.31it/s] 42it [00:04, 9.48it/s] 43it [00:04, 9.62it/s] 44it [00:04, 9.67it/s] 45it [00:04, 9.75it/s] 46it [00:04, 9.11it/s] 47it [00:04, 9.34it/s] 48it [00:05, 9.50it/s] 49it [00:05, 9.62it/s] 50it [00:05, 9.69it/s]2025-05-26 03:54:56,392 - INFO - [Epoch 009 | Batch 0050] IWAE-loss 10535.8184 | mean log_px -0.1103 | KL -3535.26 + 51it [00:05, 9.74it/s] 52it [00:05, 9.77it/s] 53it [00:05, 9.83it/s] 54it [00:05, 9.85it/s] 55it [00:05, 9.82it/s] 56it [00:05, 9.82it/s] 57it [00:06, 9.78it/s] 58it [00:06, 9.82it/s] 59it [00:06, 9.85it/s] 60it [00:06, 9.83it/s] 61it [00:06, 9.86it/s] 62it [00:06, 9.87it/s] 63it [00:06, 9.37it/s] 64it [00:06, 9.49it/s] 65it [00:06, 9.52it/s] 66it [00:06, 9.64it/s] 67it [00:07, 9.71it/s] 68it [00:07, 9.72it/s] 69it [00:07, 9.73it/s] 70it [00:07, 9.73it/s] 71it [00:07, 9.12it/s] 72it [00:07, 9.31it/s] 73it [00:07, 9.47it/s] 74it [00:07, 9.58it/s] 75it [00:07, 9.65it/s] 76it [00:07, 9.72it/s] 77it [00:08, 9.78it/s] 78it [00:08, 9.77it/s] 79it [00:08, 9.77it/s] 80it [00:08, 9.79it/s] 81it [00:08, 9.83it/s] 82it [00:08, 9.85it/s] 83it [00:08, 9.85it/s] 84it [00:08, 9.86it/s] 85it [00:08, 9.84it/s] 86it [00:08, 9.82it/s] 87it [00:09, 9.83it/s] 88it [00:09, 9.82it/s] 89it [00:09, 9.84it/s] 90it [00:09, 9.84it/s] 91it [00:09, 9.79it/s] 92it [00:09, 9.09it/s] 93it [00:09, 8.84it/s] 94it [00:09, 8.50it/s] 95it [00:09, 8.85it/s] 96it [00:10, 9.10it/s] 97it [00:10, 9.28it/s] 98it [00:10, 8.92it/s] 99it [00:10, 9.12it/s] 100it [00:10, 9.23it/s]2025-05-26 03:55:01,623 - INFO - [Epoch 009 | Batch 0100] IWAE-loss 12649.1650 | mean log_px -0.1434 | KL -3534.93 + 101it [00:10, 9.25it/s] 102it [00:10, 9.30it/s] 103it [00:10, 9.40it/s] 104it [00:10, 9.52it/s] 105it [00:11, 9.61it/s] 106it [00:11, 9.66it/s] 107it [00:11, 9.54it/s] 108it [00:11, 9.61it/s] 109it [00:11, 9.26it/s] 110it [00:11, 9.30it/s] 111it [00:11, 9.22it/s] 112it [00:11, 8.71it/s] 113it [00:11, 8.83it/s] 114it [00:12, 9.10it/s] 115it [00:12, 9.30it/s] 116it [00:12, 8.97it/s] 117it [00:12, 9.22it/s] 118it [00:12, 9.34it/s] 119it [00:12, 8.97it/s] 120it [00:12, 9.20it/s] 121it [00:12, 9.40it/s] 122it [00:12, 9.46it/s] 123it [00:12, 9.58it/s] 124it [00:13, 9.65it/s] 125it [00:13, 9.14it/s] 126it [00:13, 9.33it/s] 127it [00:13, 9.49it/s] 128it [00:13, 9.59it/s] 129it [00:13, 9.68it/s] 130it [00:13, 9.72it/s] 131it [00:13, 9.76it/s] 132it [00:13, 9.78it/s] 133it [00:14, 9.81it/s] 134it [00:14, 9.81it/s] 135it [00:14, 9.84it/s] 136it [00:14, 9.83it/s] 137it [00:14, 9.84it/s] 138it [00:14, 9.84it/s] 139it [00:14, 9.26it/s] 140it [00:14, 9.39it/s] 141it [00:14, 9.51it/s] 142it [00:14, 9.60it/s] 143it [00:15, 9.13it/s] 144it [00:15, 9.32it/s] 145it [00:15, 9.49it/s] 146it [00:15, 9.58it/s] 147it [00:15, 9.65it/s] 148it [00:15, 9.70it/s] 149it [00:15, 9.75it/s] 150it [00:15, 9.76it/s]2025-05-26 03:55:06,897 - INFO - [Epoch 009 | Batch 0150] IWAE-loss 14599.3418 | mean log_px -0.1665 | KL -3540.62 + 151it [00:15, 9.19it/s] 152it [00:16, 9.37it/s] 153it [00:16, 9.48it/s] 154it [00:16, 9.58it/s] 155it [00:16, 9.66it/s] 156it [00:16, 9.71it/s] 157it [00:16, 9.75it/s] 158it [00:16, 9.76it/s] 159it [00:16, 9.79it/s] 160it [00:16, 9.80it/s] 161it [00:16, 9.81it/s] 162it [00:17, 9.81it/s] 163it [00:17, 9.82it/s] 164it [00:17, 9.82it/s] 165it [00:17, 9.83it/s] 166it [00:17, 9.81it/s] 167it [00:17, 9.82it/s] 168it [00:17, 9.81it/s] 169it [00:17, 9.83it/s] 170it [00:17, 9.83it/s] 171it [00:17, 9.28it/s] 172it [00:18, 9.43it/s] 173it [00:18, 9.55it/s] 174it [00:18, 9.63it/s] 175it [00:18, 9.70it/s] 176it [00:18, 9.73it/s] 177it [00:18, 9.54it/s] 178it [00:18, 9.62it/s] 179it [00:18, 9.27it/s] 180it [00:18, 9.41it/s] 181it [00:19, 8.96it/s] 182it [00:19, 9.12it/s] 183it [00:19, 9.30it/s] 184it [00:19, 9.43it/s] 185it [00:19, 9.44it/s] 186it [00:19, 8.89it/s] 187it [00:19, 9.16it/s] 188it [00:19, 9.35it/s] 189it [00:19, 9.48it/s] 190it [00:19, 9.62it/s] 191it [00:20, 9.09it/s] 192it [00:20, 9.15it/s] 193it [00:20, 9.37it/s] 194it [00:20, 9.51it/s] 195it [00:20, 9.13it/s] 196it [00:20, 9.48it/s] +2025-05-26 03:55:11,724 - INFO - Epoch: 9, Objective: tensor([12982.9697], device='cuda:0', grad_fn=), Loss: 0.14898112416267395, KL/n: 72.30970001220703 + 0it [00:00, ?it/s]2025-05-26 03:55:12,182 - INFO - [Epoch 010 | Batch 0000] IWAE-loss 13698.6484 | mean log_px -0.1451 | KL -3541.10 + 1it [00:00, 4.63it/s] 2it [00:00, 6.71it/s] 4it [00:00, 8.46it/s] 6it [00:00, 9.14it/s] 8it [00:00, 9.09it/s] 10it [00:01, 9.42it/s] 12it [00:01, 9.63it/s] 14it [00:01, 9.76it/s] 15it [00:01, 9.74it/s] 16it [00:01, 9.76it/s] 17it [00:01, 9.80it/s] 18it [00:01, 9.84it/s] 19it [00:02, 9.34it/s] 20it [00:02, 9.50it/s] 21it [00:02, 9.61it/s] 22it [00:02, 9.71it/s] 23it [00:02, 9.20it/s] 24it [00:02, 9.39it/s] 25it [00:02, 9.56it/s] 26it [00:02, 9.68it/s] 27it [00:02, 9.19it/s] 29it [00:03, 9.59it/s] 30it [00:03, 9.67it/s] 32it [00:03, 9.83it/s] 34it [00:03, 9.60it/s] 36it [00:03, 9.76it/s] 38it [00:04, 9.85it/s] 40it [00:04, 9.92it/s] 42it [00:04, 9.96it/s] 44it [00:04, 10.00it/s] 46it [00:04, 10.01it/s] 48it [00:05, 10.03it/s] 50it [00:05, 10.01it/s]2025-05-26 03:55:17,313 - INFO - [Epoch 010 | Batch 0050] IWAE-loss 15355.1699 | mean log_px -0.1796 | KL -3543.84 + 52it [00:05, 10.00it/s] 53it [00:05, 9.99it/s] 55it [00:05, 10.02it/s] 57it [00:05, 10.01it/s] 59it [00:06, 10.03it/s] 61it [00:06, 9.75it/s] 62it [00:06, 9.77it/s] 63it [00:06, 9.81it/s] 64it [00:06, 9.79it/s] 65it [00:06, 9.84it/s] 66it [00:06, 9.86it/s] 67it [00:06, 9.86it/s] 69it [00:07, 9.96it/s] 70it [00:07, 9.95it/s] 71it [00:07, 9.94it/s] 72it [00:07, 9.89it/s] 73it [00:07, 9.41it/s] 74it [00:07, 9.51it/s] 75it [00:07, 9.64it/s] 76it [00:07, 9.73it/s] 78it [00:08, 9.87it/s] 79it [00:08, 9.89it/s] 80it [00:08, 9.90it/s] 81it [00:08, 9.91it/s] 82it [00:08, 9.91it/s] 84it [00:08, 9.95it/s] 85it [00:08, 9.53it/s] 86it [00:08, 9.62it/s] 87it [00:08, 9.69it/s] 89it [00:09, 9.84it/s] 90it [00:09, 9.86it/s] 91it [00:09, 9.89it/s] 92it [00:09, 9.92it/s] 94it [00:09, 9.98it/s] 95it [00:09, 9.98it/s] 96it [00:09, 9.98it/s] 97it [00:09, 9.97it/s] 98it [00:10, 9.98it/s] 100it [00:10, 10.02it/s]2025-05-26 03:55:22,383 - INFO - [Epoch 010 | Batch 0100] IWAE-loss 10181.3457 | mean log_px -0.1026 | KL -3547.27 + 102it [00:10, 9.98it/s] 104it [00:10, 10.00it/s] 105it [00:10, 9.99it/s] 106it [00:10, 9.99it/s] 107it [00:10, 9.95it/s] 109it [00:11, 9.99it/s] 110it [00:11, 9.94it/s] 111it [00:11, 9.93it/s] 113it [00:11, 9.99it/s] 114it [00:11, 9.98it/s] 116it [00:11, 10.03it/s] 118it [00:12, 10.05it/s] 120it [00:12, 9.67it/s] 122it [00:12, 9.81it/s] 124it [00:12, 9.90it/s] 126it [00:12, 9.94it/s] 128it [00:13, 9.91it/s] 129it [00:13, 9.86it/s] 130it [00:13, 9.89it/s] 131it [00:13, 9.64it/s] 132it [00:13, 9.69it/s] 133it [00:13, 9.73it/s] 134it [00:13, 9.79it/s] 135it [00:13, 9.79it/s] 136it [00:13, 9.79it/s] 137it [00:14, 9.84it/s] 138it [00:14, 9.79it/s] 139it [00:14, 9.80it/s] 140it [00:14, 9.75it/s] 141it [00:14, 9.82it/s] 142it [00:14, 9.74it/s] 143it [00:14, 9.26it/s] 144it [00:14, 9.41it/s] 145it [00:14, 9.57it/s] 146it [00:14, 9.61it/s] 147it [00:15, 9.64it/s] 148it [00:15, 9.05it/s] 149it [00:15, 9.21it/s] 150it [00:15, 9.36it/s]2025-05-26 03:55:27,507 - INFO - [Epoch 010 | Batch 0150] IWAE-loss 12556.6738 | mean log_px -0.1344 | KL -3543.33 + 151it [00:15, 9.45it/s] 152it [00:15, 9.55it/s] 153it [00:15, 9.62it/s] 154it [00:15, 9.66it/s] 155it [00:15, 9.71it/s] 156it [00:16, 9.77it/s] 157it [00:16, 9.69it/s] 158it [00:16, 9.67it/s] 159it [00:16, 9.69it/s] 160it [00:16, 9.60it/s] 161it [00:16, 9.62it/s] 162it [00:16, 9.62it/s] 163it [00:16, 9.70it/s] 164it [00:16, 9.77it/s] 165it [00:16, 9.78it/s] 166it [00:17, 9.79it/s] 167it [00:17, 9.83it/s] 168it [00:17, 9.82it/s] 169it [00:17, 9.84it/s] 170it [00:17, 9.86it/s] 172it [00:17, 9.93it/s] 173it [00:17, 9.84it/s] 174it [00:17, 9.85it/s] 175it [00:17, 9.85it/s] 176it [00:18, 9.88it/s] 177it [00:18, 9.88it/s] 178it [00:18, 9.86it/s] 179it [00:18, 9.89it/s] 180it [00:18, 9.91it/s] 181it [00:18, 9.93it/s] 182it [00:18, 9.41it/s] 183it [00:18, 9.53it/s] 184it [00:18, 9.61it/s] 185it [00:18, 9.68it/s] 186it [00:19, 9.71it/s] 187it [00:19, 9.73it/s] 188it [00:19, 9.78it/s] 189it [00:19, 9.78it/s] 190it [00:19, 9.82it/s] 191it [00:19, 9.86it/s] 192it [00:19, 9.84it/s] 193it [00:19, 9.80it/s] 194it [00:19, 9.78it/s] 195it [00:20, 8.68it/s] 196it [00:20, 8.84it/s] 196it [00:20, 9.69it/s] +2025-05-26 03:55:32,265 - INFO - Epoch: 10, Objective: tensor([15107.3916], device='cuda:0', grad_fn=), Loss: 0.16303861141204834, KL/n: 72.43524169921875 + 0it [00:00, ?it/s]2025-05-26 03:55:32,556 - INFO - [Epoch 011 | Batch 0000] IWAE-loss 10246.0049 | mean log_px -0.1013 | KL -3548.55 + 1it [00:00, 5.04it/s] 2it [00:00, 6.50it/s] 3it [00:00, 7.68it/s] 4it [00:00, 8.37it/s] 5it [00:00, 8.35it/s] 6it [00:00, 8.74it/s] 7it [00:00, 8.99it/s] 8it [00:00, 8.62it/s] 9it [00:01, 8.95it/s] 10it [00:01, 9.19it/s] 11it [00:01, 9.41it/s] 12it [00:01, 9.56it/s] 13it [00:01, 9.68it/s] 14it [00:01, 9.70it/s] 15it [00:01, 9.78it/s] 16it [00:01, 9.82it/s] 17it [00:01, 9.85it/s] 18it [00:01, 9.86it/s] 19it [00:02, 9.85it/s] 20it [00:02, 9.80it/s] 21it [00:02, 9.21it/s] 22it [00:02, 9.35it/s] 23it [00:02, 9.46it/s] 24it [00:02, 9.57it/s] 26it [00:02, 9.79it/s] 27it [00:02, 9.82it/s] 28it [00:03, 9.87it/s] 30it [00:03, 9.94it/s] 31it [00:03, 9.94it/s] 32it [00:03, 9.92it/s] 33it [00:03, 9.93it/s] 34it [00:03, 9.90it/s] 35it [00:03, 9.90it/s] 36it [00:03, 9.92it/s] 37it [00:03, 9.92it/s] 38it [00:04, 9.87it/s] 39it [00:04, 9.75it/s] 40it [00:04, 9.73it/s] 41it [00:04, 9.78it/s] 42it [00:04, 9.82it/s] 43it [00:04, 9.87it/s] 44it [00:04, 9.89it/s] 45it [00:04, 9.88it/s] 46it [00:04, 9.89it/s] 47it [00:04, 9.92it/s] 48it [00:05, 9.89it/s] 49it [00:05, 9.90it/s] 50it [00:05, 9.40it/s]2025-05-26 03:55:37,736 - INFO - [Epoch 011 | Batch 0050] IWAE-loss 13919.8701 | mean log_px -0.1529 | KL -3551.17 + 51it [00:05, 9.49it/s] 52it [00:05, 9.60it/s] 53it [00:05, 9.69it/s] 54it [00:05, 9.72it/s] 55it [00:05, 9.27it/s] 56it [00:05, 9.40it/s] 57it [00:06, 9.54it/s] 58it [00:06, 9.63it/s] 59it [00:06, 9.70it/s] 60it [00:06, 9.74it/s] 61it [00:06, 9.78it/s] 62it [00:06, 9.80it/s] 63it [00:06, 9.84it/s] 64it [00:06, 9.85it/s] 65it [00:06, 9.88it/s] 66it [00:06, 9.86it/s] 67it [00:07, 9.87it/s] 68it [00:07, 9.83it/s] 69it [00:07, 9.87it/s] 70it [00:07, 9.87it/s] 72it [00:07, 9.89it/s] 73it [00:07, 9.88it/s] 74it [00:07, 9.88it/s] 75it [00:07, 9.84it/s] 76it [00:07, 9.86it/s] 77it [00:08, 9.50it/s] 78it [00:08, 9.62it/s] 79it [00:08, 9.69it/s] 80it [00:08, 9.72it/s] 81it [00:08, 9.74it/s] 82it [00:08, 9.79it/s] 83it [00:08, 9.80it/s] 84it [00:08, 9.81it/s] 85it [00:08, 9.21it/s] 86it [00:08, 9.38it/s] 87it [00:09, 9.45it/s] 88it [00:09, 9.53it/s] 89it [00:09, 9.03it/s] 90it [00:09, 9.27it/s] 91it [00:09, 9.46it/s] 92it [00:09, 9.55it/s] 93it [00:09, 9.08it/s] 94it [00:09, 9.27it/s] 95it [00:09, 9.44it/s] 96it [00:10, 9.56it/s] 97it [00:10, 9.07it/s] 98it [00:10, 9.25it/s] 99it [00:10, 9.45it/s] 100it [00:10, 9.56it/s]2025-05-26 03:55:42,936 - INFO - [Epoch 011 | Batch 0100] IWAE-loss 11395.6230 | mean log_px -0.1321 | KL -3551.43 + 101it [00:10, 9.03it/s] 102it [00:10, 9.24it/s] 103it [00:10, 9.40it/s] 104it [00:10, 9.49it/s] 105it [00:11, 8.97it/s] 106it [00:11, 9.15it/s] 107it [00:11, 9.36it/s] 108it [00:11, 9.49it/s] 109it [00:11, 9.04it/s] 110it [00:11, 9.23it/s] 111it [00:11, 9.42it/s] 112it [00:11, 9.56it/s] 113it [00:11, 9.07it/s] 114it [00:11, 9.27it/s] 115it [00:12, 9.44it/s] 116it [00:12, 9.47it/s] 117it [00:12, 8.99it/s] 118it [00:12, 9.17it/s] 119it [00:12, 9.31it/s] 120it [00:12, 9.47it/s] 121it [00:12, 9.62it/s] 122it [00:12, 9.72it/s] 123it [00:12, 9.76it/s] 124it [00:13, 9.81it/s] 125it [00:13, 9.18it/s] 126it [00:13, 9.28it/s] 127it [00:13, 9.46it/s] 128it [00:13, 9.61it/s] 129it [00:13, 9.70it/s] 131it [00:13, 9.85it/s] 132it [00:13, 9.84it/s] 133it [00:13, 9.26it/s] 134it [00:14, 9.41it/s] 135it [00:14, 9.54it/s] 136it [00:14, 9.63it/s] 137it [00:14, 9.14it/s] 138it [00:14, 9.30it/s] 139it [00:14, 9.45it/s] 140it [00:14, 9.57it/s] 141it [00:14, 9.04it/s] 142it [00:14, 9.25it/s] 143it [00:15, 9.43it/s] 144it [00:15, 9.50it/s] 145it [00:15, 9.00it/s] 146it [00:15, 9.19it/s] 147it [00:15, 9.41it/s] 148it [00:15, 9.39it/s] 149it [00:15, 9.56it/s]2025-05-26 03:55:48,255 - INFO - [Epoch 011 | Batch 0150] IWAE-loss 14350.5879 | mean log_px -0.1595 | KL -3548.78 + 151it [00:15, 9.77it/s] 153it [00:16, 9.88it/s] 155it [00:16, 9.95it/s] 156it [00:16, 9.96it/s] 158it [00:16, 10.01it/s] 160it [00:16, 10.02it/s] 162it [00:16, 10.02it/s] 164it [00:17, 9.68it/s] 166it [00:17, 9.80it/s] 167it [00:17, 9.82it/s] 169it [00:17, 9.90it/s] 170it [00:17, 9.90it/s] 172it [00:18, 9.96it/s] 174it [00:18, 9.99it/s] 176it [00:18, 9.59it/s] 178it [00:18, 9.73it/s] 180it [00:18, 9.84it/s] 182it [00:19, 9.91it/s] 183it [00:19, 9.62it/s] 184it [00:19, 9.69it/s] 186it [00:19, 9.41it/s] 188it [00:19, 9.65it/s] 190it [00:19, 9.79it/s] 191it [00:19, 9.38it/s] 192it [00:20, 9.50it/s] 194it [00:20, 9.72it/s] 195it [00:20, 9.03it/s] 196it [00:20, 9.52it/s] +2025-05-26 03:55:52,984 - INFO - Epoch: 11, Objective: tensor([10451.8135], device='cuda:0', grad_fn=), Loss: 0.1001165509223938, KL/n: 72.5517807006836 + 0it [00:00, ?it/s]2025-05-26 03:55:53,430 - INFO - [Epoch 012 | Batch 0000] IWAE-loss 8402.5049 | mean log_px -0.0712 | KL -3554.51 + 1it [00:00, 5.55it/s] 2it [00:00, 7.46it/s] 4it [00:00, 8.48it/s] 6it [00:00, 9.18it/s] 8it [00:00, 9.14it/s] 9it [00:01, 9.05it/s] 10it [00:01, 9.26it/s] 11it [00:01, 9.43it/s] 12it [00:01, 9.14it/s] 13it [00:01, 9.29it/s] 15it [00:01, 9.64it/s] 16it [00:01, 9.59it/s] 17it [00:01, 9.60it/s] 18it [00:01, 9.68it/s] 19it [00:02, 9.57it/s] 20it [00:02, 9.09it/s] 21it [00:02, 9.22it/s] 22it [00:02, 9.35it/s] 23it [00:02, 9.48it/s] 24it [00:02, 9.60it/s] 25it [00:02, 9.69it/s] 26it [00:02, 9.74it/s] 27it [00:02, 9.82it/s] 28it [00:03, 9.20it/s] 30it [00:03, 9.59it/s] 31it [00:03, 9.67it/s] 33it [00:03, 9.84it/s] 35it [00:03, 9.94it/s] 36it [00:03, 9.48it/s] 38it [00:04, 9.69it/s] 40it [00:04, 9.83it/s] 41it [00:04, 9.53it/s] 43it [00:04, 9.73it/s] 44it [00:04, 9.45it/s] 45it [00:04, 9.56it/s] 47it [00:04, 9.43it/s] 49it [00:05, 9.66it/s] 50it [00:05, 9.30it/s]2025-05-26 03:55:58,671 - INFO - [Epoch 012 | Batch 0050] IWAE-loss 10922.4316 | mean log_px -0.1087 | KL -3553.06 + 51it [00:05, 9.43it/s] 53it [00:05, 9.68it/s] 54it [00:05, 9.38it/s] 56it [00:05, 9.64it/s] 57it [00:06, 9.25it/s] 59it [00:06, 9.56it/s] 61it [00:06, 9.65it/s] 62it [00:06, 9.67it/s] 64it [00:06, 9.82it/s] 65it [00:06, 9.42it/s] 67it [00:07, 9.66it/s] 68it [00:07, 9.72it/s] 69it [00:07, 9.33it/s] 70it [00:07, 9.47it/s] 71it [00:07, 9.60it/s] 72it [00:07, 9.70it/s] 73it [00:07, 9.22it/s] 75it [00:07, 9.59it/s] 76it [00:08, 9.68it/s] 77it [00:08, 9.17it/s] 78it [00:08, 9.31it/s] 79it [00:08, 9.43it/s] 80it [00:08, 9.50it/s] 81it [00:08, 9.42it/s] 82it [00:08, 9.36it/s] 83it [00:08, 9.32it/s] 84it [00:08, 8.79it/s] 85it [00:09, 8.94it/s] 86it [00:09, 9.03it/s] 87it [00:09, 9.19it/s] 88it [00:09, 8.84it/s] 90it [00:09, 9.39it/s] 92it [00:09, 9.66it/s] 93it [00:09, 9.28it/s] 95it [00:10, 9.47it/s] 96it [00:10, 9.48it/s] 97it [00:10, 9.48it/s] 98it [00:10, 9.54it/s] 99it [00:10, 9.61it/s] 100it [00:10, 9.13it/s]2025-05-26 03:56:03,973 - INFO - [Epoch 012 | Batch 0100] IWAE-loss 11670.1055 | mean log_px -0.1183 | KL -3560.71 + 101it [00:10, 9.27it/s] 102it [00:10, 9.39it/s] 103it [00:10, 9.49it/s] 104it [00:11, 8.99it/s] 105it [00:11, 9.23it/s] 106it [00:11, 9.40it/s] 107it [00:11, 9.43it/s] 108it [00:11, 8.94it/s] 110it [00:11, 9.43it/s] 112it [00:11, 9.25it/s] 114it [00:12, 9.54it/s] 115it [00:12, 9.63it/s] 116it [00:12, 9.25it/s] 118it [00:12, 9.57it/s] 119it [00:12, 9.65it/s] 120it [00:12, 9.25it/s] 122it [00:12, 9.57it/s] 124it [00:13, 9.76it/s] 126it [00:13, 9.87it/s] 128it [00:13, 9.92it/s] 130it [00:13, 9.98it/s] 131it [00:13, 9.59it/s] 133it [00:14, 9.74it/s] 135it [00:14, 9.85it/s] 136it [00:14, 9.88it/s] 138it [00:14, 9.94it/s] 140it [00:14, 9.99it/s] 141it [00:14, 9.99it/s] 142it [00:14, 9.50it/s] 144it [00:15, 9.71it/s] 146it [00:15, 9.47it/s] 148it [00:15, 9.67it/s] 150it [00:15, 9.81it/s]2025-05-26 03:56:09,151 - INFO - [Epoch 012 | Batch 0150] IWAE-loss 9823.7705 | mean log_px -0.0984 | KL -3558.63 + 151it [00:15, 9.45it/s] 153it [00:16, 9.66it/s] 155it [00:16, 9.80it/s] 156it [00:16, 9.43it/s] 158it [00:16, 9.65it/s] 159it [00:16, 9.68it/s] 161it [00:16, 9.81it/s] 163it [00:17, 9.53it/s] 164it [00:17, 9.62it/s] 165it [00:17, 9.60it/s] 166it [00:17, 9.69it/s] 167it [00:17, 9.25it/s] 168it [00:17, 9.42it/s] 170it [00:17, 9.67it/s] 171it [00:18, 9.27it/s] 172it [00:18, 9.43it/s] 174it [00:18, 9.70it/s] 176it [00:18, 9.83it/s] 178it [00:18, 9.90it/s] 180it [00:18, 9.95it/s] 182it [00:19, 9.98it/s] 183it [00:19, 9.98it/s] 184it [00:19, 9.98it/s] 186it [00:19, 9.99it/s] 188it [00:19, 10.02it/s] 190it [00:19, 10.03it/s] 192it [00:20, 10.04it/s] 194it [00:20, 10.04it/s] 196it [00:20, 9.77it/s] 196it [00:20, 9.52it/s] +2025-05-26 03:56:13,878 - INFO - Epoch: 12, Objective: tensor([11959.2480], device='cuda:0', grad_fn=), Loss: 0.12528853118419647, KL/n: 72.63204193115234 + 0it [00:00, ?it/s]2025-05-26 03:56:14,160 - INFO - [Epoch 013 | Batch 0000] IWAE-loss 10673.3086 | mean log_px -0.1125 | KL -3559.28 + 1it [00:00, 4.72it/s] 2it [00:00, 6.80it/s] 4it [00:00, 8.03it/s] 6it [00:00, 8.86it/s] 8it [00:00, 9.31it/s] 10it [00:01, 9.59it/s] 11it [00:01, 9.67it/s] 12it [00:01, 9.73it/s] 14it [00:01, 9.87it/s] 16it [00:01, 9.95it/s] 18it [00:01, 10.00it/s] 20it [00:02, 10.03it/s] 22it [00:02, 10.06it/s] 24it [00:02, 10.07it/s] 26it [00:02, 10.09it/s] 28it [00:02, 10.08it/s] 30it [00:03, 9.74it/s] 32it [00:03, 9.86it/s] 34it [00:03, 9.92it/s] 36it [00:03, 9.97it/s] 38it [00:03, 10.00it/s] 40it [00:04, 10.03it/s] 42it [00:04, 10.05it/s] 44it [00:04, 10.06it/s] 46it [00:04, 10.07it/s] 48it [00:04, 10.09it/s] 50it [00:05, 10.09it/s]2025-05-26 03:56:19,194 - INFO - [Epoch 013 | Batch 0050] IWAE-loss 14811.1055 | mean log_px -0.1740 | KL -3564.73 + 52it [00:05, 10.08it/s] 54it [00:05, 10.08it/s] 56it [00:05, 10.09it/s] 58it [00:05, 10.09it/s] 60it [00:06, 10.10it/s] 62it [00:06, 10.08it/s] 64it [00:06, 10.07it/s] 66it [00:06, 9.74it/s] 68it [00:06, 9.83it/s] 70it [00:07, 9.58it/s] 72it [00:07, 9.72it/s] 74it [00:07, 9.83it/s] 75it [00:07, 9.48it/s] 77it [00:07, 9.68it/s] 79it [00:08, 9.75it/s] 80it [00:08, 9.80it/s] 82it [00:08, 9.55it/s] 83it [00:08, 9.63it/s] 84it [00:08, 9.71it/s] 85it [00:08, 9.27it/s] 86it [00:08, 9.37it/s] 88it [00:09, 9.64it/s] 90it [00:09, 9.80it/s] 92it [00:09, 9.89it/s] 93it [00:09, 9.89it/s] 94it [00:09, 9.83it/s] 95it [00:09, 9.82it/s] 96it [00:09, 9.82it/s] 97it [00:09, 9.84it/s] 98it [00:10, 9.85it/s] 99it [00:10, 9.88it/s] 100it [00:10, 9.80it/s]2025-05-26 03:56:24,307 - INFO - [Epoch 013 | Batch 0100] IWAE-loss 11084.1914 | mean log_px -0.1101 | KL -3557.34 + 101it [00:10, 9.46it/s] 102it [00:10, 9.32it/s] 103it [00:10, 9.50it/s] 104it [00:10, 9.44it/s] 105it [00:10, 9.48it/s] 106it [00:10, 9.60it/s] 107it [00:10, 9.70it/s] 108it [00:11, 9.73it/s] 109it [00:11, 9.56it/s] 110it [00:11, 9.67it/s] 111it [00:11, 9.73it/s] 112it [00:11, 9.78it/s] 113it [00:11, 9.81it/s] 114it [00:11, 9.80it/s] 115it [00:11, 9.84it/s] 116it [00:11, 9.86it/s] 117it [00:11, 9.90it/s] 118it [00:12, 9.90it/s] 119it [00:12, 9.92it/s] 120it [00:12, 9.42it/s] 121it [00:12, 9.57it/s] 122it [00:12, 9.67it/s] 123it [00:12, 9.76it/s] 124it [00:12, 9.80it/s] 125it [00:12, 9.85it/s] 126it [00:12, 9.86it/s] 127it [00:13, 9.90it/s] 128it [00:13, 9.90it/s] 129it [00:13, 9.92it/s] 130it [00:13, 9.92it/s] 131it [00:13, 9.93it/s] 132it [00:13, 9.93it/s] 133it [00:13, 9.94it/s] 134it [00:13, 9.94it/s] 135it [00:13, 9.95it/s] 136it [00:13, 9.95it/s] 137it [00:14, 9.96it/s] 138it [00:14, 9.95it/s] 139it [00:14, 9.94it/s] 140it [00:14, 9.94it/s] 141it [00:14, 9.92it/s] 142it [00:14, 9.94it/s] 143it [00:14, 9.95it/s] 144it [00:14, 9.94it/s] 145it [00:14, 9.87it/s] 146it [00:14, 9.36it/s] 147it [00:15, 9.52it/s] 148it [00:15, 9.64it/s] 149it [00:15, 9.72it/s] 150it [00:15, 9.76it/s]2025-05-26 03:56:29,425 - INFO - [Epoch 013 | Batch 0150] IWAE-loss 8056.9863 | mean log_px -0.0642 | KL -3562.25 + 151it [00:15, 9.16it/s] 152it [00:15, 9.37it/s] 153it [00:15, 9.44it/s] 154it [00:15, 9.57it/s] 155it [00:15, 9.66it/s] 156it [00:15, 9.73it/s] 157it [00:16, 9.79it/s] 158it [00:16, 9.26it/s] 159it [00:16, 9.44it/s] 160it [00:16, 9.56it/s] 161it [00:16, 9.65it/s] 162it [00:16, 9.72it/s] 163it [00:16, 9.78it/s] 164it [00:16, 9.80it/s] 165it [00:16, 9.81it/s] 166it [00:17, 9.84it/s] 167it [00:17, 9.88it/s] 168it [00:17, 9.87it/s] 169it [00:17, 9.87it/s] 170it [00:17, 9.88it/s] 171it [00:17, 9.91it/s] 172it [00:17, 9.90it/s] 173it [00:17, 9.91it/s] 174it [00:17, 9.91it/s] 175it [00:17, 9.91it/s] 176it [00:18, 9.90it/s] 177it [00:18, 9.91it/s] 178it [00:18, 9.90it/s] 179it [00:18, 9.90it/s] 180it [00:18, 9.88it/s] 181it [00:18, 9.91it/s] 182it [00:18, 9.89it/s] 183it [00:18, 9.91it/s] 184it [00:18, 9.90it/s] 185it [00:18, 9.90it/s] 186it [00:19, 9.90it/s] 187it [00:19, 9.90it/s] 188it [00:19, 9.91it/s] 189it [00:19, 9.93it/s] 190it [00:19, 9.91it/s] 191it [00:19, 9.80it/s] 192it [00:19, 9.32it/s] 193it [00:19, 9.49it/s] 194it [00:19, 9.61it/s] 195it [00:19, 8.83it/s] 196it [00:20, 9.73it/s] +2025-05-26 03:56:34,168 - INFO - Epoch: 13, Objective: tensor([13255.1807], device='cuda:0', grad_fn=), Loss: 0.15383651852607727, KL/n: 72.70011138916016 + 0it [00:00, ?it/s]2025-05-26 03:56:34,618 - INFO - [Epoch 014 | Batch 0000] IWAE-loss 11022.1055 | mean log_px -0.1185 | KL -3559.76 + 1it [00:00, 5.62it/s] 2it [00:00, 6.94it/s] 3it [00:00, 7.92it/s] 4it [00:00, 8.49it/s] 5it [00:00, 8.95it/s] 6it [00:00, 9.26it/s] 7it [00:00, 8.89it/s] 8it [00:00, 9.17it/s] 9it [00:01, 9.40it/s] 10it [00:01, 9.52it/s] 11it [00:01, 9.61it/s] 12it [00:01, 9.70it/s] 13it [00:01, 9.75it/s] 14it [00:01, 9.64it/s] 15it [00:01, 9.71it/s] 17it [00:01, 9.89it/s] 19it [00:02, 9.98it/s] 21it [00:02, 10.02it/s] 23it [00:02, 10.05it/s] 25it [00:02, 10.05it/s] 27it [00:02, 10.06it/s] 29it [00:03, 10.08it/s] 31it [00:03, 10.09it/s] 33it [00:03, 10.11it/s] 35it [00:03, 10.11it/s] 37it [00:03, 9.76it/s] 39it [00:04, 9.86it/s] 41it [00:04, 9.94it/s] 42it [00:04, 9.87it/s] 44it [00:04, 9.92it/s] 46it [00:04, 9.97it/s] 48it [00:04, 10.03it/s] 50it [00:05, 10.05it/s]2025-05-26 03:56:39,683 - INFO - [Epoch 014 | Batch 0050] IWAE-loss 8267.6357 | mean log_px -0.0700 | KL -3559.77 + 52it [00:05, 9.71it/s] 54it [00:05, 9.79it/s] 55it [00:05, 9.82it/s] 56it [00:05, 9.81it/s] 57it [00:05, 9.36it/s] 58it [00:05, 9.48it/s] 59it [00:06, 9.56it/s] 60it [00:06, 9.63it/s] 61it [00:06, 9.70it/s] 62it [00:06, 9.19it/s] 63it [00:06, 9.39it/s] 64it [00:06, 9.49it/s] 65it [00:06, 9.61it/s] 66it [00:06, 9.68it/s] 67it [00:06, 9.74it/s] 68it [00:07, 9.77it/s] 69it [00:07, 9.76it/s] 70it [00:07, 9.79it/s] 71it [00:07, 9.81it/s] 72it [00:07, 9.83it/s] 73it [00:07, 9.85it/s] 74it [00:07, 9.86it/s] 75it [00:07, 9.87it/s] 76it [00:07, 9.30it/s] 77it [00:07, 9.48it/s] 78it [00:08, 9.59it/s] 79it [00:08, 9.68it/s] 80it [00:08, 9.74it/s] 81it [00:08, 9.80it/s] 82it [00:08, 9.82it/s] 83it [00:08, 9.85it/s] 84it [00:08, 9.28it/s] 85it [00:08, 9.45it/s] 86it [00:08, 9.58it/s] 87it [00:08, 9.68it/s] 88it [00:09, 9.73it/s] 89it [00:09, 9.78it/s] 90it [00:09, 9.81it/s] 91it [00:09, 9.83it/s] 92it [00:09, 9.85it/s] 93it [00:09, 9.86it/s] 94it [00:09, 9.88it/s] 95it [00:09, 9.90it/s] 96it [00:09, 9.89it/s] 97it [00:10, 9.87it/s] 98it [00:10, 9.87it/s] 99it [00:10, 9.88it/s] 100it [00:10, 9.88it/s]2025-05-26 03:56:44,853 - INFO - [Epoch 014 | Batch 0100] IWAE-loss 13712.4199 | mean log_px -0.1565 | KL -3561.90 + 101it [00:10, 9.06it/s] 102it [00:10, 9.26it/s] 103it [00:10, 9.43it/s] 104it [00:10, 9.57it/s] 105it [00:10, 9.67it/s] 106it [00:10, 9.74it/s] 107it [00:11, 9.15it/s] 108it [00:11, 9.35it/s] 109it [00:11, 9.50it/s] 110it [00:11, 9.59it/s] 111it [00:11, 9.15it/s] 112it [00:11, 9.33it/s] 113it [00:11, 9.48it/s] 114it [00:11, 9.04it/s] 115it [00:11, 9.28it/s] 116it [00:12, 9.45it/s] 117it [00:12, 9.59it/s] 118it [00:12, 9.67it/s] 119it [00:12, 9.75it/s] 120it [00:12, 9.21it/s] 121it [00:12, 9.40it/s] 122it [00:12, 9.53it/s] 123it [00:12, 9.65it/s] 124it [00:12, 9.70it/s] 125it [00:12, 9.77it/s] 126it [00:13, 9.79it/s] 127it [00:13, 9.83it/s] 128it [00:13, 9.84it/s] 129it [00:13, 9.87it/s] 130it [00:13, 9.88it/s] 131it [00:13, 9.89it/s] 132it [00:13, 9.89it/s] 133it [00:13, 9.91it/s] 134it [00:13, 9.90it/s] 135it [00:13, 9.89it/s] 136it [00:14, 9.88it/s] 137it [00:14, 9.88it/s] 138it [00:14, 9.89it/s] 139it [00:14, 9.89it/s] 140it [00:14, 9.39it/s] 141it [00:14, 9.54it/s] 142it [00:14, 9.51it/s] 143it [00:14, 9.59it/s] 144it [00:14, 9.66it/s] 145it [00:15, 9.71it/s] 146it [00:15, 9.35it/s] 147it [00:15, 9.43it/s] 148it [00:15, 9.43it/s] 149it [00:15, 9.49it/s] 150it [00:15, 9.34it/s]2025-05-26 03:56:50,093 - INFO - [Epoch 014 | Batch 0150] IWAE-loss 13030.7373 | mean log_px -0.1424 | KL -3557.82 + 151it [00:15, 9.18it/s] 152it [00:15, 9.16it/s] 153it [00:15, 9.25it/s] 154it [00:15, 9.36it/s] 155it [00:16, 8.93it/s] 156it [00:16, 9.14it/s] 157it [00:16, 9.32it/s] 158it [00:16, 9.33it/s] 159it [00:16, 9.17it/s] 160it [00:16, 9.19it/s] 161it [00:16, 9.16it/s] 162it [00:16, 8.68it/s] 163it [00:16, 8.87it/s] 164it [00:17, 9.02it/s] 165it [00:17, 9.12it/s] 166it [00:17, 9.19it/s] 167it [00:17, 9.29it/s] 168it [00:17, 9.23it/s] 169it [00:17, 9.26it/s] 170it [00:17, 9.27it/s] 171it [00:17, 9.28it/s] 172it [00:17, 9.41it/s] 173it [00:18, 9.46it/s] 174it [00:18, 9.40it/s] 175it [00:18, 9.40it/s] 176it [00:18, 9.39it/s] 177it [00:18, 9.39it/s] 178it [00:18, 9.43it/s] 179it [00:18, 9.41it/s] 180it [00:18, 9.46it/s] 181it [00:18, 9.38it/s] 182it [00:19, 9.37it/s] 183it [00:19, 9.35it/s] 184it [00:19, 9.29it/s] 185it [00:19, 9.28it/s] 186it [00:19, 9.30it/s] 187it [00:19, 9.34it/s] 188it [00:19, 9.37it/s] 189it [00:19, 8.91it/s] 190it [00:19, 9.05it/s] 191it [00:19, 9.14it/s] 192it [00:20, 9.21it/s] 193it [00:20, 8.78it/s] 194it [00:20, 8.99it/s] 195it [00:20, 8.61it/s] 196it [00:20, 8.80it/s] 196it [00:20, 9.50it/s] +2025-05-26 03:56:55,109 - INFO - Epoch: 14, Objective: tensor([11565.9922], device='cuda:0', grad_fn=), Loss: 0.11370649188756943, KL/n: 72.74580383300781 + 0it [00:00, ?it/s]2025-05-26 03:56:55,390 - INFO - [Epoch 015 | Batch 0000] IWAE-loss 10721.7217 | mean log_px -0.1022 | KL -3567.32 + 1it [00:00, 5.27it/s] 2it [00:00, 7.15it/s] 3it [00:00, 8.12it/s] 4it [00:00, 8.63it/s] 5it [00:00, 8.95it/s] 6it [00:00, 9.15it/s] 7it [00:00, 8.65it/s] 8it [00:00, 8.89it/s] 9it [00:01, 8.99it/s] 10it [00:01, 9.02it/s] 11it [00:01, 9.18it/s] 12it [00:01, 8.81it/s] 13it [00:01, 9.02it/s] 14it [00:01, 9.06it/s] 15it [00:01, 8.71it/s] 16it [00:01, 8.96it/s] 17it [00:01, 9.05it/s] 18it [00:02, 9.23it/s] 19it [00:02, 9.37it/s] 20it [00:02, 9.42it/s] 21it [00:02, 9.44it/s] 22it [00:02, 8.96it/s] 23it [00:02, 9.12it/s] 24it [00:02, 9.26it/s] 25it [00:02, 9.40it/s] 26it [00:02, 9.36it/s] 27it [00:03, 9.44it/s] 28it [00:03, 9.09it/s] 29it [00:03, 9.25it/s] 30it [00:03, 9.34it/s] 31it [00:03, 9.44it/s] 32it [00:03, 9.49it/s] 33it [00:03, 9.57it/s] 34it [00:03, 9.59it/s] 35it [00:03, 9.62it/s] 36it [00:03, 9.60it/s] 37it [00:04, 9.61it/s] 38it [00:04, 9.58it/s] 39it [00:04, 9.63it/s] 40it [00:04, 9.63it/s] 41it [00:04, 9.60it/s] 42it [00:04, 9.53it/s] 43it [00:04, 9.58it/s] 44it [00:04, 9.55it/s] 45it [00:04, 9.59it/s] 46it [00:05, 9.59it/s] 47it [00:05, 9.64it/s] 48it [00:05, 9.62it/s] 49it [00:05, 9.05it/s] 50it [00:05, 9.20it/s]2025-05-26 03:57:00,745 - INFO - [Epoch 015 | Batch 0050] IWAE-loss 11714.7119 | mean log_px -0.1263 | KL -3566.29 + 51it [00:05, 9.32it/s] 52it [00:05, 9.39it/s] 53it [00:05, 9.40it/s] 54it [00:05, 9.34it/s] 55it [00:05, 9.48it/s] 56it [00:06, 9.49it/s] 57it [00:06, 9.51it/s] 58it [00:06, 9.53it/s] 59it [00:06, 9.59it/s] 60it [00:06, 9.57it/s] 61it [00:06, 9.57it/s] 62it [00:06, 9.57it/s] 63it [00:06, 9.57it/s] 64it [00:06, 9.57it/s] 65it [00:07, 9.55it/s] 66it [00:07, 9.55it/s] 67it [00:07, 9.56it/s] 68it [00:07, 9.56it/s] 69it [00:07, 9.57it/s] 70it [00:07, 9.60it/s] 71it [00:07, 9.59it/s] 72it [00:07, 9.59it/s] 73it [00:07, 9.57it/s] 74it [00:07, 9.56it/s] 75it [00:08, 9.48it/s] 76it [00:08, 9.49it/s] 77it [00:08, 9.46it/s] 78it [00:08, 9.50it/s] 79it [00:08, 9.48it/s] 80it [00:08, 9.53it/s] 81it [00:08, 9.41it/s] 82it [00:08, 9.43it/s] 83it [00:08, 9.41it/s] 84it [00:09, 9.42it/s] 85it [00:09, 9.42it/s] 86it [00:09, 9.49it/s] 87it [00:09, 9.50it/s] 88it [00:09, 9.47it/s] 89it [00:09, 9.49it/s] 90it [00:09, 9.47it/s] 91it [00:09, 9.49it/s] 92it [00:09, 9.52it/s] 93it [00:09, 9.52it/s] 94it [00:10, 9.51it/s] 95it [00:10, 9.53it/s] 96it [00:10, 9.53it/s] 97it [00:10, 9.53it/s] 98it [00:10, 9.55it/s] 99it [00:10, 9.55it/s] 100it [00:10, 9.49it/s]2025-05-26 03:57:05,999 - INFO - [Epoch 015 | Batch 0100] IWAE-loss 10056.2070 | mean log_px -0.1000 | KL -3566.32 + 101it [00:10, 9.51it/s] 102it [00:10, 9.39it/s] 103it [00:11, 9.34it/s] 104it [00:11, 8.72it/s] 105it [00:11, 9.00it/s] 106it [00:11, 9.19it/s] 107it [00:11, 9.32it/s] 108it [00:11, 9.42it/s] 109it [00:11, 9.51it/s] 110it [00:11, 9.04it/s] 111it [00:11, 9.24it/s] 112it [00:11, 9.37it/s] 113it [00:12, 9.47it/s] 114it [00:12, 8.86it/s] 115it [00:12, 9.08it/s] 116it [00:12, 9.20it/s] 117it [00:12, 9.22it/s] 118it [00:12, 8.69it/s] 119it [00:12, 8.97it/s] 120it [00:12, 9.17it/s] 121it [00:12, 9.33it/s] 122it [00:13, 9.38it/s] 123it [00:13, 9.45it/s] 124it [00:13, 9.47it/s] 125it [00:13, 9.50it/s] 126it [00:13, 9.52it/s] 127it [00:13, 9.54it/s] 128it [00:13, 9.55it/s] 129it [00:13, 9.55it/s] 130it [00:13, 9.52it/s] 131it [00:14, 9.54it/s] 132it [00:14, 9.56it/s] 133it [00:14, 9.55it/s] 134it [00:14, 9.57it/s] 135it [00:14, 9.57it/s] 136it [00:14, 9.57it/s] 137it [00:14, 9.57it/s] 138it [00:14, 9.59it/s] 139it [00:14, 9.64it/s] 140it [00:14, 9.56it/s] 141it [00:15, 9.53it/s] 142it [00:15, 9.54it/s] 143it [00:15, 9.55it/s] 144it [00:15, 9.50it/s] 145it [00:15, 9.48it/s] 146it [00:15, 9.49it/s] 147it [00:15, 9.52it/s] 148it [00:15, 9.52it/s] 149it [00:15, 9.54it/s] 150it [00:16, 9.53it/s]2025-05-26 03:57:11,325 - INFO - [Epoch 015 | Batch 0150] IWAE-loss 9198.8525 | mean log_px -0.0873 | KL -3561.38 + 151it [00:16, 9.57it/s] 152it [00:16, 9.59it/s] 153it [00:16, 9.56it/s] 154it [00:16, 9.56it/s] 155it [00:16, 9.52it/s] 156it [00:16, 9.56it/s] 157it [00:16, 9.51it/s] 158it [00:16, 9.49it/s] 159it [00:16, 9.55it/s] 160it [00:17, 9.57it/s] 161it [00:17, 9.54it/s] 162it [00:17, 9.17it/s] 163it [00:17, 9.27it/s] 164it [00:17, 9.31it/s] 165it [00:17, 9.38it/s] 166it [00:17, 9.40it/s] 167it [00:17, 9.47it/s] 168it [00:17, 9.46it/s] 169it [00:18, 9.54it/s] 170it [00:18, 9.35it/s] 171it [00:18, 9.05it/s] 172it [00:18, 9.14it/s] 173it [00:18, 9.24it/s] 174it [00:18, 9.33it/s] 175it [00:18, 9.39it/s] 176it [00:18, 9.40it/s] 177it [00:18, 9.46it/s] 178it [00:18, 9.49it/s] 179it [00:19, 9.53it/s] 180it [00:19, 9.53it/s] 181it [00:19, 9.53it/s] 182it [00:19, 9.47it/s] 183it [00:19, 9.45it/s] 184it [00:19, 9.53it/s] 185it [00:19, 9.53it/s] 186it [00:19, 9.51it/s] 187it [00:19, 9.28it/s] 188it [00:20, 9.04it/s] 189it [00:20, 9.19it/s] 190it [00:20, 9.27it/s] 191it [00:20, 9.39it/s] 192it [00:20, 8.94it/s] 193it [00:20, 9.08it/s] 194it [00:20, 9.21it/s] 195it [00:20, 8.80it/s] 196it [00:20, 9.09it/s] 196it [00:20, 9.34it/s] +2025-05-26 03:57:16,239 - INFO - Epoch: 15, Objective: tensor([12319.4551], device='cuda:0', grad_fn=), Loss: 0.13309964537620544, KL/n: 72.79181671142578 + 0it [00:00, ?it/s]2025-05-26 03:57:16,695 - INFO - [Epoch 016 | Batch 0000] IWAE-loss 7340.2905 | mean log_px -0.0581 | KL -3566.00 + 1it [00:00, 4.92it/s] 2it [00:00, 6.81it/s] 3it [00:00, 7.87it/s] 4it [00:00, 7.87it/s] 5it [00:00, 8.43it/s] 6it [00:00, 8.80it/s] 7it [00:00, 9.04it/s] 8it [00:00, 9.24it/s] 9it [00:01, 9.39it/s] 10it [00:01, 9.49it/s] 11it [00:01, 9.52it/s] 12it [00:01, 9.52it/s] 13it [00:01, 9.55it/s] 14it [00:01, 9.57it/s] 15it [00:01, 9.58it/s] 16it [00:01, 9.59it/s] 17it [00:01, 9.56it/s] 18it [00:01, 9.55it/s] 19it [00:02, 9.50it/s] 20it [00:02, 9.06it/s] 21it [00:02, 9.22it/s] 22it [00:02, 9.30it/s] 23it [00:02, 9.33it/s] 24it [00:02, 8.74it/s] 25it [00:02, 8.98it/s] 26it [00:02, 9.03it/s] 27it [00:02, 9.19it/s] 28it [00:03, 9.28it/s] 29it [00:03, 9.28it/s] 30it [00:03, 9.32it/s] 31it [00:03, 9.35it/s] 32it [00:03, 9.42it/s] 33it [00:03, 8.95it/s] 34it [00:03, 9.09it/s] 35it [00:03, 9.24it/s] 36it [00:03, 9.30it/s] 37it [00:04, 9.45it/s] 38it [00:04, 9.44it/s] 39it [00:04, 9.45it/s] 40it [00:04, 9.44it/s] 41it [00:04, 9.45it/s] 42it [00:04, 9.41it/s] 43it [00:04, 9.49it/s] 44it [00:04, 9.51it/s] 45it [00:04, 9.55it/s] 46it [00:05, 9.54it/s] 47it [00:05, 9.57it/s] 48it [00:05, 9.58it/s] 49it [00:05, 9.58it/s] 50it [00:05, 9.60it/s]2025-05-26 03:57:22,044 - INFO - [Epoch 016 | Batch 0050] IWAE-loss 9277.7939 | mean log_px -0.0837 | KL -3565.87 + 51it [00:05, 9.01it/s] 52it [00:05, 9.12it/s] 53it [00:05, 9.25it/s] 54it [00:05, 9.35it/s] 55it [00:05, 9.43it/s] 56it [00:06, 9.32it/s] 57it [00:06, 9.39it/s] 58it [00:06, 9.46it/s] 59it [00:06, 9.46it/s] 60it [00:06, 9.47it/s] 61it [00:06, 9.50it/s] 62it [00:06, 9.55it/s] 63it [00:06, 9.53it/s] 64it [00:06, 9.51it/s] 65it [00:07, 9.58it/s] 66it [00:07, 9.61it/s] 67it [00:07, 9.60it/s] 68it [00:07, 9.59it/s] 69it [00:07, 9.04it/s] 70it [00:07, 9.15it/s] 71it [00:07, 9.22it/s] 72it [00:07, 9.34it/s] 73it [00:07, 9.00it/s] 74it [00:08, 9.19it/s] 75it [00:08, 9.25it/s] 76it [00:08, 8.86it/s] 77it [00:08, 9.04it/s] 78it [00:08, 9.16it/s] 79it [00:08, 9.29it/s] 80it [00:08, 9.28it/s] 81it [00:08, 9.39it/s] 82it [00:08, 9.44it/s] 83it [00:08, 9.53it/s] 84it [00:09, 9.55it/s] 85it [00:09, 9.52it/s] 86it [00:09, 9.54it/s] 87it [00:09, 9.00it/s] 88it [00:09, 9.11it/s] 89it [00:09, 9.28it/s] 90it [00:09, 9.36it/s] 91it [00:09, 9.39it/s] 92it [00:09, 9.43it/s] 93it [00:10, 9.48it/s] 94it [00:10, 9.51it/s] 95it [00:10, 9.52it/s] 96it [00:10, 9.49it/s] 97it [00:10, 9.52it/s] 98it [00:10, 9.52it/s] 99it [00:10, 9.53it/s] 100it [00:10, 9.50it/s]2025-05-26 03:57:27,389 - INFO - [Epoch 016 | Batch 0100] IWAE-loss 11751.0801 | mean log_px -0.1212 | KL -3566.18 + 101it [00:10, 9.54it/s] 102it [00:10, 9.55it/s] 103it [00:11, 9.59it/s] 104it [00:11, 9.60it/s] 105it [00:11, 9.63it/s] 106it [00:11, 9.58it/s] 107it [00:11, 9.56it/s] 108it [00:11, 9.49it/s] 109it [00:11, 9.52it/s] 110it [00:11, 9.53it/s] 111it [00:11, 9.56it/s] 112it [00:12, 9.58it/s] 113it [00:12, 9.62it/s] 114it [00:12, 9.54it/s] 115it [00:12, 9.54it/s] 116it [00:12, 9.54it/s] 117it [00:12, 8.97it/s] 118it [00:12, 9.16it/s] 119it [00:12, 9.29it/s] 120it [00:12, 9.35it/s] 121it [00:12, 9.41it/s] 122it [00:13, 9.46it/s] 123it [00:13, 9.52it/s] 124it [00:13, 9.53it/s] 125it [00:13, 9.60it/s] 126it [00:13, 9.54it/s] 127it [00:13, 9.18it/s] 128it [00:13, 9.27it/s] 129it [00:13, 9.33it/s] 130it [00:13, 8.71it/s] 131it [00:14, 8.99it/s] 132it [00:14, 9.19it/s] 133it [00:14, 9.31it/s] 134it [00:14, 9.38it/s] 135it [00:14, 8.90it/s] 136it [00:14, 9.08it/s] 137it [00:14, 9.23it/s] 138it [00:14, 9.31it/s] 139it [00:14, 9.39it/s] 140it [00:15, 9.45it/s] 141it [00:15, 8.93it/s] 142it [00:15, 9.07it/s] 143it [00:15, 9.21it/s] 144it [00:15, 9.30it/s] 145it [00:15, 8.86it/s] 146it [00:15, 9.06it/s] 147it [00:15, 9.22it/s] 148it [00:15, 9.33it/s] 149it [00:16, 9.37it/s] 150it [00:16, 9.42it/s]2025-05-26 03:57:32,744 - INFO - [Epoch 016 | Batch 0150] IWAE-loss 10209.6055 | mean log_px -0.0996 | KL -3564.47 + 151it [00:16, 9.44it/s] 152it [00:16, 9.48it/s] 153it [00:16, 8.94it/s] 154it [00:16, 9.11it/s] 155it [00:16, 9.22it/s] 156it [00:16, 9.30it/s] 157it [00:16, 9.38it/s] 158it [00:16, 9.39it/s] 159it [00:17, 9.43it/s] 160it [00:17, 9.04it/s] 161it [00:17, 9.20it/s] 162it [00:17, 9.31it/s] 163it [00:17, 9.36it/s] 164it [00:17, 9.45it/s] 165it [00:17, 9.48it/s] 166it [00:17, 9.53it/s] 167it [00:17, 9.52it/s] 168it [00:18, 9.53it/s] 169it [00:18, 9.60it/s] 170it [00:18, 9.56it/s] 171it [00:18, 9.58it/s] 172it [00:18, 9.54it/s] 173it [00:18, 9.53it/s] 174it [00:18, 9.51it/s] 175it [00:18, 9.00it/s] 176it [00:18, 9.19it/s] 177it [00:19, 9.35it/s] 178it [00:19, 9.43it/s] 179it [00:19, 8.90it/s] 180it [00:19, 9.05it/s] 181it [00:19, 9.20it/s] 182it [00:19, 9.27it/s] 183it [00:19, 9.35it/s] 184it [00:19, 9.44it/s] 185it [00:19, 9.50it/s] 186it [00:19, 9.49it/s] 187it [00:20, 9.51it/s] 188it [00:20, 9.55it/s] 189it [00:20, 9.60it/s] 190it [00:20, 9.64it/s] 191it [00:20, 9.56it/s] 192it [00:20, 9.55it/s] 193it [00:20, 9.57it/s] 194it [00:20, 9.57it/s] 195it [00:20, 8.99it/s] 196it [00:21, 8.61it/s] 196it [00:21, 9.28it/s] +2025-05-26 03:57:37,673 - INFO - Epoch: 16, Objective: tensor([10027.8145], device='cuda:0', grad_fn=), Loss: 0.09540171176195145, KL/n: 72.8223648071289 + 0it [00:00, ?it/s]2025-05-26 03:57:37,967 - INFO - [Epoch 017 | Batch 0000] IWAE-loss 10231.7510 | mean log_px -0.0985 | KL -3565.85 + 1it [00:00, 5.26it/s] 2it [00:00, 7.13it/s] 3it [00:00, 7.49it/s] 4it [00:00, 8.17it/s] 5it [00:00, 8.64it/s] 6it [00:00, 8.91it/s] 7it [00:00, 9.11it/s] 8it [00:00, 9.18it/s] 9it [00:01, 9.30it/s] 10it [00:01, 9.40it/s] 11it [00:01, 9.52it/s] 12it [00:01, 9.60it/s] 13it [00:01, 9.65it/s] 14it [00:01, 9.66it/s] 15it [00:01, 9.27it/s] 16it [00:01, 9.19it/s] 17it [00:01, 9.38it/s] 18it [00:01, 9.49it/s] 19it [00:02, 9.57it/s] 20it [00:02, 9.62it/s] 21it [00:02, 9.67it/s] 22it [00:02, 9.64it/s] 23it [00:02, 9.69it/s] 24it [00:02, 9.69it/s] 25it [00:02, 9.32it/s] 26it [00:02, 9.41it/s] 27it [00:02, 9.52it/s] 28it [00:03, 8.98it/s] 29it [00:03, 9.19it/s] 30it [00:03, 9.33it/s] 31it [00:03, 9.44it/s] 32it [00:03, 9.52it/s] 33it [00:03, 9.60it/s] 34it [00:03, 9.24it/s] 35it [00:03, 9.39it/s] 36it [00:03, 9.49it/s] 37it [00:04, 9.24it/s] 38it [00:04, 8.62it/s] 39it [00:04, 8.82it/s] 40it [00:04, 9.00it/s] 41it [00:04, 9.11it/s] 42it [00:04, 9.17it/s] 43it [00:04, 9.27it/s] 44it [00:04, 9.36it/s] 45it [00:04, 8.90it/s] 46it [00:05, 9.01it/s] 47it [00:05, 9.15it/s] 48it [00:05, 8.68it/s] 49it [00:05, 8.96it/s] 50it [00:05, 9.12it/s]2025-05-26 03:57:43,346 - INFO - [Epoch 017 | Batch 0050] IWAE-loss 8144.4380 | mean log_px -0.0670 | KL -3562.43 + 51it [00:05, 9.24it/s] 52it [00:05, 8.78it/s] 53it [00:05, 8.98it/s] 54it [00:05, 9.18it/s] 55it [00:06, 9.29it/s] 56it [00:06, 9.34it/s] 57it [00:06, 9.33it/s] 58it [00:06, 9.33it/s] 59it [00:06, 9.41it/s] 60it [00:06, 9.40it/s] 61it [00:06, 9.43it/s] 62it [00:06, 9.41it/s] 63it [00:06, 9.46it/s] 64it [00:06, 9.52it/s] 65it [00:07, 9.55it/s] 66it [00:07, 9.53it/s] 67it [00:07, 8.98it/s] 68it [00:07, 9.16it/s] 69it [00:07, 9.27it/s] 70it [00:07, 9.31it/s] 71it [00:07, 9.40it/s] 72it [00:07, 9.44it/s] 73it [00:07, 9.52it/s] 74it [00:08, 9.48it/s] 75it [00:08, 8.80it/s] 76it [00:08, 8.46it/s] 77it [00:08, 8.42it/s] 78it [00:08, 8.71it/s] 79it [00:08, 9.00it/s] 80it [00:08, 9.14it/s] 81it [00:08, 9.23it/s] 82it [00:08, 9.33it/s] 83it [00:09, 9.02it/s] 84it [00:09, 9.18it/s] 85it [00:09, 9.29it/s] 86it [00:09, 8.97it/s] 87it [00:09, 9.15it/s] 88it [00:09, 9.26it/s] 89it [00:09, 9.34it/s] 90it [00:09, 9.43it/s] 91it [00:09, 9.41it/s] 92it [00:10, 8.97it/s] 93it [00:10, 9.10it/s] 94it [00:10, 9.23it/s] 95it [00:10, 9.33it/s] 96it [00:10, 9.41it/s] 97it [00:10, 9.48it/s] 98it [00:10, 9.56it/s] 99it [00:10, 9.54it/s] 100it [00:10, 9.57it/s]2025-05-26 03:57:48,749 - INFO - [Epoch 017 | Batch 0100] IWAE-loss 8396.8623 | mean log_px -0.0690 | KL -3563.99 + 101it [00:10, 9.51it/s] 102it [00:11, 8.97it/s] 103it [00:11, 9.09it/s] 104it [00:11, 9.17it/s] 105it [00:11, 9.32it/s] 106it [00:11, 9.40it/s] 107it [00:11, 9.41it/s] 108it [00:11, 8.90it/s] 109it [00:11, 8.63it/s] 110it [00:11, 8.89it/s] 111it [00:12, 9.08it/s] 112it [00:12, 9.22it/s] 113it [00:12, 9.34it/s] 114it [00:12, 9.38it/s] 115it [00:12, 9.44it/s] 116it [00:12, 9.43it/s] 117it [00:12, 9.44it/s] 118it [00:12, 8.93it/s] 119it [00:12, 9.07it/s] 120it [00:13, 9.16it/s] 121it [00:13, 9.27it/s] 122it [00:13, 9.34it/s] 123it [00:13, 9.29it/s] 124it [00:13, 8.92it/s] 125it [00:13, 8.97it/s] 126it [00:13, 9.11it/s] 127it [00:13, 8.77it/s] 128it [00:13, 8.89it/s] 129it [00:14, 9.15it/s] 130it [00:14, 9.33it/s] 131it [00:14, 9.47it/s] 132it [00:14, 9.57it/s] 133it [00:14, 9.12it/s] 134it [00:14, 9.34it/s] 135it [00:14, 9.51it/s] 136it [00:14, 9.58it/s] 137it [00:14, 9.12it/s] 138it [00:15, 9.21it/s] 139it [00:15, 9.30it/s] 140it [00:15, 9.38it/s] 141it [00:15, 9.44it/s] 142it [00:15, 9.38it/s] 143it [00:15, 9.35it/s] 144it [00:15, 9.32it/s] 145it [00:15, 9.39it/s] 146it [00:15, 9.41it/s] 147it [00:15, 9.44it/s] 148it [00:16, 9.47it/s] 149it [00:16, 9.47it/s] 150it [00:16, 9.43it/s]2025-05-26 03:57:54,160 - INFO - [Epoch 017 | Batch 0150] IWAE-loss 9258.7881 | mean log_px -0.0835 | KL -3569.38 + 151it [00:16, 9.48it/s] 152it [00:16, 9.48it/s] 153it [00:16, 9.47it/s] 154it [00:16, 8.99it/s] 155it [00:16, 9.12it/s] 156it [00:16, 9.24it/s] 157it [00:17, 9.32it/s] 158it [00:17, 9.38it/s] 159it [00:17, 9.36it/s] 160it [00:17, 9.22it/s] 161it [00:17, 9.00it/s] 162it [00:17, 9.11it/s] 163it [00:17, 9.28it/s] 164it [00:17, 9.32it/s] 165it [00:17, 9.37it/s] 166it [00:18, 9.07it/s] 167it [00:18, 9.17it/s] 168it [00:18, 9.26it/s] 169it [00:18, 9.41it/s] 170it [00:18, 9.10it/s] 171it [00:18, 9.21it/s] 172it [00:18, 9.28it/s] 173it [00:18, 9.36it/s] 174it [00:18, 9.44it/s] 175it [00:18, 9.53it/s] 176it [00:19, 9.50it/s] 177it [00:19, 8.94it/s] 178it [00:19, 9.14it/s] 179it [00:19, 9.28it/s] 180it [00:19, 9.35it/s] 181it [00:19, 9.42it/s] 182it [00:19, 9.40it/s] 183it [00:19, 8.92it/s] 184it [00:19, 9.04it/s] 185it [00:20, 9.15it/s] 186it [00:20, 9.22it/s] 187it [00:20, 9.30it/s] 188it [00:20, 8.88it/s] 189it [00:20, 9.07it/s] 190it [00:20, 9.22it/s] 191it [00:20, 9.30it/s] 192it [00:20, 9.34it/s] 193it [00:20, 9.38it/s] 194it [00:21, 9.45it/s] 195it [00:21, 8.87it/s] 196it [00:21, 8.52it/s] 196it [00:21, 9.18it/s] +2025-05-26 03:57:59,167 - INFO - Epoch: 17, Objective: tensor([9598.7822], device='cuda:0', grad_fn=), Loss: 0.08933060616254807, KL/n: 72.83203125 + 0it [00:00, ?it/s]2025-05-26 03:57:59,638 - INFO - [Epoch 018 | Batch 0000] IWAE-loss 12348.8164 | mean log_px -0.1254 | KL -3569.31 + 1it [00:00, 2.61it/s] 2it [00:00, 4.56it/s] 3it [00:00, 6.00it/s] 4it [00:00, 6.66it/s] 5it [00:00, 7.47it/s] 6it [00:00, 8.04it/s] 7it [00:01, 8.48it/s] 8it [00:01, 8.50it/s] 9it [00:01, 8.82it/s] 10it [00:01, 9.03it/s] 11it [00:01, 9.19it/s] 12it [00:01, 9.29it/s] 13it [00:01, 9.41it/s] 14it [00:01, 9.41it/s] 15it [00:01, 9.09it/s] 16it [00:02, 9.22it/s] 17it [00:02, 9.33it/s] 18it [00:02, 9.37it/s] 19it [00:02, 9.02it/s] 20it [00:02, 9.17it/s] 21it [00:02, 9.29it/s] 22it [00:02, 9.35it/s] 23it [00:02, 9.33it/s] 24it [00:02, 9.43it/s] 25it [00:02, 9.43it/s] 26it [00:03, 9.47it/s] 27it [00:03, 9.54it/s] 28it [00:03, 9.58it/s] 29it [00:03, 9.56it/s] 30it [00:03, 9.56it/s] 31it [00:03, 9.57it/s] 32it [00:03, 9.51it/s] 33it [00:03, 9.57it/s] 34it [00:03, 9.50it/s] 35it [00:04, 8.98it/s] 36it [00:04, 9.11it/s] 37it [00:04, 9.30it/s] 38it [00:04, 9.31it/s] 39it [00:04, 9.45it/s] 40it [00:04, 9.46it/s] 41it [00:04, 9.45it/s] 42it [00:04, 9.42it/s] 43it [00:04, 9.40it/s] 44it [00:04, 9.43it/s] 45it [00:05, 9.50it/s] 46it [00:05, 9.56it/s] 47it [00:05, 9.06it/s] 48it [00:05, 9.08it/s] 49it [00:05, 9.12it/s] 50it [00:05, 9.15it/s]2025-05-26 03:58:04,998 - INFO - [Epoch 018 | Batch 0050] IWAE-loss 8044.7241 | mean log_px -0.0678 | KL -3567.06 + 51it [00:05, 9.26it/s] 52it [00:05, 8.94it/s] 53it [00:05, 9.13it/s] 54it [00:06, 9.27it/s] 55it [00:06, 9.29it/s] 56it [00:06, 9.25it/s] 57it [00:06, 8.81it/s] 58it [00:06, 8.88it/s] 59it [00:06, 9.05it/s] 60it [00:06, 9.17it/s] 61it [00:06, 9.26it/s] 62it [00:06, 9.33it/s] 63it [00:07, 9.37it/s] 64it [00:07, 9.37it/s] 65it [00:07, 8.80it/s] 66it [00:07, 8.96it/s] 67it [00:07, 9.07it/s] 68it [00:07, 9.19it/s] 69it [00:07, 9.29it/s] 70it [00:07, 9.05it/s] 71it [00:07, 9.15it/s] 72it [00:08, 9.25it/s] 73it [00:08, 9.32it/s] 74it [00:08, 9.27it/s] 75it [00:08, 8.91it/s] 76it [00:08, 8.99it/s] 77it [00:08, 9.19it/s] 78it [00:08, 9.27it/s] 79it [00:08, 9.22it/s] 80it [00:08, 9.27it/s] 81it [00:09, 8.95it/s] 82it [00:09, 9.11it/s] 83it [00:09, 9.20it/s] 84it [00:09, 9.23it/s] 85it [00:09, 8.71it/s] 86it [00:09, 8.86it/s] 87it [00:09, 8.90it/s] 88it [00:09, 8.68it/s] 89it [00:09, 8.94it/s] 90it [00:10, 9.16it/s] 91it [00:10, 9.35it/s] 92it [00:10, 8.86it/s] 93it [00:10, 9.14it/s] 94it [00:10, 9.33it/s] 95it [00:10, 9.49it/s] 96it [00:10, 9.59it/s] 97it [00:10, 9.67it/s] 98it [00:10, 9.49it/s] 99it [00:10, 9.14it/s] 100it [00:11, 9.35it/s]2025-05-26 03:58:10,456 - INFO - [Epoch 018 | Batch 0100] IWAE-loss 8123.0947 | mean log_px -0.0684 | KL -3570.99 + 101it [00:11, 8.91it/s] 102it [00:11, 9.13it/s] 103it [00:11, 9.25it/s] 104it [00:11, 9.37it/s] 105it [00:11, 8.87it/s] 106it [00:11, 9.04it/s] 107it [00:11, 9.17it/s] 108it [00:11, 9.27it/s] 109it [00:12, 9.36it/s] 110it [00:12, 9.40it/s] 111it [00:12, 9.43it/s] 112it [00:12, 9.48it/s] 113it [00:12, 9.11it/s] 114it [00:12, 9.20it/s] 115it [00:12, 9.31it/s] 116it [00:12, 9.40it/s] 117it [00:12, 9.43it/s] 118it [00:13, 9.02it/s] 119it [00:13, 9.16it/s] 120it [00:13, 9.27it/s] 121it [00:13, 9.37it/s] 122it [00:13, 9.41it/s] 123it [00:13, 9.49it/s] 124it [00:13, 9.52it/s] 125it [00:13, 9.56it/s] 126it [00:13, 9.55it/s] 127it [00:14, 9.15it/s] 128it [00:14, 9.14it/s] 129it [00:14, 9.20it/s] 130it [00:14, 9.30it/s] 131it [00:14, 9.36it/s] 132it [00:14, 9.34it/s] 133it [00:14, 9.36it/s] 134it [00:14, 9.30it/s] 135it [00:14, 9.33it/s] 136it [00:14, 8.78it/s] 137it [00:15, 9.00it/s] 138it [00:15, 9.17it/s] 139it [00:15, 9.19it/s] 140it [00:15, 9.16it/s] 141it [00:15, 9.22it/s] 142it [00:15, 9.31it/s] 143it [00:15, 9.28it/s] 144it [00:15, 9.26it/s] 145it [00:15, 9.28it/s] 146it [00:16, 9.25it/s] 147it [00:16, 9.22it/s] 148it [00:16, 9.23it/s] 149it [00:16, 8.73it/s] 150it [00:16, 8.71it/s]2025-05-26 03:58:15,893 - INFO - [Epoch 018 | Batch 0150] IWAE-loss 6793.8252 | mean log_px -0.0610 | KL -3563.42 + 151it [00:16, 8.94it/s] 152it [00:16, 9.15it/s] 153it [00:16, 9.29it/s] 154it [00:16, 8.73it/s] 155it [00:17, 8.90it/s] 156it [00:17, 9.07it/s] 157it [00:17, 9.15it/s] 158it [00:17, 8.82it/s] 159it [00:17, 9.02it/s] 160it [00:17, 9.22it/s] 161it [00:17, 8.81it/s] 162it [00:17, 9.04it/s] 163it [00:17, 9.26it/s] 164it [00:18, 9.41it/s] 165it [00:18, 8.91it/s] 166it [00:18, 9.15it/s] 167it [00:18, 9.34it/s] 168it [00:18, 9.42it/s] 169it [00:18, 8.97it/s] 170it [00:18, 9.23it/s] 171it [00:18, 9.43it/s] 172it [00:18, 9.55it/s] 173it [00:19, 9.08it/s] 174it [00:19, 9.30it/s] 175it [00:19, 9.48it/s] 176it [00:19, 9.59it/s] 177it [00:19, 9.09it/s] 178it [00:19, 9.30it/s] 179it [00:19, 9.48it/s] 180it [00:19, 9.58it/s] 181it [00:19, 9.07it/s] 182it [00:19, 9.31it/s] 183it [00:20, 9.48it/s] 184it [00:20, 9.58it/s] 185it [00:20, 9.09it/s] 186it [00:20, 9.30it/s] 187it [00:20, 9.48it/s] 188it [00:20, 9.58it/s] 189it [00:20, 9.09it/s] 190it [00:20, 9.29it/s] 191it [00:20, 9.45it/s] 192it [00:21, 9.57it/s] 193it [00:21, 9.08it/s] 194it [00:21, 9.30it/s] 195it [00:21, 8.95it/s] 196it [00:21, 8.73it/s] 196it [00:21, 9.08it/s] +2025-05-26 03:58:20,887 - INFO - Epoch: 18, Objective: tensor([8188.5557], device='cuda:0', grad_fn=), Loss: 0.07669003307819366, KL/n: 72.82756805419922 + 0it [00:00, ?it/s]2025-05-26 03:58:21,166 - INFO - [Epoch 019 | Batch 0000] IWAE-loss 6962.9434 | mean log_px -0.0530 | KL -3566.80 + 1it [00:00, 5.48it/s] 2it [00:00, 7.43it/s] 3it [00:00, 7.77it/s] 5it [00:00, 8.89it/s] 7it [00:00, 8.94it/s] 8it [00:00, 9.17it/s] 9it [00:01, 9.34it/s] 10it [00:01, 9.49it/s] 11it [00:01, 9.07it/s] 12it [00:01, 9.32it/s] 14it [00:01, 9.60it/s] 15it [00:01, 9.20it/s] 17it [00:01, 9.54it/s] 19it [00:02, 9.74it/s] 21it [00:02, 9.85it/s] 22it [00:02, 9.88it/s] 23it [00:02, 9.43it/s] 25it [00:02, 9.67it/s] 27it [00:02, 9.80it/s] 29it [00:03, 9.89it/s] 30it [00:03, 9.90it/s] 31it [00:03, 9.45it/s] 33it [00:03, 9.66it/s] 35it [00:03, 9.81it/s] 36it [00:03, 9.85it/s] 38it [00:04, 9.91it/s] 40it [00:04, 9.93it/s] 42it [00:04, 9.96it/s] 43it [00:04, 9.64it/s] 44it [00:04, 9.63it/s] 46it [00:04, 9.73it/s] 47it [00:04, 9.44it/s] 49it [00:05, 9.65it/s] 50it [00:05, 9.66it/s]2025-05-26 03:58:26,343 - INFO - [Epoch 019 | Batch 0050] IWAE-loss 11381.5762 | mean log_px -0.1166 | KL -3569.48 + 51it [00:05, 9.28it/s] 52it [00:05, 9.40it/s] 54it [00:05, 9.66it/s] 56it [00:05, 9.82it/s] 57it [00:05, 9.43it/s] 59it [00:06, 9.66it/s] 61it [00:06, 9.79it/s] 62it [00:06, 9.83it/s] 63it [00:06, 9.80it/s] 64it [00:06, 9.74it/s] 65it [00:06, 9.81it/s] 66it [00:06, 9.85it/s] 67it [00:07, 9.89it/s] 68it [00:07, 9.32it/s] 69it [00:07, 9.51it/s] 70it [00:07, 9.64it/s] 71it [00:07, 9.74it/s] 72it [00:07, 9.81it/s] 74it [00:07, 9.92it/s] 76it [00:07, 9.95it/s] 78it [00:08, 9.97it/s] 79it [00:08, 9.98it/s] 81it [00:08, 10.00it/s] 82it [00:08, 9.53it/s] 83it [00:08, 9.48it/s] 84it [00:08, 9.58it/s] 86it [00:08, 9.74it/s] 88it [00:09, 9.83it/s] 90it [00:09, 9.89it/s] 92it [00:09, 9.95it/s] 94it [00:09, 9.97it/s] 96it [00:09, 10.00it/s] 97it [00:10, 9.98it/s] 98it [00:10, 9.98it/s] 100it [00:10, 10.01it/s]2025-05-26 03:58:31,443 - INFO - [Epoch 019 | Batch 0100] IWAE-loss 8565.3213 | mean log_px -0.0776 | KL -3569.59 + 101it [00:10, 9.55it/s] 102it [00:10, 9.65it/s] 104it [00:10, 9.79it/s] 106it [00:10, 9.88it/s] 107it [00:11, 9.45it/s] 108it [00:11, 9.56it/s] 110it [00:11, 9.73it/s] 112it [00:11, 9.83it/s] 113it [00:11, 9.84it/s] 115it [00:11, 9.90it/s] 116it [00:12, 9.92it/s] 118it [00:12, 9.57it/s] 120it [00:12, 9.73it/s] 121it [00:12, 9.75it/s] 122it [00:12, 9.33it/s] 123it [00:12, 9.19it/s] 124it [00:12, 9.26it/s] 125it [00:12, 9.07it/s] 126it [00:13, 8.91it/s] 127it [00:13, 8.50it/s] 128it [00:13, 8.75it/s] 129it [00:13, 8.97it/s] 130it [00:13, 9.09it/s] 131it [00:13, 9.22it/s] 132it [00:13, 9.29it/s] 133it [00:13, 9.31it/s] 134it [00:13, 9.37it/s] 135it [00:14, 9.42it/s] 136it [00:14, 9.42it/s] 137it [00:14, 9.46it/s] 138it [00:14, 9.48it/s] 139it [00:14, 9.47it/s] 140it [00:14, 9.48it/s] 141it [00:14, 9.45it/s] 142it [00:14, 9.50it/s] 143it [00:14, 9.52it/s] 144it [00:15, 9.46it/s] 145it [00:15, 9.49it/s] 146it [00:15, 8.98it/s] 147it [00:15, 9.15it/s] 148it [00:15, 9.25it/s] 149it [00:15, 9.33it/s] 150it [00:15, 9.43it/s]2025-05-26 03:58:36,764 - INFO - [Epoch 019 | Batch 0150] IWAE-loss 7441.7295 | mean log_px -0.0628 | KL -3567.16 + 151it [00:15, 8.93it/s] 152it [00:15, 9.08it/s] 153it [00:16, 9.14it/s] 154it [00:16, 9.20it/s] 155it [00:16, 9.24it/s] 156it [00:16, 9.30it/s] 157it [00:16, 9.35it/s] 158it [00:16, 9.16it/s] 159it [00:16, 9.26it/s] 160it [00:16, 9.32it/s] 161it [00:16, 9.34it/s] 162it [00:16, 9.41it/s] 163it [00:17, 9.44it/s] 164it [00:17, 9.44it/s] 165it [00:17, 9.48it/s] 166it [00:17, 9.52it/s] 167it [00:17, 9.48it/s] 168it [00:17, 9.44it/s] 169it [00:17, 9.45it/s] 170it [00:17, 9.48it/s] 171it [00:17, 9.54it/s] 172it [00:18, 9.52it/s] 173it [00:18, 9.29it/s] 174it [00:18, 9.40it/s] 175it [00:18, 8.92it/s] 176it [00:18, 9.07it/s] 177it [00:18, 9.19it/s] 178it [00:18, 9.24it/s] 179it [00:18, 9.29it/s] 180it [00:18, 9.34it/s] 181it [00:19, 9.40it/s] 182it [00:19, 9.40it/s] 183it [00:19, 9.39it/s] 184it [00:19, 9.34it/s] 185it [00:19, 9.24it/s] 186it [00:19, 8.67it/s] 187it [00:19, 8.90it/s] 188it [00:19, 9.09it/s] 189it [00:19, 9.21it/s] 190it [00:19, 9.31it/s] 191it [00:20, 9.40it/s] 192it [00:20, 9.43it/s] 193it [00:20, 9.47it/s] 194it [00:20, 9.50it/s] 195it [00:20, 9.00it/s] 196it [00:20, 8.85it/s] 196it [00:20, 9.46it/s] +2025-05-26 03:58:41,735 - INFO - Epoch: 19, Objective: tensor([7893.3765], device='cuda:0', grad_fn=), Loss: 0.061493679881095886, KL/n: 72.83820343017578 + 0it [00:00, ?it/s]2025-05-26 03:58:42,213 - INFO - [Epoch 020 | Batch 0000] IWAE-loss 6628.0117 | mean log_px -0.0495 | KL -3568.11 + 1it [00:00, 2.62it/s] 2it [00:00, 4.37it/s] 3it [00:00, 5.83it/s] 4it [00:00, 6.86it/s] 5it [00:00, 7.65it/s] 6it [00:00, 8.22it/s] 7it [00:01, 8.63it/s] 8it [00:01, 8.94it/s] 9it [00:01, 9.14it/s] 10it [00:01, 9.22it/s] 11it [00:01, 9.33it/s] 12it [00:01, 9.43it/s] 13it [00:01, 9.46it/s] 14it [00:01, 9.49it/s] 15it [00:01, 9.52it/s] 16it [00:01, 9.54it/s] 17it [00:02, 9.45it/s] 18it [00:02, 9.45it/s] 19it [00:02, 9.49it/s] 20it [00:02, 9.32it/s] 21it [00:02, 9.24it/s] 22it [00:02, 8.57it/s] 23it [00:02, 8.85it/s] 24it [00:02, 9.00it/s] 25it [00:02, 9.17it/s] 26it [00:03, 9.28it/s] 27it [00:03, 9.39it/s] 28it [00:03, 9.43it/s] 29it [00:03, 9.45it/s] 30it [00:03, 9.47it/s] 31it [00:03, 9.55it/s] 32it [00:03, 9.51it/s] 33it [00:03, 9.37it/s] 34it [00:03, 8.66it/s] 35it [00:04, 8.90it/s] 36it [00:04, 9.00it/s] 37it [00:04, 9.16it/s] 38it [00:04, 9.27it/s] 39it [00:04, 9.35it/s] 40it [00:04, 9.41it/s] 41it [00:04, 9.44it/s] 42it [00:04, 9.49it/s] 43it [00:04, 9.44it/s] 44it [00:04, 9.39it/s] 45it [00:05, 9.35it/s] 46it [00:05, 8.86it/s] 47it [00:05, 9.04it/s] 48it [00:05, 9.16it/s] 49it [00:05, 9.28it/s] 50it [00:05, 9.35it/s]2025-05-26 03:58:47,585 - INFO - [Epoch 020 | Batch 0050] IWAE-loss 7019.3750 | mean log_px -0.0534 | KL -3567.79 + 51it [00:05, 8.90it/s] 52it [00:05, 9.09it/s] 53it [00:05, 9.20it/s] 54it [00:06, 9.27it/s] 55it [00:06, 9.31it/s] 56it [00:06, 9.37it/s] 57it [00:06, 9.37it/s] 58it [00:06, 9.09it/s] 59it [00:06, 9.24it/s] 60it [00:06, 9.29it/s] 61it [00:06, 9.23it/s] 62it [00:06, 9.29it/s] 63it [00:07, 9.37it/s] 64it [00:07, 8.88it/s] 65it [00:07, 8.99it/s] 66it [00:07, 9.11it/s] 67it [00:07, 9.22it/s] 68it [00:07, 9.27it/s] 69it [00:07, 9.34it/s] 70it [00:07, 8.85it/s] 71it [00:07, 9.10it/s] 72it [00:08, 9.24it/s] 73it [00:08, 9.30it/s] 74it [00:08, 9.34it/s] 75it [00:08, 9.32it/s] 76it [00:08, 9.23it/s] 77it [00:08, 9.34it/s] 78it [00:08, 9.43it/s] 79it [00:08, 9.46it/s] 80it [00:08, 9.24it/s] 81it [00:09, 9.35it/s] 82it [00:09, 9.39it/s] 83it [00:09, 9.48it/s] 84it [00:09, 9.47it/s] 85it [00:09, 9.49it/s] 86it [00:09, 9.53it/s] 87it [00:09, 9.54it/s] 88it [00:09, 8.89it/s] 89it [00:09, 9.03it/s] 90it [00:09, 9.16it/s] 91it [00:10, 9.24it/s] 92it [00:10, 8.46it/s] 93it [00:10, 8.85it/s] 94it [00:10, 9.14it/s] 95it [00:10, 8.84it/s] 96it [00:10, 9.15it/s] 98it [00:10, 9.47it/s] 100it [00:11, 9.70it/s]2025-05-26 03:58:52,986 - INFO - [Epoch 020 | Batch 0100] IWAE-loss 9756.4814 | mean log_px -0.0918 | KL -3565.89 + 101it [00:11, 9.31it/s] 102it [00:11, 9.46it/s] 104it [00:11, 9.69it/s] 106it [00:11, 9.83it/s] 108it [00:11, 9.92it/s] 110it [00:12, 9.97it/s] 112it [00:12, 10.00it/s] 113it [00:12, 9.61it/s] 115it [00:12, 9.75it/s] 117it [00:12, 9.44it/s] 119it [00:13, 9.64it/s] 121it [00:13, 9.77it/s] 122it [00:13, 9.45it/s] 124it [00:13, 9.65it/s] 126it [00:13, 9.79it/s] 128it [00:13, 9.89it/s] 130it [00:14, 9.91it/s] 132it [00:14, 9.98it/s] 134it [00:14, 10.01it/s] 136it [00:14, 10.04it/s] 138it [00:14, 10.06it/s] 140it [00:15, 10.07it/s] 142it [00:15, 10.07it/s] 144it [00:15, 10.07it/s] 146it [00:15, 9.73it/s] 148it [00:15, 9.83it/s] 150it [00:16, 9.91it/s]2025-05-26 03:58:58,069 - INFO - [Epoch 020 | Batch 0150] IWAE-loss 6741.2627 | mean log_px -0.0465 | KL -3565.47 + 151it [00:16, 9.54it/s] 153it [00:16, 9.71it/s] 155it [00:16, 9.82it/s] 156it [00:16, 9.85it/s] 158it [00:16, 9.92it/s] 160it [00:17, 9.98it/s] 162it [00:17, 10.00it/s] 164it [00:17, 9.67it/s] 165it [00:17, 9.73it/s] 166it [00:17, 9.74it/s] 168it [00:17, 9.85it/s] 170it [00:18, 9.61it/s] 171it [00:18, 9.54it/s] 172it [00:18, 9.29it/s] 173it [00:18, 9.43it/s] 175it [00:18, 9.68it/s] 176it [00:18, 9.75it/s] 178it [00:19, 9.88it/s] 180it [00:19, 9.54it/s] 182it [00:19, 9.70it/s] 184it [00:19, 9.79it/s] 186it [00:19, 9.88it/s] 188it [00:20, 9.60it/s] 189it [00:20, 9.66it/s] 190it [00:20, 9.73it/s] 191it [00:20, 9.71it/s] 192it [00:20, 9.69it/s] 193it [00:20, 9.73it/s] 194it [00:20, 9.80it/s] 195it [00:20, 9.36it/s] 196it [00:20, 9.15it/s] 196it [00:20, 9.35it/s] +2025-05-26 03:59:02,840 - INFO - Epoch: 20, Objective: tensor([5954.1396], device='cuda:0', grad_fn=), Loss: 0.034850478172302246, KL/n: 72.82156372070312 + 0it [00:00, ?it/s]2025-05-26 03:59:03,123 - INFO - [Epoch 021 | Batch 0000] IWAE-loss 7638.6367 | mean log_px -0.0598 | KL -3567.85 + 1it [00:00, 5.01it/s] 2it [00:00, 7.03it/s] 3it [00:00, 8.09it/s] 4it [00:00, 8.67it/s] 5it [00:00, 9.07it/s] 6it [00:00, 9.29it/s] 7it [00:00, 9.23it/s] 8it [00:00, 9.40it/s] 9it [00:01, 9.55it/s] 10it [00:01, 9.59it/s] 11it [00:01, 9.67it/s] 12it [00:01, 9.71it/s] 13it [00:01, 9.77it/s] 14it [00:01, 9.77it/s] 15it [00:01, 9.72it/s] 16it [00:01, 9.63it/s] 17it [00:01, 9.69it/s] 18it [00:01, 9.69it/s] 19it [00:02, 9.71it/s] 20it [00:02, 9.72it/s] 21it [00:02, 9.74it/s] 22it [00:02, 9.77it/s] 23it [00:02, 9.77it/s] 24it [00:02, 9.79it/s] 25it [00:02, 9.80it/s] 26it [00:02, 9.80it/s] 27it [00:02, 9.79it/s] 28it [00:02, 9.80it/s] 29it [00:03, 9.79it/s] 30it [00:03, 9.79it/s] 31it [00:03, 9.78it/s] 32it [00:03, 9.75it/s] 33it [00:03, 9.77it/s] 34it [00:03, 9.76it/s] 35it [00:03, 9.78it/s] 36it [00:03, 9.80it/s] 37it [00:03, 9.82it/s] 38it [00:03, 9.80it/s] 39it [00:04, 9.80it/s] 40it [00:04, 9.80it/s] 41it [00:04, 9.81it/s] 42it [00:04, 9.82it/s] 43it [00:04, 9.79it/s] 44it [00:04, 9.74it/s] 45it [00:04, 9.76it/s] 46it [00:04, 9.73it/s] 47it [00:04, 9.74it/s] 48it [00:05, 9.74it/s] 49it [00:05, 9.76it/s] 50it [00:05, 9.76it/s]2025-05-26 03:59:08,251 - INFO - [Epoch 021 | Batch 0050] IWAE-loss 12824.7617 | mean log_px -0.1392 | KL -3568.71 + 51it [00:05, 9.73it/s] 52it [00:05, 9.73it/s] 53it [00:05, 9.73it/s] 54it [00:05, 9.74it/s] 55it [00:05, 9.75it/s] 56it [00:05, 9.75it/s] 57it [00:05, 9.76it/s] 58it [00:06, 9.72it/s] 59it [00:06, 9.73it/s] 60it [00:06, 9.74it/s] 61it [00:06, 9.75it/s] 62it [00:06, 9.76it/s] 63it [00:06, 9.77it/s] 64it [00:06, 9.77it/s] 65it [00:06, 9.80it/s] 66it [00:06, 9.79it/s] 67it [00:06, 9.79it/s] 68it [00:07, 9.75it/s] 69it [00:07, 9.78it/s] 70it [00:07, 9.74it/s] 71it [00:07, 9.76it/s] 72it [00:07, 9.79it/s] 74it [00:07, 9.48it/s] 76it [00:07, 9.67it/s] 77it [00:08, 9.29it/s] 79it [00:08, 9.56it/s] 80it [00:08, 9.63it/s] 81it [00:08, 9.20it/s] 82it [00:08, 9.32it/s] 83it [00:08, 9.42it/s] 84it [00:08, 9.45it/s] 85it [00:08, 8.90it/s] 86it [00:08, 8.94it/s] 87it [00:09, 9.09it/s] 88it [00:09, 9.21it/s] 89it [00:09, 8.85it/s] 90it [00:09, 9.05it/s] 91it [00:09, 9.24it/s] 92it [00:09, 9.27it/s] 93it [00:09, 8.82it/s] 94it [00:09, 9.03it/s] 95it [00:09, 9.24it/s] 96it [00:10, 8.78it/s] 97it [00:10, 9.05it/s] 98it [00:10, 9.29it/s] 99it [00:10, 9.43it/s] 100it [00:10, 8.97it/s]2025-05-26 03:59:13,563 - INFO - [Epoch 021 | Batch 0100] IWAE-loss 9816.6523 | mean log_px -0.1053 | KL -3570.17 + 101it [00:10, 9.09it/s] 102it [00:10, 9.25it/s] 103it [00:10, 9.43it/s] 104it [00:10, 8.95it/s] 105it [00:11, 9.08it/s] 106it [00:11, 9.29it/s] 107it [00:11, 9.45it/s] 108it [00:11, 8.97it/s] 109it [00:11, 9.21it/s] 110it [00:11, 9.38it/s] 111it [00:11, 9.48it/s] 112it [00:11, 8.99it/s] 113it [00:11, 9.24it/s] 114it [00:12, 9.36it/s] 115it [00:12, 9.43it/s] 116it [00:12, 9.11it/s] 118it [00:12, 9.56it/s] 120it [00:12, 9.79it/s] 121it [00:12, 9.40it/s] 123it [00:12, 9.66it/s] 125it [00:13, 9.50it/s] 126it [00:13, 9.58it/s] 128it [00:13, 9.77it/s] 130it [00:13, 9.89it/s] 131it [00:13, 9.59it/s] 132it [00:13, 9.67it/s] 134it [00:14, 9.42it/s] 136it [00:14, 9.67it/s] 138it [00:14, 9.81it/s] 140it [00:14, 9.92it/s] 142it [00:14, 10.00it/s] 144it [00:15, 10.04it/s] 146it [00:15, 9.71it/s] 148it [00:15, 9.84it/s] 150it [00:15, 9.92it/s]2025-05-26 03:59:18,756 - INFO - [Epoch 021 | Batch 0150] IWAE-loss 6365.2271 | mean log_px -0.0422 | KL -3569.45 + 151it [00:15, 9.94it/s] 153it [00:16, 10.01it/s] 155it [00:16, 9.65it/s] 157it [00:16, 9.81it/s] 159it [00:16, 9.91it/s] 160it [00:16, 9.85it/s] 162it [00:16, 9.94it/s] 164it [00:17, 10.00it/s] 166it [00:17, 9.69it/s] 167it [00:17, 9.73it/s] 168it [00:17, 9.76it/s] 169it [00:17, 9.78it/s] 170it [00:17, 9.80it/s] 171it [00:17, 9.80it/s] 172it [00:17, 9.84it/s] 173it [00:18, 9.33it/s] 175it [00:18, 9.67it/s] 177it [00:18, 9.86it/s] 179it [00:18, 9.96it/s] 180it [00:18, 9.55it/s] 182it [00:18, 9.77it/s] 184it [00:19, 9.89it/s] 186it [00:19, 9.97it/s] 188it [00:19, 10.03it/s] 190it [00:19, 10.07it/s] 192it [00:19, 10.09it/s] 194it [00:20, 10.10it/s] 196it [00:20, 9.89it/s] 196it [00:20, 9.59it/s] +2025-05-26 03:59:23,415 - INFO - Epoch: 21, Objective: tensor([6160.0498], device='cuda:0', grad_fn=), Loss: 0.040021877735853195, KL/n: 72.79065704345703 + 0it [00:00, ?it/s]2025-05-26 03:59:23,875 - INFO - [Epoch 022 | Batch 0000] IWAE-loss 9817.3037 | mean log_px -0.0940 | KL -3564.62 + 1it [00:00, 2.55it/s] 3it [00:00, 5.73it/s] 5it [00:00, 7.13it/s] 7it [00:01, 8.15it/s] 9it [00:01, 8.80it/s] 11it [00:01, 8.86it/s] 12it [00:01, 9.02it/s] 14it [00:01, 9.38it/s] 16it [00:01, 9.62it/s] 18it [00:02, 9.76it/s] 20it [00:02, 9.88it/s] 22it [00:02, 9.96it/s] 24it [00:02, 10.01it/s] 26it [00:02, 9.71it/s] 28it [00:03, 9.83it/s] 30it [00:03, 9.92it/s] 32it [00:03, 9.65it/s] 34it [00:03, 9.78it/s] 36it [00:03, 9.55it/s] 38it [00:04, 9.72it/s] 40it [00:04, 9.84it/s] 42it [00:04, 9.94it/s] 44it [00:04, 9.66it/s] 46it [00:04, 9.80it/s] 48it [00:05, 9.90it/s] 50it [00:05, 9.97it/s]2025-05-26 03:59:28,980 - INFO - [Epoch 022 | Batch 0050] IWAE-loss 8459.5879 | mean log_px -0.0763 | KL -3567.08 + 51it [00:05, 9.60it/s] 53it [00:05, 9.77it/s] 55it [00:05, 9.89it/s] 57it [00:06, 9.98it/s] 59it [00:06, 10.04it/s] 61it [00:06, 10.07it/s] 63it [00:06, 10.08it/s] 65it [00:06, 9.75it/s] 67it [00:07, 9.84it/s] 69it [00:07, 9.93it/s] 71it [00:07, 9.98it/s] 73it [00:07, 10.04it/s] 75it [00:07, 10.08it/s] 77it [00:08, 10.11it/s] 79it [00:08, 10.13it/s] 81it [00:08, 10.15it/s] 83it [00:08, 10.15it/s] 85it [00:08, 10.13it/s] 87it [00:09, 10.13it/s] 89it [00:09, 10.11it/s] 91it [00:09, 10.07it/s] 93it [00:09, 10.10it/s] 95it [00:09, 10.08it/s] 97it [00:10, 10.10it/s] 99it [00:10, 10.10it/s]2025-05-26 03:59:33,963 - INFO - [Epoch 022 | Batch 0100] IWAE-loss 9265.9893 | mean log_px -0.0819 | KL -3570.15 + 101it [00:10, 10.12it/s] 103it [00:10, 10.05it/s] 105it [00:10, 10.03it/s] 107it [00:11, 10.08it/s] 109it [00:11, 10.09it/s] 111it [00:11, 10.07it/s] 113it [00:11, 10.04it/s] 115it [00:11, 10.08it/s] 117it [00:12, 10.11it/s] 119it [00:12, 10.11it/s] 121it [00:12, 10.10it/s] 123it [00:12, 10.13it/s] 125it [00:12, 10.03it/s] 127it [00:13, 10.04it/s] 129it [00:13, 10.08it/s] 131it [00:13, 10.08it/s] 133it [00:13, 10.10it/s] 135it [00:13, 10.11it/s] 137it [00:14, 10.12it/s] 139it [00:14, 10.13it/s] 141it [00:14, 10.13it/s] 143it [00:14, 10.10it/s] 145it [00:14, 10.10it/s] 147it [00:15, 10.10it/s] 149it [00:15, 10.12it/s]2025-05-26 03:59:38,918 - INFO - [Epoch 022 | Batch 0150] IWAE-loss 8519.6299 | mean log_px -0.0768 | KL -3566.00 + 151it [00:15, 10.11it/s] 153it [00:15, 10.12it/s] 155it [00:15, 10.12it/s] 157it [00:15, 10.13it/s] 159it [00:16, 10.12it/s] 161it [00:16, 10.11it/s] 163it [00:16, 10.09it/s] 165it [00:16, 10.07it/s] 167it [00:17, 9.87it/s] 169it [00:17, 9.93it/s] 170it [00:17, 9.94it/s] 172it [00:17, 9.97it/s] 174it [00:17, 10.00it/s] 176it [00:17, 10.04it/s] 178it [00:18, 9.79it/s] 180it [00:18, 9.56it/s] 182it [00:18, 9.68it/s] 184it [00:18, 9.48it/s] 186it [00:18, 9.64it/s] 187it [00:19, 9.70it/s] 188it [00:19, 9.41it/s] 190it [00:19, 9.65it/s] 191it [00:19, 9.31it/s] 192it [00:19, 9.32it/s] 193it [00:19, 9.24it/s] 194it [00:19, 8.98it/s] 195it [00:19, 8.88it/s] 196it [00:20, 9.74it/s] +2025-05-26 03:59:43,664 - INFO - Epoch: 22, Objective: tensor([8000.1289], device='cuda:0', grad_fn=), Loss: 0.06485095620155334, KL/n: 72.75353240966797 + 0it [00:00, ?it/s]2025-05-26 03:59:43,914 - INFO - [Epoch 023 | Batch 0000] IWAE-loss 10706.0791 | mean log_px -0.1055 | KL -3565.08 + 1it [00:00, 5.31it/s] 2it [00:00, 7.33it/s] 4it [00:00, 8.81it/s] 5it [00:00, 9.08it/s] 6it [00:00, 9.26it/s] 8it [00:00, 9.61it/s] 9it [00:00, 9.61it/s] 10it [00:01, 9.64it/s] 12it [00:01, 9.08it/s] 13it [00:01, 8.96it/s] 14it [00:01, 9.14it/s] 15it [00:01, 9.02it/s] 16it [00:01, 9.25it/s] 18it [00:01, 9.58it/s] 20it [00:02, 9.75it/s] 22it [00:02, 9.85it/s] 24it [00:02, 9.62it/s] 25it [00:02, 9.67it/s] 26it [00:02, 9.71it/s] 27it [00:02, 9.77it/s] 28it [00:02, 9.83it/s] 30it [00:03, 9.93it/s] 32it [00:03, 9.96it/s] 34it [00:03, 9.99it/s] 35it [00:03, 9.99it/s] 36it [00:03, 9.96it/s] 37it [00:03, 9.87it/s] 38it [00:03, 9.90it/s] 39it [00:04, 9.47it/s] 40it [00:04, 9.59it/s] 41it [00:04, 9.69it/s] 42it [00:04, 9.77it/s] 43it [00:04, 9.24it/s] 44it [00:04, 9.43it/s] 46it [00:04, 9.69it/s] 48it [00:05, 9.83it/s] 49it [00:05, 9.86it/s] 50it [00:05, 9.89it/s]2025-05-26 03:59:49,090 - INFO - [Epoch 023 | Batch 0050] IWAE-loss 6445.8760 | mean log_px -0.0427 | KL -3562.69 + 51it [00:05, 9.92it/s] 52it [00:05, 9.92it/s] 53it [00:05, 9.31it/s] 54it [00:05, 9.50it/s] 56it [00:05, 9.74it/s] 58it [00:06, 9.86it/s] 60it [00:06, 9.91it/s] 61it [00:06, 9.92it/s] 62it [00:06, 9.59it/s] 63it [00:06, 9.67it/s] 64it [00:06, 9.71it/s] 66it [00:06, 9.84it/s] 68it [00:07, 9.92it/s] 70it [00:07, 9.90it/s] 71it [00:07, 9.92it/s] 73it [00:07, 9.97it/s] 74it [00:07, 9.96it/s] 76it [00:07, 9.98it/s] 77it [00:07, 9.98it/s] 78it [00:08, 9.98it/s] 79it [00:08, 9.96it/s] 80it [00:08, 9.96it/s] 82it [00:08, 10.02it/s] 84it [00:08, 10.04it/s] 86it [00:08, 10.04it/s] 88it [00:09, 10.03it/s] 90it [00:09, 10.03it/s] 92it [00:09, 10.03it/s] 94it [00:09, 10.04it/s] 96it [00:09, 10.04it/s] 98it [00:10, 10.04it/s] 100it [00:10, 10.04it/s]2025-05-26 03:59:54,126 - INFO - [Epoch 023 | Batch 0100] IWAE-loss 9278.5117 | mean log_px -0.0849 | KL -3567.39 + 102it [00:10, 10.02it/s] 104it [00:10, 10.02it/s] 106it [00:10, 10.03it/s] 108it [00:11, 10.04it/s] 110it [00:11, 10.02it/s] 112it [00:11, 10.01it/s] 114it [00:11, 10.01it/s] 116it [00:11, 9.66it/s] 117it [00:11, 9.69it/s] 118it [00:12, 9.74it/s] 119it [00:12, 9.33it/s] 120it [00:12, 9.46it/s] 122it [00:12, 9.32it/s] 123it [00:12, 9.43it/s] 124it [00:12, 9.52it/s] 125it [00:12, 9.56it/s] 126it [00:12, 9.64it/s] 127it [00:13, 9.68it/s] 128it [00:13, 9.68it/s] 129it [00:13, 9.73it/s] 130it [00:13, 9.78it/s] 131it [00:13, 9.79it/s] 132it [00:13, 9.84it/s] 133it [00:13, 9.88it/s] 134it [00:13, 9.27it/s] 135it [00:13, 9.47it/s] 137it [00:14, 9.73it/s] 138it [00:14, 9.79it/s] 140it [00:14, 9.89it/s] 142it [00:14, 9.62it/s] 143it [00:14, 9.68it/s] 144it [00:14, 9.72it/s] 145it [00:14, 9.79it/s] 147it [00:15, 9.89it/s] 149it [00:15, 9.86it/s] 150it [00:15, 9.86it/s]2025-05-26 03:59:59,259 - INFO - [Epoch 023 | Batch 0150] IWAE-loss 9398.9590 | mean log_px -0.0833 | KL -3566.49 + 151it [00:15, 9.88it/s] 153it [00:15, 9.93it/s] 154it [00:15, 9.94it/s] 156it [00:16, 9.98it/s] 157it [00:16, 9.99it/s] 159it [00:16, 10.01it/s] 161it [00:16, 9.61it/s] 163it [00:16, 9.75it/s] 165it [00:16, 9.84it/s] 166it [00:17, 9.87it/s] 168it [00:17, 9.93it/s] 169it [00:17, 9.80it/s] 170it [00:17, 9.80it/s] 171it [00:17, 9.71it/s] 172it [00:17, 9.73it/s] 173it [00:17, 9.80it/s] 175it [00:17, 9.90it/s] 177it [00:18, 9.90it/s] 178it [00:18, 9.22it/s] 179it [00:18, 9.36it/s] 180it [00:18, 9.45it/s] 181it [00:18, 9.53it/s] 182it [00:18, 9.55it/s] 183it [00:18, 9.57it/s] 184it [00:18, 9.57it/s] 185it [00:18, 9.67it/s] 186it [00:19, 9.72it/s] 187it [00:19, 9.75it/s] 189it [00:19, 9.85it/s] 190it [00:19, 9.85it/s] 191it [00:19, 9.68it/s] 192it [00:19, 9.61it/s] 193it [00:19, 9.54it/s] 194it [00:19, 8.96it/s] 195it [00:20, 8.71it/s] 196it [00:20, 8.93it/s] 196it [00:20, 9.68it/s] +2025-05-26 04:00:04,036 - INFO - Epoch: 23, Objective: tensor([7036.1016], device='cuda:0', grad_fn=), Loss: 0.05605386570096016, KL/n: 72.70604705810547 + 0it [00:00, ?it/s]2025-05-26 04:00:04,503 - INFO - [Epoch 024 | Batch 0000] IWAE-loss 10053.7881 | mean log_px -0.0965 | KL -3562.36 + 1it [00:00, 5.24it/s] 2it [00:00, 6.59it/s] 3it [00:00, 7.67it/s] 4it [00:00, 8.32it/s] 5it [00:00, 8.18it/s] 6it [00:00, 8.56it/s] 7it [00:00, 8.86it/s] 8it [00:00, 8.99it/s] 9it [00:01, 8.65it/s] 10it [00:01, 8.86it/s] 11it [00:01, 8.99it/s] 12it [00:01, 9.15it/s] 13it [00:01, 8.75it/s] 14it [00:01, 8.90it/s] 15it [00:01, 9.02it/s] 16it [00:01, 9.13it/s] 17it [00:01, 8.78it/s] 18it [00:02, 8.91it/s] 19it [00:02, 9.10it/s] 20it [00:02, 9.25it/s] 21it [00:02, 8.84it/s] 22it [00:02, 9.03it/s] 23it [00:02, 9.12it/s] 24it [00:02, 9.20it/s] 25it [00:02, 8.84it/s] 26it [00:02, 9.04it/s] 27it [00:03, 9.16it/s] 28it [00:03, 8.79it/s] 29it [00:03, 8.95it/s] 30it [00:03, 9.11it/s] 31it [00:03, 9.19it/s] 32it [00:03, 8.76it/s] 33it [00:03, 8.80it/s] 34it [00:03, 9.10it/s] 35it [00:03, 9.32it/s] 36it [00:04, 9.45it/s] 37it [00:04, 9.52it/s] 38it [00:04, 9.60it/s] 39it [00:04, 9.63it/s] 40it [00:04, 9.68it/s] 41it [00:04, 9.75it/s] 42it [00:04, 9.77it/s] 43it [00:04, 9.80it/s] 44it [00:04, 9.81it/s] 45it [00:04, 9.82it/s] 46it [00:05, 9.81it/s] 47it [00:05, 9.65it/s] 48it [00:05, 9.60it/s] 49it [00:05, 9.64it/s] 50it [00:05, 9.66it/s]2025-05-26 04:00:09,922 - INFO - [Epoch 024 | Batch 0050] IWAE-loss 7944.3613 | mean log_px -0.0672 | KL -3565.10 + 51it [00:05, 9.69it/s] 52it [00:05, 9.71it/s] 53it [00:05, 9.52it/s] 54it [00:05, 9.61it/s] 55it [00:06, 9.68it/s] 56it [00:06, 9.73it/s] 57it [00:06, 9.63it/s] 58it [00:06, 9.65it/s] 59it [00:06, 9.69it/s] 60it [00:06, 9.71it/s] 61it [00:06, 9.75it/s] 62it [00:06, 9.78it/s] 63it [00:06, 9.80it/s] 64it [00:06, 9.78it/s] 65it [00:07, 9.80it/s] 66it [00:07, 9.81it/s] 67it [00:07, 9.84it/s] 68it [00:07, 9.84it/s] 69it [00:07, 9.85it/s] 70it [00:07, 9.85it/s] 71it [00:07, 9.85it/s] 72it [00:07, 9.82it/s] 73it [00:07, 9.82it/s] 74it [00:07, 9.80it/s] 75it [00:08, 9.82it/s] 76it [00:08, 9.82it/s] 77it [00:08, 9.84it/s] 78it [00:08, 9.82it/s] 79it [00:08, 9.85it/s] 80it [00:08, 9.83it/s] 81it [00:08, 9.84it/s] 82it [00:08, 9.83it/s] 83it [00:08, 9.83it/s] 84it [00:08, 9.84it/s] 85it [00:09, 9.85it/s] 86it [00:09, 9.86it/s] 87it [00:09, 9.87it/s] 88it [00:09, 9.86it/s] 89it [00:09, 9.87it/s] 90it [00:09, 9.87it/s] 91it [00:09, 9.87it/s] 92it [00:09, 9.87it/s] 93it [00:09, 9.87it/s] 94it [00:09, 9.84it/s] 95it [00:10, 9.83it/s] 96it [00:10, 9.83it/s] 97it [00:10, 9.70it/s] 98it [00:10, 9.53it/s] 99it [00:10, 9.39it/s] 100it [00:10, 9.50it/s]2025-05-26 04:00:15,042 - INFO - [Epoch 024 | Batch 0100] IWAE-loss 6554.0537 | mean log_px -0.0452 | KL -3559.28 + 101it [00:10, 9.58it/s] 102it [00:10, 9.64it/s] 103it [00:10, 9.71it/s] 104it [00:11, 9.73it/s] 105it [00:11, 9.76it/s] 106it [00:11, 9.78it/s] 107it [00:11, 9.80it/s] 108it [00:11, 9.79it/s] 109it [00:11, 9.52it/s] 110it [00:11, 9.61it/s] 111it [00:11, 9.67it/s] 112it [00:11, 9.70it/s] 113it [00:11, 9.72it/s] 114it [00:12, 9.71it/s] 115it [00:12, 9.72it/s] 116it [00:12, 9.75it/s] 117it [00:12, 9.76it/s] 118it [00:12, 9.77it/s] 119it [00:12, 9.80it/s] 120it [00:12, 9.77it/s] 121it [00:12, 9.79it/s] 122it [00:12, 9.79it/s] 123it [00:12, 9.77it/s] 124it [00:13, 9.78it/s] 125it [00:13, 9.82it/s] 126it [00:13, 9.79it/s] 127it [00:13, 9.81it/s] 128it [00:13, 9.79it/s] 129it [00:13, 9.64it/s] 130it [00:13, 9.63it/s] 131it [00:13, 9.69it/s] 132it [00:13, 9.71it/s] 133it [00:14, 9.75it/s] 134it [00:14, 9.74it/s] 135it [00:14, 9.76it/s] 136it [00:14, 9.76it/s] 137it [00:14, 9.68it/s] 138it [00:14, 9.71it/s] 139it [00:14, 9.75it/s] 140it [00:14, 9.75it/s] 141it [00:14, 9.76it/s] 142it [00:14, 9.76it/s] 143it [00:15, 9.77it/s] 144it [00:15, 9.76it/s] 145it [00:15, 9.79it/s] 146it [00:15, 9.75it/s] 147it [00:15, 9.79it/s] 148it [00:15, 9.79it/s] 149it [00:15, 9.80it/s] 150it [00:15, 9.79it/s]2025-05-26 04:00:20,169 - INFO - [Epoch 024 | Batch 0150] IWAE-loss 11166.3877 | mean log_px -0.1161 | KL -3563.05 + 151it [00:15, 9.77it/s] 152it [00:15, 9.79it/s] 153it [00:16, 9.80it/s] 154it [00:16, 9.78it/s] 155it [00:16, 9.81it/s] 156it [00:16, 9.81it/s] 157it [00:16, 9.81it/s] 158it [00:16, 9.78it/s] 159it [00:16, 9.80it/s] 160it [00:16, 9.81it/s] 161it [00:16, 9.84it/s] 162it [00:16, 9.82it/s] 163it [00:17, 9.83it/s] 164it [00:17, 9.82it/s] 165it [00:17, 9.82it/s] 166it [00:17, 9.80it/s] 167it [00:17, 9.83it/s] 168it [00:17, 9.79it/s] 169it [00:17, 9.68it/s] 170it [00:17, 9.70it/s] 171it [00:17, 9.74it/s] 172it [00:17, 9.76it/s] 173it [00:18, 9.79it/s] 174it [00:18, 9.81it/s] 175it [00:18, 9.84it/s] 176it [00:18, 9.82it/s] 177it [00:18, 9.84it/s] 178it [00:18, 9.83it/s] 179it [00:18, 9.71it/s] 180it [00:18, 9.73it/s] 181it [00:18, 9.76it/s] 182it [00:19, 9.73it/s] 183it [00:19, 9.73it/s] 184it [00:19, 9.70it/s] 185it [00:19, 9.74it/s] 186it [00:19, 9.76it/s] 187it [00:19, 9.74it/s] 188it [00:19, 9.75it/s] 189it [00:19, 9.70it/s] 190it [00:19, 9.71it/s] 191it [00:19, 9.73it/s] 192it [00:20, 9.73it/s] 193it [00:20, 9.75it/s] 194it [00:20, 9.60it/s] 195it [00:20, 9.22it/s] 196it [00:20, 9.54it/s] +2025-05-26 04:00:24,900 - INFO - Epoch: 24, Objective: tensor([7781.2070], device='cuda:0', grad_fn=), Loss: 0.06895510107278824, KL/n: 72.64373779296875 + 0it [00:00, ?it/s]2025-05-26 04:00:25,147 - INFO - [Epoch 025 | Batch 0000] IWAE-loss 5908.9863 | mean log_px -0.0345 | KL -3553.46 + 1it [00:00, 6.23it/s] 2it [00:00, 7.98it/s] 3it [00:00, 8.77it/s] 4it [00:00, 9.16it/s] 5it [00:00, 9.44it/s] 6it [00:00, 9.52it/s] 7it [00:00, 9.62it/s] 8it [00:00, 9.68it/s] 9it [00:00, 9.73it/s] 10it [00:01, 9.73it/s] 11it [00:01, 9.77it/s] 12it [00:01, 9.78it/s] 13it [00:01, 9.27it/s] 14it [00:01, 9.46it/s] 15it [00:01, 9.61it/s] 16it [00:01, 9.71it/s] 18it [00:01, 9.46it/s] 19it [00:02, 9.54it/s] 20it [00:02, 9.65it/s] 22it [00:02, 9.82it/s] 24it [00:02, 9.91it/s] 26it [00:02, 9.96it/s] 27it [00:02, 9.96it/s] 29it [00:03, 9.95it/s] 30it [00:03, 9.95it/s] 32it [00:03, 9.99it/s] 34it [00:03, 10.00it/s] 35it [00:03, 9.98it/s] 37it [00:03, 9.98it/s] 38it [00:03, 9.98it/s] 40it [00:04, 10.00it/s] 42it [00:04, 10.02it/s] 44it [00:04, 10.04it/s] 46it [00:04, 10.05it/s] 48it [00:04, 10.06it/s] 50it [00:05, 10.03it/s]2025-05-26 04:00:30,203 - INFO - [Epoch 025 | Batch 0050] IWAE-loss 5141.8364 | mean log_px -0.0226 | KL -3558.55 + 52it [00:05, 10.01it/s] 54it [00:05, 10.03it/s] 56it [00:05, 10.04it/s] 58it [00:05, 10.06it/s] 60it [00:06, 10.06it/s] 62it [00:06, 10.06it/s] 64it [00:06, 10.07it/s] 66it [00:06, 10.06it/s] 68it [00:06, 10.06it/s] 70it [00:07, 10.04it/s] 72it [00:07, 9.77it/s] 73it [00:07, 9.81it/s] 75it [00:07, 9.88it/s] 77it [00:07, 9.94it/s] 78it [00:07, 9.95it/s] 80it [00:08, 10.00it/s] 82it [00:08, 9.99it/s] 83it [00:08, 9.90it/s] 84it [00:08, 9.85it/s] 85it [00:08, 9.39it/s] 86it [00:08, 9.52it/s] 88it [00:08, 9.75it/s] 90it [00:09, 9.87it/s] 92it [00:09, 9.93it/s] 93it [00:09, 9.94it/s] 95it [00:09, 9.96it/s] 96it [00:09, 9.88it/s] 97it [00:09, 9.41it/s] 98it [00:09, 9.55it/s] 100it [00:10, 9.75it/s]2025-05-26 04:00:35,262 - INFO - [Epoch 025 | Batch 0100] IWAE-loss 6209.9375 | mean log_px -0.0399 | KL -3555.98 + 101it [00:10, 9.79it/s] 102it [00:10, 9.84it/s] 104it [00:10, 9.94it/s] 106it [00:10, 9.98it/s] 108it [00:10, 10.01it/s] 110it [00:11, 10.02it/s] 112it [00:11, 10.03it/s] 114it [00:11, 9.69it/s] 115it [00:11, 9.74it/s] 116it [00:11, 9.79it/s] 118it [00:11, 9.88it/s] 119it [00:12, 9.48it/s] 120it [00:12, 9.59it/s] 122it [00:12, 9.77it/s] 124it [00:12, 9.88it/s] 125it [00:12, 9.89it/s] 127it [00:12, 9.97it/s] 128it [00:13, 9.97it/s] 130it [00:13, 10.01it/s] 132it [00:13, 10.02it/s] 134it [00:13, 10.03it/s] 136it [00:13, 10.04it/s] 138it [00:14, 10.02it/s] 140it [00:14, 10.03it/s] 142it [00:14, 10.04it/s] 144it [00:14, 10.04it/s] 146it [00:14, 10.05it/s] 148it [00:14, 10.04it/s] 150it [00:15, 10.01it/s]2025-05-26 04:00:40,287 - INFO - [Epoch 025 | Batch 0150] IWAE-loss 8218.2256 | mean log_px -0.0712 | KL -3553.84 + 152it [00:15, 10.01it/s] 154it [00:15, 9.67it/s] 155it [00:15, 9.73it/s] 156it [00:15, 9.75it/s] 157it [00:15, 9.80it/s] 159it [00:16, 9.89it/s] 160it [00:16, 9.90it/s] 161it [00:16, 9.92it/s] 162it [00:16, 9.51it/s] 164it [00:16, 9.75it/s] 165it [00:16, 9.34it/s] 166it [00:16, 9.47it/s] 167it [00:16, 9.60it/s] 168it [00:17, 9.66it/s] 170it [00:17, 9.83it/s] 171it [00:17, 9.45it/s] 172it [00:17, 9.56it/s] 173it [00:17, 9.67it/s] 174it [00:17, 9.73it/s] 176it [00:17, 9.88it/s] 178it [00:18, 9.94it/s] 179it [00:18, 9.95it/s] 180it [00:18, 9.54it/s] 181it [00:18, 9.65it/s] 182it [00:18, 9.74it/s] 184it [00:18, 9.88it/s] 186it [00:18, 9.97it/s] 188it [00:19, 10.00it/s] 190it [00:19, 10.01it/s] 192it [00:19, 10.02it/s] 194it [00:19, 10.03it/s] 196it [00:19, 9.71it/s] 196it [00:19, 9.82it/s] +2025-05-26 04:00:44,986 - INFO - Epoch: 25, Objective: tensor([8688.2051], device='cuda:0', grad_fn=), Loss: 0.08251015841960907, KL/n: 72.58772277832031 + 0it [00:00, ?it/s]2025-05-26 04:00:45,437 - INFO - [Epoch 026 | Batch 0000] IWAE-loss 7151.1875 | mean log_px -0.0637 | KL -3554.05 + 1it [00:00, 4.76it/s] 2it [00:00, 6.88it/s] 4it [00:00, 8.58it/s] 6it [00:00, 9.15it/s] 7it [00:00, 9.14it/s] 8it [00:00, 9.18it/s] 9it [00:01, 8.85it/s] 10it [00:01, 9.13it/s] 11it [00:01, 9.35it/s] 12it [00:01, 9.50it/s] 14it [00:01, 9.24it/s] 16it [00:01, 9.54it/s] 17it [00:01, 9.61it/s] 18it [00:02, 9.20it/s] 19it [00:02, 9.37it/s] 20it [00:02, 9.51it/s] 21it [00:02, 9.64it/s] 23it [00:02, 9.80it/s] 24it [00:02, 9.43it/s] 26it [00:02, 9.66it/s] 28it [00:03, 9.80it/s] 30it [00:03, 9.89it/s] 32it [00:03, 9.94it/s] 34it [00:03, 9.98it/s] 36it [00:03, 10.00it/s] 38it [00:04, 10.01it/s] 39it [00:04, 9.62it/s] 40it [00:04, 9.67it/s] 42it [00:04, 9.81it/s] 44it [00:04, 9.89it/s] 46it [00:04, 9.95it/s] 47it [00:04, 9.94it/s] 48it [00:05, 9.95it/s] 50it [00:05, 9.57it/s]2025-05-26 04:00:50,615 - INFO - [Epoch 026 | Batch 0050] IWAE-loss 8084.2090 | mean log_px -0.0655 | KL -3553.26 + 51it [00:05, 9.65it/s] 53it [00:05, 9.81it/s] 54it [00:05, 9.83it/s] 56it [00:05, 9.91it/s] 58it [00:06, 9.96it/s] 60it [00:06, 9.99it/s] 62it [00:06, 10.01it/s] 64it [00:06, 9.73it/s] 66it [00:06, 9.83it/s] 68it [00:07, 9.88it/s] 69it [00:07, 9.51it/s] 70it [00:07, 9.60it/s] 72it [00:07, 9.76it/s] 73it [00:07, 9.80it/s] 74it [00:07, 9.84it/s] 76it [00:07, 9.91it/s] 78it [00:08, 9.96it/s] 80it [00:08, 9.96it/s] 81it [00:08, 9.97it/s] 82it [00:08, 9.97it/s] 84it [00:08, 10.01it/s] 86it [00:08, 10.01it/s] 88it [00:09, 10.00it/s] 89it [00:09, 9.99it/s] 90it [00:09, 9.99it/s] 91it [00:09, 9.97it/s] 93it [00:09, 9.96it/s] 94it [00:09, 9.97it/s] 95it [00:09, 9.46it/s] 96it [00:09, 9.57it/s] 97it [00:10, 9.68it/s] 98it [00:10, 9.19it/s] 99it [00:10, 9.41it/s] 100it [00:10, 9.56it/s]2025-05-26 04:00:55,699 - INFO - [Epoch 026 | Batch 0100] IWAE-loss 6382.7183 | mean log_px -0.0501 | KL -3556.70 + 101it [00:10, 9.65it/s] 102it [00:10, 9.73it/s] 103it [00:10, 9.18it/s] 104it [00:10, 9.37it/s] 105it [00:10, 9.47it/s] 106it [00:10, 9.03it/s] 108it [00:11, 9.12it/s] 109it [00:11, 9.31it/s] 110it [00:11, 9.48it/s] 112it [00:11, 9.26it/s] 113it [00:11, 9.42it/s] 114it [00:11, 9.56it/s] 116it [00:12, 9.76it/s] 118it [00:12, 9.86it/s] 119it [00:12, 9.88it/s] 120it [00:12, 9.91it/s] 121it [00:12, 9.93it/s] 123it [00:12, 9.98it/s] 124it [00:12, 9.98it/s] 126it [00:13, 10.01it/s] 128it [00:13, 9.62it/s] 129it [00:13, 9.69it/s] 130it [00:13, 9.75it/s] 132it [00:13, 9.87it/s] 134it [00:13, 9.94it/s] 136it [00:14, 9.98it/s] 137it [00:14, 9.65it/s] 138it [00:14, 9.62it/s] 140it [00:14, 9.78it/s] 142it [00:14, 9.86it/s] 144it [00:14, 9.80it/s] 145it [00:14, 9.52it/s] 146it [00:15, 9.61it/s] 147it [00:15, 9.66it/s] 148it [00:15, 9.20it/s] 149it [00:15, 9.35it/s] 150it [00:15, 9.50it/s]2025-05-26 04:01:00,884 - INFO - [Epoch 026 | Batch 0150] IWAE-loss 8474.0977 | mean log_px -0.0783 | KL -3551.70 + 151it [00:15, 9.55it/s] 152it [00:15, 9.65it/s] 153it [00:15, 9.74it/s] 154it [00:15, 9.79it/s] 156it [00:16, 9.90it/s] 158it [00:16, 9.97it/s] 160it [00:16, 9.92it/s] 162it [00:16, 9.58it/s] 164it [00:16, 9.71it/s] 166it [00:17, 9.82it/s] 167it [00:17, 9.46it/s] 168it [00:17, 9.56it/s] 169it [00:17, 9.65it/s] 170it [00:17, 9.73it/s] 171it [00:17, 9.79it/s] 172it [00:17, 9.77it/s] 173it [00:17, 9.82it/s] 174it [00:17, 9.87it/s] 176it [00:18, 9.95it/s] 178it [00:18, 9.99it/s] 179it [00:18, 9.49it/s] 180it [00:18, 9.59it/s] 182it [00:18, 9.76it/s] 184it [00:19, 9.87it/s] 185it [00:19, 9.55it/s] 186it [00:19, 9.64it/s] 188it [00:19, 9.79it/s] 189it [00:19, 9.82it/s] 190it [00:19, 9.86it/s] 191it [00:19, 9.87it/s] 192it [00:19, 9.87it/s] 193it [00:19, 9.90it/s] 194it [00:20, 9.29it/s] 195it [00:20, 9.10it/s] 196it [00:20, 9.64it/s] +2025-05-26 04:01:05,621 - INFO - Epoch: 26, Objective: tensor([10124.8457], device='cuda:0', grad_fn=), Loss: 0.10262526571750641, KL/n: 72.52192687988281 + 0it [00:00, ?it/s]2025-05-26 04:01:05,891 - INFO - [Epoch 027 | Batch 0000] IWAE-loss 5660.2915 | mean log_px -0.0403 | KL -3550.19 + 1it [00:00, 4.81it/s] 3it [00:00, 7.85it/s] 4it [00:00, 8.45it/s] 6it [00:00, 9.20it/s] 8it [00:00, 9.56it/s] 10it [00:01, 9.76it/s] 12it [00:01, 9.87it/s] 14it [00:01, 9.96it/s] 15it [00:01, 9.56it/s] 16it [00:01, 9.54it/s] 17it [00:01, 9.60it/s] 18it [00:01, 9.65it/s] 20it [00:02, 9.39it/s] 22it [00:02, 9.65it/s] 24it [00:02, 9.80it/s] 26it [00:02, 9.92it/s] 27it [00:02, 9.61it/s] 29it [00:03, 9.79it/s] 30it [00:03, 9.81it/s] 31it [00:03, 9.81it/s] 33it [00:03, 9.93it/s] 35it [00:03, 10.01it/s] 37it [00:03, 10.04it/s] 39it [00:04, 10.08it/s] 41it [00:04, 10.06it/s] 43it [00:04, 9.75it/s] 45it [00:04, 9.85it/s] 46it [00:04, 9.50it/s] 47it [00:04, 9.58it/s] 49it [00:05, 9.37it/s] 50it [00:05, 9.49it/s]2025-05-26 04:01:11,020 - INFO - [Epoch 027 | Batch 0050] IWAE-loss 7041.8789 | mean log_px -0.0514 | KL -3547.65 + 51it [00:05, 9.59it/s] 53it [00:05, 9.80it/s] 55it [00:05, 9.91it/s] 57it [00:05, 9.97it/s] 59it [00:06, 10.02it/s] 61it [00:06, 10.04it/s] 63it [00:06, 10.03it/s] 65it [00:06, 9.70it/s] 67it [00:06, 9.82it/s] 68it [00:07, 9.83it/s] 70it [00:07, 9.91it/s] 71it [00:07, 9.89it/s] 72it [00:07, 9.47it/s] 73it [00:07, 9.58it/s] 74it [00:07, 9.68it/s] 76it [00:07, 9.84it/s] 77it [00:07, 9.41it/s] 79it [00:08, 9.68it/s] 81it [00:08, 9.83it/s] 83it [00:08, 9.53it/s] 84it [00:08, 9.58it/s] 86it [00:08, 9.76it/s] 87it [00:08, 9.78it/s] 88it [00:09, 9.80it/s] 90it [00:09, 9.90it/s] 92it [00:09, 9.98it/s] 94it [00:09, 10.02it/s] 96it [00:09, 10.00it/s] 98it [00:10, 10.03it/s] 100it [00:10, 10.06it/s]2025-05-26 04:01:16,086 - INFO - [Epoch 027 | Batch 0100] IWAE-loss 7957.1924 | mean log_px -0.0696 | KL -3551.78 + 102it [00:10, 9.69it/s] 103it [00:10, 9.73it/s] 105it [00:10, 9.48it/s] 106it [00:10, 9.55it/s] 108it [00:11, 9.74it/s] 109it [00:11, 9.77it/s] 111it [00:11, 9.90it/s] 113it [00:11, 9.59it/s] 114it [00:11, 9.63it/s] 115it [00:11, 9.51it/s] 116it [00:11, 9.42it/s] 117it [00:12, 9.47it/s] 119it [00:12, 9.72it/s] 120it [00:12, 9.78it/s] 122it [00:12, 9.89it/s] 123it [00:12, 9.54it/s] 124it [00:12, 9.64it/s] 125it [00:12, 9.73it/s] 126it [00:12, 9.79it/s] 127it [00:13, 9.79it/s] 129it [00:13, 9.92it/s] 131it [00:13, 9.89it/s] 132it [00:13, 9.88it/s] 133it [00:13, 9.90it/s] 134it [00:13, 9.92it/s] 136it [00:13, 9.98it/s] 137it [00:14, 9.94it/s] 139it [00:14, 10.00it/s] 141it [00:14, 10.02it/s] 143it [00:14, 9.66it/s] 145it [00:14, 9.79it/s] 146it [00:15, 9.79it/s] 147it [00:15, 9.81it/s] 149it [00:15, 9.91it/s] 150it [00:15, 9.88it/s]2025-05-26 04:01:21,219 - INFO - [Epoch 027 | Batch 0150] IWAE-loss 7002.5981 | mean log_px -0.0568 | KL -3547.20 + 151it [00:15, 9.41it/s] 153it [00:15, 9.69it/s] 155it [00:15, 9.82it/s] 157it [00:16, 9.92it/s] 158it [00:16, 9.93it/s] 160it [00:16, 9.97it/s] 162it [00:16, 9.96it/s] 163it [00:16, 9.89it/s] 164it [00:16, 9.88it/s] 165it [00:16, 9.87it/s] 166it [00:17, 9.86it/s] 167it [00:17, 9.86it/s] 168it [00:17, 9.74it/s] 169it [00:17, 9.55it/s] 170it [00:17, 8.87it/s] 171it [00:17, 8.31it/s] 172it [00:17, 8.50it/s] 173it [00:17, 8.76it/s] 174it [00:17, 9.05it/s] 175it [00:18, 9.27it/s] 176it [00:18, 8.95it/s] 177it [00:18, 9.17it/s] 178it [00:18, 9.38it/s] 179it [00:18, 9.49it/s] 180it [00:18, 9.00it/s] 181it [00:18, 9.26it/s] 182it [00:18, 9.38it/s] 183it [00:18, 9.45it/s] 184it [00:19, 9.49it/s] 185it [00:19, 9.60it/s] 186it [00:19, 9.60it/s] 187it [00:19, 9.61it/s] 188it [00:19, 9.66it/s] 190it [00:19, 9.88it/s] 191it [00:19, 9.44it/s] 192it [00:19, 9.45it/s] 193it [00:19, 9.49it/s] 194it [00:20, 9.52it/s] 195it [00:20, 9.19it/s] 196it [00:20, 8.95it/s] 196it [00:20, 9.63it/s] +2025-05-26 04:01:26,095 - INFO - Epoch: 27, Objective: tensor([5026.2368], device='cuda:0', grad_fn=), Loss: 0.021482713520526886, KL/n: 72.46076965332031 + 0it [00:00, ?it/s]2025-05-26 04:01:26,558 - INFO - [Epoch 028 | Batch 0000] IWAE-loss 6144.6147 | mean log_px -0.0405 | KL -3548.91 + 1it [00:00, 5.19it/s] 2it [00:00, 6.69it/s] 3it [00:00, 7.75it/s] 4it [00:00, 8.47it/s] 5it [00:00, 8.93it/s] 6it [00:00, 9.18it/s] 7it [00:00, 9.39it/s] 8it [00:00, 9.53it/s] 9it [00:01, 9.64it/s] 10it [00:01, 9.70it/s] 11it [00:01, 9.79it/s] 13it [00:01, 9.91it/s] 14it [00:01, 9.91it/s] 16it [00:01, 9.95it/s] 17it [00:01, 9.94it/s] 18it [00:01, 9.37it/s] 20it [00:02, 9.64it/s] 21it [00:02, 9.68it/s] 22it [00:02, 9.72it/s] 23it [00:02, 9.74it/s] 24it [00:02, 9.75it/s] 25it [00:02, 9.79it/s] 26it [00:02, 9.84it/s] 28it [00:02, 9.94it/s] 29it [00:03, 9.92it/s] 31it [00:03, 9.99it/s] 32it [00:03, 9.95it/s] 33it [00:03, 9.94it/s] 34it [00:03, 9.88it/s] 35it [00:03, 9.89it/s] 36it [00:03, 9.46it/s] 37it [00:03, 9.57it/s] 38it [00:03, 9.65it/s] 39it [00:04, 9.13it/s] 40it [00:04, 9.17it/s] 41it [00:04, 9.33it/s] 42it [00:04, 9.51it/s] 44it [00:04, 9.74it/s] 45it [00:04, 9.39it/s] 46it [00:04, 9.52it/s] 47it [00:04, 9.62it/s] 48it [00:05, 9.14it/s] 50it [00:05, 9.52it/s]2025-05-26 04:01:31,733 - INFO - [Epoch 028 | Batch 0050] IWAE-loss 7022.5996 | mean log_px -0.0538 | KL -3548.01 + 51it [00:05, 9.60it/s] 52it [00:05, 9.28it/s] 53it [00:05, 9.38it/s] 54it [00:05, 9.50it/s] 55it [00:05, 9.09it/s] 57it [00:06, 9.52it/s] 59it [00:06, 9.73it/s] 61it [00:06, 9.48it/s] 62it [00:06, 9.56it/s] 64it [00:06, 9.73it/s] 65it [00:06, 9.36it/s] 66it [00:06, 9.50it/s] 67it [00:07, 9.61it/s] 68it [00:07, 9.70it/s] 69it [00:07, 9.24it/s] 70it [00:07, 9.43it/s] 72it [00:07, 9.67it/s] 73it [00:07, 9.27it/s] 74it [00:07, 9.43it/s] 76it [00:07, 9.68it/s] 77it [00:08, 9.31it/s] 78it [00:08, 9.45it/s] 79it [00:08, 9.59it/s] 80it [00:08, 9.68it/s] 81it [00:08, 9.22it/s] 82it [00:08, 9.41it/s] 83it [00:08, 9.58it/s] 84it [00:08, 9.68it/s] 85it [00:08, 9.20it/s] 86it [00:09, 9.41it/s] 88it [00:09, 9.70it/s] 90it [00:09, 9.86it/s] 92it [00:09, 9.94it/s] 94it [00:09, 10.00it/s] 96it [00:10, 10.03it/s] 98it [00:10, 10.04it/s] 100it [00:10, 10.06it/s]2025-05-26 04:01:36,919 - INFO - [Epoch 028 | Batch 0100] IWAE-loss 7795.5220 | mean log_px -0.0668 | KL -3546.89 + 102it [00:10, 9.71it/s] 104it [00:10, 9.82it/s] 106it [00:11, 9.91it/s] 108it [00:11, 9.97it/s] 110it [00:11, 10.01it/s] 112it [00:11, 9.69it/s] 114it [00:11, 9.53it/s] 116it [00:12, 9.67it/s] 117it [00:12, 9.42it/s] 119it [00:12, 9.65it/s] 121it [00:12, 9.79it/s] 122it [00:12, 9.83it/s] 124it [00:12, 9.91it/s] 126it [00:13, 9.97it/s] 127it [00:13, 9.57it/s] 129it [00:13, 9.75it/s] 131it [00:13, 9.83it/s] 133it [00:13, 9.89it/s] 135it [00:14, 9.94it/s] 136it [00:14, 9.57it/s] 138it [00:14, 9.72it/s] 140it [00:14, 9.48it/s] 142it [00:14, 9.64it/s] 144it [00:14, 9.78it/s] 146it [00:15, 9.88it/s] 148it [00:15, 9.61it/s] 150it [00:15, 9.72it/s]2025-05-26 04:01:42,066 - INFO - [Epoch 028 | Batch 0150] IWAE-loss 6129.2549 | mean log_px -0.0445 | KL -3552.00 + 151it [00:15, 9.68it/s] 153it [00:15, 9.81it/s] 154it [00:16, 9.59it/s] 156it [00:16, 9.76it/s] 158it [00:16, 9.87it/s] 159it [00:16, 9.88it/s] 161it [00:16, 9.97it/s] 162it [00:16, 9.97it/s] 164it [00:17, 10.01it/s] 166it [00:17, 10.04it/s] 168it [00:17, 10.03it/s] 170it [00:17, 10.05it/s] 172it [00:17, 10.04it/s] 174it [00:18, 9.72it/s] 176it [00:18, 9.82it/s] 177it [00:18, 9.49it/s] 179it [00:18, 9.66it/s] 181it [00:18, 9.80it/s] 183it [00:18, 9.62it/s] 184it [00:19, 9.67it/s] 185it [00:19, 9.67it/s] 186it [00:19, 9.24it/s] 188it [00:19, 9.57it/s] 190it [00:19, 9.74it/s] 192it [00:19, 9.83it/s] 193it [00:20, 9.44it/s] 195it [00:20, 9.39it/s] 196it [00:20, 9.62it/s] +2025-05-26 04:01:46,789 - INFO - Epoch: 28, Objective: tensor([7316.0479], device='cuda:0', grad_fn=), Loss: 0.06041298806667328, KL/n: 72.37413787841797 + 0it [00:00, ?it/s]2025-05-26 04:01:47,075 - INFO - [Epoch 029 | Batch 0000] IWAE-loss 5790.9482 | mean log_px -0.0366 | KL -3544.11 + 1it [00:00, 4.45it/s] 3it [00:00, 7.63it/s] 5it [00:00, 8.75it/s] 7it [00:00, 9.29it/s] 9it [00:01, 9.61it/s] 11it [00:01, 9.80it/s] 13it [00:01, 9.56it/s] 15it [00:01, 9.75it/s] 17it [00:01, 9.89it/s] 19it [00:02, 9.93it/s] 20it [00:02, 9.45it/s] 21it [00:02, 9.42it/s] 22it [00:02, 9.55it/s] 24it [00:02, 9.79it/s] 26it [00:02, 9.93it/s] 28it [00:02, 10.01it/s] 30it [00:03, 10.08it/s] 32it [00:03, 10.07it/s] 34it [00:03, 10.09it/s] 36it [00:03, 9.69it/s] 38it [00:03, 9.78it/s] 40it [00:04, 9.90it/s] 42it [00:04, 9.99it/s] 44it [00:04, 9.76it/s] 46it [00:04, 9.85it/s] 48it [00:04, 9.95it/s] 50it [00:05, 10.00it/s]2025-05-26 04:01:52,141 - INFO - [Epoch 029 | Batch 0050] IWAE-loss 8045.6401 | mean log_px -0.0730 | KL -3546.79 + 52it [00:05, 9.71it/s] 54it [00:05, 9.83it/s] 56it [00:05, 9.93it/s] 57it [00:05, 9.58it/s] 59it [00:06, 9.78it/s] 61it [00:06, 9.91it/s] 63it [00:06, 9.95it/s] 64it [00:06, 9.91it/s] 65it [00:06, 9.58it/s] 67it [00:06, 9.80it/s] 69it [00:07, 9.93it/s] 71it [00:07, 10.00it/s] 72it [00:07, 9.60it/s] 74it [00:07, 9.80it/s] 76it [00:07, 9.63it/s] 78it [00:08, 9.81it/s] 80it [00:08, 9.54it/s] 82it [00:08, 9.68it/s] 83it [00:08, 9.73it/s] 84it [00:08, 9.73it/s] 85it [00:08, 9.77it/s] 87it [00:08, 9.59it/s] 89it [00:09, 9.79it/s] 91it [00:09, 9.92it/s] 93it [00:09, 10.01it/s] 95it [00:09, 9.73it/s] 97it [00:09, 9.86it/s] 99it [00:10, 9.96it/s]2025-05-26 04:01:57,245 - INFO - [Epoch 029 | Batch 0100] IWAE-loss 7717.3555 | mean log_px -0.0658 | KL -3546.15 + 101it [00:10, 9.69it/s] 103it [00:10, 9.83it/s] 105it [00:10, 9.94it/s] 107it [00:10, 10.02it/s] 109it [00:11, 10.07it/s] 111it [00:11, 10.10it/s] 113it [00:11, 10.11it/s] 115it [00:11, 10.13it/s] 117it [00:11, 10.11it/s] 119it [00:12, 10.10it/s] 121it [00:12, 10.14it/s] 123it [00:12, 10.13it/s] 125it [00:12, 10.16it/s] 127it [00:12, 10.18it/s] 129it [00:13, 9.83it/s] 130it [00:13, 9.54it/s] 132it [00:13, 9.41it/s] 134it [00:13, 9.64it/s] 135it [00:13, 9.70it/s] 136it [00:13, 9.34it/s] 138it [00:14, 9.64it/s] 140it [00:14, 9.83it/s] 142it [00:14, 9.93it/s] 144it [00:14, 10.01it/s] 146it [00:14, 10.08it/s] 148it [00:15, 10.06it/s] 150it [00:15, 9.78it/s]2025-05-26 04:02:02,298 - INFO - [Epoch 029 | Batch 0150] IWAE-loss 9115.5293 | mean log_px -0.0874 | KL -3541.34 + 152it [00:15, 9.85it/s] 154it [00:15, 9.93it/s] 156it [00:15, 10.02it/s] 158it [00:16, 10.06it/s] 160it [00:16, 9.73it/s] 162it [00:16, 9.87it/s] 164it [00:16, 9.92it/s] 166it [00:16, 10.00it/s] 168it [00:17, 10.06it/s] 170it [00:17, 9.82it/s] 172it [00:17, 9.91it/s] 173it [00:17, 9.57it/s] 175it [00:17, 9.69it/s] 177it [00:18, 9.85it/s] 179it [00:18, 9.66it/s] 181it [00:18, 9.81it/s] 183it [00:18, 9.91it/s] 185it [00:18, 10.00it/s] 186it [00:18, 9.99it/s] 187it [00:19, 9.67it/s] 189it [00:19, 9.82it/s] 191it [00:19, 9.94it/s] 193it [00:19, 9.98it/s] 195it [00:19, 9.78it/s] 196it [00:19, 9.54it/s] 196it [00:20, 9.77it/s] +2025-05-26 04:02:06,972 - INFO - Epoch: 29, Objective: tensor([7595.7744], device='cuda:0', grad_fn=), Loss: 0.06281988322734833, KL/n: 72.2783432006836 + 0it [00:00, ?it/s]2025-05-26 04:02:07,244 - INFO - [Epoch 030 | Batch 0000] IWAE-loss 7184.0381 | mean log_px -0.0520 | KL -3540.00 + 1it [00:00, 5.41it/s] 2it [00:00, 6.77it/s] 4it [00:00, 8.58it/s] 6it [00:00, 8.90it/s] 8it [00:00, 9.34it/s] 10it [00:01, 9.61it/s] 12it [00:01, 9.80it/s] 13it [00:01, 9.43it/s] 15it [00:01, 9.69it/s] 17it [00:01, 9.86it/s] 19it [00:02, 9.97it/s] 20it [00:02, 7.44it/s] 21it [00:02, 7.64it/s] 23it [00:02, 8.43it/s] 24it [00:02, 8.39it/s] 26it [00:02, 8.98it/s] 27it [00:03, 9.16it/s] 28it [00:03, 9.33it/s] 30it [00:03, 9.34it/s] 32it [00:03, 9.59it/s] 33it [00:03, 9.28it/s] 35it [00:03, 9.57it/s] 36it [00:03, 9.66it/s] 37it [00:04, 9.30it/s] 39it [00:04, 9.62it/s] 41it [00:04, 9.81it/s] 43it [00:04, 9.53it/s] 45it [00:04, 9.73it/s] 47it [00:05, 9.87it/s] 48it [00:05, 9.53it/s] 50it [00:05, 9.74it/s]2025-05-26 04:02:12,575 - INFO - [Epoch 030 | Batch 0050] IWAE-loss 5986.0142 | mean log_px -0.0354 | KL -3537.95 + 51it [00:05, 9.40it/s] 53it [00:05, 9.67it/s] 55it [00:05, 9.84it/s] 56it [00:06, 9.48it/s] 58it [00:06, 9.72it/s] 60it [00:06, 9.86it/s] 61it [00:06, 9.87it/s] 63it [00:06, 9.97it/s] 65it [00:06, 10.04it/s] 67it [00:07, 10.07it/s] 69it [00:07, 9.71it/s] 70it [00:07, 9.71it/s] 71it [00:07, 9.62it/s] 72it [00:07, 9.68it/s] 73it [00:07, 9.75it/s] 75it [00:07, 9.93it/s] 77it [00:08, 10.02it/s] 79it [00:08, 10.07it/s] 81it [00:08, 10.07it/s] 83it [00:08, 10.09it/s] 85it [00:08, 10.03it/s] 87it [00:09, 10.06it/s] 89it [00:09, 9.81it/s] 91it [00:09, 9.89it/s] 93it [00:09, 9.97it/s] 94it [00:09, 9.98it/s] 96it [00:10, 9.65it/s] 98it [00:10, 9.80it/s] 100it [00:10, 9.91it/s]2025-05-26 04:02:17,641 - INFO - [Epoch 030 | Batch 0100] IWAE-loss 5398.5059 | mean log_px -0.0280 | KL -3539.20 + 101it [00:10, 9.53it/s] 102it [00:10, 9.60it/s] 104it [00:10, 9.77it/s] 105it [00:11, 9.81it/s] 107it [00:11, 9.94it/s] 109it [00:11, 10.01it/s] 110it [00:11, 9.60it/s] 112it [00:11, 9.79it/s] 114it [00:11, 9.52it/s] 115it [00:12, 9.57it/s] 117it [00:12, 9.77it/s] 119it [00:12, 9.89it/s] 121it [00:12, 9.96it/s] 122it [00:12, 9.64it/s] 124it [00:12, 9.83it/s] 126it [00:13, 9.90it/s] 127it [00:13, 9.81it/s] 128it [00:13, 9.66it/s] 129it [00:13, 9.21it/s] 131it [00:13, 9.57it/s] 133it [00:13, 9.79it/s] 135it [00:14, 9.91it/s] 137it [00:14, 10.01it/s] 138it [00:14, 9.62it/s] 140it [00:14, 9.79it/s] 141it [00:14, 9.43it/s] 143it [00:14, 9.68it/s] 145it [00:15, 9.84it/s] 147it [00:15, 9.94it/s] 149it [00:15, 10.00it/s]2025-05-26 04:02:22,758 - INFO - [Epoch 030 | Batch 0150] IWAE-loss 8095.3145 | mean log_px -0.0698 | KL -3535.73 + 151it [00:15, 9.68it/s] 153it [00:15, 9.82it/s] 154it [00:16, 9.82it/s] 156it [00:16, 9.93it/s] 157it [00:16, 9.94it/s] 159it [00:16, 10.00it/s] 161it [00:16, 10.05it/s] 163it [00:16, 10.04it/s] 165it [00:17, 9.70it/s] 167it [00:17, 9.83it/s] 168it [00:17, 9.48it/s] 170it [00:17, 9.71it/s] 172it [00:17, 9.86it/s] 173it [00:17, 9.45it/s] 175it [00:18, 9.69it/s] 177it [00:18, 9.82it/s] 178it [00:18, 9.82it/s] 180it [00:18, 9.63it/s] 182it [00:18, 9.79it/s] 184it [00:19, 9.91it/s] 185it [00:19, 9.55it/s] 187it [00:19, 9.76it/s] 189it [00:19, 9.87it/s] 191it [00:19, 9.97it/s] 193it [00:19, 10.03it/s] 195it [00:20, 9.81it/s] 196it [00:20, 9.59it/s] 196it [00:20, 9.62it/s] +2025-05-26 04:02:27,471 - INFO - Epoch: 30, Objective: tensor([8346.3223], device='cuda:0', grad_fn=), Loss: 0.08652433753013611, KL/n: 72.18109130859375 + 0it [00:00, ?it/s]2025-05-26 04:02:27,724 - INFO - [Epoch 031 | Batch 0000] IWAE-loss 7981.7705 | mean log_px -0.0697 | KL -3537.61 + 1it [00:00, 5.44it/s] 3it [00:00, 8.25it/s] 4it [00:00, 8.78it/s] 6it [00:00, 9.38it/s] 8it [00:00, 9.64it/s] 9it [00:00, 9.35it/s] 10it [00:01, 9.48it/s] 11it [00:01, 9.59it/s] 12it [00:01, 9.66it/s] 14it [00:01, 9.81it/s] 15it [00:01, 9.85it/s] 16it [00:01, 9.88it/s] 17it [00:01, 9.69it/s] 18it [00:01, 9.67it/s] 20it [00:02, 9.79it/s] 22it [00:02, 9.91it/s] 23it [00:02, 9.47it/s] 24it [00:02, 9.56it/s] 25it [00:02, 9.63it/s] 27it [00:02, 9.37it/s] 28it [00:02, 9.50it/s] 30it [00:03, 9.66it/s] 31it [00:03, 9.71it/s] 33it [00:03, 9.85it/s] 34it [00:03, 9.88it/s] 36it [00:03, 9.95it/s] 38it [00:03, 9.60it/s] 40it [00:04, 9.71it/s] 42it [00:04, 9.82it/s] 43it [00:04, 9.83it/s] 45it [00:04, 9.91it/s] 46it [00:04, 9.93it/s] 47it [00:04, 9.47it/s] 48it [00:05, 9.59it/s] 50it [00:05, 9.78it/s]2025-05-26 04:02:32,867 - INFO - [Epoch 031 | Batch 0050] IWAE-loss 7131.4248 | mean log_px -0.0549 | KL -3539.47 + 51it [00:05, 9.36it/s] 53it [00:05, 9.63it/s] 55it [00:05, 9.78it/s] 56it [00:05, 9.82it/s] 58it [00:06, 9.91it/s] 60it [00:06, 9.96it/s] 62it [00:06, 10.00it/s] 63it [00:06, 9.99it/s] 64it [00:06, 9.99it/s] 65it [00:06, 9.98it/s] 66it [00:06, 9.43it/s] 67it [00:06, 9.53it/s] 68it [00:07, 9.63it/s] 69it [00:07, 9.73it/s] 70it [00:07, 9.79it/s] 72it [00:07, 9.89it/s] 74it [00:07, 9.95it/s] 75it [00:07, 9.96it/s] 76it [00:07, 9.94it/s] 78it [00:08, 9.97it/s] 79it [00:08, 9.97it/s] 80it [00:08, 9.98it/s] 82it [00:08, 10.00it/s] 83it [00:08, 9.99it/s] 84it [00:08, 9.99it/s] 86it [00:08, 10.02it/s] 88it [00:09, 10.04it/s] 90it [00:09, 10.06it/s] 92it [00:09, 10.06it/s] 94it [00:09, 10.01it/s] 96it [00:09, 10.00it/s] 98it [00:10, 10.04it/s] 100it [00:10, 10.05it/s]2025-05-26 04:02:37,904 - INFO - [Epoch 031 | Batch 0100] IWAE-loss 6414.5449 | mean log_px -0.0424 | KL -3538.34 + 102it [00:10, 9.98it/s] 103it [00:10, 9.98it/s] 105it [00:10, 10.01it/s] 107it [00:10, 9.77it/s] 108it [00:11, 9.16it/s] 109it [00:11, 9.18it/s] 110it [00:11, 9.21it/s] 111it [00:11, 9.25it/s] 112it [00:11, 9.24it/s] 113it [00:11, 9.30it/s] 114it [00:11, 9.27it/s] 115it [00:11, 9.27it/s] 116it [00:11, 9.23it/s] 117it [00:12, 9.23it/s] 118it [00:12, 9.25it/s] 119it [00:12, 9.29it/s] 120it [00:12, 9.23it/s] 121it [00:12, 9.30it/s] 122it [00:12, 9.29it/s] 123it [00:12, 9.31it/s] 124it [00:12, 8.74it/s] 125it [00:12, 9.01it/s] 126it [00:13, 9.13it/s] 127it [00:13, 9.21it/s] 128it [00:13, 9.24it/s] 129it [00:13, 9.36it/s] 130it [00:13, 9.37it/s] 131it [00:13, 8.88it/s] 132it [00:13, 9.08it/s] 133it [00:13, 9.22it/s] 134it [00:13, 9.28it/s] 135it [00:14, 9.39it/s] 136it [00:14, 9.39it/s] 137it [00:14, 9.44it/s] 138it [00:14, 9.45it/s] 139it [00:14, 9.46it/s] 140it [00:14, 9.43it/s] 141it [00:14, 9.45it/s] 142it [00:14, 9.43it/s] 143it [00:14, 9.46it/s] 144it [00:14, 9.44it/s] 145it [00:15, 9.47it/s] 146it [00:15, 9.47it/s] 147it [00:15, 9.47it/s] 148it [00:15, 9.47it/s] 149it [00:15, 9.51it/s] 150it [00:15, 9.55it/s]2025-05-26 04:02:43,267 - INFO - [Epoch 031 | Batch 0150] IWAE-loss 7563.3599 | mean log_px -0.0640 | KL -3531.75 + 151it [00:15, 9.47it/s] 152it [00:15, 9.44it/s] 153it [00:15, 9.46it/s] 154it [00:16, 9.45it/s] 155it [00:16, 9.47it/s] 156it [00:16, 9.46it/s] 157it [00:16, 9.48it/s] 158it [00:16, 9.48it/s] 159it [00:16, 9.50it/s] 160it [00:16, 9.50it/s] 161it [00:16, 9.46it/s] 162it [00:16, 9.46it/s] 163it [00:16, 9.44it/s] 164it [00:17, 9.46it/s] 165it [00:17, 9.48it/s] 166it [00:17, 9.50it/s] 167it [00:17, 9.49it/s] 168it [00:17, 9.52it/s] 169it [00:17, 9.53it/s] 170it [00:17, 9.50it/s] 171it [00:17, 9.50it/s] 172it [00:17, 9.53it/s] 173it [00:18, 9.38it/s] 174it [00:18, 9.02it/s] 175it [00:18, 9.09it/s] 176it [00:18, 9.18it/s] 177it [00:18, 9.27it/s] 178it [00:18, 9.38it/s] 179it [00:18, 9.11it/s] 180it [00:18, 9.19it/s] 181it [00:18, 9.21it/s] 182it [00:19, 9.28it/s] 183it [00:19, 9.34it/s] 184it [00:19, 8.79it/s] 185it [00:19, 8.99it/s] 186it [00:19, 9.10it/s] 187it [00:19, 9.21it/s] 188it [00:19, 9.29it/s] 189it [00:19, 9.34it/s] 190it [00:19, 9.40it/s] 191it [00:19, 9.44it/s] 192it [00:20, 9.45it/s] 193it [00:20, 9.44it/s] 194it [00:20, 9.43it/s] 195it [00:20, 8.90it/s] 196it [00:20, 9.10it/s] 196it [00:20, 9.52it/s] +2025-05-26 04:02:48,197 - INFO - Epoch: 31, Objective: tensor([6049.7988], device='cuda:0', grad_fn=), Loss: 0.03925026208162308, KL/n: 72.08685302734375 + 0it [00:00, ?it/s]2025-05-26 04:02:48,477 - INFO - [Epoch 032 | Batch 0000] IWAE-loss 5750.3301 | mean log_px -0.0349 | KL -3535.57 + 1it [00:00, 4.61it/s] 2it [00:00, 6.60it/s] 3it [00:00, 7.74it/s] 4it [00:00, 7.83it/s] 5it [00:00, 8.41it/s] 6it [00:00, 8.77it/s] 7it [00:00, 8.99it/s] 8it [00:00, 9.15it/s] 9it [00:01, 9.25it/s] 10it [00:01, 5.85it/s] 11it [00:01, 6.65it/s] 12it [00:01, 7.26it/s] 13it [00:01, 7.81it/s] 14it [00:01, 8.24it/s] 15it [00:01, 8.55it/s] 16it [00:02, 8.80it/s] 17it [00:02, 8.49it/s] 18it [00:02, 8.75it/s] 19it [00:02, 8.96it/s] 20it [00:02, 9.10it/s] 21it [00:02, 9.23it/s] 22it [00:02, 9.30it/s] 23it [00:02, 9.37it/s] 24it [00:02, 9.33it/s] 25it [00:02, 9.34it/s] 26it [00:03, 9.40it/s] 27it [00:03, 9.43it/s] 28it [00:03, 9.35it/s] 29it [00:03, 8.79it/s] 30it [00:03, 8.85it/s] 31it [00:03, 8.95it/s] 32it [00:03, 9.06it/s] 33it [00:03, 8.97it/s] 34it [00:04, 8.91it/s] 35it [00:04, 8.88it/s] 36it [00:04, 8.83it/s] 37it [00:04, 8.83it/s] 38it [00:04, 8.82it/s] 39it [00:04, 9.05it/s] 40it [00:04, 9.06it/s] 41it [00:04, 9.16it/s] 42it [00:04, 9.26it/s] 43it [00:04, 9.35it/s] 44it [00:05, 9.38it/s] 45it [00:05, 9.41it/s] 46it [00:05, 9.43it/s] 47it [00:05, 9.45it/s] 48it [00:05, 9.46it/s] 49it [00:05, 9.50it/s] 50it [00:05, 9.49it/s]2025-05-26 04:02:54,118 - INFO - [Epoch 032 | Batch 0050] IWAE-loss 5072.8218 | mean log_px -0.0260 | KL -3529.07 + 51it [00:05, 9.51it/s] 52it [00:05, 9.55it/s] 53it [00:06, 9.47it/s] 54it [00:06, 9.44it/s] 55it [00:06, 9.49it/s] 56it [00:06, 9.47it/s] 57it [00:06, 9.44it/s] 58it [00:06, 9.49it/s] 59it [00:06, 9.49it/s] 60it [00:06, 9.45it/s] 61it [00:06, 9.39it/s] 62it [00:07, 8.87it/s] 63it [00:07, 9.04it/s] 64it [00:07, 9.08it/s] 65it [00:07, 9.09it/s] 66it [00:07, 9.04it/s] 67it [00:07, 9.17it/s] 68it [00:07, 9.28it/s] 69it [00:07, 9.37it/s] 70it [00:07, 9.41it/s] 71it [00:07, 9.46it/s] 72it [00:08, 9.49it/s] 73it [00:08, 9.52it/s] 74it [00:08, 9.07it/s] 75it [00:08, 9.20it/s] 76it [00:08, 9.26it/s] 77it [00:08, 9.37it/s] 78it [00:08, 9.37it/s] 79it [00:08, 9.42it/s] 80it [00:08, 9.45it/s] 81it [00:09, 9.42it/s] 82it [00:09, 9.39it/s] 83it [00:09, 9.42it/s] 84it [00:09, 9.43it/s] 85it [00:09, 9.42it/s] 86it [00:09, 9.36it/s] 87it [00:09, 9.37it/s] 88it [00:09, 9.38it/s] 89it [00:09, 9.38it/s] 90it [00:10, 8.88it/s] 91it [00:10, 9.04it/s] 92it [00:10, 9.15it/s] 93it [00:10, 9.28it/s] 94it [00:10, 9.31it/s] 95it [00:10, 9.38it/s] 96it [00:10, 9.43it/s] 97it [00:10, 9.48it/s] 98it [00:10, 9.41it/s] 99it [00:10, 9.43it/s] 100it [00:11, 8.93it/s]2025-05-26 04:02:59,495 - INFO - [Epoch 032 | Batch 0100] IWAE-loss 6324.5918 | mean log_px -0.0521 | KL -3526.06 + 101it [00:11, 9.03it/s] 102it [00:11, 9.20it/s] 103it [00:11, 9.29it/s] 104it [00:11, 9.33it/s] 105it [00:11, 9.39it/s] 106it [00:11, 9.39it/s] 107it [00:11, 9.44it/s] 108it [00:11, 9.50it/s] 109it [00:12, 9.47it/s] 110it [00:12, 9.47it/s] 111it [00:12, 9.05it/s] 112it [00:12, 9.18it/s] 113it [00:12, 9.26it/s] 114it [00:12, 9.32it/s] 115it [00:12, 9.42it/s] 116it [00:12, 8.98it/s] 117it [00:12, 9.11it/s] 118it [00:13, 9.23it/s] 119it [00:13, 9.32it/s] 120it [00:13, 9.33it/s] 121it [00:13, 9.35it/s] 122it [00:13, 8.87it/s] 123it [00:13, 9.06it/s] 124it [00:13, 9.21it/s] 125it [00:13, 9.30it/s] 126it [00:13, 8.81it/s] 127it [00:14, 8.99it/s] 128it [00:14, 9.10it/s] 129it [00:14, 9.20it/s] 130it [00:14, 8.63it/s] 131it [00:14, 8.92it/s] 132it [00:14, 9.05it/s] 133it [00:14, 9.23it/s] 134it [00:14, 8.80it/s] 135it [00:14, 8.98it/s] 136it [00:15, 9.12it/s] 137it [00:15, 9.21it/s] 138it [00:15, 9.29it/s] 139it [00:15, 9.32it/s] 140it [00:15, 9.31it/s] 141it [00:15, 9.42it/s] 142it [00:15, 9.44it/s] 143it [00:15, 9.46it/s] 144it [00:15, 9.44it/s] 145it [00:15, 9.04it/s] 146it [00:16, 9.18it/s] 147it [00:16, 9.32it/s] 148it [00:16, 8.88it/s] 149it [00:16, 8.93it/s] 150it [00:16, 9.05it/s]2025-05-26 04:03:04,934 - INFO - [Epoch 032 | Batch 0150] IWAE-loss 7815.7627 | mean log_px -0.0678 | KL -3526.52 + 151it [00:16, 9.17it/s] 152it [00:16, 9.25it/s] 153it [00:16, 9.31it/s] 154it [00:16, 8.95it/s] 155it [00:17, 9.09it/s] 156it [00:17, 9.22it/s] 157it [00:17, 9.32it/s] 158it [00:17, 9.39it/s] 159it [00:17, 9.47it/s] 160it [00:17, 8.92it/s] 161it [00:17, 9.10it/s] 162it [00:17, 9.17it/s] 163it [00:17, 9.31it/s] 164it [00:18, 9.01it/s] 165it [00:18, 9.11it/s] 166it [00:18, 9.23it/s] 167it [00:18, 9.30it/s] 168it [00:18, 9.38it/s] 169it [00:18, 9.45it/s] 170it [00:18, 9.46it/s] 171it [00:18, 9.45it/s] 172it [00:18, 9.48it/s] 173it [00:19, 9.53it/s] 174it [00:19, 9.51it/s] 175it [00:19, 9.53it/s] 176it [00:19, 9.57it/s] 177it [00:19, 9.55it/s] 178it [00:19, 9.53it/s] 179it [00:19, 9.51it/s] 180it [00:19, 9.51it/s] 181it [00:19, 9.53it/s] 182it [00:19, 9.01it/s] 183it [00:20, 9.18it/s] 184it [00:20, 9.26it/s] 185it [00:20, 9.35it/s] 186it [00:20, 9.39it/s] 187it [00:20, 8.91it/s] 188it [00:20, 9.12it/s] 189it [00:20, 9.22it/s] 190it [00:20, 9.28it/s] 191it [00:20, 9.41it/s] 192it [00:21, 9.46it/s] 193it [00:21, 9.43it/s] 194it [00:21, 9.47it/s] 195it [00:21, 8.89it/s] 196it [00:21, 8.69it/s] 196it [00:21, 9.09it/s] +2025-05-26 04:03:09,899 - INFO - Epoch: 32, Objective: tensor([5291.6196], device='cuda:0', grad_fn=), Loss: 0.03124961443245411, KL/n: 71.98877716064453 + 0it [00:00, ?it/s]2025-05-26 04:03:10,185 - INFO - [Epoch 033 | Batch 0000] IWAE-loss 5486.5654 | mean log_px -0.0308 | KL -3528.38 + 1it [00:00, 5.25it/s] 2it [00:00, 7.17it/s] 3it [00:00, 7.49it/s] 4it [00:00, 8.22it/s] 5it [00:00, 8.60it/s] 6it [00:00, 8.90it/s] 7it [00:00, 8.57it/s] 8it [00:00, 8.82it/s] 9it [00:01, 9.06it/s] 10it [00:01, 9.22it/s] 11it [00:01, 9.35it/s] 12it [00:01, 9.42it/s] 13it [00:01, 9.52it/s] 14it [00:01, 8.95it/s] 15it [00:01, 9.13it/s] 16it [00:01, 9.25it/s] 17it [00:01, 9.35it/s] 18it [00:02, 9.38it/s] 19it [00:02, 9.41it/s] 20it [00:02, 9.43it/s] 21it [00:02, 9.43it/s] 22it [00:02, 9.42it/s] 23it [00:02, 8.89it/s] 24it [00:02, 9.05it/s] 25it [00:02, 9.18it/s] 26it [00:02, 9.25it/s] 27it [00:03, 9.42it/s] 28it [00:03, 9.46it/s] 29it [00:03, 9.31it/s] 30it [00:03, 9.42it/s] 31it [00:03, 9.46it/s] 32it [00:03, 9.49it/s] 33it [00:03, 9.57it/s] 34it [00:03, 9.56it/s] 35it [00:03, 9.66it/s] 36it [00:03, 9.65it/s] 37it [00:04, 9.38it/s] 38it [00:04, 9.38it/s] 39it [00:04, 8.92it/s] 40it [00:04, 9.11it/s] 41it [00:04, 9.31it/s] 42it [00:04, 9.42it/s] 43it [00:04, 9.10it/s] 44it [00:04, 9.20it/s] 45it [00:04, 9.30it/s] 46it [00:05, 9.35it/s] 47it [00:05, 9.41it/s] 48it [00:05, 9.43it/s] 49it [00:05, 9.50it/s] 50it [00:05, 9.55it/s]2025-05-26 04:03:15,548 - INFO - [Epoch 033 | Batch 0050] IWAE-loss 5826.6826 | mean log_px -0.0356 | KL -3525.49 + 51it [00:05, 9.58it/s] 52it [00:05, 9.56it/s] 53it [00:05, 9.57it/s] 54it [00:05, 9.52it/s] 55it [00:05, 9.50it/s] 56it [00:06, 9.53it/s] 57it [00:06, 9.56it/s] 58it [00:06, 9.53it/s] 59it [00:06, 9.50it/s] 60it [00:06, 9.57it/s] 61it [00:06, 8.97it/s] 62it [00:06, 9.12it/s] 63it [00:06, 9.28it/s] 64it [00:06, 9.35it/s] 65it [00:07, 9.43it/s] 66it [00:07, 9.51it/s] 67it [00:07, 9.55it/s] 68it [00:07, 9.55it/s] 69it [00:07, 9.57it/s] 70it [00:07, 9.61it/s] 71it [00:07, 9.56it/s] 72it [00:07, 9.55it/s] 73it [00:07, 9.60it/s] 74it [00:07, 9.62it/s] 75it [00:08, 9.57it/s] 76it [00:08, 8.97it/s] 77it [00:08, 9.13it/s] 78it [00:08, 9.30it/s] 79it [00:08, 9.33it/s] 80it [00:08, 9.39it/s] 81it [00:08, 9.45it/s] 82it [00:08, 9.43it/s] 83it [00:08, 9.46it/s] 84it [00:09, 9.54it/s] 85it [00:09, 9.58it/s] 86it [00:09, 9.63it/s] 87it [00:09, 9.05it/s] 88it [00:09, 9.20it/s] 89it [00:09, 9.27it/s] 90it [00:09, 9.33it/s] 91it [00:09, 9.42it/s] 92it [00:09, 9.38it/s] 93it [00:10, 9.44it/s] 94it [00:10, 9.52it/s] 95it [00:10, 9.49it/s] 96it [00:10, 9.49it/s] 97it [00:10, 8.87it/s] 98it [00:10, 9.07it/s] 99it [00:10, 9.23it/s] 100it [00:10, 9.30it/s]2025-05-26 04:03:20,873 - INFO - [Epoch 033 | Batch 0100] IWAE-loss 7603.5825 | mean log_px -0.0618 | KL -3521.97 + 101it [00:10, 9.32it/s] 102it [00:10, 9.35it/s] 103it [00:11, 9.41it/s] 104it [00:11, 9.47it/s] 105it [00:11, 9.47it/s] 106it [00:11, 9.17it/s] 107it [00:11, 8.83it/s] 108it [00:11, 8.99it/s] 109it [00:11, 9.15it/s] 110it [00:11, 9.24it/s] 111it [00:11, 9.35it/s] 112it [00:12, 9.43it/s] 113it [00:12, 9.49it/s] 114it [00:12, 9.51it/s] 115it [00:12, 9.46it/s] 116it [00:12, 9.54it/s] 117it [00:12, 9.52it/s] 118it [00:12, 9.50it/s] 119it [00:12, 9.50it/s] 120it [00:12, 9.50it/s] 121it [00:13, 9.48it/s] 122it [00:13, 9.38it/s] 123it [00:13, 9.22it/s] 124it [00:13, 8.52it/s] 125it [00:13, 8.83it/s] 126it [00:13, 9.02it/s] 127it [00:13, 9.20it/s] 128it [00:13, 9.34it/s] 129it [00:13, 9.44it/s] 130it [00:13, 9.48it/s] 131it [00:14, 9.55it/s] 132it [00:14, 9.59it/s] 133it [00:14, 9.62it/s] 134it [00:14, 9.00it/s] 135it [00:14, 9.18it/s] 136it [00:14, 9.24it/s] 137it [00:14, 9.32it/s] 138it [00:14, 9.37it/s] 139it [00:14, 9.38it/s] 140it [00:15, 9.32it/s] 141it [00:15, 9.38it/s] 142it [00:15, 9.41it/s] 143it [00:15, 8.81it/s] 144it [00:15, 9.00it/s] 145it [00:15, 9.15it/s] 146it [00:15, 9.28it/s] 147it [00:15, 9.32it/s] 148it [00:15, 9.40it/s] 149it [00:16, 9.47it/s] 150it [00:16, 9.07it/s]2025-05-26 04:03:26,257 - INFO - [Epoch 033 | Batch 0150] IWAE-loss 5245.3364 | mean log_px -0.0273 | KL -3525.40 + 151it [00:16, 9.16it/s] 152it [00:16, 9.25it/s] 153it [00:16, 9.24it/s] 154it [00:16, 9.29it/s] 155it [00:16, 9.35it/s] 156it [00:16, 9.41it/s] 157it [00:16, 9.46it/s] 158it [00:17, 9.47it/s] 159it [00:17, 9.47it/s] 160it [00:17, 9.47it/s] 161it [00:17, 9.53it/s] 162it [00:17, 9.50it/s] 163it [00:17, 9.51it/s] 164it [00:17, 9.54it/s] 165it [00:17, 9.53it/s] 166it [00:17, 9.60it/s] 167it [00:17, 9.61it/s] 168it [00:18, 9.59it/s] 169it [00:18, 9.55it/s] 170it [00:18, 9.56it/s] 171it [00:18, 9.55it/s] 172it [00:18, 9.57it/s] 173it [00:18, 9.53it/s] 174it [00:18, 9.56it/s] 175it [00:18, 9.54it/s] 176it [00:18, 9.47it/s] 177it [00:19, 8.92it/s] 178it [00:19, 9.09it/s] 179it [00:19, 9.17it/s] 180it [00:19, 9.23it/s] 181it [00:19, 8.92it/s] 182it [00:19, 9.06it/s] 183it [00:19, 9.15it/s] 184it [00:19, 8.84it/s] 185it [00:19, 9.04it/s] 186it [00:20, 9.21it/s] 187it [00:20, 9.35it/s] 188it [00:20, 9.38it/s] 189it [00:20, 9.43it/s] 190it [00:20, 9.43it/s] 191it [00:20, 9.44it/s] 192it [00:20, 9.50it/s] 193it [00:20, 9.57it/s] 194it [00:20, 9.02it/s] 195it [00:20, 8.66it/s] 196it [00:21, 8.93it/s] 196it [00:21, 9.27it/s] +2025-05-26 04:03:31,184 - INFO - Epoch: 33, Objective: tensor([9180.2832], device='cuda:0', grad_fn=), Loss: 0.08810441941022873, KL/n: 71.89595794677734 + 0it [00:00, ?it/s]2025-05-26 04:03:31,647 - INFO - [Epoch 034 | Batch 0000] IWAE-loss 7107.1201 | mean log_px -0.0598 | KL -3525.40 + 1it [00:00, 2.69it/s] 2it [00:00, 4.64it/s] 3it [00:00, 6.06it/s] 4it [00:00, 6.76it/s] 5it [00:00, 7.51it/s] 6it [00:00, 8.04it/s] 7it [00:01, 8.48it/s] 8it [00:01, 8.28it/s] 9it [00:01, 8.60it/s] 10it [00:01, 8.88it/s] 11it [00:01, 9.06it/s] 12it [00:01, 9.15it/s] 13it [00:01, 8.77it/s] 14it [00:01, 8.94it/s] 15it [00:01, 9.03it/s] 16it [00:02, 9.13it/s] 17it [00:02, 9.22it/s] 18it [00:02, 9.28it/s] 19it [00:02, 9.35it/s] 20it [00:02, 9.41it/s] 21it [00:02, 9.39it/s] 22it [00:02, 9.45it/s] 23it [00:02, 9.46it/s] 24it [00:02, 9.04it/s] 25it [00:02, 9.18it/s] 26it [00:03, 9.26it/s] 27it [00:03, 9.27it/s] 28it [00:03, 9.39it/s] 29it [00:03, 9.40it/s] 30it [00:03, 9.35it/s] 31it [00:03, 9.37it/s] 32it [00:03, 9.36it/s] 33it [00:03, 9.40it/s] 34it [00:03, 9.41it/s] 35it [00:04, 9.45it/s] 36it [00:04, 9.42it/s] 37it [00:04, 9.49it/s] 38it [00:04, 9.50it/s] 39it [00:04, 9.52it/s] 40it [00:04, 9.56it/s] 41it [00:04, 9.59it/s] 42it [00:04, 9.56it/s] 43it [00:04, 9.61it/s] 44it [00:04, 9.53it/s] 45it [00:05, 9.02it/s] 46it [00:05, 9.16it/s] 47it [00:05, 9.26it/s] 48it [00:05, 8.63it/s] 49it [00:05, 8.80it/s] 50it [00:05, 8.97it/s]2025-05-26 04:03:37,052 - INFO - [Epoch 034 | Batch 0050] IWAE-loss 5209.7563 | mean log_px -0.0287 | KL -3518.90 + 51it [00:05, 9.13it/s] 52it [00:05, 9.21it/s] 53it [00:05, 9.33it/s] 54it [00:06, 9.38it/s] 55it [00:06, 9.46it/s] 56it [00:06, 9.46it/s] 57it [00:06, 9.51it/s] 58it [00:06, 9.45it/s] 59it [00:06, 9.50it/s] 60it [00:06, 9.48it/s] 61it [00:06, 9.46it/s] 62it [00:06, 9.52it/s] 63it [00:07, 9.55it/s] 64it [00:07, 9.56it/s] 65it [00:07, 9.52it/s] 66it [00:07, 9.51it/s] 67it [00:07, 9.52it/s] 68it [00:07, 9.50it/s] 69it [00:07, 9.47it/s] 70it [00:07, 9.05it/s] 71it [00:07, 9.17it/s] 72it [00:08, 9.25it/s] 73it [00:08, 9.35it/s] 74it [00:08, 9.41it/s] 75it [00:08, 9.42it/s] 76it [00:08, 9.40it/s] 77it [00:08, 9.41it/s] 78it [00:08, 9.43it/s] 79it [00:08, 9.50it/s] 80it [00:08, 9.53it/s] 81it [00:08, 9.59it/s] 82it [00:09, 9.58it/s] 83it [00:09, 9.62it/s] 84it [00:09, 9.51it/s] 85it [00:09, 9.43it/s] 86it [00:09, 9.42it/s] 87it [00:09, 9.42it/s] 88it [00:09, 8.87it/s] 89it [00:09, 9.00it/s] 90it [00:09, 9.10it/s] 91it [00:10, 9.20it/s] 92it [00:10, 9.28it/s] 93it [00:10, 9.32it/s] 94it [00:10, 9.36it/s] 95it [00:10, 9.44it/s] 96it [00:10, 9.42it/s] 97it [00:10, 9.44it/s] 98it [00:10, 9.42it/s] 99it [00:10, 9.02it/s] 100it [00:11, 9.08it/s]2025-05-26 04:03:42,383 - INFO - [Epoch 034 | Batch 0100] IWAE-loss 6808.0835 | mean log_px -0.0500 | KL -3514.93 + 101it [00:11, 9.15it/s] 102it [00:11, 9.25it/s] 103it [00:11, 9.29it/s] 104it [00:11, 9.32it/s] 105it [00:11, 9.34it/s] 106it [00:11, 9.37it/s] 107it [00:11, 9.37it/s] 108it [00:11, 9.35it/s] 109it [00:11, 9.38it/s] 110it [00:12, 9.46it/s] 111it [00:12, 9.51it/s] 112it [00:12, 9.49it/s] 113it [00:12, 9.48it/s] 114it [00:12, 9.46it/s] 115it [00:12, 9.47it/s] 116it [00:12, 9.45it/s] 117it [00:12, 9.47it/s] 118it [00:12, 9.45it/s] 119it [00:13, 9.43it/s] 120it [00:13, 9.41it/s] 121it [00:13, 8.90it/s] 122it [00:13, 9.08it/s] 123it [00:13, 9.14it/s] 124it [00:13, 9.21it/s] 125it [00:13, 9.32it/s] 126it [00:13, 9.33it/s] 127it [00:13, 9.38it/s] 128it [00:13, 9.41it/s] 129it [00:14, 9.40it/s] 130it [00:14, 9.42it/s] 131it [00:14, 9.47it/s] 132it [00:14, 9.44it/s] 133it [00:14, 9.46it/s] 134it [00:14, 9.45it/s] 135it [00:14, 9.43it/s] 136it [00:14, 9.45it/s] 137it [00:14, 9.47it/s] 138it [00:15, 9.45it/s] 139it [00:15, 8.95it/s] 140it [00:15, 9.07it/s] 141it [00:15, 9.16it/s] 142it [00:15, 9.28it/s] 143it [00:15, 8.92it/s] 144it [00:15, 9.06it/s] 145it [00:15, 9.23it/s] 146it [00:15, 9.28it/s] 147it [00:16, 9.39it/s] 148it [00:16, 9.42it/s] 149it [00:16, 9.44it/s] 150it [00:16, 9.44it/s]2025-05-26 04:03:47,730 - INFO - [Epoch 034 | Batch 0150] IWAE-loss 7905.4756 | mean log_px -0.0700 | KL -3521.38 + 151it [00:16, 9.49it/s] 152it [00:16, 9.46it/s] 153it [00:16, 9.40it/s] 154it [00:16, 9.40it/s] 155it [00:16, 9.26it/s] 156it [00:16, 9.35it/s] 157it [00:17, 8.96it/s] 158it [00:17, 9.14it/s] 159it [00:17, 9.23it/s] 160it [00:17, 9.34it/s] 161it [00:17, 8.97it/s] 162it [00:17, 9.15it/s] 163it [00:17, 9.23it/s] 164it [00:17, 8.91it/s] 165it [00:17, 9.08it/s] 166it [00:18, 9.17it/s] 167it [00:18, 9.32it/s] 168it [00:18, 9.36it/s] 169it [00:18, 9.38it/s] 170it [00:18, 9.41it/s] 171it [00:18, 9.42it/s] 172it [00:18, 8.84it/s] 173it [00:18, 9.03it/s] 174it [00:18, 9.18it/s] 175it [00:19, 8.75it/s] 176it [00:19, 8.89it/s] 177it [00:19, 9.04it/s] 178it [00:19, 9.13it/s] 179it [00:19, 8.71it/s] 180it [00:19, 8.89it/s] 181it [00:19, 9.08it/s] 182it [00:19, 9.15it/s] 183it [00:19, 9.29it/s] 184it [00:20, 8.75it/s] 185it [00:20, 8.94it/s] 186it [00:20, 9.09it/s] 187it [00:20, 9.22it/s] 188it [00:20, 8.78it/s] 189it [00:20, 8.97it/s] 190it [00:20, 9.11it/s] 191it [00:20, 9.25it/s] 192it [00:20, 9.30it/s] 193it [00:21, 9.42it/s] 194it [00:21, 9.44it/s] 195it [00:21, 8.91it/s] 196it [00:21, 9.13it/s] 196it [00:21, 9.13it/s] +2025-05-26 04:03:52,774 - INFO - Epoch: 34, Objective: tensor([7032.6973], device='cuda:0', grad_fn=), Loss: 0.05743390694260597, KL/n: 71.76044464111328 + 0it [00:00, ?it/s]2025-05-26 04:03:53,055 - INFO - [Epoch 035 | Batch 0000] IWAE-loss 5518.7554 | mean log_px -0.0321 | KL -3518.21 + 1it [00:00, 5.19it/s] 2it [00:00, 7.10it/s] 3it [00:00, 8.06it/s] 4it [00:00, 8.53it/s] 5it [00:00, 8.87it/s] 6it [00:00, 9.03it/s] 7it [00:00, 9.11it/s] 8it [00:00, 9.25it/s] 9it [00:01, 9.37it/s] 10it [00:01, 9.40it/s] 11it [00:01, 9.42it/s] 12it [00:01, 9.47it/s] 13it [00:01, 9.54it/s] 14it [00:01, 9.46it/s] 15it [00:01, 9.33it/s] 16it [00:01, 9.17it/s] 17it [00:01, 9.31it/s] 18it [00:01, 9.39it/s] 19it [00:02, 9.44it/s] 20it [00:02, 9.39it/s] 21it [00:02, 9.45it/s] 22it [00:02, 9.22it/s] 23it [00:02, 9.31it/s] 24it [00:02, 9.41it/s] 25it [00:02, 9.47it/s] 26it [00:02, 8.88it/s] 27it [00:02, 9.08it/s] 28it [00:03, 9.18it/s] 29it [00:03, 9.27it/s] 30it [00:03, 9.31it/s] 31it [00:03, 9.39it/s] 32it [00:03, 9.42it/s] 33it [00:03, 9.43it/s] 34it [00:03, 9.50it/s] 35it [00:03, 9.48it/s] 36it [00:03, 9.55it/s] 37it [00:04, 9.53it/s] 38it [00:04, 9.47it/s] 39it [00:04, 9.52it/s] 40it [00:04, 9.49it/s] 41it [00:04, 9.51it/s] 42it [00:04, 9.54it/s] 43it [00:04, 9.59it/s] 44it [00:04, 9.58it/s] 45it [00:04, 9.56it/s] 46it [00:04, 9.54it/s] 47it [00:05, 9.55it/s] 48it [00:05, 9.54it/s] 49it [00:05, 9.54it/s] 50it [00:05, 9.50it/s]2025-05-26 04:03:58,359 - INFO - [Epoch 035 | Batch 0050] IWAE-loss 10205.3838 | mean log_px -0.0955 | KL -3515.78 + 51it [00:05, 9.47it/s] 52it [00:05, 9.50it/s] 53it [00:05, 9.51it/s] 54it [00:05, 9.53it/s] 55it [00:05, 8.98it/s] 56it [00:06, 9.12it/s] 57it [00:06, 9.25it/s] 58it [00:06, 9.30it/s] 59it [00:06, 8.84it/s] 60it [00:06, 9.02it/s] 61it [00:06, 9.19it/s] 62it [00:06, 9.13it/s] 63it [00:06, 9.29it/s] 64it [00:06, 9.34it/s] 65it [00:07, 9.34it/s] 66it [00:07, 9.38it/s] 67it [00:07, 9.43it/s] 68it [00:07, 9.43it/s] 69it [00:07, 9.41it/s] 70it [00:07, 8.91it/s] 71it [00:07, 9.14it/s] 72it [00:07, 9.20it/s] 73it [00:07, 9.34it/s] 74it [00:07, 9.38it/s] 75it [00:08, 9.47it/s] 76it [00:08, 8.86it/s] 77it [00:08, 9.04it/s] 78it [00:08, 9.18it/s] 79it [00:08, 9.20it/s] 80it [00:08, 8.79it/s] 81it [00:08, 8.98it/s] 82it [00:08, 9.16it/s] 83it [00:08, 9.28it/s] 84it [00:09, 9.36it/s] 85it [00:09, 9.43it/s] 86it [00:09, 9.48it/s] 87it [00:09, 9.51it/s] 88it [00:09, 9.09it/s] 89it [00:09, 9.22it/s] 90it [00:09, 9.28it/s] 91it [00:09, 9.40it/s] 92it [00:09, 9.41it/s] 93it [00:10, 9.45it/s] 94it [00:10, 9.47it/s] 95it [00:10, 9.48it/s] 96it [00:10, 8.88it/s] 97it [00:10, 9.06it/s] 98it [00:10, 9.16it/s] 99it [00:10, 9.31it/s] 100it [00:10, 9.37it/s]2025-05-26 04:04:03,766 - INFO - [Epoch 035 | Batch 0100] IWAE-loss 7475.6548 | mean log_px -0.0570 | KL -3514.94 + 101it [00:10, 9.43it/s] 102it [00:11, 9.51it/s] 103it [00:11, 9.51it/s] 104it [00:11, 9.48it/s] 105it [00:11, 9.44it/s] 106it [00:11, 9.41it/s] 107it [00:11, 9.43it/s] 108it [00:11, 9.49it/s] 109it [00:11, 9.56it/s] 110it [00:11, 9.50it/s] 111it [00:11, 9.50it/s] 112it [00:12, 9.49it/s] 113it [00:12, 9.42it/s] 114it [00:12, 8.95it/s] 115it [00:12, 9.07it/s] 116it [00:12, 9.22it/s] 117it [00:12, 9.38it/s] 118it [00:12, 9.48it/s] 119it [00:12, 9.55it/s] 120it [00:12, 9.52it/s] 121it [00:13, 9.51it/s] 122it [00:13, 9.56it/s] 123it [00:13, 9.50it/s] 124it [00:13, 9.48it/s] 125it [00:13, 9.46it/s] 126it [00:13, 8.92it/s] 127it [00:13, 9.07it/s] 128it [00:13, 9.20it/s] 129it [00:13, 9.23it/s] 130it [00:13, 9.26it/s] 131it [00:14, 9.33it/s] 132it [00:14, 9.37it/s] 133it [00:14, 8.86it/s] 134it [00:14, 9.00it/s] 135it [00:14, 9.17it/s] 136it [00:14, 9.21it/s] 137it [00:14, 9.34it/s] 138it [00:14, 9.43it/s] 139it [00:14, 8.90it/s] 140it [00:15, 9.09it/s] 141it [00:15, 9.25it/s] 142it [00:15, 9.33it/s] 143it [00:15, 8.85it/s] 144it [00:15, 9.07it/s] 145it [00:15, 9.21it/s] 146it [00:15, 9.34it/s] 147it [00:15, 8.99it/s] 148it [00:15, 9.16it/s] 149it [00:16, 9.30it/s] 150it [00:16, 9.39it/s]2025-05-26 04:04:09,141 - INFO - [Epoch 035 | Batch 0150] IWAE-loss 5995.6523 | mean log_px -0.0361 | KL -3514.44 + 151it [00:16, 9.41it/s] 152it [00:16, 9.37it/s] 153it [00:16, 9.43it/s] 154it [00:16, 9.45it/s] 155it [00:16, 9.49it/s] 156it [00:16, 9.49it/s] 157it [00:16, 9.52it/s] 158it [00:17, 9.48it/s] 159it [00:17, 9.40it/s] 160it [00:17, 9.35it/s] 161it [00:17, 9.30it/s] 162it [00:17, 9.41it/s] 163it [00:17, 9.44it/s] 164it [00:17, 9.04it/s] 165it [00:17, 9.18it/s] 166it [00:17, 9.25it/s] 167it [00:17, 9.28it/s] 168it [00:18, 8.92it/s] 169it [00:18, 8.93it/s] 170it [00:18, 9.00it/s] 171it [00:18, 9.20it/s] 172it [00:18, 9.34it/s] 173it [00:18, 9.40it/s] 174it [00:18, 9.43it/s] 175it [00:18, 9.52it/s] 176it [00:18, 9.08it/s] 177it [00:19, 9.21it/s] 178it [00:19, 9.33it/s] 179it [00:19, 9.38it/s] 180it [00:19, 9.43it/s] 181it [00:19, 9.47it/s] 182it [00:19, 9.49it/s] 183it [00:19, 9.52it/s] 184it [00:19, 9.11it/s] 185it [00:19, 9.23it/s] 186it [00:20, 9.29it/s] 187it [00:20, 9.36it/s] 188it [00:20, 9.38it/s] 189it [00:20, 9.46it/s] 190it [00:20, 9.48it/s] 191it [00:20, 9.49it/s] 192it [00:20, 9.53it/s] 193it [00:20, 9.60it/s] 194it [00:20, 9.58it/s] 195it [00:21, 8.98it/s] 196it [00:21, 9.17it/s] 196it [00:21, 9.26it/s] +2025-05-26 04:04:14,072 - INFO - Epoch: 35, Objective: tensor([5837.2930], device='cuda:0', grad_fn=), Loss: 0.03758452087640762, KL/n: 71.64217376708984 + 0it [00:00, ?it/s]2025-05-26 04:04:14,535 - INFO - [Epoch 036 | Batch 0000] IWAE-loss 5874.6455 | mean log_px -0.0372 | KL -3509.21 + 1it [00:00, 2.52it/s] 2it [00:00, 4.45it/s] 3it [00:00, 5.91it/s] 4it [00:00, 6.98it/s] 5it [00:00, 7.78it/s] 6it [00:00, 8.35it/s] 7it [00:01, 8.78it/s] 8it [00:01, 8.84it/s] 9it [00:01, 9.07it/s] 10it [00:01, 9.18it/s] 11it [00:01, 9.29it/s] 12it [00:01, 9.28it/s] 13it [00:01, 9.36it/s] 14it [00:01, 9.42it/s] 15it [00:01, 9.49it/s] 16it [00:01, 9.40it/s] 17it [00:02, 9.22it/s] 18it [00:02, 9.31it/s] 19it [00:02, 9.29it/s] 20it [00:02, 9.34it/s] 21it [00:02, 9.40it/s] 22it [00:02, 9.39it/s] 23it [00:02, 9.44it/s] 24it [00:02, 9.43it/s] 25it [00:02, 9.47it/s] 26it [00:03, 9.41it/s] 27it [00:03, 9.40it/s] 28it [00:03, 9.42it/s] 29it [00:03, 9.47it/s] 30it [00:03, 9.52it/s] 31it [00:03, 9.55it/s] 32it [00:03, 9.57it/s] 33it [00:03, 9.59it/s] 34it [00:03, 9.63it/s] 35it [00:03, 9.64it/s] 36it [00:04, 9.62it/s] 37it [00:04, 9.62it/s] 38it [00:04, 9.61it/s] 39it [00:04, 9.63it/s] 40it [00:04, 9.64it/s] 41it [00:04, 9.65it/s] 42it [00:04, 9.62it/s] 43it [00:04, 9.61it/s] 44it [00:04, 9.58it/s] 45it [00:05, 9.59it/s] 46it [00:05, 9.56it/s] 47it [00:05, 9.57it/s] 48it [00:05, 8.98it/s] 49it [00:05, 9.17it/s] 50it [00:05, 9.30it/s]2025-05-26 04:04:19,829 - INFO - [Epoch 036 | Batch 0050] IWAE-loss 5224.4829 | mean log_px -0.0283 | KL -3501.39 + 51it [00:05, 9.42it/s] 52it [00:05, 9.45it/s] 53it [00:05, 9.49it/s] 54it [00:05, 9.03it/s] 55it [00:06, 9.18it/s] 56it [00:06, 9.29it/s] 57it [00:06, 8.93it/s] 58it [00:06, 9.17it/s] 59it [00:06, 9.29it/s] 60it [00:06, 9.35it/s] 61it [00:06, 9.38it/s] 62it [00:06, 9.43it/s] 63it [00:06, 8.95it/s] 64it [00:07, 9.12it/s] 65it [00:07, 9.24it/s] 66it [00:07, 9.33it/s] 67it [00:07, 9.38it/s] 68it [00:07, 9.44it/s] 69it [00:07, 9.50it/s] 70it [00:07, 9.53it/s] 71it [00:07, 9.55it/s] 72it [00:07, 9.55it/s] 73it [00:08, 9.56it/s] 74it [00:08, 9.52it/s] 75it [00:08, 9.41it/s] 76it [00:08, 9.49it/s] 77it [00:08, 9.03it/s] 78it [00:08, 9.16it/s] 79it [00:08, 9.13it/s] 80it [00:08, 9.23it/s] 81it [00:08, 9.32it/s] 82it [00:08, 9.37it/s] 83it [00:09, 8.94it/s] 84it [00:09, 9.11it/s] 85it [00:09, 9.24it/s] 86it [00:09, 9.25it/s] 87it [00:09, 9.36it/s] 88it [00:09, 9.44it/s] 89it [00:09, 9.45it/s] 90it [00:09, 9.54it/s] 91it [00:09, 9.53it/s] 92it [00:10, 9.54it/s] 93it [00:10, 9.48it/s] 94it [00:10, 9.48it/s] 95it [00:10, 9.48it/s] 96it [00:10, 9.52it/s] 97it [00:10, 9.57it/s] 98it [00:10, 9.58it/s] 99it [00:10, 9.60it/s] 100it [00:10, 9.59it/s]2025-05-26 04:04:25,167 - INFO - [Epoch 036 | Batch 0100] IWAE-loss 8589.2041 | mean log_px -0.0804 | KL -3509.35 + 101it [00:11, 9.38it/s] 102it [00:11, 9.46it/s] 103it [00:11, 9.48it/s] 104it [00:11, 9.50it/s] 105it [00:11, 9.52it/s] 106it [00:11, 9.51it/s] 107it [00:11, 9.52it/s] 108it [00:11, 9.39it/s] 109it [00:11, 8.97it/s] 110it [00:11, 9.11it/s] 111it [00:12, 9.21it/s] 112it [00:12, 9.28it/s] 113it [00:12, 9.31it/s] 114it [00:12, 9.34it/s] 115it [00:12, 9.41it/s] 116it [00:12, 9.43it/s] 117it [00:12, 9.46it/s] 118it [00:12, 9.44it/s] 119it [00:12, 9.30it/s] 120it [00:13, 9.38it/s] 121it [00:13, 9.44it/s] 122it [00:13, 9.49it/s] 123it [00:13, 9.53it/s] 124it [00:13, 9.56it/s] 125it [00:13, 9.55it/s] 126it [00:13, 9.60it/s] 127it [00:13, 9.59it/s] 128it [00:13, 9.58it/s] 129it [00:13, 9.59it/s] 130it [00:14, 9.59it/s] 131it [00:14, 9.60it/s] 132it [00:14, 9.57it/s] 133it [00:14, 9.61it/s] 134it [00:14, 9.59it/s] 135it [00:14, 9.59it/s] 136it [00:14, 9.54it/s] 137it [00:14, 9.55it/s] 138it [00:14, 9.56it/s] 139it [00:15, 9.58it/s] 140it [00:15, 9.06it/s] 141it [00:15, 9.21it/s] 142it [00:15, 9.33it/s] 143it [00:15, 9.40it/s] 144it [00:15, 9.42it/s] 145it [00:15, 9.48it/s] 146it [00:15, 9.53it/s] 147it [00:15, 9.52it/s] 148it [00:15, 9.20it/s] 149it [00:16, 9.29it/s] 150it [00:16, 9.33it/s]2025-05-26 04:04:30,473 - INFO - [Epoch 036 | Batch 0150] IWAE-loss 5136.7231 | mean log_px -0.0261 | KL -3499.86 + 151it [00:16, 9.42it/s] 152it [00:16, 9.43it/s] 153it [00:16, 9.47it/s] 154it [00:16, 9.44it/s] 155it [00:16, 9.47it/s] 156it [00:16, 9.48it/s] 157it [00:16, 9.48it/s] 158it [00:17, 9.51it/s] 159it [00:17, 9.57it/s] 160it [00:17, 9.58it/s] 161it [00:17, 9.54it/s] 162it [00:17, 9.54it/s] 163it [00:17, 9.55it/s] 164it [00:17, 9.57it/s] 165it [00:17, 9.58it/s] 166it [00:17, 9.57it/s] 167it [00:17, 9.59it/s] 168it [00:18, 9.53it/s] 169it [00:18, 9.55it/s] 170it [00:18, 9.56it/s] 171it [00:18, 9.54it/s] 172it [00:18, 9.58it/s] 173it [00:18, 9.28it/s] 174it [00:18, 9.37it/s] 175it [00:18, 9.44it/s] 176it [00:18, 9.29it/s] 177it [00:19, 9.34it/s] 178it [00:19, 9.42it/s] 179it [00:19, 9.44it/s] 180it [00:19, 9.46it/s] 181it [00:19, 9.45it/s] 182it [00:19, 9.46it/s] 183it [00:19, 9.54it/s] 184it [00:19, 9.58it/s] 185it [00:19, 9.62it/s] 186it [00:19, 9.43it/s] 187it [00:20, 9.48it/s] 188it [00:20, 9.47it/s] 189it [00:20, 9.48it/s] 190it [00:20, 9.54it/s] 191it [00:20, 9.56it/s] 192it [00:20, 9.21it/s] 193it [00:20, 9.29it/s] 194it [00:20, 9.38it/s] 195it [00:20, 8.83it/s] 196it [00:21, 8.74it/s] 196it [00:21, 9.26it/s] +2025-05-26 04:04:35,363 - INFO - Epoch: 36, Objective: tensor([6148.1465], device='cuda:0', grad_fn=), Loss: 0.04331137239933014, KL/n: 71.53656005859375 + 0it [00:00, ?it/s]2025-05-26 04:04:35,621 - INFO - [Epoch 037 | Batch 0000] IWAE-loss 5157.5024 | mean log_px -0.0263 | KL -3506.90 + 1it [00:00, 5.87it/s] 2it [00:00, 7.05it/s] 4it [00:00, 8.70it/s] 6it [00:00, 9.33it/s] 8it [00:00, 9.63it/s] 9it [00:00, 9.71it/s] 11it [00:01, 9.87it/s] 13it [00:01, 9.97it/s] 15it [00:01, 10.03it/s] 17it [00:01, 10.06it/s] 19it [00:01, 10.08it/s] 21it [00:02, 10.10it/s] 23it [00:02, 10.11it/s] 25it [00:02, 10.12it/s] 27it [00:02, 10.12it/s] 29it [00:02, 10.13it/s] 31it [00:03, 10.14it/s] 33it [00:03, 10.01it/s] 35it [00:03, 10.04it/s] 37it [00:03, 10.07it/s] 39it [00:03, 10.09it/s] 41it [00:04, 10.09it/s] 43it [00:04, 10.04it/s] 45it [00:04, 10.06it/s] 47it [00:04, 10.03it/s] 49it [00:04, 9.98it/s]2025-05-26 04:04:40,605 - INFO - [Epoch 037 | Batch 0050] IWAE-loss 6418.6987 | mean log_px -0.0469 | KL -3502.43 + 51it [00:05, 9.69it/s] 52it [00:05, 9.69it/s] 53it [00:05, 9.65it/s] 54it [00:05, 9.69it/s] 56it [00:05, 9.84it/s] 58it [00:05, 9.94it/s] 60it [00:06, 10.01it/s] 62it [00:06, 10.03it/s] 64it [00:06, 10.08it/s] 66it [00:06, 10.09it/s] 68it [00:06, 9.77it/s] 70it [00:07, 9.88it/s] 72it [00:07, 9.95it/s] 74it [00:07, 10.00it/s] 76it [00:07, 10.04it/s] 78it [00:07, 10.07it/s] 80it [00:08, 10.10it/s] 82it [00:08, 10.11it/s] 84it [00:08, 10.12it/s] 86it [00:08, 10.13it/s] 88it [00:08, 10.14it/s] 90it [00:09, 10.13it/s] 92it [00:09, 9.78it/s] 94it [00:09, 9.55it/s] 95it [00:09, 9.53it/s] 96it [00:09, 9.58it/s] 97it [00:09, 9.67it/s] 98it [00:09, 9.73it/s] 100it [00:10, 9.88it/s]2025-05-26 04:04:45,662 - INFO - [Epoch 037 | Batch 0100] IWAE-loss 5038.2764 | mean log_px -0.0247 | KL -3498.83 + 101it [00:10, 9.36it/s] 103it [00:10, 9.63it/s] 104it [00:10, 9.71it/s] 105it [00:10, 9.77it/s] 107it [00:10, 9.88it/s] 109it [00:11, 9.96it/s] 110it [00:11, 9.92it/s] 112it [00:11, 9.58it/s] 114it [00:11, 9.77it/s] 116it [00:11, 9.88it/s] 118it [00:11, 9.96it/s] 120it [00:12, 9.99it/s] 122it [00:12, 10.04it/s] 124it [00:12, 10.07it/s] 126it [00:12, 10.08it/s] 128it [00:12, 10.04it/s] 130it [00:13, 10.05it/s] 132it [00:13, 9.79it/s] 134it [00:13, 9.88it/s] 135it [00:13, 9.62it/s] 137it [00:13, 9.77it/s] 138it [00:13, 9.42it/s] 140it [00:14, 9.64it/s] 141it [00:14, 9.70it/s] 142it [00:14, 9.32it/s] 144it [00:14, 9.60it/s] 145it [00:14, 9.68it/s] 147it [00:14, 9.84it/s] 149it [00:15, 9.93it/s] 150it [00:15, 9.60it/s]2025-05-26 04:04:50,774 - INFO - [Epoch 037 | Batch 0150] IWAE-loss 6093.8408 | mean log_px -0.0371 | KL -3496.12 + 151it [00:15, 9.67it/s] 153it [00:15, 9.83it/s] 155it [00:15, 9.93it/s] 157it [00:15, 9.98it/s] 159it [00:16, 10.02it/s] 161it [00:16, 10.03it/s] 163it [00:16, 10.06it/s] 165it [00:16, 10.06it/s] 167it [00:16, 9.70it/s] 168it [00:17, 9.73it/s] 169it [00:17, 9.75it/s] 170it [00:17, 9.77it/s] 171it [00:17, 9.79it/s] 173it [00:17, 9.92it/s] 175it [00:17, 9.95it/s] 177it [00:17, 10.00it/s] 179it [00:18, 10.04it/s] 181it [00:18, 10.07it/s] 183it [00:18, 10.08it/s] 185it [00:18, 9.72it/s] 186it [00:18, 9.77it/s] 187it [00:18, 9.80it/s] 189it [00:19, 9.48it/s] 190it [00:19, 9.58it/s] 191it [00:19, 9.64it/s] 193it [00:19, 9.77it/s] 194it [00:19, 9.36it/s] 195it [00:19, 9.18it/s] 196it [00:19, 9.81it/s] +2025-05-26 04:04:55,463 - INFO - Epoch: 37, Objective: tensor([7495.4062], device='cuda:0', grad_fn=), Loss: 0.06337570399045944, KL/n: 71.414794921875 + 0it [00:00, ?it/s]2025-05-26 04:04:55,929 - INFO - [Epoch 038 | Batch 0000] IWAE-loss 8049.1758 | mean log_px -0.0730 | KL -3499.70 + 1it [00:00, 2.48it/s] 2it [00:00, 4.44it/s] 3it [00:00, 5.92it/s] 4it [00:00, 6.96it/s] 5it [00:00, 7.31it/s] 7it [00:01, 8.50it/s] 8it [00:01, 8.84it/s] 9it [00:01, 8.64it/s] 10it [00:01, 8.97it/s] 12it [00:01, 9.42it/s] 13it [00:01, 9.04it/s] 14it [00:01, 9.08it/s] 15it [00:01, 9.12it/s] 16it [00:02, 9.25it/s] 17it [00:02, 9.44it/s] 18it [00:02, 9.53it/s] 19it [00:02, 9.66it/s] 20it [00:02, 9.74it/s] 21it [00:02, 9.80it/s] 22it [00:02, 9.78it/s] 23it [00:02, 9.33it/s] 24it [00:02, 9.45it/s] 25it [00:02, 9.53it/s] 26it [00:03, 9.03it/s] 27it [00:03, 9.25it/s] 29it [00:03, 9.61it/s] 30it [00:03, 9.70it/s] 32it [00:03, 9.81it/s] 34it [00:03, 9.91it/s] 36it [00:04, 9.64it/s] 38it [00:04, 9.77it/s] 39it [00:04, 9.81it/s] 40it [00:04, 9.83it/s] 41it [00:04, 9.33it/s] 42it [00:04, 8.93it/s] 43it [00:04, 8.62it/s] 44it [00:04, 8.89it/s] 46it [00:05, 9.38it/s] 48it [00:05, 9.62it/s] 49it [00:05, 9.70it/s] 50it [00:05, 9.72it/s]2025-05-26 04:05:01,214 - INFO - [Epoch 038 | Batch 0050] IWAE-loss 5952.2158 | mean log_px -0.0410 | KL -3503.08 + 51it [00:05, 9.23it/s] 52it [00:05, 9.28it/s] 53it [00:05, 9.45it/s] 54it [00:05, 9.58it/s] 56it [00:06, 9.34it/s] 57it [00:06, 9.49it/s] 58it [00:06, 9.61it/s] 60it [00:06, 9.77it/s] 61it [00:06, 9.21it/s] 62it [00:06, 9.37it/s] 63it [00:06, 9.45it/s] 65it [00:07, 9.29it/s] 66it [00:07, 9.43it/s] 68it [00:07, 9.69it/s] 69it [00:07, 9.31it/s] 70it [00:07, 9.42it/s] 72it [00:07, 9.63it/s] 73it [00:07, 9.61it/s] 74it [00:08, 9.23it/s] 75it [00:08, 9.39it/s] 77it [00:08, 9.67it/s] 78it [00:08, 9.69it/s] 79it [00:08, 9.22it/s] 80it [00:08, 9.40it/s] 81it [00:08, 9.55it/s] 82it [00:08, 9.66it/s] 83it [00:09, 9.19it/s] 84it [00:09, 9.36it/s] 86it [00:09, 9.67it/s] 88it [00:09, 9.83it/s] 89it [00:09, 9.50it/s] 90it [00:09, 9.60it/s] 92it [00:09, 9.79it/s] 94it [00:10, 9.89it/s] 95it [00:10, 9.45it/s] 97it [00:10, 9.67it/s] 98it [00:10, 9.73it/s] 100it [00:10, 9.86it/s]2025-05-26 04:05:06,457 - INFO - [Epoch 038 | Batch 0100] IWAE-loss 7382.7646 | mean log_px -0.0584 | KL -3494.08 + 101it [00:10, 9.37it/s] 102it [00:11, 9.49it/s] 103it [00:11, 9.58it/s] 104it [00:11, 9.68it/s] 105it [00:11, 9.21it/s] 106it [00:11, 9.38it/s] 107it [00:11, 9.49it/s] 108it [00:11, 9.62it/s] 109it [00:11, 9.15it/s] 111it [00:11, 9.52it/s] 112it [00:12, 9.60it/s] 113it [00:12, 9.19it/s] 114it [00:12, 9.35it/s] 115it [00:12, 9.46it/s] 116it [00:12, 9.60it/s] 118it [00:12, 9.81it/s] 120it [00:12, 9.91it/s] 121it [00:13, 9.49it/s] 123it [00:13, 9.72it/s] 125it [00:13, 9.85it/s] 127it [00:13, 9.94it/s] 129it [00:13, 9.99it/s] 130it [00:13, 9.98it/s] 131it [00:14, 9.91it/s] 133it [00:14, 9.98it/s] 135it [00:14, 10.03it/s] 137it [00:14, 9.67it/s] 139it [00:14, 9.81it/s] 140it [00:14, 9.47it/s] 141it [00:15, 9.53it/s] 142it [00:15, 9.62it/s] 143it [00:15, 9.64it/s] 144it [00:15, 9.18it/s] 145it [00:15, 9.31it/s] 146it [00:15, 9.48it/s] 147it [00:15, 9.60it/s] 148it [00:15, 9.68it/s] 149it [00:15, 9.75it/s] 150it [00:16, 9.30it/s]2025-05-26 04:05:11,669 - INFO - [Epoch 038 | Batch 0150] IWAE-loss 5241.9893 | mean log_px -0.0268 | KL -3495.52 + 151it [00:16, 9.46it/s] 153it [00:16, 9.77it/s] 155it [00:16, 9.89it/s] 156it [00:16, 9.44it/s] 158it [00:16, 9.68it/s] 160it [00:17, 9.47it/s] 162it [00:17, 9.68it/s] 163it [00:17, 9.73it/s] 164it [00:17, 9.78it/s] 165it [00:17, 9.79it/s] 167it [00:17, 9.94it/s] 168it [00:17, 9.49it/s] 170it [00:18, 9.71it/s] 172it [00:18, 9.49it/s] 174it [00:18, 9.66it/s] 176it [00:18, 9.46it/s] 178it [00:18, 9.63it/s] 179it [00:19, 9.70it/s] 180it [00:19, 9.35it/s] 181it [00:19, 9.49it/s] 183it [00:19, 9.74it/s] 184it [00:19, 9.76it/s] 185it [00:19, 9.33it/s] 187it [00:19, 9.65it/s] 189it [00:20, 9.84it/s] 191it [00:20, 9.95it/s] 193it [00:20, 10.01it/s] 195it [00:20, 9.79it/s] 196it [00:20, 9.56it/s] 196it [00:20, 9.41it/s] +2025-05-26 04:05:16,428 - INFO - Epoch: 38, Objective: tensor([6876.5137], device='cuda:0', grad_fn=), Loss: 0.05297667905688286, KL/n: 71.28185272216797 + 0it [00:00, ?it/s]2025-05-26 04:05:16,702 - INFO - [Epoch 039 | Batch 0000] IWAE-loss 6343.7041 | mean log_px -0.0524 | KL -3491.50 + 1it [00:00, 5.56it/s] 2it [00:00, 6.90it/s] 3it [00:00, 7.97it/s] 4it [00:00, 8.67it/s] 5it [00:00, 9.08it/s] 6it [00:00, 8.68it/s] 7it [00:00, 9.02it/s] 8it [00:00, 9.25it/s] 9it [00:01, 9.43it/s] 10it [00:01, 9.54it/s] 11it [00:01, 9.63it/s] 12it [00:01, 9.68it/s] 13it [00:01, 9.71it/s] 14it [00:01, 9.73it/s] 15it [00:01, 9.72it/s] 16it [00:01, 9.70it/s] 17it [00:01, 9.78it/s] 19it [00:02, 9.93it/s] 20it [00:02, 9.93it/s] 22it [00:02, 9.98it/s] 24it [00:02, 10.01it/s] 26it [00:02, 10.03it/s] 28it [00:02, 9.95it/s] 30it [00:03, 9.72it/s] 32it [00:03, 9.83it/s] 33it [00:03, 9.54it/s] 35it [00:03, 9.69it/s] 36it [00:03, 9.34it/s] 38it [00:04, 9.60it/s] 40it [00:04, 9.73it/s] 41it [00:04, 9.41it/s] 42it [00:04, 9.48it/s] 43it [00:04, 9.55it/s] 45it [00:04, 9.76it/s] 47it [00:04, 9.87it/s] 48it [00:05, 9.87it/s] 49it [00:05, 9.50it/s] 50it [00:05, 9.59it/s]2025-05-26 04:05:21,873 - INFO - [Epoch 039 | Batch 0050] IWAE-loss 5679.2578 | mean log_px -0.0351 | KL -3490.73 + 51it [00:05, 9.69it/s] 52it [00:05, 9.69it/s] 53it [00:05, 9.72it/s] 54it [00:05, 9.76it/s] 55it [00:05, 9.15it/s] 56it [00:05, 9.29it/s] 57it [00:05, 9.49it/s] 58it [00:06, 9.52it/s] 59it [00:06, 9.59it/s] 60it [00:06, 9.63it/s] 61it [00:06, 9.66it/s] 62it [00:06, 9.70it/s] 63it [00:06, 9.73it/s] 64it [00:06, 9.13it/s] 65it [00:06, 9.37it/s] 66it [00:06, 9.53it/s] 67it [00:07, 9.66it/s] 68it [00:07, 9.75it/s] 70it [00:07, 9.90it/s] 71it [00:07, 9.40it/s] 72it [00:07, 9.55it/s] 74it [00:07, 9.76it/s] 76it [00:07, 9.83it/s] 77it [00:08, 9.86it/s] 78it [00:08, 9.74it/s] 79it [00:08, 9.80it/s] 80it [00:08, 9.31it/s] 81it [00:08, 9.48it/s] 82it [00:08, 9.54it/s] 83it [00:08, 9.59it/s] 85it [00:08, 9.77it/s] 86it [00:08, 9.78it/s] 87it [00:09, 9.76it/s] 88it [00:09, 9.81it/s] 90it [00:09, 9.91it/s] 92it [00:09, 9.97it/s] 93it [00:09, 9.97it/s] 94it [00:09, 9.98it/s] 95it [00:09, 9.98it/s] 96it [00:09, 9.97it/s] 98it [00:10, 9.95it/s] 99it [00:10, 9.45it/s]2025-05-26 04:05:27,038 - INFO - [Epoch 039 | Batch 0100] IWAE-loss 5635.9746 | mean log_px -0.0364 | KL -3484.96 + 101it [00:10, 9.67it/s] 103it [00:10, 9.50it/s] 104it [00:10, 9.59it/s] 106it [00:11, 9.76it/s] 107it [00:11, 9.81it/s] 108it [00:11, 9.83it/s] 110it [00:11, 9.89it/s] 112it [00:11, 9.95it/s] 114it [00:11, 9.99it/s] 116it [00:12, 10.01it/s] 117it [00:12, 9.59it/s] 118it [00:12, 9.55it/s] 119it [00:12, 9.46it/s] 120it [00:12, 9.56it/s] 122it [00:12, 9.34it/s] 124it [00:12, 9.60it/s] 125it [00:12, 9.68it/s] 126it [00:13, 9.71it/s] 128it [00:13, 9.86it/s] 130it [00:13, 9.90it/s] 131it [00:13, 9.88it/s] 132it [00:13, 9.88it/s] 134it [00:13, 9.94it/s] 136it [00:14, 9.99it/s] 137it [00:14, 9.50it/s] 138it [00:14, 9.55it/s] 140it [00:14, 9.74it/s] 141it [00:14, 9.80it/s] 142it [00:14, 9.35it/s] 144it [00:14, 9.63it/s] 146it [00:15, 9.80it/s] 147it [00:15, 9.81it/s] 148it [00:15, 9.29it/s] 149it [00:15, 9.08it/s] 150it [00:15, 9.20it/s]2025-05-26 04:05:32,211 - INFO - [Epoch 039 | Batch 0150] IWAE-loss 6551.1885 | mean log_px -0.0438 | KL -3480.69 + 151it [00:15, 9.36it/s] 152it [00:15, 9.51it/s] 153it [00:15, 9.06it/s] 154it [00:16, 9.29it/s] 155it [00:16, 9.46it/s] 156it [00:16, 9.57it/s] 157it [00:16, 9.67it/s] 158it [00:16, 9.72it/s] 159it [00:16, 9.69it/s] 160it [00:16, 9.27it/s] 161it [00:16, 9.47it/s] 162it [00:16, 9.59it/s] 163it [00:16, 9.69it/s] 164it [00:17, 9.17it/s] 165it [00:17, 9.39it/s] 167it [00:17, 9.69it/s] 168it [00:17, 9.73it/s] 169it [00:17, 9.79it/s] 170it [00:17, 9.81it/s] 171it [00:17, 9.29it/s] 172it [00:17, 9.47it/s] 173it [00:17, 9.57it/s] 174it [00:18, 9.64it/s] 175it [00:18, 9.15it/s] 176it [00:18, 9.37it/s] 178it [00:18, 9.70it/s] 180it [00:18, 9.50it/s] 182it [00:18, 9.68it/s] 183it [00:19, 9.70it/s] 184it [00:19, 9.30it/s] 186it [00:19, 9.59it/s] 187it [00:19, 9.66it/s] 188it [00:19, 9.71it/s] 190it [00:19, 9.85it/s] 192it [00:19, 9.94it/s] 193it [00:20, 9.95it/s] 195it [00:20, 9.69it/s] 196it [00:20, 9.60it/s] +2025-05-26 04:05:36,988 - INFO - Epoch: 39, Objective: tensor([6474.6235], device='cuda:0', grad_fn=), Loss: 0.045537568628787994, KL/n: 71.1382827758789 + 0it [00:00, ?it/s]2025-05-26 04:05:37,451 - INFO - [Epoch 040 | Batch 0000] IWAE-loss 7672.9946 | mean log_px -0.0628 | KL -3483.29 + 1it [00:00, 4.57it/s] 2it [00:00, 6.70it/s] 4it [00:00, 7.98it/s] 6it [00:00, 8.83it/s] 7it [00:00, 8.68it/s] 9it [00:01, 9.21it/s] 11it [00:01, 9.14it/s] 12it [00:01, 9.30it/s] 14it [00:01, 9.57it/s] 15it [00:01, 9.24it/s] 17it [00:01, 9.54it/s] 18it [00:02, 9.20it/s] 20it [00:02, 9.48it/s] 22it [00:02, 9.66it/s] 23it [00:02, 9.31it/s] 24it [00:02, 9.44it/s] 25it [00:02, 9.56it/s] 26it [00:02, 9.65it/s] 27it [00:02, 9.70it/s] 28it [00:03, 9.32it/s] 29it [00:03, 9.50it/s] 30it [00:03, 9.56it/s] 31it [00:03, 9.05it/s] 32it [00:03, 9.30it/s] 33it [00:03, 9.49it/s] 34it [00:03, 9.61it/s] 36it [00:03, 9.41it/s] 38it [00:04, 9.63it/s] 39it [00:04, 9.25it/s] 40it [00:04, 9.40it/s] 42it [00:04, 9.67it/s] 44it [00:04, 9.41it/s] 45it [00:04, 9.52it/s] 46it [00:04, 9.45it/s] 47it [00:05, 9.57it/s] 48it [00:05, 9.67it/s] 49it [00:05, 9.31it/s] 50it [00:05, 9.45it/s]2025-05-26 04:05:42,753 - INFO - [Epoch 040 | Batch 0050] IWAE-loss 5287.8018 | mean log_px -0.0307 | KL -3482.75 + 51it [00:05, 9.55it/s] 53it [00:05, 9.32it/s] 54it [00:05, 9.47it/s] 55it [00:05, 9.60it/s] 57it [00:06, 9.79it/s] 59it [00:06, 9.89it/s] 61it [00:06, 9.53it/s] 62it [00:06, 9.61it/s] 64it [00:06, 9.77it/s] 65it [00:06, 9.39it/s] 66it [00:07, 9.52it/s] 68it [00:07, 9.30it/s] 69it [00:07, 9.44it/s] 70it [00:07, 9.55it/s] 71it [00:07, 9.64it/s] 72it [00:07, 9.22it/s] 74it [00:07, 9.55it/s] 76it [00:08, 9.74it/s] 77it [00:08, 9.42it/s] 78it [00:08, 9.53it/s] 79it [00:08, 9.63it/s] 81it [00:08, 9.37it/s] 82it [00:08, 9.51it/s] 84it [00:08, 9.72it/s] 86it [00:09, 9.48it/s] 88it [00:09, 9.66it/s] 90it [00:09, 9.79it/s] 91it [00:09, 9.43it/s] 92it [00:09, 9.54it/s] 93it [00:09, 9.64it/s] 94it [00:09, 9.68it/s] 95it [00:10, 9.75it/s] 97it [00:10, 9.88it/s] 98it [00:10, 9.40it/s] 100it [00:10, 9.63it/s]2025-05-26 04:05:47,970 - INFO - [Epoch 040 | Batch 0100] IWAE-loss 6247.6255 | mean log_px -0.0492 | KL -3478.28 + 101it [00:10, 9.71it/s] 103it [00:10, 9.42it/s] 105it [00:11, 9.64it/s] 106it [00:11, 9.70it/s] 107it [00:11, 9.29it/s] 108it [00:11, 9.45it/s] 109it [00:11, 9.59it/s] 111it [00:11, 9.78it/s] 112it [00:11, 9.36it/s] 114it [00:12, 9.60it/s] 116it [00:12, 9.38it/s] 118it [00:12, 9.60it/s] 119it [00:12, 9.67it/s] 121it [00:12, 9.42it/s] 122it [00:12, 9.52it/s] 123it [00:13, 9.62it/s] 124it [00:13, 9.71it/s] 125it [00:13, 9.26it/s] 127it [00:13, 9.59it/s] 128it [00:13, 9.66it/s] 129it [00:13, 9.74it/s] 130it [00:13, 9.81it/s] 131it [00:13, 9.40it/s] 133it [00:14, 9.67it/s] 135it [00:14, 9.82it/s] 137it [00:14, 9.53it/s] 138it [00:14, 9.60it/s] 139it [00:14, 9.69it/s] 140it [00:14, 9.26it/s] 141it [00:14, 9.43it/s] 142it [00:15, 9.56it/s] 144it [00:15, 9.33it/s] 145it [00:15, 9.48it/s] 147it [00:15, 9.29it/s] 148it [00:15, 9.43it/s] 149it [00:15, 9.54it/s] 150it [00:15, 9.63it/s]2025-05-26 04:05:53,210 - INFO - [Epoch 040 | Batch 0150] IWAE-loss 6392.1655 | mean log_px -0.0420 | KL -3472.99 + 151it [00:15, 9.69it/s] 152it [00:16, 9.31it/s] 154it [00:16, 9.61it/s] 155it [00:16, 9.69it/s] 156it [00:16, 9.17it/s] 158it [00:16, 9.51it/s] 159it [00:16, 9.60it/s] 160it [00:16, 9.69it/s] 161it [00:17, 9.26it/s] 162it [00:17, 9.45it/s] 163it [00:17, 9.59it/s] 165it [00:17, 9.33it/s] 166it [00:17, 9.48it/s] 168it [00:17, 9.28it/s] 169it [00:17, 9.43it/s] 170it [00:17, 9.54it/s] 172it [00:18, 9.31it/s] 174it [00:18, 9.58it/s] 175it [00:18, 9.65it/s] 177it [00:18, 9.41it/s] 179it [00:18, 9.62it/s] 181it [00:19, 9.78it/s] 182it [00:19, 9.47it/s] 183it [00:19, 9.57it/s] 184it [00:19, 9.65it/s] 185it [00:19, 9.24it/s] 186it [00:19, 9.40it/s] 188it [00:19, 9.67it/s] 189it [00:19, 9.27it/s] 191it [00:20, 9.58it/s] 193it [00:20, 9.76it/s] 194it [00:20, 9.47it/s] 195it [00:20, 9.28it/s] 196it [00:20, 9.44it/s] +2025-05-26 04:05:58,058 - INFO - Epoch: 40, Objective: tensor([5746.3809], device='cuda:0', grad_fn=), Loss: 0.034290388226509094, KL/n: 70.98202514648438 + 0it [00:00, ?it/s]2025-05-26 04:05:58,332 - INFO - [Epoch 041 | Batch 0000] IWAE-loss 5749.5537 | mean log_px -0.0346 | KL -3479.12 + 1it [00:00, 4.67it/s] 2it [00:00, 6.80it/s] 4it [00:00, 8.07it/s] 6it [00:00, 8.95it/s] 7it [00:00, 9.19it/s] 9it [00:01, 9.15it/s] 11it [00:01, 9.49it/s] 12it [00:01, 9.57it/s] 13it [00:01, 9.63it/s] 15it [00:01, 9.81it/s] 16it [00:01, 9.42it/s] 18it [00:01, 9.68it/s] 19it [00:02, 9.47it/s] 20it [00:02, 8.85it/s] 21it [00:02, 9.09it/s] 22it [00:02, 9.30it/s] 23it [00:02, 9.48it/s] 24it [00:02, 9.59it/s] 25it [00:02, 9.12it/s] 26it [00:02, 9.34it/s] 27it [00:02, 9.50it/s] 28it [00:03, 9.63it/s] 29it [00:03, 9.73it/s] 30it [00:03, 9.16it/s] 31it [00:03, 9.36it/s] 32it [00:03, 9.41it/s] 34it [00:03, 9.73it/s] 36it [00:03, 9.88it/s] 37it [00:03, 9.46it/s] 39it [00:04, 9.71it/s] 41it [00:04, 9.88it/s] 42it [00:04, 9.49it/s] 44it [00:04, 9.71it/s] 46it [00:04, 9.86it/s] 47it [00:05, 9.45it/s] 49it [00:05, 9.69it/s]2025-05-26 04:06:03,568 - INFO - [Epoch 041 | Batch 0050] IWAE-loss 5837.0518 | mean log_px -0.0380 | KL -3473.68 + 51it [00:05, 9.49it/s] 53it [00:05, 9.69it/s] 55it [00:05, 9.84it/s] 56it [00:05, 9.49it/s] 58it [00:06, 9.71it/s] 60it [00:06, 9.85it/s] 61it [00:06, 9.57it/s] 63it [00:06, 9.75it/s] 65it [00:06, 9.44it/s] 67it [00:07, 9.66it/s] 69it [00:07, 9.82it/s] 70it [00:07, 9.47it/s] 72it [00:07, 9.67it/s] 74it [00:07, 9.83it/s] 75it [00:07, 9.46it/s] 77it [00:08, 9.67it/s] 79it [00:08, 9.82it/s] 80it [00:08, 9.72it/s] 81it [00:08, 9.65it/s] 82it [00:08, 9.54it/s] 83it [00:08, 9.60it/s] 84it [00:08, 9.68it/s] 85it [00:08, 9.75it/s] 86it [00:09, 9.80it/s] 87it [00:09, 9.46it/s] 88it [00:09, 9.59it/s] 89it [00:09, 9.69it/s] 90it [00:09, 9.36it/s] 91it [00:09, 9.42it/s] 92it [00:09, 9.43it/s] 93it [00:09, 9.54it/s] 94it [00:09, 9.63it/s] 95it [00:09, 9.69it/s] 96it [00:10, 9.72it/s] 97it [00:10, 9.70it/s] 98it [00:10, 9.68it/s] 99it [00:10, 9.60it/s] 100it [00:10, 9.68it/s]2025-05-26 04:06:08,762 - INFO - [Epoch 041 | Batch 0100] IWAE-loss 5281.2070 | mean log_px -0.0259 | KL -3478.21 + 101it [00:10, 9.71it/s] 102it [00:10, 9.12it/s] 103it [00:10, 9.26it/s] 104it [00:10, 9.36it/s] 105it [00:11, 8.91it/s] 106it [00:11, 9.15it/s] 107it [00:11, 9.35it/s] 108it [00:11, 9.47it/s] 109it [00:11, 9.58it/s] 110it [00:11, 9.63it/s] 111it [00:11, 9.69it/s] 112it [00:11, 9.74it/s] 113it [00:11, 9.72it/s] 114it [00:12, 9.47it/s] 115it [00:12, 9.23it/s] 116it [00:12, 9.41it/s] 117it [00:12, 9.57it/s] 118it [00:12, 9.65it/s] 119it [00:12, 9.16it/s] 120it [00:12, 9.35it/s] 121it [00:12, 9.52it/s] 122it [00:12, 9.64it/s] 123it [00:12, 9.72it/s] 124it [00:13, 9.20it/s] 125it [00:13, 9.42it/s] 126it [00:13, 9.55it/s] 127it [00:13, 9.66it/s] 128it [00:13, 9.73it/s] 129it [00:13, 9.22it/s] 130it [00:13, 9.40it/s] 131it [00:13, 9.55it/s] 132it [00:13, 9.66it/s] 133it [00:13, 9.75it/s] 134it [00:14, 9.23it/s] 135it [00:14, 9.43it/s] 136it [00:14, 9.57it/s] 137it [00:14, 9.68it/s] 138it [00:14, 9.19it/s] 139it [00:14, 9.40it/s] 140it [00:14, 9.54it/s] 141it [00:14, 9.65it/s] 142it [00:14, 9.72it/s] 143it [00:15, 9.79it/s] 144it [00:15, 9.81it/s] 145it [00:15, 9.85it/s] 146it [00:15, 9.85it/s] 147it [00:15, 9.87it/s] 148it [00:15, 9.87it/s] 149it [00:15, 9.90it/s] 150it [00:15, 9.91it/s]2025-05-26 04:06:14,002 - INFO - [Epoch 041 | Batch 0150] IWAE-loss 5604.3018 | mean log_px -0.0409 | KL -3472.15 + 151it [00:15, 9.91it/s] 152it [00:15, 9.92it/s] 153it [00:16, 9.92it/s] 154it [00:16, 9.87it/s] 155it [00:16, 9.89it/s] 156it [00:16, 9.89it/s] 157it [00:16, 9.33it/s] 158it [00:16, 9.34it/s] 159it [00:16, 9.47it/s] 160it [00:16, 9.58it/s] 161it [00:16, 9.64it/s] 162it [00:17, 9.59it/s] 163it [00:17, 9.66it/s] 164it [00:17, 9.68it/s] 165it [00:17, 9.73it/s] 166it [00:17, 9.33it/s] 167it [00:17, 9.47it/s] 168it [00:17, 9.59it/s] 169it [00:17, 9.10it/s] 170it [00:17, 9.22it/s] 171it [00:17, 9.43it/s] 172it [00:18, 9.48it/s] 173it [00:18, 9.55it/s] 174it [00:18, 9.54it/s] 175it [00:18, 9.26it/s] 176it [00:18, 9.44it/s] 177it [00:18, 9.58it/s] 178it [00:18, 9.67it/s] 179it [00:18, 9.77it/s] 180it [00:18, 9.81it/s] 181it [00:18, 9.84it/s] 182it [00:19, 9.85it/s] 183it [00:19, 9.87it/s] 184it [00:19, 9.88it/s] 185it [00:19, 9.90it/s] 186it [00:19, 9.33it/s] 187it [00:19, 9.51it/s] 188it [00:19, 9.63it/s] 189it [00:19, 9.73it/s] 190it [00:19, 9.79it/s] 191it [00:20, 9.82it/s] 192it [00:20, 9.28it/s] 193it [00:20, 9.45it/s] 194it [00:20, 9.56it/s] 195it [00:20, 9.10it/s] 196it [00:20, 9.51it/s] +2025-05-26 04:06:18,806 - INFO - Epoch: 41, Objective: tensor([4431.4009], device='cuda:0', grad_fn=), Loss: 0.017086666077375412, KL/n: 70.84024810791016 + 0it [00:00, ?it/s]2025-05-26 04:06:19,262 - INFO - [Epoch 042 | Batch 0000] IWAE-loss 7730.5332 | mean log_px -0.0675 | KL -3471.14 + 1it [00:00, 5.38it/s] 2it [00:00, 7.32it/s] 3it [00:00, 8.27it/s] 4it [00:00, 8.78it/s] 5it [00:00, 9.16it/s] 6it [00:00, 9.36it/s] 7it [00:00, 9.51it/s] 8it [00:00, 9.59it/s] 9it [00:01, 9.67it/s] 10it [00:01, 9.65it/s] 11it [00:01, 9.67it/s] 12it [00:01, 9.69it/s] 13it [00:01, 9.74it/s] 14it [00:01, 9.76it/s] 15it [00:01, 9.75it/s] 16it [00:01, 9.74it/s] 17it [00:01, 9.75it/s] 18it [00:01, 9.73it/s] 19it [00:02, 9.77it/s] 20it [00:02, 9.79it/s] 21it [00:02, 9.82it/s] 22it [00:02, 9.82it/s] 23it [00:02, 9.81it/s] 24it [00:02, 9.80it/s] 25it [00:02, 9.53it/s] 26it [00:02, 9.62it/s] 27it [00:02, 9.71it/s] 28it [00:02, 9.74it/s] 29it [00:03, 9.78it/s] 30it [00:03, 9.76it/s] 31it [00:03, 9.79it/s] 32it [00:03, 9.78it/s] 33it [00:03, 9.80it/s] 34it [00:03, 9.78it/s] 35it [00:03, 9.82it/s] 36it [00:03, 9.82it/s] 37it [00:03, 9.83it/s] 38it [00:03, 9.84it/s] 39it [00:04, 9.54it/s] 40it [00:04, 9.61it/s] 41it [00:04, 9.66it/s] 42it [00:04, 9.68it/s] 43it [00:04, 9.72it/s] 44it [00:04, 9.73it/s] 45it [00:04, 9.76it/s] 46it [00:04, 9.74it/s] 47it [00:04, 9.76it/s] 48it [00:05, 9.80it/s] 49it [00:05, 9.76it/s] 50it [00:05, 9.75it/s]2025-05-26 04:06:24,389 - INFO - [Epoch 042 | Batch 0050] IWAE-loss 6543.3037 | mean log_px -0.0493 | KL -3464.77 + 51it [00:05, 9.74it/s] 52it [00:05, 9.73it/s] 53it [00:05, 9.56it/s] 54it [00:05, 9.57it/s] 55it [00:05, 9.62it/s] 56it [00:05, 9.45it/s] 57it [00:05, 9.56it/s] 58it [00:06, 9.62it/s] 59it [00:06, 9.66it/s] 60it [00:06, 9.70it/s] 61it [00:06, 9.71it/s] 62it [00:06, 9.72it/s] 63it [00:06, 9.71it/s] 64it [00:06, 9.72it/s] 65it [00:06, 9.76it/s] 66it [00:06, 9.74it/s] 67it [00:06, 9.77it/s] 68it [00:07, 9.76it/s] 69it [00:07, 9.78it/s] 70it [00:07, 9.77it/s] 71it [00:07, 9.76it/s] 72it [00:07, 9.78it/s] 73it [00:07, 9.81it/s] 74it [00:07, 9.81it/s] 75it [00:07, 9.83it/s] 76it [00:07, 9.80it/s] 77it [00:07, 9.82it/s] 78it [00:08, 9.79it/s] 79it [00:08, 9.83it/s] 80it [00:08, 9.84it/s] 81it [00:08, 9.83it/s] 82it [00:08, 9.80it/s] 83it [00:08, 9.83it/s] 84it [00:08, 9.80it/s] 85it [00:08, 9.68it/s] 86it [00:08, 9.71it/s] 87it [00:09, 9.17it/s] 88it [00:09, 9.34it/s] 89it [00:09, 9.47it/s] 90it [00:09, 9.57it/s] 91it [00:09, 9.64it/s] 92it [00:09, 9.08it/s] 93it [00:09, 9.29it/s] 94it [00:09, 9.35it/s] 95it [00:09, 9.41it/s] 96it [00:09, 9.51it/s] 97it [00:10, 9.61it/s] 98it [00:10, 9.46it/s] 99it [00:10, 9.56it/s] 100it [00:10, 9.60it/s]2025-05-26 04:06:29,577 - INFO - [Epoch 042 | Batch 0100] IWAE-loss 4768.8535 | mean log_px -0.0224 | KL -3467.10 + 101it [00:10, 9.61it/s] 102it [00:10, 9.67it/s] 103it [00:10, 9.74it/s] 104it [00:10, 9.77it/s] 105it [00:10, 9.78it/s] 106it [00:11, 9.80it/s] 107it [00:11, 9.81it/s] 108it [00:11, 9.58it/s] 109it [00:11, 9.66it/s] 110it [00:11, 9.69it/s] 111it [00:11, 9.51it/s] 112it [00:11, 9.56it/s] 113it [00:11, 9.60it/s] 114it [00:11, 9.66it/s] 115it [00:11, 9.71it/s] 116it [00:12, 9.74it/s] 117it [00:12, 9.73it/s] 118it [00:12, 9.77it/s] 119it [00:12, 9.81it/s] 120it [00:12, 9.78it/s] 121it [00:12, 9.54it/s] 122it [00:12, 9.25it/s] 123it [00:12, 9.22it/s] 124it [00:12, 9.33it/s] 125it [00:13, 9.37it/s] 126it [00:13, 9.43it/s] 127it [00:13, 9.49it/s] 128it [00:13, 9.51it/s] 129it [00:13, 9.55it/s] 130it [00:13, 9.55it/s] 131it [00:13, 9.59it/s] 132it [00:13, 9.57it/s] 133it [00:13, 9.50it/s] 134it [00:13, 9.46it/s] 135it [00:14, 9.58it/s] 136it [00:14, 9.58it/s] 137it [00:14, 9.67it/s] 138it [00:14, 9.68it/s] 139it [00:14, 9.65it/s] 140it [00:14, 9.69it/s] 141it [00:14, 9.73it/s] 142it [00:14, 9.74it/s] 143it [00:14, 9.77it/s] 144it [00:14, 9.77it/s] 145it [00:15, 9.74it/s] 146it [00:15, 9.74it/s] 147it [00:15, 9.78it/s] 148it [00:15, 9.76it/s] 149it [00:15, 9.76it/s] 150it [00:15, 9.77it/s]2025-05-26 04:06:34,764 - INFO - [Epoch 042 | Batch 0150] IWAE-loss 5339.9580 | mean log_px -0.0337 | KL -3464.08 + 151it [00:15, 9.65it/s] 152it [00:15, 9.60it/s] 153it [00:15, 9.67it/s] 154it [00:15, 9.70it/s] 155it [00:16, 9.72it/s] 156it [00:16, 9.47it/s] 157it [00:16, 9.57it/s] 158it [00:16, 9.62it/s] 159it [00:16, 9.68it/s] 160it [00:16, 9.70it/s] 161it [00:16, 9.73it/s] 162it [00:16, 9.73it/s] 163it [00:16, 9.78it/s] 164it [00:17, 9.78it/s] 165it [00:17, 9.77it/s] 166it [00:17, 9.80it/s] 167it [00:17, 9.80it/s] 168it [00:17, 9.74it/s] 169it [00:17, 9.54it/s] 170it [00:17, 9.58it/s] 171it [00:17, 9.61it/s] 172it [00:17, 9.66it/s] 173it [00:17, 9.69it/s] 174it [00:18, 9.71it/s] 175it [00:18, 9.75it/s] 176it [00:18, 9.75it/s] 177it [00:18, 9.76it/s] 178it [00:18, 9.75it/s] 179it [00:18, 9.70it/s] 180it [00:18, 9.71it/s] 181it [00:18, 9.73it/s] 182it [00:18, 9.73it/s] 183it [00:18, 9.77it/s] 184it [00:19, 9.75it/s] 185it [00:19, 9.79it/s] 186it [00:19, 9.80it/s] 187it [00:19, 9.80it/s] 188it [00:19, 9.81it/s] 189it [00:19, 9.82it/s] 190it [00:19, 9.82it/s] 191it [00:19, 9.83it/s] 192it [00:19, 9.83it/s] 193it [00:20, 9.85it/s] 194it [00:20, 9.84it/s] 195it [00:20, 9.09it/s] 196it [00:20, 8.80it/s] 196it [00:20, 9.60it/s] +2025-05-26 04:06:39,541 - INFO - Epoch: 42, Objective: tensor([5298.1240], device='cuda:0', grad_fn=), Loss: 0.0280563123524189, KL/n: 70.67806243896484 + 0it [00:00, ?it/s]2025-05-26 04:06:39,813 - INFO - [Epoch 043 | Batch 0000] IWAE-loss 4510.7559 | mean log_px -0.0216 | KL -3460.82 + 1it [00:00, 5.26it/s] 2it [00:00, 7.23it/s] 3it [00:00, 7.54it/s] 4it [00:00, 7.82it/s] 5it [00:00, 8.46it/s] 6it [00:00, 8.86it/s] 7it [00:00, 9.14it/s] 8it [00:00, 9.34it/s] 9it [00:01, 8.91it/s] 10it [00:01, 9.14it/s] 11it [00:01, 9.27it/s] 12it [00:01, 9.43it/s] 13it [00:01, 9.16it/s] 14it [00:01, 9.35it/s] 15it [00:01, 9.49it/s] 16it [00:01, 9.59it/s] 17it [00:01, 9.12it/s] 18it [00:02, 9.33it/s] 19it [00:02, 9.48it/s] 20it [00:02, 9.60it/s] 21it [00:02, 9.66it/s] 22it [00:02, 9.69it/s] 23it [00:02, 9.74it/s] 24it [00:02, 9.76it/s] 25it [00:02, 9.78it/s] 26it [00:02, 9.80it/s] 27it [00:02, 9.82it/s] 28it [00:03, 9.23it/s] 29it [00:03, 9.41it/s] 30it [00:03, 9.54it/s] 31it [00:03, 9.64it/s] 32it [00:03, 9.68it/s] 33it [00:03, 9.68it/s] 34it [00:03, 9.72it/s] 35it [00:03, 9.76it/s] 36it [00:03, 9.78it/s] 37it [00:03, 9.79it/s] 38it [00:04, 9.69it/s] 39it [00:04, 9.73it/s] 40it [00:04, 9.76it/s] 41it [00:04, 9.78it/s] 42it [00:04, 9.77it/s] 43it [00:04, 9.79it/s] 44it [00:04, 9.79it/s] 45it [00:04, 9.81it/s] 46it [00:04, 9.82it/s] 47it [00:05, 9.26it/s] 48it [00:05, 9.36it/s] 49it [00:05, 9.51it/s] 50it [00:05, 9.58it/s]2025-05-26 04:06:45,062 - INFO - [Epoch 043 | Batch 0050] IWAE-loss 4645.6123 | mean log_px -0.0196 | KL -3460.41 + 51it [00:05, 9.61it/s] 52it [00:05, 9.68it/s] 53it [00:05, 9.74it/s] 54it [00:05, 9.75it/s] 55it [00:05, 9.79it/s] 56it [00:05, 9.80it/s] 57it [00:06, 9.83it/s] 58it [00:06, 9.75it/s] 59it [00:06, 9.80it/s] 60it [00:06, 9.80it/s] 61it [00:06, 9.82it/s] 62it [00:06, 9.76it/s] 63it [00:06, 9.21it/s] 64it [00:06, 9.39it/s] 65it [00:06, 9.51it/s] 66it [00:06, 9.59it/s] 67it [00:07, 9.64it/s] 68it [00:07, 9.68it/s] 69it [00:07, 9.35it/s] 70it [00:07, 9.49it/s] 71it [00:07, 9.60it/s] 72it [00:07, 9.65it/s] 73it [00:07, 9.69it/s] 74it [00:07, 9.63it/s] 75it [00:07, 9.54it/s] 76it [00:08, 9.53it/s] 77it [00:08, 9.51it/s] 78it [00:08, 9.53it/s] 79it [00:08, 9.53it/s] 80it [00:08, 9.57it/s] 81it [00:08, 9.49it/s] 82it [00:08, 9.15it/s] 83it [00:08, 9.23it/s] 84it [00:08, 9.32it/s] 85it [00:08, 9.41it/s] 86it [00:09, 9.41it/s] 87it [00:09, 9.47it/s] 88it [00:09, 9.44it/s] 89it [00:09, 9.51it/s] 90it [00:09, 9.56it/s] 91it [00:09, 9.56it/s] 92it [00:09, 9.52it/s] 93it [00:09, 9.56it/s] 94it [00:09, 9.41it/s] 95it [00:10, 9.45it/s] 96it [00:10, 9.49it/s] 97it [00:10, 9.47it/s] 98it [00:10, 9.49it/s] 99it [00:10, 9.53it/s] 100it [00:10, 9.52it/s]2025-05-26 04:06:50,297 - INFO - [Epoch 043 | Batch 0100] IWAE-loss 7542.3433 | mean log_px -0.0583 | KL -3461.22 + 101it [00:10, 9.19it/s] 102it [00:10, 9.31it/s] 103it [00:10, 9.37it/s] 104it [00:10, 9.39it/s] 105it [00:11, 9.44it/s] 106it [00:11, 8.75it/s] 107it [00:11, 9.01it/s] 108it [00:11, 9.15it/s] 109it [00:11, 9.33it/s] 110it [00:11, 9.37it/s] 111it [00:11, 9.40it/s] 112it [00:11, 9.47it/s] 113it [00:11, 9.47it/s] 114it [00:12, 9.48it/s] 115it [00:12, 9.50it/s] 116it [00:12, 9.52it/s] 117it [00:12, 9.57it/s] 118it [00:12, 9.58it/s] 119it [00:12, 9.46it/s] 120it [00:12, 9.40it/s] 121it [00:12, 9.50it/s] 122it [00:12, 9.52it/s] 123it [00:13, 9.46it/s] 124it [00:13, 9.55it/s] 125it [00:13, 9.62it/s] 126it [00:13, 9.24it/s] 127it [00:13, 9.40it/s] 128it [00:13, 9.51it/s] 129it [00:13, 9.60it/s] 130it [00:13, 9.65it/s] 131it [00:13, 9.65it/s] 132it [00:13, 9.67it/s] 133it [00:14, 9.69it/s] 134it [00:14, 9.70it/s] 135it [00:14, 9.72it/s] 136it [00:14, 9.71it/s] 137it [00:14, 9.17it/s] 138it [00:14, 9.33it/s] 139it [00:14, 9.44it/s] 140it [00:14, 9.55it/s] 141it [00:14, 9.63it/s] 142it [00:15, 9.67it/s] 143it [00:15, 9.70it/s] 144it [00:15, 9.73it/s] 145it [00:15, 9.75it/s] 146it [00:15, 9.71it/s] 147it [00:15, 9.33it/s] 148it [00:15, 9.46it/s] 149it [00:15, 9.56it/s] 150it [00:15, 9.01it/s]2025-05-26 04:06:55,594 - INFO - [Epoch 043 | Batch 0150] IWAE-loss 4443.6572 | mean log_px -0.0191 | KL -3451.98 + 151it [00:15, 9.19it/s] 152it [00:16, 9.33it/s] 153it [00:16, 9.44it/s] 154it [00:16, 9.32it/s] 155it [00:16, 9.34it/s] 156it [00:16, 9.37it/s] 157it [00:16, 9.38it/s] 158it [00:16, 8.95it/s] 159it [00:16, 9.05it/s] 160it [00:16, 9.18it/s] 161it [00:17, 9.33it/s] 162it [00:17, 9.42it/s] 163it [00:17, 9.50it/s] 164it [00:17, 9.58it/s] 165it [00:17, 9.65it/s] 166it [00:17, 9.69it/s] 167it [00:17, 9.21it/s] 168it [00:17, 9.38it/s] 169it [00:17, 9.50it/s] 170it [00:17, 9.55it/s] 171it [00:18, 9.61it/s] 172it [00:18, 9.65it/s] 173it [00:18, 9.70it/s] 174it [00:18, 9.71it/s] 175it [00:18, 9.70it/s] 176it [00:18, 9.72it/s] 177it [00:18, 9.74it/s] 178it [00:18, 9.72it/s] 179it [00:18, 9.75it/s] 180it [00:19, 9.75it/s] 181it [00:19, 9.77it/s] 182it [00:19, 9.76it/s] 183it [00:19, 9.78it/s] 184it [00:19, 9.74it/s] 185it [00:19, 9.71it/s] 186it [00:19, 9.10it/s] 187it [00:19, 9.29it/s] 188it [00:19, 9.42it/s] 189it [00:19, 9.48it/s] 190it [00:20, 9.54it/s] 191it [00:20, 9.60it/s] 192it [00:20, 9.61it/s] 193it [00:20, 9.63it/s] 194it [00:20, 9.64it/s] 195it [00:20, 9.05it/s] 196it [00:20, 9.29it/s] 196it [00:20, 9.44it/s] +2025-05-26 04:07:00,429 - INFO - Epoch: 43, Objective: tensor([4990.5254], device='cuda:0', grad_fn=), Loss: 0.022801268845796585, KL/n: 70.53202056884766 + 0it [00:00, ?it/s]2025-05-26 04:07:00,879 - INFO - [Epoch 044 | Batch 0000] IWAE-loss 8241.9609 | mean log_px -0.0746 | KL -3451.67 + 1it [00:00, 4.72it/s] 2it [00:00, 6.78it/s] 3it [00:00, 7.90it/s] 4it [00:00, 8.53it/s] 5it [00:00, 8.33it/s] 6it [00:00, 8.74it/s] 7it [00:00, 9.05it/s] 8it [00:00, 9.21it/s] 9it [00:01, 8.70it/s] 10it [00:01, 8.97it/s] 11it [00:01, 9.14it/s] 12it [00:01, 9.26it/s] 13it [00:01, 9.40it/s] 14it [00:01, 9.27it/s] 15it [00:01, 9.40it/s] 16it [00:01, 9.47it/s] 17it [00:01, 9.54it/s] 18it [00:02, 9.46it/s] 19it [00:02, 9.53it/s] 20it [00:02, 9.50it/s] 21it [00:02, 8.70it/s] 22it [00:02, 8.57it/s] 23it [00:02, 8.70it/s] 24it [00:02, 8.43it/s] 25it [00:02, 8.76it/s] 26it [00:02, 9.01it/s] 27it [00:03, 9.18it/s] 28it [00:03, 9.27it/s] 29it [00:03, 9.37it/s] 30it [00:03, 9.44it/s] 31it [00:03, 9.51it/s] 32it [00:03, 9.30it/s] 33it [00:03, 9.32it/s] 34it [00:03, 9.40it/s] 35it [00:03, 9.16it/s] 36it [00:04, 9.29it/s] 37it [00:04, 9.39it/s] 38it [00:04, 9.46it/s] 39it [00:04, 9.54it/s] 40it [00:04, 9.55it/s] 41it [00:04, 9.58it/s] 42it [00:04, 9.61it/s] 43it [00:04, 9.63it/s] 44it [00:04, 9.65it/s] 45it [00:04, 9.67it/s] 46it [00:05, 9.28it/s] 47it [00:05, 9.40it/s] 48it [00:05, 9.47it/s] 49it [00:05, 9.53it/s] 50it [00:05, 9.56it/s]2025-05-26 04:07:06,269 - INFO - [Epoch 044 | Batch 0050] IWAE-loss 8636.9531 | mean log_px -0.0781 | KL -3454.60 + 51it [00:05, 9.57it/s] 52it [00:05, 9.57it/s] 53it [00:05, 9.45it/s] 54it [00:05, 9.50it/s] 55it [00:05, 9.51it/s] 56it [00:06, 8.99it/s] 57it [00:06, 9.18it/s] 58it [00:06, 9.18it/s] 59it [00:06, 9.13it/s] 60it [00:06, 8.49it/s] 61it [00:06, 8.81it/s] 62it [00:06, 9.03it/s] 63it [00:06, 9.21it/s] 64it [00:06, 9.33it/s] 65it [00:07, 9.43it/s] 66it [00:07, 9.48it/s] 67it [00:07, 9.48it/s] 68it [00:07, 9.39it/s] 69it [00:07, 9.11it/s] 70it [00:07, 9.15it/s] 71it [00:07, 9.29it/s] 72it [00:07, 9.38it/s] 73it [00:07, 9.42it/s] 74it [00:08, 9.47it/s] 75it [00:08, 9.52it/s] 76it [00:08, 9.54it/s] 77it [00:08, 9.57it/s] 78it [00:08, 9.60it/s] 79it [00:08, 9.55it/s] 80it [00:08, 9.57it/s] 81it [00:08, 9.49it/s] 82it [00:08, 9.52it/s] 83it [00:09, 9.54it/s] 84it [00:09, 9.43it/s] 85it [00:09, 9.50it/s] 86it [00:09, 9.38it/s] 87it [00:09, 8.85it/s] 88it [00:09, 9.08it/s] 89it [00:09, 9.19it/s] 90it [00:09, 8.79it/s] 91it [00:09, 8.99it/s] 92it [00:09, 9.17it/s] 93it [00:10, 9.30it/s] 94it [00:10, 9.02it/s] 95it [00:10, 9.08it/s] 96it [00:10, 9.23it/s] 97it [00:10, 9.34it/s] 98it [00:10, 9.41it/s] 99it [00:10, 9.48it/s] 100it [00:10, 9.53it/s]2025-05-26 04:07:11,654 - INFO - [Epoch 044 | Batch 0100] IWAE-loss 4468.0703 | mean log_px -0.0182 | KL -3448.35 + 101it [00:10, 9.40it/s] 102it [00:11, 9.45it/s] 103it [00:11, 9.49it/s] 104it [00:11, 9.54it/s] 105it [00:11, 9.57it/s] 106it [00:11, 9.59it/s] 107it [00:11, 9.60it/s] 108it [00:11, 9.58it/s] 109it [00:11, 9.61it/s] 110it [00:11, 9.61it/s] 111it [00:11, 9.64it/s] 112it [00:12, 9.65it/s] 113it [00:12, 9.63it/s] 114it [00:12, 9.64it/s] 115it [00:12, 9.64it/s] 116it [00:12, 9.64it/s] 117it [00:12, 9.63it/s] 118it [00:12, 9.64it/s] 119it [00:12, 9.64it/s] 120it [00:12, 9.64it/s] 121it [00:13, 9.52it/s] 122it [00:13, 9.40it/s] 123it [00:13, 9.33it/s] 124it [00:13, 9.42it/s] 125it [00:13, 9.50it/s] 126it [00:13, 9.48it/s] 127it [00:13, 9.53it/s] 128it [00:13, 9.50it/s] 129it [00:13, 9.42it/s] 130it [00:14, 8.92it/s] 131it [00:14, 9.12it/s] 132it [00:14, 9.26it/s] 133it [00:14, 9.37it/s] 134it [00:14, 9.44it/s] 135it [00:14, 9.51it/s] 136it [00:14, 9.54it/s] 137it [00:14, 9.57it/s] 138it [00:14, 9.59it/s] 139it [00:14, 9.62it/s] 140it [00:15, 9.62it/s] 141it [00:15, 9.64it/s] 142it [00:15, 8.95it/s] 143it [00:15, 9.14it/s] 144it [00:15, 9.28it/s] 145it [00:15, 9.39it/s] 146it [00:15, 9.45it/s] 147it [00:15, 8.97it/s] 148it [00:15, 9.16it/s] 149it [00:16, 9.32it/s] 150it [00:16, 9.31it/s]2025-05-26 04:07:16,944 - INFO - [Epoch 044 | Batch 0150] IWAE-loss 5638.1201 | mean log_px -0.0363 | KL -3448.95 + 151it [00:16, 9.28it/s] 152it [00:16, 9.30it/s] 153it [00:16, 9.33it/s] 154it [00:16, 9.39it/s] 155it [00:16, 9.42it/s] 156it [00:16, 9.45it/s] 157it [00:16, 9.48it/s] 158it [00:16, 9.50it/s] 159it [00:17, 9.51it/s] 160it [00:17, 9.49it/s] 161it [00:17, 9.54it/s] 162it [00:17, 9.56it/s] 163it [00:17, 9.45it/s] 164it [00:17, 9.48it/s] 165it [00:17, 9.48it/s] 166it [00:17, 9.48it/s] 167it [00:17, 9.33it/s] 168it [00:18, 9.36it/s] 169it [00:18, 9.51it/s] 170it [00:18, 9.59it/s] 171it [00:18, 9.67it/s] 172it [00:18, 9.73it/s] 173it [00:18, 9.78it/s] 174it [00:18, 9.80it/s] 175it [00:18, 9.80it/s] 176it [00:18, 9.79it/s] 177it [00:18, 9.80it/s] 178it [00:19, 9.81it/s] 179it [00:19, 9.82it/s] 180it [00:19, 9.75it/s] 181it [00:19, 9.76it/s] 182it [00:19, 9.76it/s] 183it [00:19, 9.77it/s] 184it [00:19, 9.79it/s] 185it [00:19, 9.80it/s] 186it [00:19, 9.80it/s] 187it [00:19, 9.80it/s] 188it [00:20, 9.79it/s] 189it [00:20, 9.78it/s] 190it [00:20, 9.80it/s] 191it [00:20, 9.82it/s] 192it [00:20, 9.81it/s] 193it [00:20, 9.81it/s] 194it [00:20, 9.81it/s] 195it [00:20, 9.27it/s] 196it [00:20, 9.35it/s] +2025-05-26 04:07:21,704 - INFO - Epoch: 44, Objective: tensor([5709.1240], device='cuda:0', grad_fn=), Loss: 0.03686925023794174, KL/n: 70.38143920898438 + 0it [00:00, ?it/s]2025-05-26 04:07:21,978 - INFO - [Epoch 045 | Batch 0000] IWAE-loss 6154.7354 | mean log_px -0.0426 | KL -3452.68 + 1it [00:00, 4.82it/s] 2it [00:00, 6.90it/s] 3it [00:00, 8.03it/s] 4it [00:00, 8.17it/s] 5it [00:00, 8.73it/s] 6it [00:00, 9.09it/s] 7it [00:00, 9.36it/s] 8it [00:00, 9.53it/s] 9it [00:01, 9.65it/s] 10it [00:01, 9.74it/s] 11it [00:01, 9.80it/s] 12it [00:01, 9.82it/s] 13it [00:01, 9.86it/s] 14it [00:01, 9.86it/s] 15it [00:01, 9.89it/s] 16it [00:01, 9.89it/s] 17it [00:01, 9.89it/s] 18it [00:01, 9.88it/s] 19it [00:02, 9.88it/s] 20it [00:02, 9.88it/s] 21it [00:02, 9.88it/s] 22it [00:02, 9.89it/s] 23it [00:02, 9.89it/s] 24it [00:02, 9.88it/s] 25it [00:02, 9.90it/s] 26it [00:02, 9.90it/s] 27it [00:02, 9.90it/s] 28it [00:02, 9.89it/s] 29it [00:03, 9.90it/s] 30it [00:03, 9.85it/s] 31it [00:03, 9.11it/s] 32it [00:03, 9.27it/s] 33it [00:03, 9.45it/s] 34it [00:03, 8.97it/s] 35it [00:03, 9.24it/s] 36it [00:03, 9.33it/s] 37it [00:03, 9.50it/s] 38it [00:04, 9.59it/s] 39it [00:04, 9.69it/s] 40it [00:04, 9.26it/s] 41it [00:04, 9.42it/s] 42it [00:04, 9.53it/s] 43it [00:04, 8.95it/s] 44it [00:04, 9.15it/s] 45it [00:04, 9.32it/s] 46it [00:04, 9.44it/s] 47it [00:04, 9.56it/s] 48it [00:05, 9.64it/s] 49it [00:05, 9.71it/s] 50it [00:05, 9.77it/s]2025-05-26 04:07:27,186 - INFO - [Epoch 045 | Batch 0050] IWAE-loss 4413.5903 | mean log_px -0.0159 | KL -3443.76 + 51it [00:05, 9.79it/s] 52it [00:05, 9.21it/s] 53it [00:05, 9.41it/s] 54it [00:05, 9.53it/s] 55it [00:05, 9.64it/s] 56it [00:05, 9.71it/s] 57it [00:06, 9.78it/s] 58it [00:06, 9.83it/s] 59it [00:06, 9.86it/s] 60it [00:06, 9.87it/s] 61it [00:06, 9.88it/s] 62it [00:06, 9.88it/s] 63it [00:06, 9.86it/s] 64it [00:06, 9.88it/s] 65it [00:06, 9.88it/s] 66it [00:06, 9.90it/s] 67it [00:07, 9.89it/s] 68it [00:07, 9.90it/s] 69it [00:07, 9.91it/s] 70it [00:07, 9.91it/s] 71it [00:07, 9.90it/s] 72it [00:07, 9.28it/s] 73it [00:07, 9.46it/s] 74it [00:07, 9.59it/s] 75it [00:07, 9.69it/s] 76it [00:07, 9.75it/s] 77it [00:08, 9.81it/s] 78it [00:08, 9.85it/s] 79it [00:08, 9.87it/s] 80it [00:08, 9.87it/s] 81it [00:08, 9.87it/s] 82it [00:08, 9.87it/s] 83it [00:08, 9.88it/s] 84it [00:08, 9.90it/s] 85it [00:08, 9.91it/s] 86it [00:08, 9.64it/s] 87it [00:09, 9.25it/s] 88it [00:09, 9.40it/s] 89it [00:09, 9.55it/s] 90it [00:09, 9.64it/s] 91it [00:09, 9.01it/s] 92it [00:09, 9.20it/s] 93it [00:09, 9.33it/s] 94it [00:09, 9.43it/s] 95it [00:09, 9.55it/s] 96it [00:10, 9.65it/s] 97it [00:10, 9.72it/s] 98it [00:10, 9.64it/s] 99it [00:10, 9.64it/s] 100it [00:10, 9.65it/s]2025-05-26 04:07:32,356 - INFO - [Epoch 045 | Batch 0100] IWAE-loss 5534.2393 | mean log_px -0.0361 | KL -3439.78 + 101it [00:10, 9.64it/s] 102it [00:10, 9.66it/s] 103it [00:10, 9.74it/s] 104it [00:10, 9.18it/s] 105it [00:10, 9.38it/s] 106it [00:11, 9.53it/s] 107it [00:11, 9.64it/s] 108it [00:11, 9.71it/s] 109it [00:11, 9.78it/s] 110it [00:11, 9.82it/s] 111it [00:11, 9.86it/s] 112it [00:11, 9.89it/s] 113it [00:11, 9.91it/s] 114it [00:11, 9.41it/s] 115it [00:12, 9.56it/s] 116it [00:12, 9.64it/s] 117it [00:12, 9.72it/s] 118it [00:12, 9.73it/s] 119it [00:12, 9.79it/s] 120it [00:12, 9.81it/s] 121it [00:12, 9.78it/s] 122it [00:12, 9.64it/s] 123it [00:12, 9.50it/s] 124it [00:12, 9.50it/s] 125it [00:13, 9.62it/s] 126it [00:13, 9.68it/s] 127it [00:13, 9.77it/s] 128it [00:13, 9.82it/s] 129it [00:13, 9.86it/s] 130it [00:13, 9.86it/s] 131it [00:13, 9.88it/s] 132it [00:13, 9.87it/s] 133it [00:13, 9.25it/s] 134it [00:13, 9.41it/s] 135it [00:14, 9.56it/s] 136it [00:14, 9.64it/s] 137it [00:14, 9.70it/s] 138it [00:14, 9.66it/s] 139it [00:14, 9.73it/s] 140it [00:14, 9.15it/s] 141it [00:14, 9.38it/s] 142it [00:14, 9.39it/s] 143it [00:14, 9.48it/s] 144it [00:15, 9.54it/s] 145it [00:15, 9.66it/s] 146it [00:15, 9.73it/s] 147it [00:15, 9.76it/s] 148it [00:15, 9.78it/s] 149it [00:15, 9.18it/s] 150it [00:15, 9.36it/s]2025-05-26 04:07:37,559 - INFO - [Epoch 045 | Batch 0150] IWAE-loss 5436.4814 | mean log_px -0.0340 | KL -3438.98 + 151it [00:15, 9.42it/s] 152it [00:15, 9.46it/s] 153it [00:15, 9.51it/s] 154it [00:16, 9.54it/s] 155it [00:16, 9.53it/s] 156it [00:16, 9.53it/s] 157it [00:16, 9.48it/s] 158it [00:16, 9.46it/s] 159it [00:16, 9.48it/s] 160it [00:16, 9.46it/s] 161it [00:16, 9.49it/s] 162it [00:16, 9.46it/s] 163it [00:17, 9.51it/s] 164it [00:17, 9.53it/s] 165it [00:17, 9.51it/s] 166it [00:17, 9.53it/s] 167it [00:17, 9.53it/s] 168it [00:17, 9.48it/s] 169it [00:17, 9.44it/s] 170it [00:17, 9.48it/s] 171it [00:17, 9.41it/s] 172it [00:17, 9.46it/s] 173it [00:18, 9.50it/s] 174it [00:18, 9.51it/s] 175it [00:18, 9.57it/s] 176it [00:18, 9.48it/s] 177it [00:18, 9.30it/s] 178it [00:18, 9.35it/s] 179it [00:18, 9.42it/s] 180it [00:18, 9.44it/s] 181it [00:18, 9.44it/s] 182it [00:19, 9.44it/s] 183it [00:19, 9.44it/s] 184it [00:19, 9.46it/s] 185it [00:19, 9.51it/s] 186it [00:19, 9.57it/s] 187it [00:19, 9.53it/s] 188it [00:19, 9.52it/s] 189it [00:19, 9.51it/s] 190it [00:19, 9.49it/s] 191it [00:19, 9.43it/s] 192it [00:20, 9.45it/s] 193it [00:20, 9.44it/s] 194it [00:20, 9.42it/s] 195it [00:20, 8.91it/s] 196it [00:20, 9.17it/s] 196it [00:20, 9.52it/s] +2025-05-26 04:07:42,423 - INFO - Epoch: 45, Objective: tensor([5079.6650], device='cuda:0', grad_fn=), Loss: 0.031979966908693314, KL/n: 70.21158599853516 + 0it [00:00, ?it/s]2025-05-26 04:07:42,712 - INFO - [Epoch 046 | Batch 0000] IWAE-loss 4801.6733 | mean log_px -0.0225 | KL -3436.86 + 1it [00:00, 4.40it/s] 2it [00:00, 6.46it/s] 3it [00:00, 7.59it/s] 4it [00:00, 8.26it/s] 5it [00:00, 8.70it/s] 6it [00:00, 8.97it/s] 7it [00:00, 9.16it/s] 8it [00:00, 9.30it/s] 9it [00:01, 9.38it/s] 10it [00:01, 9.39it/s] 11it [00:01, 9.47it/s] 12it [00:01, 9.54it/s] 13it [00:01, 9.53it/s] 14it [00:01, 9.53it/s] 15it [00:01, 9.56it/s] 16it [00:01, 9.59it/s] 17it [00:01, 9.64it/s] 18it [00:01, 9.65it/s] 19it [00:02, 9.54it/s] 20it [00:02, 6.16it/s] 21it [00:02, 6.90it/s] 22it [00:02, 7.52it/s] 23it [00:02, 8.03it/s] 24it [00:02, 8.40it/s] 25it [00:02, 8.73it/s] 26it [00:03, 8.96it/s] 27it [00:03, 8.62it/s] 28it [00:03, 8.81it/s] 29it [00:03, 9.00it/s] 30it [00:03, 9.10it/s] 31it [00:03, 9.25it/s] 32it [00:03, 9.37it/s] 33it [00:03, 9.42it/s] 34it [00:03, 9.43it/s] 35it [00:04, 9.05it/s] 36it [00:04, 9.10it/s] 37it [00:04, 9.24it/s] 38it [00:04, 9.32it/s] 39it [00:04, 9.38it/s] 40it [00:04, 9.40it/s] 41it [00:04, 9.43it/s] 42it [00:04, 9.46it/s] 43it [00:04, 9.53it/s] 44it [00:04, 9.56it/s] 45it [00:05, 9.56it/s] 46it [00:05, 9.53it/s] 47it [00:05, 9.53it/s] 48it [00:05, 9.54it/s] 49it [00:05, 9.56it/s] 50it [00:05, 8.84it/s]2025-05-26 04:07:48,235 - INFO - [Epoch 046 | Batch 0050] IWAE-loss 4658.3813 | mean log_px -0.0175 | KL -3431.65 + 51it [00:05, 9.01it/s] 52it [00:05, 9.17it/s] 53it [00:05, 9.28it/s] 54it [00:06, 9.37it/s] 55it [00:06, 9.41it/s] 56it [00:06, 9.45it/s] 57it [00:06, 9.44it/s] 58it [00:06, 9.42it/s] 59it [00:06, 9.44it/s] 60it [00:06, 9.47it/s] 61it [00:06, 9.48it/s] 62it [00:06, 9.49it/s] 63it [00:06, 9.54it/s] 64it [00:07, 9.61it/s] 65it [00:07, 9.58it/s] 66it [00:07, 9.62it/s] 67it [00:07, 9.60it/s] 68it [00:07, 9.60it/s] 69it [00:07, 9.60it/s] 70it [00:07, 9.61it/s] 71it [00:07, 9.60it/s] 72it [00:07, 9.60it/s] 73it [00:08, 9.62it/s] 74it [00:08, 9.59it/s] 75it [00:08, 9.60it/s] 76it [00:08, 9.57it/s] 77it [00:08, 9.50it/s] 78it [00:08, 9.51it/s] 79it [00:08, 9.54it/s] 80it [00:08, 9.56it/s] 81it [00:08, 9.55it/s] 82it [00:08, 9.54it/s] 83it [00:09, 9.48it/s] 84it [00:09, 9.49it/s] 85it [00:09, 9.48it/s] 86it [00:09, 9.48it/s] 87it [00:09, 9.55it/s] 88it [00:09, 9.56it/s] 89it [00:09, 9.58it/s] 90it [00:09, 9.22it/s] 91it [00:09, 9.38it/s] 92it [00:10, 9.40it/s] 93it [00:10, 9.40it/s] 94it [00:10, 9.42it/s] 95it [00:10, 9.50it/s] 96it [00:10, 9.51it/s] 97it [00:10, 9.51it/s] 98it [00:10, 9.53it/s] 99it [00:10, 9.58it/s] 100it [00:10, 9.58it/s]2025-05-26 04:07:53,484 - INFO - [Epoch 046 | Batch 0100] IWAE-loss 5551.6338 | mean log_px -0.0332 | KL -3436.21 + 101it [00:10, 9.55it/s] 102it [00:11, 9.56it/s] 103it [00:11, 9.63it/s] 104it [00:11, 9.66it/s] 105it [00:11, 9.66it/s] 106it [00:11, 9.56it/s] 107it [00:11, 9.56it/s] 108it [00:11, 9.61it/s] 109it [00:11, 9.58it/s] 110it [00:11, 9.58it/s] 111it [00:12, 9.58it/s] 112it [00:12, 9.59it/s] 113it [00:12, 9.61it/s] 114it [00:12, 9.63it/s] 115it [00:12, 9.63it/s] 116it [00:12, 9.52it/s] 117it [00:12, 9.19it/s] 118it [00:12, 9.26it/s] 119it [00:12, 9.37it/s] 120it [00:12, 9.40it/s] 121it [00:13, 9.46it/s] 122it [00:13, 9.02it/s] 123it [00:13, 9.16it/s] 124it [00:13, 9.24it/s] 125it [00:13, 9.31it/s] 126it [00:13, 9.40it/s] 127it [00:13, 9.48it/s] 128it [00:13, 9.49it/s] 129it [00:13, 9.47it/s] 130it [00:14, 9.48it/s] 131it [00:14, 9.58it/s] 132it [00:14, 9.61it/s] 133it [00:14, 9.57it/s] 134it [00:14, 9.58it/s] 135it [00:14, 9.61it/s] 136it [00:14, 9.63it/s] 137it [00:14, 9.09it/s] 138it [00:14, 9.23it/s] 139it [00:14, 9.35it/s] 140it [00:15, 9.41it/s] 141it [00:15, 9.40it/s] 142it [00:15, 9.44it/s] 143it [00:15, 9.44it/s] 144it [00:15, 9.50it/s] 145it [00:15, 9.04it/s] 146it [00:15, 9.14it/s] 147it [00:15, 9.23it/s] 148it [00:15, 9.27it/s] 149it [00:16, 9.30it/s] 150it [00:16, 9.40it/s]2025-05-26 04:07:58,785 - INFO - [Epoch 046 | Batch 0150] IWAE-loss 5915.6621 | mean log_px -0.0405 | KL -3435.87 + 151it [00:16, 9.46it/s] 152it [00:16, 9.42it/s] 153it [00:16, 9.48it/s] 154it [00:16, 9.56it/s] 155it [00:16, 9.62it/s] 156it [00:16, 9.63it/s] 157it [00:16, 9.60it/s] 158it [00:17, 9.18it/s] 159it [00:17, 9.24it/s] 160it [00:17, 9.32it/s] 161it [00:17, 9.38it/s] 162it [00:17, 9.37it/s] 163it [00:17, 9.43it/s] 164it [00:17, 9.39it/s] 165it [00:17, 9.49it/s] 166it [00:17, 9.48it/s] 167it [00:17, 9.54it/s] 168it [00:18, 9.49it/s] 169it [00:18, 9.51it/s] 170it [00:18, 9.52it/s] 171it [00:18, 9.52it/s] 172it [00:18, 9.56it/s] 173it [00:18, 9.57it/s] 174it [00:18, 9.57it/s] 175it [00:18, 9.55it/s] 176it [00:18, 9.55it/s] 177it [00:19, 9.57it/s] 178it [00:19, 9.54it/s] 179it [00:19, 9.20it/s] 180it [00:19, 9.31it/s] 181it [00:19, 9.39it/s] 182it [00:19, 9.45it/s] 183it [00:19, 9.47it/s] 184it [00:19, 9.49it/s] 185it [00:19, 9.13it/s] 186it [00:19, 9.25it/s] 187it [00:20, 8.84it/s] 188it [00:20, 9.04it/s] 189it [00:20, 9.16it/s] 190it [00:20, 9.26it/s] 191it [00:20, 8.86it/s] 192it [00:20, 9.05it/s] 193it [00:20, 9.19it/s] 194it [00:20, 9.26it/s] 195it [00:20, 8.77it/s] 196it [00:21, 9.05it/s] 196it [00:21, 9.27it/s] +2025-05-26 04:08:03,696 - INFO - Epoch: 46, Objective: tensor([5599.3286], device='cuda:0', grad_fn=), Loss: 0.028604112565517426, KL/n: 70.04393768310547 + 0it [00:00, ?it/s]2025-05-26 04:08:03,969 - INFO - [Epoch 047 | Batch 0000] IWAE-loss 6606.0967 | mean log_px -0.0507 | KL -3426.96 + 1it [00:00, 4.83it/s] 2it [00:00, 6.88it/s] 3it [00:00, 7.85it/s] 4it [00:00, 8.47it/s] 5it [00:00, 8.76it/s] 6it [00:00, 8.40it/s] 7it [00:00, 8.52it/s] 8it [00:00, 8.73it/s] 9it [00:01, 8.97it/s] 10it [00:01, 8.57it/s] 11it [00:01, 8.88it/s] 12it [00:01, 9.05it/s] 13it [00:01, 9.18it/s] 14it [00:01, 9.28it/s] 15it [00:01, 9.36it/s] 16it [00:01, 8.87it/s] 17it [00:01, 8.96it/s] 18it [00:02, 8.89it/s] 19it [00:02, 8.85it/s] 20it [00:02, 8.96it/s] 21it [00:02, 9.13it/s] 22it [00:02, 9.27it/s] 23it [00:02, 9.37it/s] 24it [00:02, 9.40it/s] 25it [00:02, 9.44it/s] 26it [00:02, 9.47it/s] 27it [00:03, 9.48it/s] 28it [00:03, 9.51it/s] 29it [00:03, 9.49it/s] 30it [00:03, 8.95it/s] 31it [00:03, 9.10it/s] 32it [00:03, 9.22it/s] 33it [00:03, 9.25it/s] 34it [00:03, 9.33it/s] 35it [00:03, 9.45it/s] 36it [00:04, 9.46it/s] 37it [00:04, 9.52it/s] 38it [00:04, 9.48it/s] 39it [00:04, 9.50it/s] 40it [00:04, 9.43it/s] 41it [00:04, 9.46it/s] 42it [00:04, 9.49it/s] 43it [00:04, 9.46it/s] 44it [00:04, 9.44it/s] 45it [00:04, 9.41it/s] 46it [00:05, 9.46it/s] 47it [00:05, 9.46it/s] 48it [00:05, 9.47it/s] 49it [00:05, 8.90it/s] 50it [00:05, 9.04it/s]2025-05-26 04:08:09,407 - INFO - [Epoch 047 | Batch 0050] IWAE-loss 5071.6953 | mean log_px -0.0309 | KL -3429.48 + 51it [00:05, 9.12it/s] 52it [00:05, 9.16it/s] 53it [00:05, 9.29it/s] 54it [00:05, 9.38it/s] 55it [00:06, 9.39it/s] 56it [00:06, 9.36it/s] 57it [00:06, 9.31it/s] 58it [00:06, 9.08it/s] 59it [00:06, 9.23it/s] 60it [00:06, 9.33it/s] 61it [00:06, 9.41it/s] 62it [00:06, 9.45it/s] 63it [00:06, 9.40it/s] 64it [00:07, 9.40it/s] 65it [00:07, 9.39it/s] 66it [00:07, 9.33it/s] 67it [00:07, 9.39it/s] 68it [00:07, 9.25it/s] 69it [00:07, 9.15it/s] 70it [00:07, 9.26it/s] 71it [00:07, 9.35it/s] 72it [00:07, 9.40it/s] 73it [00:07, 9.39it/s] 74it [00:08, 9.37it/s] 75it [00:08, 9.34it/s] 76it [00:08, 9.32it/s] 77it [00:08, 9.37it/s] 78it [00:08, 9.37it/s] 79it [00:08, 9.38it/s] 80it [00:08, 9.44it/s] 81it [00:08, 9.44it/s] 82it [00:08, 9.43it/s] 83it [00:09, 9.40it/s] 84it [00:09, 9.42it/s] 85it [00:09, 9.45it/s] 86it [00:09, 9.39it/s] 87it [00:09, 9.39it/s] 88it [00:09, 9.41it/s] 89it [00:09, 9.44it/s] 90it [00:09, 9.38it/s] 91it [00:09, 9.42it/s] 92it [00:09, 9.46it/s] 93it [00:10, 8.94it/s] 94it [00:10, 9.03it/s] 95it [00:10, 8.98it/s] 96it [00:10, 8.84it/s] 97it [00:10, 9.07it/s] 98it [00:10, 9.21it/s] 99it [00:10, 9.33it/s] 100it [00:10, 9.43it/s]2025-05-26 04:08:14,764 - INFO - [Epoch 047 | Batch 0100] IWAE-loss 4540.6260 | mean log_px -0.0246 | KL -3428.07 + 101it [00:10, 9.47it/s] 102it [00:11, 9.46it/s] 103it [00:11, 9.45it/s] 104it [00:11, 9.51it/s] 105it [00:11, 9.58it/s] 106it [00:11, 9.56it/s] 107it [00:11, 9.59it/s] 108it [00:11, 9.62it/s] 109it [00:11, 9.62it/s] 110it [00:11, 9.62it/s] 111it [00:12, 9.65it/s] 112it [00:12, 9.68it/s] 113it [00:12, 9.67it/s] 114it [00:12, 9.64it/s] 115it [00:12, 9.58it/s] 116it [00:12, 9.59it/s] 117it [00:12, 9.64it/s] 118it [00:12, 9.66it/s] 119it [00:12, 9.69it/s] 120it [00:12, 9.49it/s] 121it [00:13, 9.55it/s] 122it [00:13, 9.53it/s] 123it [00:13, 9.56it/s] 124it [00:13, 9.59it/s] 125it [00:13, 9.60it/s] 126it [00:13, 9.54it/s] 127it [00:13, 9.27it/s] 128it [00:13, 9.33it/s] 129it [00:13, 9.39it/s] 130it [00:14, 9.43it/s] 131it [00:14, 9.48it/s] 132it [00:14, 9.53it/s] 133it [00:14, 9.55it/s] 134it [00:14, 9.55it/s] 135it [00:14, 9.54it/s] 136it [00:14, 9.57it/s] 137it [00:14, 9.57it/s] 138it [00:14, 9.58it/s] 139it [00:14, 9.58it/s] 140it [00:15, 9.58it/s] 141it [00:15, 9.57it/s] 142it [00:15, 9.57it/s] 143it [00:15, 9.56it/s] 144it [00:15, 9.57it/s] 145it [00:15, 9.56it/s] 146it [00:15, 9.52it/s] 147it [00:15, 9.56it/s] 148it [00:15, 9.58it/s] 149it [00:15, 9.58it/s] 150it [00:16, 9.47it/s]2025-05-26 04:08:20,000 - INFO - [Epoch 047 | Batch 0150] IWAE-loss 4956.0400 | mean log_px -0.0260 | KL -3420.03 + 151it [00:16, 9.20it/s] 152it [00:16, 9.30it/s] 153it [00:16, 9.38it/s] 154it [00:16, 9.43it/s] 155it [00:16, 9.24it/s] 156it [00:16, 9.33it/s] 157it [00:16, 9.43it/s] 158it [00:16, 9.27it/s] 159it [00:17, 9.36it/s] 160it [00:17, 9.46it/s] 161it [00:17, 9.51it/s] 162it [00:17, 9.54it/s] 163it [00:17, 9.59it/s] 164it [00:17, 9.60it/s] 165it [00:17, 9.61it/s] 166it [00:17, 9.62it/s] 167it [00:17, 9.53it/s] 168it [00:18, 9.54it/s] 169it [00:18, 9.58it/s] 170it [00:18, 9.57it/s] 171it [00:18, 9.52it/s] 172it [00:18, 9.50it/s] 173it [00:18, 9.48it/s] 174it [00:18, 9.45it/s] 175it [00:18, 9.34it/s] 176it [00:18, 9.40it/s] 177it [00:18, 9.43it/s] 178it [00:19, 9.50it/s] 179it [00:19, 9.53it/s] 180it [00:19, 9.52it/s] 181it [00:19, 9.53it/s] 182it [00:19, 9.54it/s] 183it [00:19, 9.57it/s] 184it [00:19, 9.57it/s] 185it [00:19, 9.58it/s] 186it [00:19, 9.57it/s] 187it [00:20, 9.57it/s] 188it [00:20, 9.56it/s] 189it [00:20, 9.58it/s] 190it [00:20, 9.59it/s] 191it [00:20, 9.58it/s] 192it [00:20, 9.54it/s] 193it [00:20, 9.56it/s] 194it [00:20, 9.33it/s] 195it [00:20, 8.96it/s] 196it [00:21, 9.32it/s] +2025-05-26 04:08:24,858 - INFO - Epoch: 47, Objective: tensor([5860.7812], device='cuda:0', grad_fn=), Loss: 0.03282099589705467, KL/n: 69.88233184814453 + 0it [00:00, ?it/s]2025-05-26 04:08:25,130 - INFO - [Epoch 048 | Batch 0000] IWAE-loss 4398.5654 | mean log_px -0.0148 | KL -3425.91 + 1it [00:00, 4.63it/s] 2it [00:00, 6.49it/s] 3it [00:00, 7.43it/s] 4it [00:00, 8.05it/s] 5it [00:00, 7.96it/s] 6it [00:00, 8.33it/s] 7it [00:00, 8.58it/s] 8it [00:01, 8.67it/s] 9it [00:01, 8.29it/s] 10it [00:01, 5.70it/s] 11it [00:01, 6.49it/s] 12it [00:01, 7.13it/s] 13it [00:01, 7.70it/s] 14it [00:01, 8.11it/s] 15it [00:01, 8.47it/s] 16it [00:02, 8.24it/s] 17it [00:02, 8.59it/s] 18it [00:02, 8.77it/s] 19it [00:02, 8.97it/s] 20it [00:02, 8.59it/s] 21it [00:02, 8.81it/s] 22it [00:02, 8.98it/s] 23it [00:02, 9.10it/s] 24it [00:02, 9.24it/s] 25it [00:03, 8.76it/s] 26it [00:03, 8.92it/s] 27it [00:03, 9.07it/s] 28it [00:03, 9.14it/s] 29it [00:03, 9.17it/s] 30it [00:03, 9.24it/s] 31it [00:03, 8.87it/s] 32it [00:03, 9.03it/s] 33it [00:03, 9.16it/s] 34it [00:04, 9.21it/s] 35it [00:04, 9.28it/s] 36it [00:04, 9.29it/s] 37it [00:04, 9.39it/s] 38it [00:04, 9.39it/s] 39it [00:04, 9.30it/s] 40it [00:04, 8.86it/s] 41it [00:04, 9.09it/s] 42it [00:04, 9.21it/s] 43it [00:05, 9.28it/s] 44it [00:05, 9.38it/s] 45it [00:05, 9.40it/s] 46it [00:05, 9.41it/s] 47it [00:05, 9.45it/s] 48it [00:05, 9.48it/s] 49it [00:05, 9.55it/s] 50it [00:05, 9.48it/s]2025-05-26 04:08:30,830 - INFO - [Epoch 048 | Batch 0050] IWAE-loss 5411.3506 | mean log_px -0.0329 | KL -3426.38 + 51it [00:05, 9.45it/s] 52it [00:05, 9.41it/s] 53it [00:06, 9.45it/s] 54it [00:06, 9.50it/s] 55it [00:06, 9.54it/s] 56it [00:06, 8.96it/s] 57it [00:06, 9.13it/s] 58it [00:06, 9.25it/s] 59it [00:06, 9.30it/s] 60it [00:06, 9.37it/s] 61it [00:06, 9.42it/s] 62it [00:07, 9.44it/s] 63it [00:07, 9.45it/s] 64it [00:07, 9.53it/s] 65it [00:07, 9.56it/s] 66it [00:07, 9.54it/s] 67it [00:07, 9.57it/s] 68it [00:07, 9.57it/s] 69it [00:07, 9.00it/s] 70it [00:07, 9.16it/s] 71it [00:08, 9.28it/s] 72it [00:08, 9.34it/s] 73it [00:08, 9.41it/s] 74it [00:08, 9.43it/s] 75it [00:08, 9.47it/s] 76it [00:08, 9.54it/s] 77it [00:08, 9.59it/s] 78it [00:08, 9.58it/s] 79it [00:08, 9.63it/s] 80it [00:08, 9.50it/s] 81it [00:09, 9.47it/s] 82it [00:09, 9.51it/s] 83it [00:09, 9.55it/s] 84it [00:09, 9.53it/s] 85it [00:09, 9.54it/s] 86it [00:09, 9.57it/s] 87it [00:09, 9.57it/s] 88it [00:09, 9.57it/s] 89it [00:09, 9.55it/s] 90it [00:10, 9.50it/s] 91it [00:10, 9.52it/s] 92it [00:10, 9.55it/s] 93it [00:10, 9.56it/s] 94it [00:10, 9.56it/s] 95it [00:10, 9.56it/s] 96it [00:10, 9.58it/s] 97it [00:10, 9.56it/s] 98it [00:10, 8.98it/s] 99it [00:10, 9.13it/s] 100it [00:11, 9.27it/s]2025-05-26 04:08:36,134 - INFO - [Epoch 048 | Batch 0100] IWAE-loss 5481.2749 | mean log_px -0.0403 | KL -3417.41 + 101it [00:11, 9.33it/s] 102it [00:11, 9.44it/s] 103it [00:11, 9.44it/s] 104it [00:11, 9.44it/s] 105it [00:11, 9.47it/s] 106it [00:11, 9.53it/s] 107it [00:11, 9.48it/s] 108it [00:11, 9.05it/s] 109it [00:12, 9.21it/s] 110it [00:12, 9.23it/s] 111it [00:12, 9.03it/s] 112it [00:12, 8.68it/s] 113it [00:12, 8.86it/s] 114it [00:12, 9.04it/s] 115it [00:12, 9.19it/s] 116it [00:12, 9.30it/s] 117it [00:12, 8.86it/s] 118it [00:13, 9.07it/s] 119it [00:13, 9.22it/s] 120it [00:13, 9.35it/s] 121it [00:13, 9.39it/s] 122it [00:13, 9.06it/s] 123it [00:13, 9.21it/s] 124it [00:13, 9.20it/s] 125it [00:13, 9.08it/s] 126it [00:13, 8.68it/s] 127it [00:14, 8.77it/s] 128it [00:14, 9.01it/s] 129it [00:14, 9.16it/s] 130it [00:14, 9.22it/s] 131it [00:14, 9.32it/s] 132it [00:14, 9.36it/s] 133it [00:14, 9.36it/s] 134it [00:14, 9.05it/s] 135it [00:14, 9.17it/s] 136it [00:15, 9.17it/s] 137it [00:15, 9.26it/s] 138it [00:15, 9.30it/s] 139it [00:15, 9.23it/s] 140it [00:15, 8.98it/s] 141it [00:15, 9.14it/s] 142it [00:15, 8.87it/s] 143it [00:15, 9.06it/s] 144it [00:15, 9.13it/s] 145it [00:16, 8.75it/s] 146it [00:16, 8.96it/s] 147it [00:16, 9.10it/s] 148it [00:16, 9.27it/s] 149it [00:16, 9.18it/s] 150it [00:16, 8.89it/s]2025-05-26 04:08:41,611 - INFO - [Epoch 048 | Batch 0150] IWAE-loss 4167.0127 | mean log_px -0.0108 | KL -3420.06 + 151it [00:16, 9.09it/s] 152it [00:16, 9.19it/s] 153it [00:16, 9.29it/s] 154it [00:16, 9.39it/s] 155it [00:17, 9.42it/s] 156it [00:17, 9.42it/s] 157it [00:17, 9.45it/s] 158it [00:17, 9.47it/s] 159it [00:17, 9.34it/s] 160it [00:17, 9.31it/s] 161it [00:17, 8.90it/s] 162it [00:17, 9.07it/s] 163it [00:17, 9.20it/s] 164it [00:18, 8.78it/s] 165it [00:18, 9.00it/s] 166it [00:18, 9.13it/s] 167it [00:18, 9.25it/s] 168it [00:18, 9.32it/s] 169it [00:18, 9.41it/s] 170it [00:18, 9.34it/s] 171it [00:18, 9.47it/s] 172it [00:18, 9.47it/s] 173it [00:19, 9.47it/s] 174it [00:19, 9.51it/s] 175it [00:19, 9.51it/s] 176it [00:19, 9.54it/s] 177it [00:19, 9.17it/s] 178it [00:19, 9.30it/s] 179it [00:19, 9.39it/s] 180it [00:19, 9.42it/s] 181it [00:19, 9.48it/s] 182it [00:19, 9.47it/s] 183it [00:20, 8.99it/s] 184it [00:20, 9.12it/s] 185it [00:20, 9.00it/s] 186it [00:20, 8.72it/s] 187it [00:20, 8.95it/s] 188it [00:20, 9.00it/s] 189it [00:20, 9.16it/s] 190it [00:20, 9.24it/s] 191it [00:20, 9.35it/s] 192it [00:21, 8.94it/s] 193it [00:21, 9.17it/s] 194it [00:21, 9.33it/s] 195it [00:21, 8.90it/s] 196it [00:21, 9.18it/s] 196it [00:21, 9.07it/s] +2025-05-26 04:08:46,584 - INFO - Epoch: 48, Objective: tensor([5577.5146], device='cuda:0', grad_fn=), Loss: 0.034665796905756, KL/n: 69.71744537353516 + 0it [00:00, ?it/s]2025-05-26 04:08:46,856 - INFO - [Epoch 049 | Batch 0000] IWAE-loss 4387.7876 | mean log_px -0.0154 | KL -3415.77 + 1it [00:00, 5.43it/s] 2it [00:00, 7.35it/s] 3it [00:00, 8.28it/s] 4it [00:00, 8.80it/s] 5it [00:00, 9.11it/s] 6it [00:00, 9.29it/s] 7it [00:00, 9.43it/s] 8it [00:00, 9.51it/s] 9it [00:01, 9.57it/s] 10it [00:01, 9.62it/s] 11it [00:01, 9.69it/s] 12it [00:01, 9.72it/s] 13it [00:01, 9.75it/s] 14it [00:01, 9.73it/s] 15it [00:01, 9.72it/s] 16it [00:01, 9.71it/s] 17it [00:01, 9.56it/s] 18it [00:01, 9.53it/s] 19it [00:02, 9.54it/s] 20it [00:02, 9.46it/s] 21it [00:02, 9.48it/s] 22it [00:02, 9.52it/s] 23it [00:02, 9.55it/s] 24it [00:02, 9.53it/s] 25it [00:02, 9.58it/s] 26it [00:02, 9.29it/s] 27it [00:02, 9.37it/s] 28it [00:02, 9.39it/s] 29it [00:03, 9.42it/s] 30it [00:03, 9.41it/s] 31it [00:03, 9.44it/s] 32it [00:03, 9.48it/s] 33it [00:03, 9.50it/s] 34it [00:03, 9.33it/s] 35it [00:03, 9.37it/s] 36it [00:03, 9.45it/s] 37it [00:03, 9.55it/s] 38it [00:04, 9.60it/s] 39it [00:04, 9.66it/s] 40it [00:04, 9.68it/s] 41it [00:04, 9.70it/s] 42it [00:04, 9.72it/s] 43it [00:04, 9.69it/s] 44it [00:04, 9.71it/s] 45it [00:04, 9.72it/s] 46it [00:04, 9.73it/s] 47it [00:04, 9.74it/s] 48it [00:05, 9.72it/s] 49it [00:05, 9.75it/s] 50it [00:05, 9.75it/s]2025-05-26 04:08:52,058 - INFO - [Epoch 049 | Batch 0050] IWAE-loss 6286.7646 | mean log_px -0.0480 | KL -3411.50 + 51it [00:05, 9.74it/s] 52it [00:05, 9.72it/s] 53it [00:05, 9.74it/s] 54it [00:05, 9.76it/s] 55it [00:05, 9.78it/s] 56it [00:05, 9.76it/s] 57it [00:06, 9.77it/s] 58it [00:06, 9.74it/s] 59it [00:06, 9.74it/s] 60it [00:06, 9.75it/s] 61it [00:06, 9.77it/s] 62it [00:06, 9.76it/s] 63it [00:06, 9.77it/s] 64it [00:06, 9.77it/s] 65it [00:06, 9.75it/s] 66it [00:06, 9.76it/s] 67it [00:07, 9.77it/s] 68it [00:07, 9.75it/s] 69it [00:07, 9.74it/s] 70it [00:07, 9.74it/s] 71it [00:07, 9.73it/s] 72it [00:07, 9.73it/s] 73it [00:07, 9.72it/s] 74it [00:07, 9.71it/s] 75it [00:07, 9.58it/s] 76it [00:07, 9.61it/s] 77it [00:08, 9.63it/s] 78it [00:08, 9.62it/s] 79it [00:08, 9.66it/s] 80it [00:08, 9.64it/s] 81it [00:08, 9.35it/s] 82it [00:08, 9.43it/s] 83it [00:08, 9.49it/s] 84it [00:08, 9.49it/s] 85it [00:08, 9.46it/s] 86it [00:09, 9.44it/s] 87it [00:09, 9.47it/s] 88it [00:09, 9.13it/s] 89it [00:09, 9.27it/s] 90it [00:09, 9.27it/s] 91it [00:09, 9.38it/s] 92it [00:09, 9.44it/s] 93it [00:09, 9.50it/s] 94it [00:09, 9.53it/s] 95it [00:09, 9.46it/s] 96it [00:10, 9.44it/s] 97it [00:10, 9.44it/s] 98it [00:10, 9.48it/s] 99it [00:10, 9.48it/s] 100it [00:10, 9.51it/s]2025-05-26 04:08:57,274 - INFO - [Epoch 049 | Batch 0100] IWAE-loss 6288.9609 | mean log_px -0.0417 | KL -3411.01 + 101it [00:10, 9.50it/s] 102it [00:10, 9.49it/s] 103it [00:10, 9.54it/s] 104it [00:10, 9.53it/s] 105it [00:11, 9.48it/s] 106it [00:11, 9.56it/s] 107it [00:11, 9.59it/s] 108it [00:11, 9.58it/s] 109it [00:11, 9.57it/s] 110it [00:11, 9.55it/s] 111it [00:11, 9.33it/s] 112it [00:11, 9.41it/s] 113it [00:11, 9.46it/s] 114it [00:11, 9.50it/s] 115it [00:12, 9.53it/s] 116it [00:12, 9.56it/s] 117it [00:12, 9.58it/s] 118it [00:12, 9.54it/s] 119it [00:12, 9.53it/s] 120it [00:12, 9.53it/s] 121it [00:12, 9.54it/s] 122it [00:12, 9.51it/s] 123it [00:12, 9.47it/s] 124it [00:13, 9.45it/s] 125it [00:13, 9.46it/s] 126it [00:13, 9.48it/s] 127it [00:13, 9.51it/s] 128it [00:13, 9.48it/s] 129it [00:13, 9.50it/s] 130it [00:13, 9.49it/s] 131it [00:13, 9.52it/s] 132it [00:13, 9.50it/s] 133it [00:13, 9.54it/s] 134it [00:14, 9.53it/s] 135it [00:14, 9.56it/s] 136it [00:14, 9.52it/s] 137it [00:14, 9.52it/s] 138it [00:14, 9.53it/s] 139it [00:14, 9.32it/s] 140it [00:14, 9.40it/s] 141it [00:14, 9.49it/s] 142it [00:14, 9.47it/s] 143it [00:15, 9.51it/s] 144it [00:15, 9.55it/s] 145it [00:15, 9.54it/s] 146it [00:15, 9.52it/s] 147it [00:15, 9.51it/s] 148it [00:15, 9.49it/s] 149it [00:15, 9.51it/s] 150it [00:15, 9.52it/s]2025-05-26 04:09:02,533 - INFO - [Epoch 049 | Batch 0150] IWAE-loss 5174.5752 | mean log_px -0.0317 | KL -3409.79 + 151it [00:15, 9.57it/s] 152it [00:15, 9.53it/s] 153it [00:16, 9.55it/s] 154it [00:16, 9.55it/s] 155it [00:16, 9.53it/s] 156it [00:16, 9.55it/s] 157it [00:16, 9.55it/s] 158it [00:16, 9.55it/s] 159it [00:16, 9.55it/s] 160it [00:16, 9.56it/s] 161it [00:16, 9.54it/s] 162it [00:17, 9.50it/s] 163it [00:17, 9.53it/s] 164it [00:17, 9.56it/s] 165it [00:17, 9.58it/s] 166it [00:17, 9.50it/s] 167it [00:17, 9.52it/s] 168it [00:17, 9.52it/s] 169it [00:17, 9.57it/s] 170it [00:17, 9.62it/s] 171it [00:17, 9.63it/s] 172it [00:18, 9.65it/s] 173it [00:18, 9.68it/s] 174it [00:18, 9.70it/s] 175it [00:18, 9.71it/s] 176it [00:18, 9.71it/s] 177it [00:18, 9.74it/s] 178it [00:18, 9.75it/s] 179it [00:18, 9.75it/s] 180it [00:18, 9.76it/s] 181it [00:18, 9.75it/s] 182it [00:19, 9.77it/s] 183it [00:19, 9.77it/s] 184it [00:19, 9.77it/s] 185it [00:19, 9.77it/s] 186it [00:19, 9.74it/s] 187it [00:19, 9.72it/s] 188it [00:19, 9.73it/s] 189it [00:19, 9.74it/s] 190it [00:19, 9.75it/s] 191it [00:20, 9.76it/s] 192it [00:20, 9.78it/s] 193it [00:20, 9.78it/s] 194it [00:20, 9.79it/s] 195it [00:20, 9.17it/s] 196it [00:20, 8.89it/s] 196it [00:20, 9.51it/s] +2025-05-26 04:09:07,327 - INFO - Epoch: 49, Objective: tensor([5592.1567], device='cuda:0', grad_fn=), Loss: 0.03624124079942703, KL/n: 69.54737854003906 + 0it [00:00, ?it/s]2025-05-26 04:09:07,773 - INFO - [Epoch 050 | Batch 0000] IWAE-loss 4820.5073 | mean log_px -0.0246 | KL -3407.40 + 1it [00:00, 2.84it/s] 2it [00:00, 4.87it/s] 3it [00:00, 6.33it/s] 4it [00:00, 7.23it/s] 5it [00:00, 7.93it/s] 6it [00:00, 8.43it/s] 7it [00:00, 8.84it/s] 8it [00:01, 8.95it/s] 9it [00:01, 8.43it/s] 10it [00:01, 8.52it/s] 11it [00:01, 8.78it/s] 12it [00:01, 8.98it/s] 13it [00:01, 9.13it/s] 14it [00:01, 9.22it/s] 15it [00:01, 9.33it/s] 16it [00:01, 9.39it/s] 17it [00:02, 9.45it/s] 18it [00:02, 9.47it/s] 19it [00:02, 9.50it/s] 20it [00:02, 9.46it/s] 21it [00:02, 9.56it/s] 22it [00:02, 9.03it/s] 23it [00:02, 9.22it/s] 24it [00:02, 9.36it/s] 25it [00:02, 9.42it/s] 26it [00:03, 9.04it/s] 27it [00:03, 9.25it/s] 28it [00:03, 9.39it/s] 29it [00:03, 9.46it/s] 30it [00:03, 9.08it/s] 31it [00:03, 9.25it/s] 32it [00:03, 9.13it/s] 33it [00:03, 9.26it/s] 34it [00:03, 9.34it/s] 35it [00:04, 9.41it/s] 36it [00:04, 9.46it/s] 37it [00:04, 9.05it/s] 38it [00:04, 9.11it/s] 39it [00:04, 9.26it/s] 40it [00:04, 9.37it/s] 41it [00:04, 9.44it/s] 42it [00:04, 8.99it/s] 43it [00:04, 9.14it/s] 44it [00:04, 9.22it/s] 45it [00:05, 9.35it/s] 46it [00:05, 9.41it/s] 47it [00:05, 9.47it/s] 48it [00:05, 9.46it/s] 49it [00:05, 9.52it/s] 50it [00:05, 9.49it/s]2025-05-26 04:09:13,136 - INFO - [Epoch 050 | Batch 0050] IWAE-loss 6266.3530 | mean log_px -0.0450 | KL -3405.55 + 51it [00:05, 9.51it/s] 52it [00:05, 9.54it/s] 53it [00:05, 9.52it/s] 54it [00:06, 9.51it/s] 55it [00:06, 9.51it/s] 56it [00:06, 9.54it/s] 57it [00:06, 9.12it/s] 58it [00:06, 9.23it/s] 59it [00:06, 9.31it/s] 60it [00:06, 9.35it/s] 61it [00:06, 9.41it/s] 62it [00:06, 9.45it/s] 63it [00:06, 9.54it/s] 64it [00:07, 9.54it/s] 65it [00:07, 9.56it/s] 66it [00:07, 9.54it/s] 67it [00:07, 9.52it/s] 68it [00:07, 9.52it/s] 69it [00:07, 9.55it/s] 70it [00:07, 9.54it/s] 71it [00:07, 9.56it/s] 72it [00:07, 9.12it/s] 73it [00:08, 9.23it/s] 74it [00:08, 9.29it/s] 75it [00:08, 9.35it/s] 76it [00:08, 9.39it/s] 77it [00:08, 9.47it/s] 78it [00:08, 9.52it/s] 79it [00:08, 9.55it/s] 80it [00:08, 9.55it/s] 81it [00:08, 9.57it/s] 82it [00:08, 9.56it/s] 83it [00:09, 9.56it/s] 84it [00:09, 9.49it/s] 85it [00:09, 9.47it/s] 86it [00:09, 9.46it/s] 87it [00:09, 9.53it/s] 88it [00:09, 9.52it/s] 89it [00:09, 9.57it/s] 90it [00:09, 9.58it/s] 91it [00:09, 9.58it/s] 92it [00:10, 9.54it/s] 93it [00:10, 9.51it/s] 94it [00:10, 9.06it/s] 95it [00:10, 9.21it/s] 96it [00:10, 9.29it/s] 97it [00:10, 9.37it/s] 98it [00:10, 9.46it/s] 99it [00:10, 9.53it/s] 100it [00:10, 9.01it/s]2025-05-26 04:09:18,447 - INFO - [Epoch 050 | Batch 0100] IWAE-loss 5081.3320 | mean log_px -0.0248 | KL -3404.80 + 101it [00:11, 9.12it/s] 102it [00:11, 9.26it/s] 103it [00:11, 9.37it/s] 104it [00:11, 9.43it/s] 105it [00:11, 8.94it/s] 106it [00:11, 9.09it/s] 107it [00:11, 9.21it/s] 108it [00:11, 9.27it/s] 109it [00:11, 9.37it/s] 110it [00:12, 8.76it/s] 111it [00:12, 9.03it/s] 112it [00:12, 9.16it/s] 113it [00:12, 9.22it/s] 114it [00:12, 9.18it/s] 115it [00:12, 8.91it/s] 116it [00:12, 9.13it/s] 117it [00:12, 9.23it/s] 118it [00:12, 9.22it/s] 119it [00:12, 9.31it/s] 120it [00:13, 9.38it/s] 121it [00:13, 9.43it/s] 122it [00:13, 9.46it/s] 123it [00:13, 9.50it/s] 124it [00:13, 9.52it/s] 125it [00:13, 9.50it/s] 126it [00:13, 9.50it/s] 127it [00:13, 9.46it/s] 128it [00:13, 9.44it/s] 129it [00:14, 9.49it/s] 130it [00:14, 9.49it/s] 131it [00:14, 9.51it/s] 132it [00:14, 9.52it/s] 133it [00:14, 9.50it/s] 134it [00:14, 9.50it/s] 135it [00:14, 9.47it/s] 136it [00:14, 9.53it/s] 137it [00:14, 9.53it/s] 138it [00:15, 8.98it/s] 139it [00:15, 9.13it/s] 140it [00:15, 9.21it/s] 141it [00:15, 9.32it/s] 142it [00:15, 9.38it/s] 143it [00:15, 9.38it/s] 144it [00:15, 9.49it/s] 145it [00:15, 9.55it/s] 146it [00:15, 9.62it/s] 147it [00:15, 9.68it/s] 148it [00:16, 9.72it/s] 149it [00:16, 9.75it/s] 150it [00:16, 9.75it/s]2025-05-26 04:09:23,770 - INFO - [Epoch 050 | Batch 0150] IWAE-loss 5562.5117 | mean log_px -0.0343 | KL -3396.77 + 151it [00:16, 9.74it/s] 152it [00:16, 9.73it/s] 153it [00:16, 9.25it/s] 154it [00:16, 9.38it/s] 155it [00:16, 9.22it/s] 156it [00:16, 9.29it/s] 157it [00:17, 9.35it/s] 158it [00:17, 9.40it/s] 159it [00:17, 9.48it/s] 160it [00:17, 9.48it/s] 161it [00:17, 9.43it/s] 162it [00:17, 9.44it/s] 163it [00:17, 9.35it/s] 164it [00:17, 8.86it/s] 165it [00:17, 9.05it/s] 166it [00:17, 9.18it/s] 167it [00:18, 9.28it/s] 168it [00:18, 9.34it/s] 169it [00:18, 8.90it/s] 170it [00:18, 9.08it/s] 171it [00:18, 9.24it/s] 172it [00:18, 9.29it/s] 173it [00:18, 9.37it/s] 174it [00:18, 9.36it/s] 175it [00:18, 9.46it/s] 176it [00:19, 9.46it/s] 177it [00:19, 9.50it/s] 178it [00:19, 9.47it/s] 179it [00:19, 9.46it/s] 180it [00:19, 9.42it/s] 181it [00:19, 9.39it/s] 182it [00:19, 9.45it/s] 183it [00:19, 9.43it/s] 184it [00:19, 8.94it/s] 185it [00:20, 9.10it/s] 186it [00:20, 9.26it/s] 187it [00:20, 9.33it/s] 188it [00:20, 9.38it/s] 189it [00:20, 9.41it/s] 190it [00:20, 9.45it/s] 191it [00:20, 9.36it/s] 192it [00:20, 9.39it/s] 193it [00:20, 9.44it/s] 194it [00:20, 9.46it/s] 195it [00:21, 8.90it/s] 196it [00:21, 9.11it/s] 196it [00:21, 9.22it/s] +2025-05-26 04:09:28,726 - INFO - Epoch: 50, Objective: tensor([5149.9160], device='cuda:0', grad_fn=), Loss: 0.02591179683804512, KL/n: 69.36389923095703 + 0it [00:00, ?it/s]2025-05-26 04:09:29,006 - INFO - [Epoch 051 | Batch 0000] IWAE-loss 4607.3794 | mean log_px -0.0298 | KL -3396.73 + 1it [00:00, 4.70it/s] 2it [00:00, 6.70it/s] 3it [00:00, 7.72it/s] 4it [00:00, 8.37it/s] 5it [00:00, 8.77it/s] 6it [00:00, 8.94it/s] 7it [00:00, 8.93it/s] 8it [00:00, 9.12it/s] 9it [00:01, 9.23it/s] 10it [00:01, 9.32it/s] 11it [00:01, 9.40it/s] 12it [00:01, 8.97it/s] 13it [00:01, 9.18it/s] 14it [00:01, 9.26it/s] 15it [00:01, 9.39it/s] 16it [00:01, 9.43it/s] 17it [00:01, 8.85it/s] 18it [00:02, 9.07it/s] 19it [00:02, 9.18it/s] 20it [00:02, 9.29it/s] 21it [00:02, 9.34it/s] 22it [00:02, 9.42it/s] 23it [00:02, 9.47it/s] 24it [00:02, 9.53it/s] 25it [00:02, 9.59it/s] 26it [00:02, 9.56it/s] 27it [00:02, 9.59it/s] 28it [00:03, 9.59it/s] 29it [00:03, 9.60it/s] 30it [00:03, 9.56it/s] 31it [00:03, 9.58it/s] 32it [00:03, 9.16it/s] 33it [00:03, 9.30it/s] 34it [00:03, 9.37it/s] 35it [00:03, 9.37it/s] 36it [00:03, 9.01it/s] 37it [00:04, 9.12it/s] 38it [00:04, 9.19it/s] 39it [00:04, 9.34it/s] 40it [00:04, 9.41it/s] 41it [00:04, 8.99it/s] 42it [00:04, 9.18it/s] 43it [00:04, 9.29it/s] 44it [00:04, 9.34it/s] 45it [00:04, 8.92it/s] 46it [00:05, 9.11it/s] 47it [00:05, 9.25it/s] 48it [00:05, 9.36it/s] 49it [00:05, 8.93it/s] 50it [00:05, 9.14it/s]2025-05-26 04:09:34,405 - INFO - [Epoch 051 | Batch 0050] IWAE-loss 4357.4595 | mean log_px -0.0165 | KL -3393.12 + 51it [00:05, 9.27it/s] 52it [00:05, 9.37it/s] 53it [00:05, 8.92it/s] 54it [00:05, 9.10it/s] 55it [00:06, 9.25it/s] 56it [00:06, 9.34it/s] 57it [00:06, 8.93it/s] 58it [00:06, 9.11it/s] 59it [00:06, 9.26it/s] 60it [00:06, 8.82it/s] 61it [00:06, 9.05it/s] 62it [00:06, 9.15it/s] 63it [00:06, 9.31it/s] 64it [00:07, 8.89it/s] 65it [00:07, 9.12it/s] 66it [00:07, 9.26it/s] 67it [00:07, 9.37it/s] 68it [00:07, 8.91it/s] 69it [00:07, 9.14it/s] 70it [00:07, 9.24it/s] 71it [00:07, 9.35it/s] 72it [00:07, 8.92it/s] 73it [00:07, 9.14it/s] 74it [00:08, 9.28it/s] 75it [00:08, 9.39it/s] 76it [00:08, 8.93it/s] 77it [00:08, 9.11it/s] 78it [00:08, 9.26it/s] 79it [00:08, 9.32it/s] 80it [00:08, 8.87it/s] 81it [00:08, 9.07it/s] 82it [00:08, 9.25it/s] 83it [00:09, 9.36it/s] 84it [00:09, 8.94it/s] 85it [00:09, 9.11it/s] 86it [00:09, 9.21it/s] 87it [00:09, 9.33it/s] 88it [00:09, 8.90it/s] 89it [00:09, 9.12it/s] 90it [00:09, 9.22it/s] 91it [00:09, 9.36it/s] 92it [00:10, 8.90it/s] 93it [00:10, 9.12it/s] 94it [00:10, 9.22it/s] 95it [00:10, 9.28it/s] 96it [00:10, 8.84it/s] 97it [00:10, 9.06it/s] 98it [00:10, 9.10it/s] 99it [00:10, 9.18it/s] 100it [00:10, 8.76it/s]2025-05-26 04:09:39,895 - INFO - [Epoch 051 | Batch 0100] IWAE-loss 4766.6494 | mean log_px -0.0259 | KL -3393.81 + 101it [00:11, 8.88it/s] 102it [00:11, 8.89it/s] 103it [00:11, 8.82it/s] 104it [00:11, 8.53it/s] 105it [00:11, 8.83it/s] 106it [00:11, 9.07it/s] 107it [00:11, 9.19it/s] 108it [00:11, 8.89it/s] 109it [00:11, 9.03it/s] 110it [00:12, 9.21it/s] 111it [00:12, 8.79it/s] 112it [00:12, 9.03it/s] 113it [00:12, 9.04it/s] 114it [00:12, 9.16it/s] 115it [00:12, 9.29it/s] 116it [00:12, 8.81it/s] 117it [00:12, 9.05it/s] 118it [00:12, 9.23it/s] 119it [00:13, 9.33it/s] 120it [00:13, 8.75it/s] 121it [00:13, 9.01it/s] 122it [00:13, 9.17it/s] 123it [00:13, 9.32it/s] 124it [00:13, 8.84it/s] 125it [00:13, 9.04it/s] 126it [00:13, 9.14it/s] 127it [00:13, 9.32it/s] 128it [00:14, 9.41it/s] 129it [00:14, 9.48it/s] 130it [00:14, 9.55it/s] 131it [00:14, 9.60it/s] 132it [00:14, 9.65it/s] 133it [00:14, 9.67it/s] 134it [00:14, 9.65it/s] 135it [00:14, 9.66it/s] 136it [00:14, 9.66it/s] 137it [00:14, 9.66it/s] 138it [00:15, 9.67it/s] 139it [00:15, 9.61it/s] 140it [00:15, 9.65it/s] 141it [00:15, 9.65it/s] 142it [00:15, 9.65it/s] 143it [00:15, 9.65it/s] 144it [00:15, 9.63it/s] 145it [00:15, 9.57it/s] 146it [00:15, 9.56it/s] 147it [00:16, 9.63it/s] 148it [00:16, 9.65it/s] 149it [00:16, 9.67it/s] 150it [00:16, 9.65it/s]2025-05-26 04:09:45,252 - INFO - [Epoch 051 | Batch 0150] IWAE-loss 5195.3750 | mean log_px -0.0258 | KL -3389.90 + 151it [00:16, 9.67it/s] 152it [00:16, 9.63it/s] 153it [00:16, 9.60it/s] 154it [00:16, 9.57it/s] 155it [00:16, 9.15it/s] 156it [00:16, 9.31it/s] 157it [00:17, 9.43it/s] 158it [00:17, 9.54it/s] 159it [00:17, 9.61it/s] 160it [00:17, 9.62it/s] 161it [00:17, 9.58it/s] 162it [00:17, 9.59it/s] 163it [00:17, 9.59it/s] 164it [00:17, 9.61it/s] 165it [00:17, 9.63it/s] 166it [00:18, 9.62it/s] 167it [00:18, 9.61it/s] 168it [00:18, 9.61it/s] 169it [00:18, 9.56it/s] 170it [00:18, 9.58it/s] 171it [00:18, 9.04it/s] 172it [00:18, 9.03it/s] 173it [00:18, 9.21it/s] 174it [00:18, 9.33it/s] 175it [00:18, 9.44it/s] 176it [00:19, 9.50it/s] 177it [00:19, 9.57it/s] 178it [00:19, 9.56it/s] 179it [00:19, 9.59it/s] 180it [00:19, 9.63it/s] 181it [00:19, 9.64it/s] 182it [00:19, 9.63it/s] 183it [00:19, 9.64it/s] 184it [00:19, 9.64it/s] 185it [00:20, 9.66it/s] 186it [00:20, 9.64it/s] 187it [00:20, 9.59it/s] 188it [00:20, 9.64it/s] 189it [00:20, 9.58it/s] 190it [00:20, 9.59it/s] 191it [00:20, 9.66it/s] 192it [00:20, 9.02it/s] 193it [00:20, 9.22it/s] 194it [00:20, 9.34it/s] 195it [00:21, 8.87it/s] 196it [00:21, 9.10it/s] 196it [00:21, 9.22it/s] +2025-05-26 04:09:50,116 - INFO - Epoch: 51, Objective: tensor([5151.0229], device='cuda:0', grad_fn=), Loss: 0.03177899122238159, KL/n: 69.16956329345703 + 0it [00:00, ?it/s]2025-05-26 04:09:50,586 - INFO - [Epoch 052 | Batch 0000] IWAE-loss 4369.1685 | mean log_px -0.0140 | KL -3385.86 + 1it [00:00, 2.52it/s] 2it [00:00, 4.43it/s] 3it [00:00, 5.88it/s] 4it [00:00, 6.57it/s] 5it [00:00, 7.40it/s] 6it [00:00, 7.99it/s] 7it [00:01, 8.43it/s] 8it [00:01, 8.36it/s] 9it [00:01, 8.68it/s] 10it [00:01, 8.91it/s] 11it [00:01, 8.62it/s] 12it [00:01, 8.87it/s] 13it [00:01, 9.08it/s] 14it [00:01, 9.19it/s] 15it [00:01, 8.80it/s] 16it [00:02, 8.93it/s] 17it [00:02, 9.09it/s] 18it [00:02, 9.21it/s] 19it [00:02, 8.81it/s] 20it [00:02, 8.99it/s] 21it [00:02, 9.13it/s] 22it [00:02, 9.21it/s] 23it [00:02, 8.81it/s] 24it [00:02, 8.96it/s] 25it [00:03, 8.63it/s] 26it [00:03, 8.77it/s] 27it [00:03, 8.95it/s] 28it [00:03, 9.09it/s] 29it [00:03, 8.75it/s] 30it [00:03, 8.95it/s] 31it [00:03, 9.10it/s] 32it [00:03, 9.18it/s] 33it [00:03, 8.79it/s] 34it [00:04, 8.95it/s] 35it [00:04, 9.13it/s] 36it [00:04, 9.19it/s] 37it [00:04, 8.81it/s] 38it [00:04, 9.00it/s] 39it [00:04, 9.15it/s] 40it [00:04, 8.77it/s] 41it [00:04, 8.94it/s] 42it [00:04, 8.65it/s] 43it [00:05, 8.88it/s] 44it [00:05, 8.60it/s] 45it [00:05, 8.83it/s] 46it [00:05, 8.99it/s] 47it [00:05, 9.13it/s] 48it [00:05, 8.76it/s] 49it [00:05, 8.95it/s] 50it [00:05, 9.10it/s]2025-05-26 04:09:56,166 - INFO - [Epoch 052 | Batch 0050] IWAE-loss 4918.5332 | mean log_px -0.0245 | KL -3388.32 + 51it [00:05, 9.19it/s] 52it [00:06, 8.82it/s] 53it [00:06, 8.97it/s] 54it [00:06, 9.13it/s] 55it [00:06, 9.13it/s] 56it [00:06, 8.76it/s] 57it [00:06, 8.97it/s] 58it [00:06, 9.11it/s] 59it [00:06, 9.20it/s] 60it [00:06, 8.80it/s] 61it [00:07, 8.98it/s] 62it [00:07, 9.09it/s] 63it [00:07, 9.20it/s] 64it [00:07, 8.81it/s] 65it [00:07, 8.99it/s] 66it [00:07, 9.13it/s] 67it [00:07, 9.24it/s] 68it [00:07, 8.82it/s] 69it [00:07, 9.01it/s] 70it [00:08, 9.09it/s] 71it [00:08, 9.21it/s] 72it [00:08, 8.81it/s] 73it [00:08, 9.01it/s] 74it [00:08, 9.18it/s] 75it [00:08, 9.28it/s] 76it [00:08, 8.86it/s] 77it [00:08, 9.04it/s] 78it [00:08, 9.13it/s] 79it [00:09, 9.21it/s] 80it [00:09, 8.79it/s] 81it [00:09, 8.95it/s] 82it [00:09, 9.10it/s] 83it [00:09, 9.23it/s] 84it [00:09, 8.81it/s] 85it [00:09, 9.01it/s] 86it [00:09, 9.13it/s] 87it [00:09, 9.22it/s] 88it [00:10, 8.80it/s] 89it [00:10, 9.02it/s] 90it [00:10, 9.15it/s] 91it [00:10, 9.27it/s] 92it [00:10, 8.84it/s] 93it [00:10, 9.01it/s] 94it [00:10, 9.15it/s] 95it [00:10, 9.20it/s] 96it [00:10, 8.69it/s] 97it [00:11, 8.77it/s] 98it [00:11, 8.94it/s] 99it [00:11, 9.11it/s] 100it [00:11, 8.71it/s]2025-05-26 04:10:01,722 - INFO - [Epoch 052 | Batch 0100] IWAE-loss 4805.5391 | mean log_px -0.0203 | KL -3385.52 + 101it [00:11, 8.91it/s] 102it [00:11, 9.10it/s] 103it [00:11, 9.17it/s] 104it [00:11, 9.13it/s] 105it [00:11, 8.69it/s] 106it [00:12, 8.85it/s] 107it [00:12, 9.03it/s] 108it [00:12, 9.17it/s] 109it [00:12, 8.69it/s] 110it [00:12, 8.98it/s] 111it [00:12, 9.22it/s] 112it [00:12, 9.44it/s] 113it [00:12, 9.59it/s] 114it [00:12, 9.09it/s] 115it [00:13, 9.30it/s] 116it [00:13, 9.47it/s] 117it [00:13, 9.61it/s] 118it [00:13, 9.70it/s] 119it [00:13, 9.30it/s] 120it [00:13, 9.46it/s] 121it [00:13, 9.59it/s] 122it [00:13, 9.68it/s] 123it [00:13, 9.77it/s] 124it [00:13, 9.81it/s] 125it [00:14, 9.22it/s] 126it [00:14, 9.44it/s] 127it [00:14, 9.60it/s] 128it [00:14, 9.68it/s] 129it [00:14, 9.77it/s] 130it [00:14, 9.14it/s] 131it [00:14, 9.05it/s] 132it [00:14, 9.22it/s] 133it [00:14, 9.43it/s] 134it [00:15, 9.57it/s] 135it [00:15, 9.67it/s] 136it [00:15, 9.74it/s] 137it [00:15, 9.80it/s] 138it [00:15, 9.84it/s] 139it [00:15, 9.87it/s] 140it [00:15, 9.88it/s] 141it [00:15, 9.28it/s] 142it [00:15, 9.47it/s] 143it [00:15, 9.60it/s] 144it [00:16, 9.69it/s] 145it [00:16, 9.77it/s] 146it [00:16, 9.19it/s] 147it [00:16, 9.36it/s] 148it [00:16, 9.46it/s] 149it [00:16, 9.59it/s] 150it [00:16, 9.65it/s]2025-05-26 04:10:07,025 - INFO - [Epoch 052 | Batch 0150] IWAE-loss 5867.5352 | mean log_px -0.0419 | KL -3378.72 + 151it [00:16, 8.69it/s] 152it [00:16, 8.80it/s] 153it [00:17, 8.99it/s] 154it [00:17, 9.09it/s] 155it [00:17, 8.74it/s] 156it [00:17, 8.93it/s] 157it [00:17, 9.01it/s] 158it [00:17, 8.90it/s] 159it [00:17, 9.03it/s] 160it [00:17, 9.16it/s] 161it [00:17, 8.96it/s] 162it [00:18, 9.15it/s] 163it [00:18, 8.71it/s] 164it [00:18, 8.97it/s] 165it [00:18, 9.09it/s] 166it [00:18, 9.15it/s] 167it [00:18, 8.89it/s] 168it [00:18, 9.06it/s] 169it [00:18, 9.19it/s] 170it [00:18, 9.30it/s] 171it [00:19, 9.35it/s] 172it [00:19, 9.38it/s] 173it [00:19, 8.85it/s] 174it [00:19, 8.95it/s] 175it [00:19, 9.14it/s] 176it [00:19, 9.24it/s] 177it [00:19, 9.33it/s] 178it [00:19, 8.86it/s] 179it [00:19, 8.94it/s] 180it [00:20, 8.65it/s] 181it [00:20, 8.86it/s] 182it [00:20, 9.00it/s] 183it [00:20, 9.17it/s] 184it [00:20, 8.80it/s] 185it [00:20, 9.02it/s] 186it [00:20, 9.17it/s] 187it [00:20, 9.29it/s] 188it [00:20, 8.88it/s] 189it [00:21, 9.08it/s] 190it [00:21, 9.20it/s] 191it [00:21, 9.00it/s] 192it [00:21, 8.43it/s] 193it [00:21, 8.76it/s] 194it [00:21, 9.02it/s] 195it [00:21, 8.22it/s] 196it [00:21, 8.63it/s] 196it [00:21, 8.94it/s] +2025-05-26 04:10:12,169 - INFO - Epoch: 52, Objective: tensor([5528.3022], device='cuda:0', grad_fn=), Loss: 0.03874513879418373, KL/n: 69.0050048828125 + 0it [00:00, ?it/s]2025-05-26 04:10:12,437 - INFO - [Epoch 053 | Batch 0000] IWAE-loss 5155.4536 | mean log_px -0.0254 | KL -3377.25 + 1it [00:00, 5.42it/s] 2it [00:00, 7.30it/s] 3it [00:00, 8.10it/s] 4it [00:00, 8.61it/s] 5it [00:00, 8.91it/s] 6it [00:00, 9.10it/s] 7it [00:00, 9.17it/s] 8it [00:00, 9.30it/s] 9it [00:01, 9.28it/s] 10it [00:01, 9.31it/s] 11it [00:01, 9.41it/s] 12it [00:01, 9.46it/s] 13it [00:01, 9.52it/s] 14it [00:01, 9.49it/s] 15it [00:01, 9.53it/s] 16it [00:01, 9.59it/s] 17it [00:01, 9.54it/s] 18it [00:01, 9.56it/s] 19it [00:02, 9.55it/s] 20it [00:02, 9.56it/s] 21it [00:02, 9.60it/s] 22it [00:02, 9.56it/s] 23it [00:02, 9.57it/s] 24it [00:02, 9.56it/s] 25it [00:02, 9.62it/s] 26it [00:02, 9.64it/s] 27it [00:02, 9.59it/s] 28it [00:03, 9.56it/s] 29it [00:03, 9.32it/s] 30it [00:03, 8.96it/s] 31it [00:03, 9.08it/s] 32it [00:03, 9.27it/s] 33it [00:03, 9.40it/s] 34it [00:03, 9.46it/s] 35it [00:03, 9.45it/s] 36it [00:03, 9.46it/s] 37it [00:04, 8.90it/s] 38it [00:04, 8.82it/s] 39it [00:04, 8.95it/s] 40it [00:04, 9.16it/s] 41it [00:04, 8.79it/s] 42it [00:04, 9.07it/s] 43it [00:04, 9.28it/s] 44it [00:04, 9.42it/s] 45it [00:04, 8.97it/s] 46it [00:04, 9.18it/s] 47it [00:05, 9.36it/s] 48it [00:05, 9.49it/s] 49it [00:05, 9.59it/s] 50it [00:05, 9.66it/s]2025-05-26 04:10:17,759 - INFO - [Epoch 053 | Batch 0050] IWAE-loss 4669.8696 | mean log_px -0.0194 | KL -3377.31 + 51it [00:05, 9.68it/s] 52it [00:05, 9.71it/s] 53it [00:05, 9.74it/s] 54it [00:05, 9.75it/s] 55it [00:05, 9.79it/s] 56it [00:06, 9.78it/s] 57it [00:06, 9.79it/s] 58it [00:06, 9.79it/s] 59it [00:06, 9.80it/s] 60it [00:06, 9.80it/s] 61it [00:06, 9.80it/s] 62it [00:06, 9.74it/s] 63it [00:06, 9.75it/s] 64it [00:06, 9.75it/s] 65it [00:06, 9.76it/s] 66it [00:07, 9.77it/s] 67it [00:07, 9.79it/s] 68it [00:07, 9.80it/s] 69it [00:07, 9.76it/s] 70it [00:07, 9.77it/s] 71it [00:07, 9.79it/s] 72it [00:07, 9.79it/s] 73it [00:07, 9.82it/s] 74it [00:07, 9.76it/s] 75it [00:07, 9.74it/s] 76it [00:08, 9.76it/s] 77it [00:08, 9.79it/s] 78it [00:08, 9.80it/s] 79it [00:08, 9.80it/s] 80it [00:08, 9.80it/s] 81it [00:08, 9.76it/s] 82it [00:08, 9.73it/s] 83it [00:08, 9.78it/s] 84it [00:08, 9.78it/s] 85it [00:08, 9.80it/s] 86it [00:09, 9.80it/s] 87it [00:09, 9.83it/s] 88it [00:09, 9.82it/s] 89it [00:09, 9.82it/s] 90it [00:09, 9.82it/s] 91it [00:09, 9.82it/s] 92it [00:09, 9.80it/s] 93it [00:09, 9.82it/s] 94it [00:09, 9.81it/s] 95it [00:09, 9.81it/s] 96it [00:10, 9.78it/s] 97it [00:10, 9.75it/s] 98it [00:10, 9.70it/s] 99it [00:10, 9.68it/s] 100it [00:10, 9.63it/s]2025-05-26 04:10:22,877 - INFO - [Epoch 053 | Batch 0100] IWAE-loss 5013.9473 | mean log_px -0.0243 | KL -3370.79 + 101it [00:10, 9.61it/s] 102it [00:10, 9.68it/s] 103it [00:10, 9.70it/s] 104it [00:10, 9.72it/s] 105it [00:11, 9.73it/s] 106it [00:11, 9.75it/s] 107it [00:11, 9.77it/s] 108it [00:11, 9.71it/s] 109it [00:11, 9.74it/s] 110it [00:11, 9.75it/s] 111it [00:11, 9.75it/s] 112it [00:11, 9.75it/s] 113it [00:11, 9.76it/s] 114it [00:11, 9.71it/s] 115it [00:12, 9.74it/s] 116it [00:12, 9.76it/s] 117it [00:12, 9.79it/s] 118it [00:12, 9.74it/s] 119it [00:12, 9.76it/s] 120it [00:12, 9.77it/s] 121it [00:12, 9.79it/s] 122it [00:12, 9.66it/s] 123it [00:12, 9.68it/s] 124it [00:12, 9.73it/s] 125it [00:13, 9.75it/s] 126it [00:13, 9.75it/s] 127it [00:13, 9.74it/s] 128it [00:13, 9.73it/s] 129it [00:13, 9.76it/s] 130it [00:13, 9.74it/s] 131it [00:13, 9.77it/s] 132it [00:13, 9.78it/s] 133it [00:13, 9.78it/s] 134it [00:14, 9.79it/s] 135it [00:14, 9.79it/s] 136it [00:14, 9.80it/s] 137it [00:14, 9.80it/s] 138it [00:14, 9.80it/s] 139it [00:14, 9.81it/s] 140it [00:14, 9.82it/s] 141it [00:14, 9.82it/s] 142it [00:14, 9.81it/s] 143it [00:14, 9.81it/s] 144it [00:15, 9.81it/s] 145it [00:15, 9.81it/s] 146it [00:15, 9.81it/s] 147it [00:15, 9.81it/s] 148it [00:15, 9.64it/s] 149it [00:15, 9.67it/s] 150it [00:15, 9.32it/s]2025-05-26 04:10:28,014 - INFO - [Epoch 053 | Batch 0150] IWAE-loss 5491.2100 | mean log_px -0.0358 | KL -3374.70 + 151it [00:15, 9.45it/s] 152it [00:15, 9.55it/s] 153it [00:15, 9.63it/s] 154it [00:16, 9.68it/s] 155it [00:16, 9.72it/s] 156it [00:16, 9.75it/s] 157it [00:16, 9.77it/s] 158it [00:16, 9.78it/s] 159it [00:16, 9.77it/s] 160it [00:16, 9.78it/s] 161it [00:16, 9.79it/s] 162it [00:16, 9.80it/s] 163it [00:16, 9.80it/s] 164it [00:17, 9.79it/s] 165it [00:17, 9.78it/s] 166it [00:17, 9.76it/s] 167it [00:17, 9.78it/s] 168it [00:17, 9.77it/s] 169it [00:17, 9.79it/s] 170it [00:17, 9.79it/s] 171it [00:17, 9.79it/s] 172it [00:17, 9.79it/s] 173it [00:18, 9.72it/s] 174it [00:18, 9.73it/s] 175it [00:18, 9.76it/s] 176it [00:18, 9.76it/s] 177it [00:18, 9.74it/s] 178it [00:18, 9.49it/s] 179it [00:18, 9.59it/s] 180it [00:18, 9.65it/s] 181it [00:18, 9.70it/s] 182it [00:18, 9.74it/s] 183it [00:19, 9.71it/s] 184it [00:19, 9.53it/s] 185it [00:19, 9.61it/s] 186it [00:19, 9.67it/s] 187it [00:19, 9.71it/s] 188it [00:19, 9.73it/s] 189it [00:19, 9.71it/s] 190it [00:19, 9.57it/s] 191it [00:19, 9.63it/s] 192it [00:19, 9.68it/s] 193it [00:20, 9.17it/s] 194it [00:20, 9.36it/s] 195it [00:20, 8.94it/s] 196it [00:20, 9.57it/s] +2025-05-26 04:10:32,774 - INFO - Epoch: 53, Objective: tensor([5285.0635], device='cuda:0', grad_fn=), Loss: 0.031190963461995125, KL/n: 68.80663299560547 + 0it [00:00, ?it/s]2025-05-26 04:10:33,211 - INFO - [Epoch 054 | Batch 0000] IWAE-loss 4559.8145 | mean log_px -0.0225 | KL -3372.25 + 1it [00:00, 2.66it/s] 2it [00:00, 4.67it/s] 3it [00:00, 6.13it/s] 4it [00:00, 7.08it/s] 5it [00:00, 7.84it/s] 6it [00:00, 8.42it/s] 7it [00:00, 8.84it/s] 8it [00:01, 9.14it/s] 9it [00:01, 9.36it/s] 10it [00:01, 9.49it/s] 11it [00:01, 9.59it/s] 12it [00:01, 9.68it/s] 13it [00:01, 9.75it/s] 14it [00:01, 9.63it/s] 15it [00:01, 9.64it/s] 16it [00:01, 9.65it/s] 17it [00:02, 9.73it/s] 18it [00:02, 9.76it/s] 19it [00:02, 9.78it/s] 20it [00:02, 9.40it/s] 21it [00:02, 9.54it/s] 22it [00:02, 9.56it/s] 23it [00:02, 9.65it/s] 24it [00:02, 9.71it/s] 25it [00:02, 9.76it/s] 26it [00:02, 9.80it/s] 27it [00:03, 9.81it/s] 28it [00:03, 9.80it/s] 29it [00:03, 9.83it/s] 30it [00:03, 9.82it/s] 31it [00:03, 9.75it/s] 32it [00:03, 9.76it/s] 33it [00:03, 9.78it/s] 34it [00:03, 9.78it/s] 35it [00:03, 9.80it/s] 36it [00:03, 9.81it/s] 37it [00:04, 9.82it/s] 38it [00:04, 9.82it/s] 39it [00:04, 9.79it/s] 40it [00:04, 9.78it/s] 41it [00:04, 9.80it/s] 42it [00:04, 9.81it/s] 43it [00:04, 9.82it/s] 44it [00:04, 9.83it/s] 45it [00:04, 9.85it/s] 46it [00:04, 9.86it/s] 47it [00:05, 9.86it/s] 48it [00:05, 9.86it/s] 49it [00:05, 9.30it/s] 50it [00:05, 9.34it/s]2025-05-26 04:10:38,380 - INFO - [Epoch 054 | Batch 0050] IWAE-loss 4990.6138 | mean log_px -0.0290 | KL -3365.03 + 51it [00:05, 9.39it/s] 52it [00:05, 9.44it/s] 53it [00:05, 9.46it/s] 54it [00:05, 9.48it/s] 55it [00:05, 9.53it/s] 56it [00:06, 9.52it/s] 57it [00:06, 8.96it/s] 58it [00:06, 9.16it/s] 59it [00:06, 9.30it/s] 60it [00:06, 9.35it/s] 61it [00:06, 9.39it/s] 62it [00:06, 9.40it/s] 63it [00:06, 9.46it/s] 64it [00:06, 9.49it/s] 65it [00:07, 9.50it/s] 66it [00:07, 9.44it/s] 67it [00:07, 9.48it/s] 68it [00:07, 9.46it/s] 69it [00:07, 9.46it/s] 70it [00:07, 9.49it/s] 71it [00:07, 8.95it/s] 72it [00:07, 9.11it/s] 73it [00:07, 9.24it/s] 74it [00:07, 9.28it/s] 75it [00:08, 9.37it/s] 76it [00:08, 9.41it/s] 77it [00:08, 9.48it/s] 78it [00:08, 9.49it/s] 79it [00:08, 9.54it/s] 80it [00:08, 9.56it/s] 81it [00:08, 9.54it/s] 82it [00:08, 9.55it/s] 83it [00:08, 9.56it/s] 84it [00:09, 9.52it/s] 85it [00:09, 9.51it/s] 86it [00:09, 9.54it/s] 87it [00:09, 9.60it/s] 88it [00:09, 9.52it/s] 89it [00:09, 9.42it/s] 90it [00:09, 9.46it/s] 91it [00:09, 9.51it/s] 92it [00:09, 9.55it/s] 93it [00:09, 9.56it/s] 94it [00:10, 9.37it/s] 95it [00:10, 8.75it/s] 96it [00:10, 8.89it/s] 97it [00:10, 9.08it/s] 98it [00:10, 9.19it/s] 99it [00:10, 9.29it/s] 100it [00:10, 9.31it/s]2025-05-26 04:10:43,710 - INFO - [Epoch 054 | Batch 0100] IWAE-loss 5274.8164 | mean log_px -0.0305 | KL -3364.53 + 101it [00:10, 9.36it/s] 102it [00:10, 9.40it/s] 103it [00:11, 9.47it/s] 104it [00:11, 9.49it/s] 105it [00:11, 9.51it/s] 106it [00:11, 9.53it/s] 107it [00:11, 9.55it/s] 108it [00:11, 9.61it/s] 109it [00:11, 9.46it/s] 110it [00:11, 9.46it/s] 111it [00:11, 9.38it/s] 112it [00:12, 9.42it/s] 113it [00:12, 8.92it/s] 114it [00:12, 8.90it/s] 115it [00:12, 9.02it/s] 116it [00:12, 9.10it/s] 117it [00:12, 9.30it/s] 118it [00:12, 9.48it/s] 119it [00:12, 9.60it/s] 120it [00:12, 9.70it/s] 121it [00:12, 9.77it/s] 122it [00:13, 9.81it/s] 123it [00:13, 9.82it/s] 124it [00:13, 9.84it/s] 125it [00:13, 9.83it/s] 126it [00:13, 9.80it/s] 127it [00:13, 9.79it/s] 128it [00:13, 9.59it/s] 129it [00:13, 9.53it/s] 130it [00:13, 9.51it/s] 131it [00:14, 9.48it/s] 132it [00:14, 9.48it/s] 133it [00:14, 9.50it/s] 134it [00:14, 9.54it/s] 135it [00:14, 9.58it/s] 136it [00:14, 9.63it/s] 137it [00:14, 9.59it/s] 138it [00:14, 9.57it/s] 139it [00:14, 9.56it/s] 140it [00:14, 9.55it/s] 141it [00:15, 9.54it/s] 142it [00:15, 9.46it/s] 143it [00:15, 9.46it/s] 144it [00:15, 9.42it/s] 145it [00:15, 9.46it/s] 146it [00:15, 9.44it/s] 147it [00:15, 9.45it/s] 148it [00:15, 9.42it/s] 149it [00:15, 9.41it/s] 150it [00:16, 9.44it/s]2025-05-26 04:10:48,975 - INFO - [Epoch 054 | Batch 0150] IWAE-loss 4747.6250 | mean log_px -0.0197 | KL -3364.11 + 151it [00:16, 9.36it/s] 152it [00:16, 9.40it/s] 153it [00:16, 9.47it/s] 154it [00:16, 9.47it/s] 155it [00:16, 9.53it/s] 156it [00:16, 8.88it/s] 157it [00:16, 9.01it/s] 158it [00:16, 9.15it/s] 159it [00:16, 9.25it/s] 160it [00:17, 9.31it/s] 161it [00:17, 9.36it/s] 162it [00:17, 9.36it/s] 163it [00:17, 9.40it/s] 164it [00:17, 9.44it/s] 165it [00:17, 9.02it/s] 166it [00:17, 9.13it/s] 167it [00:17, 9.28it/s] 168it [00:17, 9.25it/s] 169it [00:18, 9.29it/s] 170it [00:18, 9.35it/s] 171it [00:18, 8.85it/s] 172it [00:18, 9.16it/s] 173it [00:18, 9.38it/s] 174it [00:18, 9.52it/s] 176it [00:18, 9.22it/s] 178it [00:19, 9.55it/s] 180it [00:19, 9.73it/s] 181it [00:19, 9.35it/s] 182it [00:19, 9.46it/s] 183it [00:19, 9.56it/s] 185it [00:19, 9.77it/s] 187it [00:19, 9.86it/s] 189it [00:20, 9.90it/s] 190it [00:20, 9.92it/s] 192it [00:20, 9.98it/s] 194it [00:20, 10.01it/s] 195it [00:20, 9.62it/s] 196it [00:20, 9.37it/s] +2025-05-26 04:10:53,824 - INFO - Epoch: 54, Objective: tensor([5742.4844], device='cuda:0', grad_fn=), Loss: 0.04035816341638565, KL/n: 68.60377502441406 + 0it [00:00, ?it/s]2025-05-26 04:10:54,095 - INFO - [Epoch 055 | Batch 0000] IWAE-loss 4954.8682 | mean log_px -0.0264 | KL -3363.76 + 1it [00:00, 4.78it/s] 3it [00:00, 7.84it/s] 5it [00:00, 8.89it/s] 6it [00:00, 9.16it/s] 7it [00:00, 8.89it/s] 9it [00:01, 9.40it/s] 10it [00:01, 9.50it/s] 11it [00:01, 9.14it/s] 13it [00:01, 9.51it/s] 14it [00:01, 9.61it/s] 15it [00:01, 9.21it/s] 16it [00:01, 9.32it/s] 18it [00:01, 9.29it/s] 20it [00:02, 9.59it/s] 22it [00:02, 9.78it/s] 23it [00:02, 9.43it/s] 25it [00:02, 9.67it/s] 27it [00:02, 9.45it/s] 28it [00:03, 9.51it/s] 29it [00:03, 9.55it/s] 30it [00:03, 9.58it/s] 31it [00:03, 9.60it/s] 32it [00:03, 9.24it/s] 33it [00:03, 9.40it/s] 34it [00:03, 9.55it/s] 35it [00:03, 9.23it/s] 37it [00:03, 9.61it/s] 39it [00:04, 9.48it/s] 41it [00:04, 9.69it/s] 42it [00:04, 9.75it/s] 44it [00:04, 9.89it/s] 46it [00:04, 9.59it/s] 48it [00:05, 9.74it/s] 50it [00:05, 9.82it/s]2025-05-26 04:10:59,314 - INFO - [Epoch 055 | Batch 0050] IWAE-loss 5218.8096 | mean log_px -0.0286 | KL -3357.67 + 51it [00:05, 9.49it/s] 52it [00:05, 9.56it/s] 53it [00:05, 9.47it/s] 54it [00:05, 9.56it/s] 55it [00:05, 9.63it/s] 56it [00:05, 9.63it/s] 57it [00:06, 9.61it/s] 58it [00:06, 9.11it/s] 59it [00:06, 9.29it/s] 60it [00:06, 9.38it/s] 61it [00:06, 9.41it/s] 62it [00:06, 9.04it/s] 63it [00:06, 9.25it/s] 64it [00:06, 9.43it/s] 65it [00:06, 9.51it/s] 66it [00:07, 9.58it/s] 67it [00:07, 9.69it/s] 68it [00:07, 9.72it/s] 69it [00:07, 9.20it/s] 70it [00:07, 9.02it/s] 71it [00:07, 9.07it/s] 72it [00:07, 9.13it/s] 73it [00:07, 8.79it/s] 74it [00:07, 9.05it/s] 75it [00:07, 9.23it/s] 76it [00:08, 9.26it/s] 77it [00:08, 9.45it/s] 78it [00:08, 9.57it/s] 79it [00:08, 8.97it/s] 80it [00:08, 9.10it/s] 81it [00:08, 9.23it/s] 82it [00:08, 9.32it/s] 83it [00:08, 9.43it/s] 84it [00:08, 9.49it/s] 85it [00:09, 9.50it/s] 86it [00:09, 9.50it/s] 87it [00:09, 9.56it/s] 88it [00:09, 9.59it/s] 89it [00:09, 9.13it/s] 90it [00:09, 9.30it/s] 91it [00:09, 9.42it/s] 92it [00:09, 9.49it/s] 93it [00:09, 9.07it/s] 94it [00:10, 9.29it/s] 95it [00:10, 9.39it/s] 96it [00:10, 9.52it/s] 97it [00:10, 9.18it/s] 98it [00:10, 9.36it/s] 99it [00:10, 9.51it/s] 100it [00:10, 9.61it/s]2025-05-26 04:11:04,673 - INFO - [Epoch 055 | Batch 0100] IWAE-loss 5689.7671 | mean log_px -0.0453 | KL -3352.47 + 101it [00:10, 9.63it/s] 102it [00:10, 9.22it/s] 103it [00:10, 9.40it/s] 104it [00:11, 9.53it/s] 105it [00:11, 9.03it/s] 106it [00:11, 9.22it/s] 107it [00:11, 9.40it/s] 108it [00:11, 9.51it/s] 109it [00:11, 9.58it/s] 110it [00:11, 9.65it/s] 111it [00:11, 9.72it/s] 112it [00:11, 9.13it/s] 113it [00:12, 9.30it/s] 114it [00:12, 9.45it/s] 115it [00:12, 9.56it/s] 116it [00:12, 9.64it/s] 117it [00:12, 9.69it/s] 118it [00:12, 9.72it/s] 119it [00:12, 9.75it/s] 120it [00:12, 9.16it/s] 121it [00:12, 9.36it/s] 122it [00:12, 9.50it/s] 123it [00:13, 9.61it/s] 124it [00:13, 9.20it/s] 125it [00:13, 9.37it/s] 126it [00:13, 9.50it/s] 127it [00:13, 9.13it/s] 128it [00:13, 9.33it/s] 129it [00:13, 9.46it/s] 130it [00:13, 9.57it/s] 131it [00:13, 9.66it/s] 132it [00:14, 9.10it/s] 133it [00:14, 9.31it/s] 134it [00:14, 9.46it/s] 135it [00:14, 9.53it/s] 136it [00:14, 9.64it/s] 137it [00:14, 9.69it/s] 138it [00:14, 9.73it/s] 139it [00:14, 9.78it/s] 140it [00:14, 9.78it/s] 141it [00:14, 9.76it/s] 142it [00:15, 9.78it/s] 143it [00:15, 9.81it/s] 144it [00:15, 9.81it/s] 145it [00:15, 9.83it/s] 146it [00:15, 9.79it/s] 147it [00:15, 9.80it/s] 148it [00:15, 9.78it/s] 149it [00:15, 9.31it/s] 150it [00:15, 9.48it/s]2025-05-26 04:11:09,929 - INFO - [Epoch 055 | Batch 0150] IWAE-loss 5461.5342 | mean log_px -0.0355 | KL -3352.60 + 151it [00:16, 9.56it/s] 152it [00:16, 9.61it/s] 153it [00:16, 9.47it/s] 154it [00:16, 9.11it/s] 155it [00:16, 9.34it/s] 156it [00:16, 9.46it/s] 157it [00:16, 9.54it/s] 158it [00:16, 9.60it/s] 159it [00:16, 9.68it/s] 160it [00:16, 9.70it/s] 161it [00:17, 9.71it/s] 162it [00:17, 9.73it/s] 163it [00:17, 9.76it/s] 164it [00:17, 9.74it/s] 165it [00:17, 9.76it/s] 166it [00:17, 9.16it/s] 167it [00:17, 9.37it/s] 168it [00:17, 9.49it/s] 169it [00:17, 9.60it/s] 170it [00:18, 9.06it/s] 171it [00:18, 9.26it/s] 172it [00:18, 9.42it/s] 173it [00:18, 9.54it/s] 174it [00:18, 9.62it/s] 175it [00:18, 9.70it/s] 176it [00:18, 9.22it/s] 177it [00:18, 9.38it/s] 178it [00:18, 9.49it/s] 179it [00:18, 9.60it/s] 180it [00:19, 9.68it/s] 181it [00:19, 9.23it/s] 182it [00:19, 9.41it/s] 183it [00:19, 9.53it/s] 184it [00:19, 9.62it/s] 185it [00:19, 9.02it/s] 186it [00:19, 9.13it/s] 187it [00:19, 9.31it/s] 188it [00:19, 9.41it/s] 189it [00:20, 8.90it/s] 190it [00:20, 9.05it/s] 191it [00:20, 9.24it/s] 192it [00:20, 9.20it/s] 193it [00:20, 9.13it/s] 194it [00:20, 8.54it/s] 195it [00:20, 8.37it/s] 196it [00:20, 8.73it/s] 196it [00:20, 9.38it/s] +2025-05-26 04:11:14,860 - INFO - Epoch: 55, Objective: tensor([5165.6812], device='cuda:0', grad_fn=), Loss: 0.03494435176253319, KL/n: 68.38105010986328 + 0it [00:00, ?it/s]2025-05-26 04:11:15,329 - INFO - [Epoch 056 | Batch 0000] IWAE-loss 4359.5181 | mean log_px -0.0144 | KL -3346.51 + 1it [00:00, 2.67it/s] 2it [00:00, 4.53it/s] 3it [00:00, 5.77it/s] 4it [00:00, 6.87it/s] 5it [00:00, 7.58it/s] 6it [00:00, 8.18it/s] 7it [00:01, 8.50it/s] 8it [00:01, 8.78it/s] 9it [00:01, 9.06it/s] 10it [00:01, 9.16it/s] 11it [00:01, 9.31it/s] 12it [00:01, 9.44it/s] 13it [00:01, 9.50it/s] 14it [00:01, 9.35it/s] 15it [00:01, 9.36it/s] 16it [00:01, 9.48it/s] 17it [00:02, 9.47it/s] 18it [00:02, 8.88it/s] 19it [00:02, 9.11it/s] 20it [00:02, 9.21it/s] 21it [00:02, 8.77it/s] 22it [00:02, 9.02it/s] 23it [00:02, 9.20it/s] 24it [00:02, 9.31it/s] 25it [00:02, 8.76it/s] 26it [00:03, 8.95it/s] 27it [00:03, 9.12it/s] 28it [00:03, 8.75it/s] 29it [00:03, 9.01it/s] 30it [00:03, 8.96it/s] 31it [00:03, 8.73it/s] 32it [00:03, 8.39it/s] 33it [00:03, 8.78it/s] 34it [00:03, 9.07it/s] 35it [00:04, 9.28it/s] 36it [00:04, 8.86it/s] 37it [00:04, 9.13it/s] 38it [00:04, 9.32it/s] 39it [00:04, 9.45it/s] 40it [00:04, 8.97it/s] 41it [00:04, 9.19it/s] 42it [00:04, 9.37it/s] 43it [00:04, 9.53it/s] 44it [00:05, 9.02it/s] 45it [00:05, 9.09it/s] 46it [00:05, 8.60it/s] 47it [00:05, 8.75it/s] 48it [00:05, 9.03it/s] 49it [00:05, 9.24it/s] 50it [00:05, 8.86it/s]2025-05-26 04:11:20,814 - INFO - [Epoch 056 | Batch 0050] IWAE-loss 7072.4180 | mean log_px -0.0646 | KL -3344.14 + 51it [00:05, 9.11it/s] 52it [00:05, 9.31it/s] 53it [00:06, 9.45it/s] 54it [00:06, 9.00it/s] 55it [00:06, 9.24it/s] 56it [00:06, 9.36it/s] 57it [00:06, 9.45it/s] 58it [00:06, 8.93it/s] 59it [00:06, 9.16it/s] 60it [00:06, 9.32it/s] 61it [00:06, 9.46it/s] 62it [00:07, 9.00it/s] 63it [00:07, 9.23it/s] 64it [00:07, 9.38it/s] 65it [00:07, 9.48it/s] 66it [00:07, 9.01it/s] 67it [00:07, 9.23it/s] 68it [00:07, 9.37it/s] 69it [00:07, 9.49it/s] 70it [00:07, 9.00it/s] 71it [00:08, 9.24it/s] 72it [00:08, 9.36it/s] 73it [00:08, 9.49it/s] 74it [00:08, 8.97it/s] 75it [00:08, 9.19it/s] 76it [00:08, 9.34it/s] 77it [00:08, 9.42it/s] 78it [00:08, 8.92it/s] 79it [00:08, 9.11it/s] 80it [00:08, 9.24it/s] 81it [00:09, 9.37it/s] 82it [00:09, 8.91it/s] 83it [00:09, 8.88it/s] 84it [00:09, 9.06it/s] 85it [00:09, 9.19it/s] 86it [00:09, 9.17it/s] 87it [00:09, 8.74it/s] 88it [00:09, 8.89it/s] 89it [00:09, 9.04it/s] 90it [00:10, 9.13it/s] 91it [00:10, 8.73it/s] 92it [00:10, 8.93it/s] 93it [00:10, 9.13it/s] 94it [00:10, 8.78it/s] 95it [00:10, 9.07it/s] 96it [00:10, 9.30it/s] 97it [00:10, 9.48it/s] 98it [00:10, 9.04it/s] 99it [00:11, 9.29it/s] 100it [00:11, 9.46it/s]2025-05-26 04:11:26,247 - INFO - [Epoch 056 | Batch 0100] IWAE-loss 4897.2031 | mean log_px -0.0227 | KL -3343.42 + 101it [00:11, 9.59it/s] 102it [00:11, 9.11it/s] 103it [00:11, 9.36it/s] 104it [00:11, 9.51it/s] 105it [00:11, 9.63it/s] 106it [00:11, 9.13it/s] 107it [00:11, 9.36it/s] 108it [00:12, 9.54it/s] 109it [00:12, 9.66it/s] 110it [00:12, 9.15it/s] 111it [00:12, 9.37it/s] 112it [00:12, 9.52it/s] 113it [00:12, 9.66it/s] 114it [00:12, 9.14it/s] 116it [00:12, 9.52it/s] 118it [00:13, 9.30it/s] 119it [00:13, 9.44it/s] 120it [00:13, 9.54it/s] 121it [00:13, 9.65it/s] 122it [00:13, 9.19it/s] 123it [00:13, 9.39it/s] 124it [00:13, 9.53it/s] 125it [00:13, 9.64it/s] 126it [00:13, 9.17it/s] 127it [00:14, 9.39it/s] 128it [00:14, 9.53it/s] 129it [00:14, 9.65it/s] 130it [00:14, 9.14it/s] 131it [00:14, 9.37it/s] 133it [00:14, 9.68it/s] 134it [00:14, 9.75it/s] 136it [00:14, 9.86it/s] 138it [00:15, 9.71it/s] 139it [00:15, 9.76it/s] 140it [00:15, 9.81it/s] 141it [00:15, 9.32it/s] 142it [00:15, 9.39it/s] 143it [00:15, 9.44it/s] 144it [00:15, 9.44it/s] 145it [00:15, 9.02it/s] 146it [00:16, 9.23it/s] 147it [00:16, 9.40it/s] 148it [00:16, 9.52it/s] 149it [00:16, 9.05it/s] 150it [00:16, 9.25it/s]2025-05-26 04:11:31,547 - INFO - [Epoch 056 | Batch 0150] IWAE-loss 4315.8975 | mean log_px -0.0143 | KL -3342.45 + 151it [00:16, 9.36it/s] 152it [00:16, 9.47it/s] 153it [00:16, 9.01it/s] 154it [00:16, 9.25it/s] 155it [00:17, 9.43it/s] 156it [00:17, 9.56it/s] 157it [00:17, 9.10it/s] 158it [00:17, 9.33it/s] 159it [00:17, 9.51it/s] 160it [00:17, 9.64it/s] 161it [00:17, 9.15it/s] 162it [00:17, 9.36it/s] 163it [00:17, 9.53it/s] 164it [00:17, 9.66it/s] 165it [00:18, 9.16it/s] 166it [00:18, 9.38it/s] 167it [00:18, 9.00it/s] 168it [00:18, 9.27it/s] 170it [00:18, 9.60it/s] 171it [00:18, 9.22it/s] 172it [00:18, 9.39it/s] 174it [00:19, 9.65it/s] 175it [00:19, 9.26it/s] 176it [00:19, 9.41it/s] 177it [00:19, 9.54it/s] 178it [00:19, 9.66it/s] 179it [00:19, 9.18it/s] 180it [00:19, 9.37it/s] 182it [00:19, 9.65it/s] 184it [00:20, 9.80it/s] 186it [00:20, 9.57it/s] 188it [00:20, 9.71it/s] 190it [00:20, 9.47it/s] 192it [00:20, 9.64it/s] 193it [00:21, 9.70it/s] 194it [00:21, 9.41it/s] 195it [00:21, 8.99it/s] 196it [00:21, 9.14it/s] +2025-05-26 04:11:36,431 - INFO - Epoch: 56, Objective: tensor([5050.2954], device='cuda:0', grad_fn=), Loss: 0.02728617750108242, KL/n: 68.18730926513672 + 0it [00:00, ?it/s]2025-05-26 04:11:36,710 - INFO - [Epoch 057 | Batch 0000] IWAE-loss 4560.9824 | mean log_px -0.0185 | KL -3340.02 + 1it [00:00, 4.75it/s] 2it [00:00, 6.81it/s] 3it [00:00, 7.96it/s] 4it [00:00, 8.03it/s] 5it [00:00, 8.57it/s] 6it [00:00, 8.40it/s] 7it [00:00, 8.82it/s] 8it [00:00, 9.16it/s] 9it [00:01, 9.33it/s] 10it [00:01, 9.52it/s] 12it [00:01, 9.75it/s] 13it [00:01, 9.39it/s] 14it [00:01, 9.53it/s] 16it [00:01, 9.38it/s] 18it [00:02, 9.61it/s] 20it [00:02, 9.75it/s] 22it [00:02, 9.84it/s] 24it [00:02, 9.90it/s] 26it [00:02, 9.66it/s] 27it [00:02, 9.72it/s] 28it [00:03, 9.77it/s] 30it [00:03, 9.86it/s] 32it [00:03, 9.91it/s] 34it [00:03, 9.66it/s] 36it [00:03, 9.77it/s] 37it [00:03, 9.43it/s] 38it [00:04, 9.53it/s] 40it [00:04, 9.69it/s] 42it [00:04, 9.80it/s] 44it [00:04, 9.87it/s] 46it [00:04, 9.57it/s] 48it [00:05, 9.71it/s] 50it [00:05, 9.81it/s]2025-05-26 04:11:41,908 - INFO - [Epoch 057 | Batch 0050] IWAE-loss 4015.7031 | mean log_px -0.0109 | KL -3334.84 + 51it [00:05, 9.45it/s] 52it [00:05, 9.55it/s] 53it [00:05, 9.65it/s] 54it [00:05, 9.72it/s] 55it [00:05, 9.35it/s] 56it [00:05, 9.45it/s] 57it [00:06, 9.57it/s] 58it [00:06, 9.63it/s] 59it [00:06, 9.72it/s] 60it [00:06, 9.78it/s] 61it [00:06, 9.22it/s] 62it [00:06, 9.40it/s] 63it [00:06, 9.46it/s] 64it [00:06, 9.57it/s] 65it [00:06, 9.05it/s] 66it [00:06, 9.27it/s] 67it [00:07, 9.47it/s] 68it [00:07, 9.59it/s] 69it [00:07, 9.68it/s] 70it [00:07, 9.73it/s] 72it [00:07, 9.86it/s] 74it [00:07, 9.92it/s] 75it [00:07, 9.46it/s] 76it [00:08, 9.58it/s] 77it [00:08, 9.68it/s] 78it [00:08, 9.75it/s] 79it [00:08, 9.81it/s] 80it [00:08, 9.86it/s] 81it [00:08, 9.40it/s] 82it [00:08, 9.55it/s] 84it [00:08, 9.29it/s] 86it [00:09, 9.56it/s] 87it [00:09, 9.49it/s] 88it [00:09, 9.14it/s] 89it [00:09, 9.17it/s] 90it [00:09, 9.29it/s] 91it [00:09, 9.39it/s] 92it [00:09, 9.49it/s] 93it [00:09, 9.57it/s] 94it [00:09, 9.62it/s] 95it [00:10, 9.66it/s] 96it [00:10, 9.68it/s] 97it [00:10, 9.71it/s] 98it [00:10, 9.73it/s] 99it [00:10, 9.67it/s] 100it [00:10, 9.66it/s]2025-05-26 04:11:47,156 - INFO - [Epoch 057 | Batch 0100] IWAE-loss 4555.8833 | mean log_px -0.0193 | KL -3332.19 + 101it [00:10, 9.14it/s] 102it [00:10, 9.38it/s] 103it [00:10, 9.55it/s] 104it [00:10, 9.55it/s] 105it [00:11, 9.59it/s] 106it [00:11, 9.69it/s] 108it [00:11, 9.83it/s] 110it [00:11, 9.91it/s] 111it [00:11, 9.93it/s] 112it [00:11, 9.88it/s] 113it [00:11, 9.91it/s] 114it [00:11, 9.37it/s] 116it [00:12, 9.63it/s] 117it [00:12, 9.71it/s] 118it [00:12, 9.77it/s] 120it [00:12, 9.41it/s] 121it [00:12, 9.53it/s] 122it [00:12, 9.63it/s] 123it [00:12, 9.69it/s] 124it [00:13, 9.63it/s] 125it [00:13, 9.69it/s] 126it [00:13, 9.76it/s] 127it [00:13, 9.78it/s] 128it [00:13, 9.82it/s] 129it [00:13, 9.86it/s] 130it [00:13, 9.29it/s] 131it [00:13, 9.44it/s] 132it [00:13, 9.51it/s] 133it [00:13, 9.62it/s] 134it [00:14, 9.08it/s] 135it [00:14, 9.30it/s] 136it [00:14, 9.42it/s] 137it [00:14, 9.53it/s] 138it [00:14, 9.04it/s] 139it [00:14, 9.27it/s] 140it [00:14, 9.45it/s] 141it [00:14, 9.00it/s] 142it [00:14, 9.24it/s] 143it [00:15, 9.32it/s] 144it [00:15, 9.46it/s] 145it [00:15, 9.12it/s] 146it [00:15, 9.31it/s] 147it [00:15, 9.47it/s] 148it [00:15, 9.57it/s] 149it [00:15, 9.65it/s] 150it [00:15, 9.69it/s]2025-05-26 04:11:52,397 - INFO - [Epoch 057 | Batch 0150] IWAE-loss 4984.7964 | mean log_px -0.0261 | KL -3333.72 + 151it [00:15, 9.14it/s] 152it [00:15, 9.34it/s] 153it [00:16, 9.49it/s] 154it [00:16, 9.60it/s] 155it [00:16, 9.08it/s] 156it [00:16, 9.31it/s] 157it [00:16, 9.49it/s] 158it [00:16, 9.62it/s] 159it [00:16, 9.72it/s] 160it [00:16, 9.79it/s] 161it [00:16, 9.20it/s] 162it [00:17, 9.37it/s] 164it [00:17, 9.66it/s] 165it [00:17, 9.74it/s] 166it [00:17, 9.25it/s] 167it [00:17, 9.44it/s] 168it [00:17, 9.58it/s] 169it [00:17, 9.69it/s] 170it [00:17, 9.78it/s] 171it [00:17, 9.83it/s] 172it [00:18, 9.86it/s] 174it [00:18, 9.93it/s] 175it [00:18, 9.94it/s] 176it [00:18, 9.91it/s] 177it [00:18, 9.93it/s] 178it [00:18, 9.35it/s] 179it [00:18, 9.52it/s] 180it [00:18, 9.61it/s] 181it [00:19, 9.72it/s] 182it [00:19, 9.78it/s] 184it [00:19, 9.89it/s] 185it [00:19, 9.90it/s] 186it [00:19, 9.92it/s] 187it [00:19, 9.94it/s] 188it [00:19, 9.94it/s] 190it [00:19, 9.97it/s] 191it [00:20, 9.98it/s] 192it [00:20, 9.97it/s] 193it [00:20, 9.40it/s] 194it [00:20, 9.54it/s] 195it [00:20, 9.24it/s] 196it [00:20, 9.51it/s] +2025-05-26 04:11:57,167 - INFO - Epoch: 57, Objective: tensor([5603.3149], device='cuda:0', grad_fn=), Loss: 0.03557281568646431, KL/n: 67.98454284667969 + 0it [00:00, ?it/s]2025-05-26 04:11:57,613 - INFO - [Epoch 058 | Batch 0000] IWAE-loss 4603.7197 | mean log_px -0.0217 | KL -3329.28 + 1it [00:00, 4.95it/s] 2it [00:00, 7.00it/s] 4it [00:00, 8.65it/s] 6it [00:00, 9.24it/s] 7it [00:00, 9.42it/s] 8it [00:00, 9.55it/s] 10it [00:01, 9.24it/s] 12it [00:01, 9.50it/s] 13it [00:01, 9.60it/s] 14it [00:01, 9.64it/s] 15it [00:01, 9.12it/s] 16it [00:01, 9.22it/s] 17it [00:01, 9.41it/s] 18it [00:01, 9.54it/s] 19it [00:02, 9.66it/s] 20it [00:02, 9.16it/s] 21it [00:02, 9.39it/s] 22it [00:02, 9.42it/s] 23it [00:02, 9.52it/s] 24it [00:02, 9.63it/s] 25it [00:02, 9.69it/s] 26it [00:02, 9.77it/s] 28it [00:03, 9.87it/s] 30it [00:03, 9.93it/s] 31it [00:03, 9.91it/s] 32it [00:03, 9.51it/s] 33it [00:03, 9.63it/s] 34it [00:03, 9.71it/s] 36it [00:03, 9.83it/s] 37it [00:03, 9.32it/s] 38it [00:04, 9.46it/s] 39it [00:04, 9.59it/s] 40it [00:04, 9.69it/s] 41it [00:04, 9.77it/s] 42it [00:04, 9.81it/s] 43it [00:04, 9.86it/s] 44it [00:04, 9.88it/s] 45it [00:04, 9.42it/s] 46it [00:04, 9.56it/s] 47it [00:04, 9.68it/s] 48it [00:05, 9.76it/s] 49it [00:05, 9.82it/s] 50it [00:05, 9.87it/s]2025-05-26 04:12:02,809 - INFO - [Epoch 058 | Batch 0050] IWAE-loss 4924.8784 | mean log_px -0.0293 | KL -3323.80 + 51it [00:05, 9.26it/s] 52it [00:05, 9.44it/s] 53it [00:05, 9.58it/s] 54it [00:05, 9.69it/s] 55it [00:05, 9.78it/s] 56it [00:05, 9.82it/s] 57it [00:06, 9.25it/s] 58it [00:06, 9.45it/s] 59it [00:06, 9.58it/s] 60it [00:06, 9.68it/s] 61it [00:06, 9.15it/s] 62it [00:06, 9.37it/s] 63it [00:06, 9.55it/s] 64it [00:06, 9.67it/s] 65it [00:06, 9.75it/s] 66it [00:06, 9.16it/s] 67it [00:07, 9.38it/s] 68it [00:07, 9.51it/s] 69it [00:07, 9.64it/s] 70it [00:07, 9.13it/s] 71it [00:07, 9.35it/s] 72it [00:07, 9.51it/s] 73it [00:07, 9.62it/s] 74it [00:07, 9.11it/s] 75it [00:07, 9.30it/s] 76it [00:08, 9.41it/s] 77it [00:08, 9.56it/s] 78it [00:08, 9.08it/s] 79it [00:08, 9.31it/s] 80it [00:08, 9.47it/s] 81it [00:08, 9.58it/s] 82it [00:08, 9.68it/s] 83it [00:08, 9.77it/s] 84it [00:08, 9.83it/s] 86it [00:09, 9.91it/s] 87it [00:09, 9.92it/s] 88it [00:09, 9.93it/s] 89it [00:09, 9.94it/s] 90it [00:09, 9.94it/s] 91it [00:09, 9.96it/s] 92it [00:09, 9.96it/s] 93it [00:09, 9.97it/s] 94it [00:09, 9.46it/s] 95it [00:09, 9.58it/s] 96it [00:10, 9.69it/s] 97it [00:10, 9.75it/s] 98it [00:10, 9.72it/s] 99it [00:10, 9.75it/s] 100it [00:10, 9.76it/s]2025-05-26 04:12:08,030 - INFO - [Epoch 058 | Batch 0100] IWAE-loss 4599.8813 | mean log_px -0.0212 | KL -3328.67 + 101it [00:10, 9.15it/s] 102it [00:10, 9.27it/s] 103it [00:10, 9.42it/s] 104it [00:10, 9.57it/s] 105it [00:11, 9.17it/s] 106it [00:11, 9.38it/s] 107it [00:11, 9.51it/s] 108it [00:11, 9.05it/s] 109it [00:11, 9.31it/s] 110it [00:11, 9.47it/s] 111it [00:11, 9.62it/s] 112it [00:11, 9.70it/s] 113it [00:11, 9.77it/s] 114it [00:11, 9.33it/s] 115it [00:12, 9.38it/s] 116it [00:12, 9.49it/s] 117it [00:12, 9.49it/s] 118it [00:12, 9.55it/s] 119it [00:12, 9.03it/s] 120it [00:12, 9.23it/s] 121it [00:12, 9.35it/s] 122it [00:12, 9.39it/s] 123it [00:12, 8.85it/s] 124it [00:13, 9.11it/s] 125it [00:13, 9.31it/s] 126it [00:13, 9.44it/s] 127it [00:13, 9.55it/s] 128it [00:13, 9.60it/s] 129it [00:13, 9.06it/s] 130it [00:13, 9.26it/s] 131it [00:13, 9.42it/s] 132it [00:13, 9.52it/s] 133it [00:14, 9.10it/s] 134it [00:14, 9.27it/s] 135it [00:14, 9.37it/s] 136it [00:14, 9.45it/s] 137it [00:14, 9.48it/s] 138it [00:14, 9.52it/s] 139it [00:14, 8.93it/s] 140it [00:14, 9.11it/s] 141it [00:14, 9.26it/s] 142it [00:14, 9.31it/s] 143it [00:15, 9.35it/s] 144it [00:15, 9.36it/s] 145it [00:15, 9.38it/s] 146it [00:15, 9.42it/s] 147it [00:15, 9.41it/s] 148it [00:15, 8.92it/s] 149it [00:15, 9.14it/s] 150it [00:15, 9.23it/s]2025-05-26 04:12:13,404 - INFO - [Epoch 058 | Batch 0150] IWAE-loss 4261.2881 | mean log_px -0.0143 | KL -3324.48 + 151it [00:15, 9.30it/s] 152it [00:16, 9.36it/s] 153it [00:16, 9.41it/s] 154it [00:16, 9.46it/s] 155it [00:16, 9.49it/s] 156it [00:16, 9.54it/s] 157it [00:16, 9.60it/s] 158it [00:16, 8.99it/s] 159it [00:16, 9.09it/s] 160it [00:16, 9.15it/s] 161it [00:17, 9.27it/s] 162it [00:17, 9.18it/s] 163it [00:17, 9.28it/s] 164it [00:17, 9.34it/s] 165it [00:17, 8.82it/s] 166it [00:17, 9.01it/s] 167it [00:17, 9.15it/s] 168it [00:17, 9.22it/s] 169it [00:17, 8.88it/s] 170it [00:18, 9.06it/s] 171it [00:18, 9.20it/s] 172it [00:18, 8.82it/s] 173it [00:18, 8.66it/s] 174it [00:18, 8.49it/s] 175it [00:18, 8.47it/s] 176it [00:18, 8.71it/s] 177it [00:18, 8.58it/s] 178it [00:18, 8.86it/s] 179it [00:19, 9.09it/s] 180it [00:19, 8.68it/s] 181it [00:19, 8.92it/s] 182it [00:19, 9.08it/s] 183it [00:19, 8.99it/s] 184it [00:19, 8.56it/s] 185it [00:19, 8.77it/s] 186it [00:19, 9.02it/s] 187it [00:19, 9.16it/s] 188it [00:20, 9.29it/s] 189it [00:20, 9.38it/s] 190it [00:20, 9.45it/s] 191it [00:20, 9.51it/s] 192it [00:20, 9.50it/s] 193it [00:20, 8.92it/s] 194it [00:20, 9.11it/s] 195it [00:20, 8.65it/s] 196it [00:20, 8.87it/s] 196it [00:21, 9.33it/s] +2025-05-26 04:12:18,493 - INFO - Epoch: 58, Objective: tensor([4525.3076], device='cuda:0', grad_fn=), Loss: 0.021634532138705254, KL/n: 67.80258178710938 + 0it [00:00, ?it/s]2025-05-26 04:12:18,769 - INFO - [Epoch 059 | Batch 0000] IWAE-loss 4513.4170 | mean log_px -0.0270 | KL -3325.71 + 1it [00:00, 5.38it/s] 2it [00:00, 7.27it/s] 3it [00:00, 8.11it/s] 4it [00:00, 8.63it/s] 5it [00:00, 9.02it/s] 6it [00:00, 9.22it/s] 7it [00:00, 9.39it/s] 8it [00:00, 8.60it/s] 9it [00:01, 8.91it/s] 10it [00:01, 9.09it/s] 11it [00:01, 9.31it/s] 12it [00:01, 9.38it/s] 13it [00:01, 8.93it/s] 14it [00:01, 9.11it/s] 15it [00:01, 9.19it/s] 16it [00:01, 9.33it/s] 17it [00:01, 9.33it/s] 18it [00:02, 9.37it/s] 19it [00:02, 9.00it/s] 20it [00:02, 9.18it/s] 21it [00:02, 9.25it/s] 22it [00:02, 9.29it/s] 23it [00:02, 9.32it/s] 24it [00:02, 9.35it/s] 25it [00:02, 9.39it/s] 26it [00:02, 9.45it/s] 27it [00:02, 9.49it/s] 28it [00:03, 9.47it/s] 29it [00:03, 8.89it/s] 30it [00:03, 9.13it/s] 31it [00:03, 9.34it/s] 32it [00:03, 9.45it/s] 33it [00:03, 9.51it/s] 34it [00:03, 9.57it/s] 35it [00:03, 9.59it/s] 36it [00:03, 9.58it/s] 37it [00:04, 9.60it/s] 38it [00:04, 9.63it/s] 39it [00:04, 9.66it/s] 40it [00:04, 9.68it/s] 41it [00:04, 9.74it/s] 42it [00:04, 9.13it/s] 43it [00:04, 9.30it/s] 44it [00:04, 9.37it/s] 45it [00:04, 9.45it/s] 46it [00:04, 9.51it/s] 47it [00:05, 9.53it/s] 48it [00:05, 9.56it/s] 49it [00:05, 9.55it/s] 50it [00:05, 9.54it/s]2025-05-26 04:12:24,095 - INFO - [Epoch 059 | Batch 0050] IWAE-loss 4204.3833 | mean log_px -0.0140 | KL -3318.27 + 51it [00:05, 9.48it/s] 52it [00:05, 9.11it/s] 53it [00:05, 9.21it/s] 54it [00:05, 9.27it/s] 55it [00:05, 9.36it/s] 56it [00:06, 9.39it/s] 57it [00:06, 9.51it/s] 58it [00:06, 9.58it/s] 59it [00:06, 9.60it/s] 60it [00:06, 9.51it/s] 61it [00:06, 9.56it/s] 62it [00:06, 9.55it/s] 63it [00:06, 9.54it/s] 64it [00:06, 9.46it/s] 65it [00:06, 9.50it/s] 66it [00:07, 9.55it/s] 67it [00:07, 9.58it/s] 68it [00:07, 9.57it/s] 69it [00:07, 9.61it/s] 70it [00:07, 9.56it/s] 71it [00:07, 9.04it/s] 72it [00:07, 9.14it/s] 73it [00:07, 9.27it/s] 74it [00:07, 9.37it/s] 75it [00:08, 9.43it/s] 76it [00:08, 9.48it/s] 77it [00:08, 9.45it/s] 78it [00:08, 9.52it/s] 79it [00:08, 9.57it/s] 80it [00:08, 9.58it/s] 81it [00:08, 9.24it/s] 82it [00:08, 9.28it/s] 83it [00:08, 9.26it/s] 84it [00:09, 8.61it/s] 85it [00:09, 8.78it/s] 86it [00:09, 8.91it/s] 87it [00:09, 9.04it/s] 88it [00:09, 9.05it/s] 89it [00:09, 9.11it/s] 90it [00:09, 9.15it/s] 91it [00:09, 8.84it/s] 92it [00:09, 9.13it/s] 93it [00:10, 9.35it/s] 94it [00:10, 9.50it/s] 95it [00:10, 9.62it/s] 96it [00:10, 9.70it/s] 97it [00:10, 9.71it/s] 98it [00:10, 9.37it/s] 99it [00:10, 9.53it/s] 100it [00:10, 9.63it/s]2025-05-26 04:12:29,436 - INFO - [Epoch 059 | Batch 0100] IWAE-loss 4880.2090 | mean log_px -0.0276 | KL -3318.33 + 101it [00:10, 9.68it/s] 102it [00:10, 9.74it/s] 103it [00:11, 9.79it/s] 104it [00:11, 9.83it/s] 105it [00:11, 9.86it/s] 106it [00:11, 9.88it/s] 107it [00:11, 9.90it/s] 108it [00:11, 9.55it/s] 109it [00:11, 9.65it/s] 110it [00:11, 9.71it/s] 111it [00:11, 9.78it/s] 112it [00:11, 9.81it/s] 113it [00:12, 9.84it/s] 114it [00:12, 9.84it/s] 115it [00:12, 9.87it/s] 116it [00:12, 9.87it/s] 117it [00:12, 9.89it/s] 118it [00:12, 9.89it/s] 119it [00:12, 9.91it/s] 120it [00:12, 9.92it/s] 121it [00:12, 9.32it/s] 122it [00:13, 9.48it/s] 123it [00:13, 9.60it/s] 124it [00:13, 9.69it/s] 125it [00:13, 9.35it/s] 126it [00:13, 9.50it/s] 127it [00:13, 9.62it/s] 128it [00:13, 9.71it/s] 129it [00:13, 9.76it/s] 130it [00:13, 9.80it/s] 131it [00:13, 9.24it/s] 132it [00:14, 9.42it/s] 133it [00:14, 9.56it/s] 134it [00:14, 9.67it/s] 135it [00:14, 9.74it/s] 136it [00:14, 9.77it/s] 137it [00:14, 9.81it/s] 138it [00:14, 9.74it/s] 139it [00:14, 9.73it/s] 140it [00:14, 9.80it/s] 141it [00:14, 9.84it/s] 142it [00:15, 9.85it/s] 143it [00:15, 9.88it/s] 144it [00:15, 9.89it/s] 145it [00:15, 9.90it/s] 146it [00:15, 9.91it/s] 147it [00:15, 9.89it/s] 148it [00:15, 9.30it/s] 149it [00:15, 9.49it/s] 150it [00:15, 9.60it/s]2025-05-26 04:12:34,581 - INFO - [Epoch 059 | Batch 0150] IWAE-loss 4119.4390 | mean log_px -0.0125 | KL -3316.20 + 151it [00:15, 9.65it/s] 152it [00:16, 9.68it/s] 153it [00:16, 9.73it/s] 154it [00:16, 9.16it/s] 155it [00:16, 9.38it/s] 156it [00:16, 9.51it/s] 157it [00:16, 9.62it/s] 158it [00:16, 9.33it/s] 159it [00:16, 9.49it/s] 160it [00:16, 9.62it/s] 161it [00:17, 9.71it/s] 162it [00:17, 9.75it/s] 163it [00:17, 9.77it/s] 164it [00:17, 9.81it/s] 165it [00:17, 9.82it/s] 166it [00:17, 9.85it/s] 167it [00:17, 9.86it/s] 168it [00:17, 9.85it/s] 169it [00:17, 9.29it/s] 170it [00:17, 9.47it/s] 171it [00:18, 9.59it/s] 172it [00:18, 9.68it/s] 173it [00:18, 9.75it/s] 174it [00:18, 9.79it/s] 175it [00:18, 9.85it/s] 176it [00:18, 9.85it/s] 177it [00:18, 9.87it/s] 178it [00:18, 9.87it/s] 179it [00:18, 9.90it/s] 180it [00:18, 9.90it/s] 181it [00:19, 9.90it/s] 182it [00:19, 9.89it/s] 183it [00:19, 9.89it/s] 184it [00:19, 9.90it/s] 185it [00:19, 9.91it/s] 186it [00:19, 9.89it/s] 187it [00:19, 9.90it/s] 188it [00:19, 9.89it/s] 189it [00:19, 9.91it/s] 190it [00:19, 9.89it/s] 191it [00:20, 9.89it/s] 192it [00:20, 9.89it/s] 193it [00:20, 9.92it/s] 194it [00:20, 9.91it/s] 195it [00:20, 9.27it/s] 196it [00:20, 9.48it/s] +2025-05-26 04:12:39,311 - INFO - Epoch: 59, Objective: tensor([5065.8369], device='cuda:0', grad_fn=), Loss: 0.029969044029712677, KL/n: 67.60353088378906 + 0it [00:00, ?it/s]2025-05-26 04:12:39,751 - INFO - [Epoch 060 | Batch 0000] IWAE-loss 5187.5234 | mean log_px -0.0315 | KL -3310.47 + 1it [00:00, 5.39it/s] 2it [00:00, 7.37it/s] 3it [00:00, 8.32it/s] 4it [00:00, 8.86it/s] 5it [00:00, 8.58it/s] 6it [00:00, 8.98it/s] 7it [00:00, 9.20it/s] 8it [00:00, 8.95it/s] 9it [00:01, 9.20it/s] 10it [00:01, 9.36it/s] 11it [00:01, 9.45it/s] 12it [00:01, 9.53it/s] 13it [00:01, 9.62it/s] 14it [00:01, 9.66it/s] 15it [00:01, 9.70it/s] 16it [00:01, 9.73it/s] 17it [00:01, 9.78it/s] 18it [00:01, 9.81it/s] 19it [00:02, 9.26it/s] 20it [00:02, 9.43it/s] 21it [00:02, 9.52it/s] 22it [00:02, 9.62it/s] 23it [00:02, 9.68it/s] 24it [00:02, 9.75it/s] 25it [00:02, 9.37it/s] 26it [00:02, 9.52it/s] 27it [00:02, 9.18it/s] 28it [00:03, 9.37it/s] 29it [00:03, 9.53it/s] 30it [00:03, 9.62it/s] 31it [00:03, 9.72it/s] 32it [00:03, 9.76it/s] 33it [00:03, 9.21it/s] 34it [00:03, 9.40it/s] 35it [00:03, 9.49it/s] 36it [00:03, 9.60it/s] 37it [00:03, 8.98it/s] 38it [00:04, 9.25it/s] 39it [00:04, 9.46it/s] 40it [00:04, 9.59it/s] 41it [00:04, 9.66it/s] 42it [00:04, 9.72it/s] 43it [00:04, 9.77it/s] 44it [00:04, 9.79it/s] 45it [00:04, 9.82it/s] 46it [00:04, 9.81it/s] 47it [00:05, 9.59it/s] 48it [00:05, 9.66it/s] 49it [00:05, 9.68it/s] 50it [00:05, 9.72it/s]2025-05-26 04:12:45,008 - INFO - [Epoch 060 | Batch 0050] IWAE-loss 4562.0859 | mean log_px -0.0215 | KL -3308.93 + 51it [00:05, 9.69it/s] 52it [00:05, 9.72it/s] 53it [00:05, 9.77it/s] 54it [00:05, 9.40it/s] 55it [00:05, 9.55it/s] 56it [00:05, 9.56it/s] 57it [00:06, 9.66it/s] 58it [00:06, 9.73it/s] 59it [00:06, 9.77it/s] 60it [00:06, 9.78it/s] 61it [00:06, 9.83it/s] 62it [00:06, 9.80it/s] 63it [00:06, 9.84it/s] 64it [00:06, 9.44it/s] 65it [00:06, 9.58it/s] 66it [00:06, 9.68it/s] 67it [00:07, 9.76it/s] 68it [00:07, 9.80it/s] 70it [00:07, 9.88it/s] 71it [00:07, 9.89it/s] 72it [00:07, 9.53it/s] 73it [00:07, 9.63it/s] 74it [00:07, 9.71it/s] 75it [00:07, 9.22it/s] 76it [00:08, 9.41it/s] 77it [00:08, 9.55it/s] 78it [00:08, 9.65it/s] 79it [00:08, 9.72it/s] 80it [00:08, 9.75it/s] 81it [00:08, 9.78it/s] 82it [00:08, 9.80it/s] 83it [00:08, 9.19it/s] 84it [00:08, 9.20it/s] 85it [00:08, 8.99it/s] 86it [00:09, 8.84it/s] 87it [00:09, 9.13it/s] 88it [00:09, 9.34it/s] 89it [00:09, 9.51it/s] 90it [00:09, 9.62it/s] 91it [00:09, 9.71it/s] 92it [00:09, 9.76it/s] 93it [00:09, 9.81it/s] 94it [00:09, 9.26it/s] 95it [00:10, 9.44it/s] 96it [00:10, 9.54it/s] 97it [00:10, 9.63it/s] 98it [00:10, 9.71it/s] 99it [00:10, 9.78it/s] 100it [00:10, 9.81it/s]2025-05-26 04:12:50,218 - INFO - [Epoch 060 | Batch 0100] IWAE-loss 4293.2979 | mean log_px -0.0141 | KL -3304.83 + 101it [00:10, 9.41it/s] 102it [00:10, 9.53it/s] 103it [00:10, 9.65it/s] 104it [00:10, 9.71it/s] 105it [00:11, 9.78it/s] 106it [00:11, 9.23it/s] 107it [00:11, 9.41it/s] 108it [00:11, 9.55it/s] 109it [00:11, 9.60it/s] 110it [00:11, 9.13it/s] 111it [00:11, 9.36it/s] 112it [00:11, 9.51it/s] 113it [00:11, 9.63it/s] 114it [00:11, 9.70it/s] 115it [00:12, 9.75it/s] 116it [00:12, 9.79it/s] 117it [00:12, 9.82it/s] 118it [00:12, 9.83it/s] 119it [00:12, 9.87it/s] 120it [00:12, 9.28it/s] 121it [00:12, 9.45it/s] 122it [00:12, 9.58it/s] 123it [00:12, 9.66it/s] 124it [00:13, 9.73it/s] 125it [00:13, 9.79it/s] 126it [00:13, 9.84it/s] 127it [00:13, 9.86it/s] 128it [00:13, 9.79it/s] 129it [00:13, 9.83it/s] 130it [00:13, 9.85it/s] 131it [00:13, 9.86it/s] 132it [00:13, 9.87it/s] 133it [00:13, 9.88it/s] 134it [00:14, 9.88it/s] 135it [00:14, 9.89it/s] 136it [00:14, 9.89it/s] 137it [00:14, 9.91it/s] 138it [00:14, 9.91it/s] 139it [00:14, 9.92it/s] 140it [00:14, 9.91it/s] 141it [00:14, 9.49it/s] 142it [00:14, 9.60it/s] 143it [00:14, 9.66it/s] 144it [00:15, 9.73it/s] 145it [00:15, 9.78it/s] 146it [00:15, 9.81it/s] 147it [00:15, 9.81it/s] 148it [00:15, 9.80it/s] 149it [00:15, 9.82it/s] 150it [00:15, 9.84it/s]2025-05-26 04:12:55,372 - INFO - [Epoch 060 | Batch 0150] IWAE-loss 4515.0557 | mean log_px -0.0186 | KL -3300.35 + 151it [00:15, 9.84it/s] 152it [00:15, 9.25it/s] 153it [00:16, 9.39it/s] 154it [00:16, 9.52it/s] 155it [00:16, 9.63it/s] 156it [00:16, 9.72it/s] 157it [00:16, 9.75it/s] 158it [00:16, 9.17it/s] 159it [00:16, 9.38it/s] 160it [00:16, 9.53it/s] 161it [00:16, 9.65it/s] 162it [00:16, 9.72it/s] 163it [00:17, 9.78it/s] 164it [00:17, 9.81it/s] 165it [00:17, 9.85it/s] 166it [00:17, 9.87it/s] 167it [00:17, 9.88it/s] 168it [00:17, 9.89it/s] 169it [00:17, 9.89it/s] 170it [00:17, 9.86it/s] 171it [00:17, 9.27it/s] 172it [00:17, 9.45it/s] 173it [00:18, 9.59it/s] 174it [00:18, 9.66it/s] 175it [00:18, 9.74it/s] 176it [00:18, 9.79it/s] 177it [00:18, 9.83it/s] 178it [00:18, 9.84it/s] 179it [00:18, 9.86it/s] 180it [00:18, 9.87it/s] 181it [00:18, 9.89it/s] 182it [00:18, 9.89it/s] 183it [00:19, 9.91it/s] 184it [00:19, 9.91it/s] 185it [00:19, 9.32it/s] 186it [00:19, 9.44it/s] 187it [00:19, 9.57it/s] 188it [00:19, 9.61it/s] 189it [00:19, 9.66it/s] 190it [00:19, 9.72it/s] 191it [00:19, 9.75it/s] 192it [00:20, 9.73it/s] 193it [00:20, 9.71it/s] 194it [00:20, 9.76it/s] 195it [00:20, 9.21it/s] 196it [00:20, 9.55it/s] +2025-05-26 04:13:00,146 - INFO - Epoch: 60, Objective: tensor([4183.7256], device='cuda:0', grad_fn=), Loss: 0.01641184277832508, KL/n: 67.38818359375 + 0it [00:00, ?it/s]2025-05-26 04:13:00,427 - INFO - [Epoch 061 | Batch 0000] IWAE-loss 4341.6694 | mean log_px -0.0202 | KL -3302.52 + 1it [00:00, 4.66it/s] 2it [00:00, 6.73it/s] 3it [00:00, 7.86it/s] 4it [00:00, 7.93it/s] 5it [00:00, 8.49it/s] 6it [00:00, 8.87it/s] 7it [00:00, 9.16it/s] 8it [00:00, 8.82it/s] 9it [00:01, 9.10it/s] 10it [00:01, 9.27it/s] 11it [00:01, 9.35it/s] 12it [00:01, 8.96it/s] 13it [00:01, 9.20it/s] 14it [00:01, 9.36it/s] 15it [00:01, 8.96it/s] 16it [00:01, 9.19it/s] 17it [00:01, 9.37it/s] 18it [00:02, 8.97it/s] 19it [00:02, 9.22it/s] 20it [00:02, 9.39it/s] 21it [00:02, 8.93it/s] 22it [00:02, 9.18it/s] 23it [00:02, 9.35it/s] 24it [00:02, 9.46it/s] 25it [00:02, 9.05it/s] 26it [00:02, 9.26it/s] 27it [00:03, 9.43it/s] 28it [00:03, 9.01it/s] 29it [00:03, 9.22it/s] 30it [00:03, 9.38it/s] 31it [00:03, 8.99it/s] 32it [00:03, 9.22it/s] 33it [00:03, 9.39it/s] 34it [00:03, 8.99it/s] 35it [00:03, 9.22it/s] 36it [00:03, 9.39it/s] 37it [00:04, 9.01it/s] 38it [00:04, 9.20it/s] 39it [00:04, 9.36it/s] 40it [00:04, 8.71it/s] 41it [00:04, 8.98it/s] 42it [00:04, 9.20it/s] 43it [00:04, 9.35it/s] 44it [00:04, 8.95it/s] 45it [00:04, 9.20it/s] 46it [00:05, 9.35it/s] 47it [00:05, 8.95it/s] 48it [00:05, 9.18it/s] 49it [00:05, 9.35it/s] 50it [00:05, 8.98it/s]2025-05-26 04:13:05,885 - INFO - [Epoch 061 | Batch 0050] IWAE-loss 4877.6030 | mean log_px -0.0282 | KL -3295.02 + 51it [00:05, 9.18it/s] 52it [00:05, 9.34it/s] 53it [00:05, 8.97it/s] 54it [00:05, 9.20it/s] 55it [00:06, 9.33it/s] 56it [00:06, 8.95it/s] 57it [00:06, 9.20it/s] 58it [00:06, 9.37it/s] 59it [00:06, 8.96it/s] 60it [00:06, 9.19it/s] 61it [00:06, 9.38it/s] 62it [00:06, 8.96it/s] 63it [00:06, 9.20it/s] 64it [00:07, 9.35it/s] 65it [00:07, 9.48it/s] 66it [00:07, 9.40it/s] 67it [00:07, 8.98it/s] 68it [00:07, 9.20it/s] 69it [00:07, 9.35it/s] 70it [00:07, 8.92it/s] 71it [00:07, 9.16it/s] 72it [00:07, 9.34it/s] 73it [00:08, 8.89it/s] 74it [00:08, 9.12it/s] 75it [00:08, 9.31it/s] 76it [00:08, 9.44it/s] 77it [00:08, 9.04it/s] 78it [00:08, 9.24it/s] 79it [00:08, 9.41it/s] 80it [00:08, 9.52it/s] 81it [00:08, 9.08it/s] 82it [00:09, 9.28it/s] 83it [00:09, 9.42it/s] 84it [00:09, 9.51it/s] 85it [00:09, 9.07it/s] 86it [00:09, 9.26it/s] 87it [00:09, 9.40it/s] 88it [00:09, 9.50it/s] 89it [00:09, 9.07it/s] 90it [00:09, 9.23it/s] 91it [00:09, 9.37it/s] 92it [00:10, 8.92it/s] 93it [00:10, 9.14it/s] 94it [00:10, 9.24it/s] 95it [00:10, 9.38it/s] 96it [00:10, 8.96it/s] 97it [00:10, 9.16it/s] 98it [00:10, 9.35it/s] 99it [00:10, 9.47it/s] 100it [00:10, 9.04it/s]2025-05-26 04:13:11,307 - INFO - [Epoch 061 | Batch 0100] IWAE-loss 4193.9419 | mean log_px -0.0158 | KL -3287.98 + 101it [00:11, 9.15it/s] 102it [00:11, 9.28it/s] 103it [00:11, 9.40it/s] 104it [00:11, 9.00it/s] 105it [00:11, 9.22it/s] 106it [00:11, 9.37it/s] 107it [00:11, 8.97it/s] 108it [00:11, 9.19it/s] 109it [00:11, 9.38it/s] 110it [00:12, 8.97it/s] 111it [00:12, 9.21it/s] 112it [00:12, 9.40it/s] 113it [00:12, 9.52it/s] 114it [00:12, 9.08it/s] 115it [00:12, 9.24it/s] 116it [00:12, 9.39it/s] 117it [00:12, 8.99it/s] 118it [00:12, 9.21it/s] 119it [00:13, 9.37it/s] 120it [00:13, 8.95it/s] 121it [00:13, 9.10it/s] 122it [00:13, 9.30it/s] 123it [00:13, 8.91it/s] 124it [00:13, 9.15it/s] 125it [00:13, 9.33it/s] 126it [00:13, 8.94it/s] 127it [00:13, 9.18it/s] 128it [00:14, 9.35it/s] 129it [00:14, 9.46it/s] 130it [00:14, 8.97it/s] 131it [00:14, 9.19it/s] 132it [00:14, 9.35it/s] 133it [00:14, 8.95it/s] 134it [00:14, 9.18it/s] 135it [00:14, 9.24it/s] 136it [00:14, 8.84it/s] 137it [00:14, 9.10it/s] 138it [00:15, 9.28it/s] 139it [00:15, 9.39it/s] 140it [00:15, 8.98it/s] 141it [00:15, 9.21it/s] 142it [00:15, 9.37it/s] 143it [00:15, 8.98it/s] 144it [00:15, 9.19it/s] 145it [00:15, 9.36it/s] 146it [00:15, 9.46it/s] 147it [00:16, 9.02it/s] 148it [00:16, 9.14it/s] 149it [00:16, 9.33it/s] 150it [00:16, 9.46it/s]2025-05-26 04:13:16,731 - INFO - [Epoch 061 | Batch 0150] IWAE-loss 4477.5815 | mean log_px -0.0203 | KL -3289.90 + 151it [00:16, 9.00it/s] 152it [00:16, 9.21it/s] 153it [00:16, 9.37it/s] 154it [00:16, 9.47it/s] 155it [00:16, 9.05it/s] 156it [00:17, 9.25it/s] 157it [00:17, 9.42it/s] 158it [00:17, 8.98it/s] 159it [00:17, 9.20it/s] 160it [00:17, 9.35it/s] 161it [00:17, 9.48it/s] 162it [00:17, 9.01it/s] 163it [00:17, 9.23it/s] 164it [00:17, 9.36it/s] 165it [00:18, 9.46it/s] 166it [00:18, 9.01it/s] 167it [00:18, 9.23it/s] 168it [00:18, 9.39it/s] 169it [00:18, 8.98it/s] 170it [00:18, 9.06it/s] 171it [00:18, 9.14it/s] 172it [00:18, 9.32it/s] 173it [00:18, 9.45it/s] 174it [00:18, 9.53it/s] 175it [00:19, 9.61it/s] 176it [00:19, 9.06it/s] 177it [00:19, 9.20it/s] 178it [00:19, 9.37it/s] 179it [00:19, 9.50it/s] 180it [00:19, 9.51it/s] 181it [00:19, 8.83it/s] 182it [00:19, 8.84it/s] 183it [00:19, 9.04it/s] 184it [00:20, 9.20it/s] 185it [00:20, 8.79it/s] 186it [00:20, 9.04it/s] 187it [00:20, 9.22it/s] 188it [00:20, 9.36it/s] 189it [00:20, 8.91it/s] 190it [00:20, 9.10it/s] 191it [00:20, 9.26it/s] 192it [00:20, 9.29it/s] 193it [00:21, 8.92it/s] 194it [00:21, 9.14it/s] 195it [00:21, 8.82it/s] 196it [00:21, 9.13it/s] +2025-05-26 04:13:21,739 - INFO - Epoch: 61, Objective: tensor([6526.4443], device='cuda:0', grad_fn=), Loss: 0.049620795994997025, KL/n: 67.15840148925781 + 0it [00:00, ?it/s]2025-05-26 04:13:22,193 - INFO - [Epoch 062 | Batch 0000] IWAE-loss 4576.0898 | mean log_px -0.0238 | KL -3289.67 + 1it [00:00, 2.55it/s] 2it [00:00, 4.52it/s] 3it [00:00, 6.02it/s] 4it [00:00, 6.70it/s] 5it [00:00, 7.56it/s] 6it [00:00, 8.23it/s] 7it [00:01, 8.71it/s] 8it [00:01, 9.05it/s] 9it [00:01, 9.30it/s] 10it [00:01, 9.49it/s] 11it [00:01, 9.63it/s] 12it [00:01, 9.69it/s] 13it [00:01, 9.77it/s] 14it [00:01, 9.81it/s] 15it [00:01, 9.84it/s] 16it [00:01, 9.84it/s] 17it [00:02, 9.87it/s] 18it [00:02, 9.88it/s] 19it [00:02, 9.90it/s] 20it [00:02, 9.89it/s] 21it [00:02, 9.32it/s] 22it [00:02, 9.48it/s] 23it [00:02, 9.63it/s] 24it [00:02, 9.11it/s] 25it [00:02, 9.33it/s] 26it [00:02, 9.49it/s] 27it [00:03, 9.61it/s] 28it [00:03, 9.07it/s] 29it [00:03, 9.19it/s] 30it [00:03, 8.96it/s] 31it [00:03, 9.23it/s] 32it [00:03, 9.38it/s] 33it [00:03, 9.52it/s] 34it [00:03, 9.61it/s] 35it [00:03, 9.69it/s] 36it [00:04, 9.75it/s] 37it [00:04, 9.79it/s] 38it [00:04, 9.80it/s] 39it [00:04, 9.84it/s] 40it [00:04, 9.85it/s] 41it [00:04, 9.80it/s] 42it [00:04, 9.81it/s] 43it [00:04, 9.84it/s] 44it [00:04, 9.85it/s] 45it [00:04, 9.87it/s] 46it [00:05, 9.88it/s] 47it [00:05, 9.90it/s] 48it [00:05, 9.89it/s] 49it [00:05, 9.91it/s] 50it [00:05, 9.91it/s]2025-05-26 04:13:27,392 - INFO - [Epoch 062 | Batch 0050] IWAE-loss 4915.9707 | mean log_px -0.0268 | KL -3286.16 + 51it [00:05, 9.17it/s] 52it [00:05, 9.37it/s] 53it [00:05, 9.53it/s] 54it [00:05, 9.06it/s] 55it [00:06, 9.31it/s] 56it [00:06, 9.46it/s] 57it [00:06, 9.60it/s] 58it [00:06, 9.21it/s] 59it [00:06, 9.37it/s] 60it [00:06, 9.51it/s] 61it [00:06, 9.18it/s] 62it [00:06, 9.37it/s] 63it [00:06, 9.53it/s] 64it [00:06, 9.03it/s] 65it [00:07, 9.29it/s] 66it [00:07, 9.47it/s] 67it [00:07, 9.60it/s] 68it [00:07, 9.68it/s] 69it [00:07, 9.12it/s] 70it [00:07, 9.30it/s] 71it [00:07, 9.45it/s] 72it [00:07, 9.42it/s] 73it [00:07, 9.11it/s] 74it [00:08, 9.32it/s] 75it [00:08, 9.49it/s] 76it [00:08, 9.60it/s] 77it [00:08, 9.69it/s] 78it [00:08, 9.56it/s] 79it [00:08, 9.66it/s] 80it [00:08, 9.73it/s] 81it [00:08, 9.80it/s] 82it [00:08, 9.80it/s] 83it [00:08, 9.51it/s] 84it [00:09, 9.24it/s] 85it [00:09, 9.43it/s] 86it [00:09, 9.37it/s] 87it [00:09, 8.92it/s] 88it [00:09, 9.09it/s] 89it [00:09, 9.17it/s] 90it [00:09, 9.27it/s] 91it [00:09, 9.35it/s] 92it [00:09, 9.30it/s] 93it [00:10, 8.81it/s] 94it [00:10, 8.91it/s] 95it [00:10, 9.00it/s] 96it [00:10, 9.09it/s] 97it [00:10, 8.65it/s] 98it [00:10, 8.96it/s] 99it [00:10, 9.18it/s] 100it [00:10, 9.33it/s]2025-05-26 04:13:32,765 - INFO - [Epoch 062 | Batch 0100] IWAE-loss 4170.7461 | mean log_px -0.0182 | KL -3282.61 + 101it [00:10, 8.91it/s] 102it [00:11, 9.17it/s] 103it [00:11, 9.34it/s] 104it [00:11, 9.48it/s] 105it [00:11, 9.01it/s] 106it [00:11, 9.19it/s] 107it [00:11, 9.36it/s] 108it [00:11, 9.49it/s] 109it [00:11, 9.02it/s] 110it [00:11, 9.23it/s] 111it [00:12, 9.40it/s] 112it [00:12, 9.51it/s] 113it [00:12, 9.04it/s] 114it [00:12, 9.26it/s] 115it [00:12, 8.88it/s] 116it [00:12, 9.13it/s] 117it [00:12, 9.35it/s] 118it [00:12, 9.48it/s] 119it [00:12, 9.01it/s] 120it [00:13, 9.23it/s] 121it [00:13, 9.39it/s] 122it [00:13, 9.50it/s] 123it [00:13, 9.03it/s] 124it [00:13, 9.25it/s] 125it [00:13, 9.41it/s] 126it [00:13, 9.52it/s] 127it [00:13, 9.08it/s] 128it [00:13, 9.27it/s] 129it [00:13, 9.43it/s] 130it [00:14, 9.52it/s] 131it [00:14, 9.05it/s] 132it [00:14, 9.27it/s] 133it [00:14, 9.44it/s] 134it [00:14, 9.54it/s] 135it [00:14, 9.06it/s] 136it [00:14, 9.28it/s] 137it [00:14, 9.42it/s] 138it [00:14, 9.54it/s] 139it [00:15, 9.03it/s] 140it [00:15, 9.25it/s] 141it [00:15, 9.41it/s] 142it [00:15, 9.52it/s] 143it [00:15, 9.08it/s] 144it [00:15, 9.28it/s] 145it [00:15, 9.44it/s] 146it [00:15, 9.55it/s] 147it [00:15, 9.07it/s] 148it [00:16, 9.25it/s] 149it [00:16, 9.43it/s] 150it [00:16, 9.54it/s]2025-05-26 04:13:38,145 - INFO - [Epoch 062 | Batch 0150] IWAE-loss 4884.0713 | mean log_px -0.0360 | KL -3281.47 + 151it [00:16, 9.07it/s] 152it [00:16, 9.27it/s] 153it [00:16, 9.40it/s] 154it [00:16, 9.51it/s] 155it [00:16, 9.03it/s] 156it [00:16, 9.24it/s] 157it [00:16, 9.41it/s] 158it [00:17, 9.53it/s] 159it [00:17, 9.05it/s] 160it [00:17, 9.27it/s] 161it [00:17, 9.43it/s] 162it [00:17, 9.54it/s] 163it [00:17, 9.03it/s] 164it [00:17, 9.22it/s] 165it [00:17, 9.38it/s] 166it [00:17, 9.50it/s] 167it [00:18, 9.03it/s] 168it [00:18, 9.20it/s] 169it [00:18, 9.37it/s] 170it [00:18, 9.46it/s] 171it [00:18, 9.01it/s] 172it [00:18, 9.24it/s] 173it [00:18, 9.39it/s] 174it [00:18, 9.49it/s] 175it [00:18, 9.04it/s] 176it [00:19, 9.23it/s] 177it [00:19, 9.40it/s] 178it [00:19, 9.49it/s] 179it [00:19, 9.03it/s] 180it [00:19, 9.24it/s] 181it [00:19, 9.39it/s] 182it [00:19, 9.50it/s] 183it [00:19, 9.01it/s] 184it [00:19, 9.16it/s] 185it [00:19, 9.27it/s] 186it [00:20, 9.40it/s] 187it [00:20, 8.94it/s] 188it [00:20, 9.18it/s] 189it [00:20, 9.35it/s] 190it [00:20, 9.47it/s] 191it [00:20, 8.99it/s] 192it [00:20, 9.20it/s] 193it [00:20, 9.38it/s] 194it [00:20, 9.50it/s] 195it [00:21, 8.57it/s] 196it [00:21, 9.21it/s] +2025-05-26 04:13:43,138 - INFO - Epoch: 62, Objective: tensor([5284.1826], device='cuda:0', grad_fn=), Loss: 0.03511318191885948, KL/n: 66.92284393310547 + 0it [00:00, ?it/s]2025-05-26 04:13:43,406 - INFO - [Epoch 063 | Batch 0000] IWAE-loss 4192.7603 | mean log_px -0.0176 | KL -3279.23 + 1it [00:00, 5.40it/s] 2it [00:00, 7.39it/s] 3it [00:00, 8.37it/s] 4it [00:00, 8.92it/s] 5it [00:00, 9.28it/s] 6it [00:00, 9.48it/s] 7it [00:00, 9.64it/s] 8it [00:00, 9.72it/s] 9it [00:00, 9.79it/s] 10it [00:01, 9.18it/s] 11it [00:01, 9.40it/s] 12it [00:01, 9.55it/s] 13it [00:01, 9.64it/s] 14it [00:01, 9.72it/s] 15it [00:01, 9.79it/s] 16it [00:01, 9.82it/s] 17it [00:01, 9.29it/s] 18it [00:01, 9.47it/s] 19it [00:02, 9.61it/s] 20it [00:02, 9.69it/s] 21it [00:02, 9.76it/s] 22it [00:02, 9.80it/s] 23it [00:02, 9.84it/s] 24it [00:02, 9.87it/s] 25it [00:02, 9.89it/s] 26it [00:02, 9.89it/s] 27it [00:02, 9.91it/s] 28it [00:02, 9.90it/s] 29it [00:03, 9.90it/s] 30it [00:03, 9.90it/s] 31it [00:03, 9.92it/s] 32it [00:03, 9.92it/s] 33it [00:03, 9.93it/s] 34it [00:03, 9.92it/s] 35it [00:03, 9.93it/s] 36it [00:03, 9.92it/s] 37it [00:03, 9.92it/s] 38it [00:03, 9.91it/s] 39it [00:04, 9.90it/s] 40it [00:04, 9.90it/s] 41it [00:04, 9.22it/s] 42it [00:04, 9.41it/s] 43it [00:04, 9.57it/s] 44it [00:04, 9.67it/s] 45it [00:04, 9.75it/s] 46it [00:04, 9.80it/s] 47it [00:04, 9.84it/s] 48it [00:04, 9.84it/s] 49it [00:05, 9.86it/s] 50it [00:05, 9.87it/s]2025-05-26 04:13:48,519 - INFO - [Epoch 063 | Batch 0050] IWAE-loss 4688.5366 | mean log_px -0.0212 | KL -3273.02 + 51it [00:05, 9.88it/s] 52it [00:05, 9.89it/s] 53it [00:05, 9.91it/s] 54it [00:05, 9.91it/s] 55it [00:05, 9.91it/s] 56it [00:05, 9.91it/s] 57it [00:05, 9.91it/s] 58it [00:06, 9.91it/s] 59it [00:06, 9.91it/s] 60it [00:06, 9.90it/s] 61it [00:06, 9.29it/s] 62it [00:06, 9.47it/s] 63it [00:06, 9.60it/s] 64it [00:06, 9.67it/s] 65it [00:06, 9.74it/s] 66it [00:06, 9.18it/s] 67it [00:06, 9.38it/s] 68it [00:07, 9.52it/s] 69it [00:07, 9.04it/s] 70it [00:07, 9.29it/s] 71it [00:07, 9.46it/s] 72it [00:07, 9.59it/s] 73it [00:07, 9.09it/s] 74it [00:07, 9.30it/s] 75it [00:07, 9.47it/s] 76it [00:07, 9.59it/s] 77it [00:08, 9.49it/s] 78it [00:08, 8.83it/s] 79it [00:08, 8.93it/s] 80it [00:08, 9.05it/s] 81it [00:08, 9.13it/s] 82it [00:08, 9.19it/s] 83it [00:08, 9.25it/s] 84it [00:08, 9.28it/s] 85it [00:08, 9.32it/s] 86it [00:09, 9.30it/s] 87it [00:09, 9.30it/s] 88it [00:09, 9.29it/s] 89it [00:09, 9.28it/s] 90it [00:09, 9.45it/s] 91it [00:09, 9.58it/s] 92it [00:09, 9.09it/s] 93it [00:09, 9.32it/s] 94it [00:09, 9.47it/s] 95it [00:09, 9.49it/s] 96it [00:10, 9.50it/s] 97it [00:10, 9.63it/s] 98it [00:10, 9.71it/s] 99it [00:10, 9.18it/s] 100it [00:10, 9.38it/s]2025-05-26 04:13:53,821 - INFO - [Epoch 063 | Batch 0100] IWAE-loss 4749.5503 | mean log_px -0.0224 | KL -3273.87 + 101it [00:10, 9.52it/s] 102it [00:10, 9.64it/s] 103it [00:10, 9.72it/s] 104it [00:10, 9.76it/s] 105it [00:11, 9.32it/s] 106it [00:11, 9.48it/s] 107it [00:11, 9.60it/s] 108it [00:11, 9.65it/s] 109it [00:11, 9.63it/s] 110it [00:11, 9.21it/s] 111it [00:11, 9.38it/s] 112it [00:11, 9.45it/s] 113it [00:11, 9.52it/s] 114it [00:11, 9.10it/s] 115it [00:12, 9.33it/s] 116it [00:12, 9.48it/s] 117it [00:12, 9.02it/s] 118it [00:12, 9.20it/s] 119it [00:12, 9.40it/s] 120it [00:12, 9.54it/s] 121it [00:12, 9.63it/s] 122it [00:12, 9.66it/s] 123it [00:12, 9.71it/s] 124it [00:13, 9.74it/s] 125it [00:13, 9.78it/s] 126it [00:13, 9.76it/s] 127it [00:13, 9.81it/s] 128it [00:13, 9.83it/s] 129it [00:13, 9.76it/s] 130it [00:13, 9.78it/s] 131it [00:13, 9.76it/s] 132it [00:13, 9.79it/s] 133it [00:13, 9.77it/s] 134it [00:14, 9.81it/s] 135it [00:14, 9.28it/s] 136it [00:14, 9.45it/s] 137it [00:14, 9.59it/s] 138it [00:14, 9.17it/s] 139it [00:14, 9.39it/s] 140it [00:14, 9.46it/s] 141it [00:14, 8.99it/s] 142it [00:14, 9.23it/s] 143it [00:15, 9.43it/s] 144it [00:15, 9.55it/s] 145it [00:15, 9.65it/s] 146it [00:15, 9.69it/s] 147it [00:15, 9.74it/s] 148it [00:15, 9.73it/s] 149it [00:15, 9.34it/s] 150it [00:15, 9.49it/s]2025-05-26 04:13:59,065 - INFO - [Epoch 063 | Batch 0150] IWAE-loss 3977.1768 | mean log_px -0.0134 | KL -3273.26 + 151it [00:15, 9.60it/s] 152it [00:15, 9.69it/s] 153it [00:16, 9.76it/s] 154it [00:16, 9.79it/s] 155it [00:16, 9.83it/s] 156it [00:16, 9.83it/s] 157it [00:16, 9.85it/s] 158it [00:16, 9.86it/s] 159it [00:16, 9.88it/s] 160it [00:16, 9.88it/s] 161it [00:16, 9.89it/s] 162it [00:16, 9.26it/s] 163it [00:17, 9.44it/s] 164it [00:17, 8.99it/s] 165it [00:17, 9.26it/s] 166it [00:17, 9.43it/s] 167it [00:17, 9.54it/s] 168it [00:17, 9.64it/s] 169it [00:17, 9.14it/s] 170it [00:17, 9.35it/s] 171it [00:17, 9.49it/s] 172it [00:18, 9.58it/s] 173it [00:18, 9.66it/s] 174it [00:18, 9.72it/s] 175it [00:18, 9.78it/s] 176it [00:18, 9.81it/s] 177it [00:18, 9.84it/s] 178it [00:18, 9.84it/s] 179it [00:18, 9.88it/s] 180it [00:18, 9.88it/s] 181it [00:18, 9.90it/s] 182it [00:19, 9.89it/s] 183it [00:19, 9.89it/s] 184it [00:19, 9.89it/s] 185it [00:19, 9.89it/s] 186it [00:19, 9.90it/s] 187it [00:19, 9.91it/s] 188it [00:19, 9.90it/s] 189it [00:19, 9.91it/s] 190it [00:19, 9.91it/s] 191it [00:19, 9.92it/s] 192it [00:20, 9.91it/s] 193it [00:20, 9.91it/s] 194it [00:20, 9.91it/s] 195it [00:20, 8.76it/s] 196it [00:20, 9.53it/s] +2025-05-26 04:14:03,821 - INFO - Epoch: 63, Objective: tensor([5113.3408], device='cuda:0', grad_fn=), Loss: 0.03467189148068428, KL/n: 66.71068572998047 + 0it [00:00, ?it/s]2025-05-26 04:14:04,088 - INFO - [Epoch 064 | Batch 0000] IWAE-loss 4048.0391 | mean log_px -0.0111 | KL -3268.86 + 1it [00:00, 5.53it/s] 2it [00:00, 7.38it/s] 3it [00:00, 7.79it/s] 4it [00:00, 8.51it/s] 5it [00:00, 8.88it/s] 6it [00:00, 8.54it/s] 7it [00:00, 8.74it/s] 8it [00:00, 9.00it/s] 9it [00:01, 9.13it/s] 10it [00:01, 5.71it/s] 11it [00:01, 6.51it/s] 12it [00:01, 7.18it/s] 13it [00:01, 7.80it/s] 14it [00:01, 8.23it/s] 15it [00:01, 8.58it/s] 16it [00:02, 8.80it/s] 17it [00:02, 9.01it/s] 18it [00:02, 9.16it/s] 19it [00:02, 9.32it/s] 20it [00:02, 9.35it/s] 21it [00:02, 9.41it/s] 22it [00:02, 9.39it/s] 23it [00:02, 9.41it/s] 24it [00:02, 9.41it/s] 25it [00:02, 9.40it/s] 26it [00:03, 9.43it/s] 27it [00:03, 9.40it/s] 28it [00:03, 9.42it/s] 29it [00:03, 9.48it/s] 30it [00:03, 9.50it/s] 31it [00:03, 9.58it/s] 32it [00:03, 9.58it/s] 33it [00:03, 9.62it/s] 34it [00:03, 9.60it/s] 35it [00:04, 9.62it/s] 36it [00:04, 9.60it/s] 37it [00:04, 9.61it/s] 38it [00:04, 9.15it/s] 39it [00:04, 9.31it/s] 40it [00:04, 9.44it/s] 41it [00:04, 9.46it/s] 42it [00:04, 9.46it/s] 43it [00:04, 9.50it/s] 44it [00:04, 9.51it/s] 45it [00:05, 9.48it/s] 46it [00:05, 9.54it/s] 47it [00:05, 9.62it/s] 48it [00:05, 9.66it/s] 49it [00:05, 9.68it/s] 50it [00:05, 9.63it/s]2025-05-26 04:14:09,591 - INFO - [Epoch 064 | Batch 0050] IWAE-loss 4078.9944 | mean log_px -0.0116 | KL -3263.32 + 51it [00:05, 9.64it/s] 52it [00:05, 9.67it/s] 53it [00:05, 9.62it/s] 54it [00:05, 9.63it/s] 55it [00:06, 9.63it/s] 56it [00:06, 9.61it/s] 57it [00:06, 9.62it/s] 58it [00:06, 9.67it/s] 59it [00:06, 9.21it/s] 60it [00:06, 9.24it/s] 61it [00:06, 9.33it/s] 62it [00:06, 9.30it/s] 63it [00:06, 9.35it/s] 64it [00:07, 9.36it/s] 65it [00:07, 9.41it/s] 66it [00:07, 9.23it/s] 67it [00:07, 9.27it/s] 68it [00:07, 9.31it/s] 69it [00:07, 9.39it/s] 70it [00:07, 8.88it/s] 71it [00:07, 9.09it/s] 72it [00:07, 9.17it/s] 73it [00:08, 9.23it/s] 74it [00:08, 8.79it/s] 75it [00:08, 9.02it/s] 76it [00:08, 9.19it/s] 77it [00:08, 9.34it/s] 78it [00:08, 8.88it/s] 79it [00:08, 9.08it/s] 80it [00:08, 9.17it/s] 81it [00:08, 9.32it/s] 82it [00:09, 9.44it/s] 83it [00:09, 9.53it/s] 84it [00:09, 9.59it/s] 85it [00:09, 9.56it/s] 86it [00:09, 9.53it/s] 87it [00:09, 9.55it/s] 88it [00:09, 9.41it/s] 89it [00:09, 8.74it/s] 90it [00:09, 8.76it/s] 91it [00:10, 8.99it/s] 92it [00:10, 9.14it/s] 93it [00:10, 9.30it/s] 94it [00:10, 9.37it/s] 95it [00:10, 8.88it/s] 96it [00:10, 9.02it/s] 97it [00:10, 9.15it/s] 98it [00:10, 9.25it/s] 99it [00:10, 8.78it/s] 100it [00:10, 8.99it/s]2025-05-26 04:14:15,005 - INFO - [Epoch 064 | Batch 0100] IWAE-loss 4177.9673 | mean log_px -0.0192 | KL -3262.71 + 101it [00:11, 9.17it/s] 102it [00:11, 9.30it/s] 103it [00:11, 8.95it/s] 104it [00:11, 9.15it/s] 105it [00:11, 9.29it/s] 106it [00:11, 9.37it/s] 107it [00:11, 8.93it/s] 108it [00:11, 9.07it/s] 109it [00:11, 9.23it/s] 110it [00:12, 9.29it/s] 111it [00:12, 8.77it/s] 112it [00:12, 8.96it/s] 113it [00:12, 9.19it/s] 114it [00:12, 9.30it/s] 115it [00:12, 8.86it/s] 116it [00:12, 9.05it/s] 117it [00:12, 9.24it/s] 118it [00:12, 9.31it/s] 119it [00:13, 8.89it/s] 120it [00:13, 9.11it/s] 121it [00:13, 9.18it/s] 122it [00:13, 9.12it/s] 123it [00:13, 8.73it/s] 124it [00:13, 8.98it/s] 125it [00:13, 9.13it/s] 126it [00:13, 9.24it/s] 127it [00:13, 8.85it/s] 128it [00:14, 9.05it/s] 129it [00:14, 9.17it/s] 130it [00:14, 9.28it/s] 131it [00:14, 8.83it/s] 132it [00:14, 9.02it/s] 133it [00:14, 9.18it/s] 134it [00:14, 9.27it/s] 135it [00:14, 8.79it/s] 136it [00:14, 8.92it/s] 137it [00:15, 8.99it/s] 138it [00:15, 9.09it/s] 139it [00:15, 8.75it/s] 140it [00:15, 8.93it/s] 141it [00:15, 9.03it/s] 142it [00:15, 9.01it/s] 143it [00:15, 8.62it/s] 144it [00:15, 8.83it/s] 145it [00:15, 9.02it/s] 146it [00:16, 9.12it/s] 147it [00:16, 8.69it/s] 148it [00:16, 8.84it/s] 149it [00:16, 8.60it/s] 150it [00:16, 8.82it/s]2025-05-26 04:14:20,553 - INFO - [Epoch 064 | Batch 0150] IWAE-loss 4131.0303 | mean log_px -0.0125 | KL -3256.42 + 151it [00:16, 8.96it/s] 152it [00:16, 9.13it/s] 153it [00:16, 9.22it/s] 154it [00:16, 9.31it/s] 155it [00:17, 9.33it/s] 156it [00:17, 9.40it/s] 157it [00:17, 9.45it/s] 158it [00:17, 9.47it/s] 159it [00:17, 9.50it/s] 160it [00:17, 9.56it/s] 161it [00:17, 9.60it/s] 162it [00:17, 9.54it/s] 163it [00:17, 9.51it/s] 164it [00:18, 9.52it/s] 165it [00:18, 9.50it/s] 166it [00:18, 9.50it/s] 167it [00:18, 9.55it/s] 168it [00:18, 9.01it/s] 169it [00:18, 9.18it/s] 170it [00:18, 9.13it/s] 171it [00:18, 9.05it/s] 172it [00:18, 8.61it/s] 173it [00:19, 8.84it/s] 174it [00:19, 9.02it/s] 175it [00:19, 9.17it/s] 176it [00:19, 8.76it/s] 177it [00:19, 8.95it/s] 178it [00:19, 9.12it/s] 179it [00:19, 9.23it/s] 180it [00:19, 8.81it/s] 181it [00:19, 9.03it/s] 182it [00:20, 9.16it/s] 183it [00:20, 9.23it/s] 184it [00:20, 8.83it/s] 185it [00:20, 8.98it/s] 186it [00:20, 9.07it/s] 187it [00:20, 9.21it/s] 188it [00:20, 8.81it/s] 189it [00:20, 9.00it/s] 190it [00:20, 9.13it/s] 191it [00:20, 9.24it/s] 192it [00:21, 8.81it/s] 193it [00:21, 9.03it/s] 194it [00:21, 9.13it/s] 195it [00:21, 8.67it/s] 196it [00:21, 8.93it/s] 196it [00:21, 9.07it/s] +2025-05-26 04:14:25,562 - INFO - Epoch: 64, Objective: tensor([4486.4854], device='cuda:0', grad_fn=), Loss: 0.017137622460722923, KL/n: 66.45817565917969 + 0it [00:00, ?it/s]2025-05-26 04:14:25,842 - INFO - [Epoch 065 | Batch 0000] IWAE-loss 4915.1265 | mean log_px -0.0304 | KL -3253.02 + 1it [00:00, 4.64it/s] 2it [00:00, 6.63it/s] 3it [00:00, 7.69it/s] 4it [00:00, 8.28it/s] 5it [00:00, 8.17it/s] 6it [00:00, 8.50it/s] 7it [00:00, 8.80it/s] 8it [00:00, 8.99it/s] 9it [00:01, 9.12it/s] 10it [00:01, 9.20it/s] 11it [00:01, 9.30it/s] 12it [00:01, 9.33it/s] 13it [00:01, 9.35it/s] 14it [00:01, 9.38it/s] 15it [00:01, 9.29it/s] 16it [00:01, 8.80it/s] 17it [00:01, 8.98it/s] 18it [00:02, 9.15it/s] 19it [00:02, 9.30it/s] 20it [00:02, 9.39it/s] 21it [00:02, 9.45it/s] 22it [00:02, 9.44it/s] 23it [00:02, 9.48it/s] 24it [00:02, 9.55it/s] 25it [00:02, 9.49it/s] 26it [00:02, 9.51it/s] 27it [00:03, 9.51it/s] 28it [00:03, 9.46it/s] 29it [00:03, 9.48it/s] 30it [00:03, 9.49it/s] 31it [00:03, 9.47it/s] 32it [00:03, 9.48it/s] 33it [00:03, 9.49it/s] 34it [00:03, 9.50it/s] 35it [00:03, 9.47it/s] 36it [00:03, 9.49it/s] 37it [00:04, 9.55it/s] 38it [00:04, 9.59it/s] 39it [00:04, 9.55it/s] 40it [00:04, 9.53it/s] 41it [00:04, 9.49it/s] 42it [00:04, 9.51it/s] 43it [00:04, 9.50it/s] 44it [00:04, 9.53it/s] 45it [00:04, 9.40it/s] 46it [00:05, 9.33it/s] 47it [00:05, 8.84it/s] 48it [00:05, 8.97it/s] 49it [00:05, 9.13it/s] 50it [00:05, 9.22it/s]2025-05-26 04:14:31,216 - INFO - [Epoch 065 | Batch 0050] IWAE-loss 4041.6321 | mean log_px -0.0125 | KL -3247.29 + 51it [00:05, 9.28it/s] 52it [00:05, 9.32it/s] 53it [00:05, 9.40it/s] 54it [00:05, 9.47it/s] 55it [00:05, 9.46it/s] 56it [00:06, 9.52it/s] 57it [00:06, 9.50it/s] 58it [00:06, 9.52it/s] 59it [00:06, 9.47it/s] 60it [00:06, 9.48it/s] 61it [00:06, 9.52it/s] 62it [00:06, 9.55it/s] 63it [00:06, 9.53it/s] 64it [00:06, 9.52it/s] 65it [00:07, 9.57it/s] 66it [00:07, 9.50it/s] 67it [00:07, 9.49it/s] 68it [00:07, 9.48it/s] 69it [00:07, 9.52it/s] 70it [00:07, 9.43it/s] 71it [00:07, 9.52it/s] 72it [00:07, 9.46it/s] 73it [00:07, 9.50it/s] 74it [00:07, 9.51it/s] 75it [00:08, 9.55it/s] 76it [00:08, 9.58it/s] 77it [00:08, 9.55it/s] 78it [00:08, 9.52it/s] 79it [00:08, 9.51it/s] 80it [00:08, 9.51it/s] 81it [00:08, 9.52it/s] 82it [00:08, 9.53it/s] 83it [00:08, 9.51it/s] 84it [00:09, 8.96it/s] 85it [00:09, 9.12it/s] 86it [00:09, 9.24it/s] 87it [00:09, 9.28it/s] 88it [00:09, 9.39it/s] 89it [00:09, 9.45it/s] 90it [00:09, 9.46it/s] 91it [00:09, 9.49it/s] 92it [00:09, 9.49it/s] 93it [00:09, 9.52it/s] 94it [00:10, 9.54it/s] 95it [00:10, 9.58it/s] 96it [00:10, 9.57it/s] 97it [00:10, 9.60it/s] 98it [00:10, 9.58it/s] 99it [00:10, 9.03it/s] 100it [00:10, 9.18it/s]2025-05-26 04:14:36,506 - INFO - [Epoch 065 | Batch 0100] IWAE-loss 4149.1934 | mean log_px -0.0150 | KL -3245.47 + 101it [00:10, 9.27it/s] 102it [00:10, 9.36it/s] 103it [00:11, 9.41it/s] 104it [00:11, 9.49it/s] 105it [00:11, 9.50it/s] 106it [00:11, 9.08it/s] 107it [00:11, 9.20it/s] 108it [00:11, 9.27it/s] 109it [00:11, 9.33it/s] 110it [00:11, 9.33it/s] 111it [00:11, 9.43it/s] 112it [00:12, 9.45it/s] 113it [00:12, 9.49it/s] 114it [00:12, 9.49it/s] 115it [00:12, 9.53it/s] 116it [00:12, 9.54it/s] 117it [00:12, 9.54it/s] 118it [00:12, 9.53it/s] 119it [00:12, 9.59it/s] 120it [00:12, 9.56it/s] 121it [00:12, 9.54it/s] 122it [00:13, 9.54it/s] 123it [00:13, 9.39it/s] 124it [00:13, 8.82it/s] 125it [00:13, 9.05it/s] 126it [00:13, 9.18it/s] 127it [00:13, 9.28it/s] 128it [00:13, 9.42it/s] 129it [00:13, 9.50it/s] 130it [00:13, 9.56it/s] 131it [00:14, 9.62it/s] 132it [00:14, 9.57it/s] 133it [00:14, 9.57it/s] 134it [00:14, 9.58it/s] 135it [00:14, 9.55it/s] 136it [00:14, 9.52it/s] 137it [00:14, 9.27it/s] 138it [00:14, 9.35it/s] 139it [00:14, 8.89it/s] 140it [00:15, 9.07it/s] 141it [00:15, 9.17it/s] 142it [00:15, 9.25it/s] 143it [00:15, 9.31it/s] 144it [00:15, 9.36it/s] 145it [00:15, 9.45it/s] 146it [00:15, 9.51it/s] 147it [00:15, 9.50it/s] 148it [00:15, 9.42it/s] 149it [00:15, 9.04it/s] 150it [00:16, 9.19it/s]2025-05-26 04:14:41,841 - INFO - [Epoch 065 | Batch 0150] IWAE-loss 5137.2002 | mean log_px -0.0301 | KL -3244.56 + 151it [00:16, 9.29it/s] 152it [00:16, 9.26it/s] 153it [00:16, 9.34it/s] 154it [00:16, 9.43it/s] 155it [00:16, 9.44it/s] 156it [00:16, 9.48it/s] 157it [00:16, 9.52it/s] 158it [00:16, 9.09it/s] 159it [00:17, 9.17it/s] 160it [00:17, 9.31it/s] 161it [00:17, 9.42it/s] 162it [00:17, 9.41it/s] 163it [00:17, 9.45it/s] 164it [00:17, 9.47it/s] 165it [00:17, 9.46it/s] 166it [00:17, 9.44it/s] 167it [00:17, 9.49it/s] 168it [00:18, 8.96it/s] 169it [00:18, 9.12it/s] 170it [00:18, 9.24it/s] 171it [00:18, 9.35it/s] 172it [00:18, 9.43it/s] 173it [00:18, 9.54it/s] 174it [00:18, 9.57it/s] 175it [00:18, 9.56it/s] 176it [00:18, 9.33it/s] 177it [00:18, 9.44it/s] 178it [00:19, 8.96it/s] 179it [00:19, 9.14it/s] 180it [00:19, 9.21it/s] 181it [00:19, 9.30it/s] 182it [00:19, 8.86it/s] 183it [00:19, 9.08it/s] 184it [00:19, 9.20it/s] 185it [00:19, 9.26it/s] 186it [00:19, 8.84it/s] 187it [00:20, 9.03it/s] 188it [00:20, 9.21it/s] 189it [00:20, 9.38it/s] 190it [00:20, 8.92it/s] 191it [00:20, 9.10it/s] 192it [00:20, 9.25it/s] 193it [00:20, 9.35it/s] 194it [00:20, 8.88it/s] 195it [00:20, 8.54it/s] 196it [00:21, 8.88it/s] 196it [00:21, 9.28it/s] +2025-05-26 04:14:46,823 - INFO - Epoch: 65, Objective: tensor([4243.4243], device='cuda:0', grad_fn=), Loss: 0.016095492988824844, KL/n: 66.21897888183594 + 0it [00:00, ?it/s]2025-05-26 04:14:47,284 - INFO - [Epoch 066 | Batch 0000] IWAE-loss 4330.0098 | mean log_px -0.0173 | KL -3242.21 + 1it [00:00, 2.51it/s] 2it [00:00, 4.42it/s] 3it [00:00, 5.86it/s] 4it [00:00, 6.92it/s] 5it [00:00, 7.66it/s] 6it [00:00, 8.14it/s] 7it [00:01, 8.12it/s] 8it [00:01, 8.49it/s] 9it [00:01, 8.81it/s] 10it [00:01, 9.00it/s] 11it [00:01, 8.64it/s] 12it [00:01, 8.77it/s] 13it [00:01, 9.01it/s] 14it [00:01, 9.11it/s] 15it [00:01, 8.74it/s] 16it [00:02, 8.94it/s] 17it [00:02, 9.11it/s] 18it [00:02, 9.16it/s] 19it [00:02, 8.77it/s] 20it [00:02, 8.94it/s] 21it [00:02, 9.13it/s] 22it [00:02, 9.21it/s] 23it [00:02, 8.82it/s] 24it [00:02, 9.01it/s] 25it [00:03, 9.22it/s] 26it [00:03, 9.33it/s] 27it [00:03, 9.31it/s] 28it [00:03, 8.87it/s] 29it [00:03, 9.05it/s] 30it [00:03, 9.19it/s] 31it [00:03, 9.30it/s] 32it [00:03, 8.86it/s] 33it [00:03, 9.06it/s] 34it [00:04, 9.17it/s] 35it [00:04, 9.27it/s] 36it [00:04, 8.81it/s] 37it [00:04, 9.01it/s] 38it [00:04, 9.15it/s] 39it [00:04, 9.24it/s] 40it [00:04, 8.85it/s] 41it [00:04, 9.06it/s] 42it [00:04, 9.13it/s] 43it [00:05, 9.26it/s] 44it [00:05, 8.75it/s] 45it [00:05, 8.92it/s] 46it [00:05, 9.07it/s] 47it [00:05, 9.19it/s] 48it [00:05, 8.81it/s] 49it [00:05, 9.00it/s] 50it [00:05, 9.10it/s]2025-05-26 04:14:52,810 - INFO - [Epoch 066 | Batch 0050] IWAE-loss 5074.5923 | mean log_px -0.0331 | KL -3240.32 + 51it [00:05, 9.18it/s] 52it [00:06, 8.81it/s] 53it [00:06, 8.96it/s] 54it [00:06, 9.10it/s] 55it [00:06, 9.22it/s] 56it [00:06, 8.83it/s] 57it [00:06, 9.03it/s] 58it [00:06, 9.18it/s] 59it [00:06, 9.31it/s] 60it [00:06, 8.88it/s] 61it [00:07, 8.82it/s] 62it [00:07, 8.80it/s] 63it [00:07, 8.85it/s] 64it [00:07, 8.53it/s] 65it [00:07, 8.82it/s] 66it [00:07, 9.04it/s] 67it [00:07, 9.22it/s] 68it [00:07, 8.83it/s] 69it [00:07, 9.07it/s] 70it [00:08, 9.21it/s] 71it [00:08, 9.31it/s] 72it [00:08, 8.84it/s] 73it [00:08, 9.07it/s] 74it [00:08, 9.22it/s] 75it [00:08, 9.27it/s] 76it [00:08, 9.22it/s] 77it [00:08, 8.82it/s] 78it [00:08, 9.00it/s] 79it [00:09, 9.16it/s] 80it [00:09, 9.28it/s] 81it [00:09, 8.85it/s] 82it [00:09, 9.04it/s] 83it [00:09, 9.16it/s] 84it [00:09, 9.29it/s] 85it [00:09, 8.86it/s] 86it [00:09, 9.00it/s] 87it [00:09, 9.15it/s] 88it [00:09, 9.23it/s] 89it [00:10, 8.83it/s] 90it [00:10, 9.03it/s] 91it [00:10, 9.16it/s] 92it [00:10, 9.26it/s] 93it [00:10, 8.83it/s] 94it [00:10, 9.01it/s] 95it [00:10, 9.14it/s] 96it [00:10, 9.27it/s] 97it [00:11, 8.87it/s] 98it [00:11, 9.04it/s] 99it [00:11, 9.20it/s] 100it [00:11, 9.32it/s]2025-05-26 04:14:58,332 - INFO - [Epoch 066 | Batch 0100] IWAE-loss 4414.3447 | mean log_px -0.0179 | KL -3239.95 + 101it [00:11, 8.91it/s] 102it [00:11, 9.11it/s] 103it [00:11, 9.25it/s] 104it [00:11, 9.34it/s] 105it [00:11, 8.89it/s] 106it [00:11, 9.08it/s] 107it [00:12, 9.26it/s] 108it [00:12, 9.37it/s] 109it [00:12, 8.91it/s] 110it [00:12, 9.08it/s] 111it [00:12, 9.20it/s] 112it [00:12, 9.30it/s] 113it [00:12, 8.86it/s] 114it [00:12, 9.06it/s] 115it [00:12, 9.22it/s] 116it [00:13, 9.30it/s] 117it [00:13, 8.89it/s] 118it [00:13, 9.07it/s] 119it [00:13, 9.11it/s] 120it [00:13, 8.68it/s] 121it [00:13, 8.91it/s] 122it [00:13, 9.09it/s] 123it [00:13, 9.22it/s] 124it [00:13, 8.78it/s] 125it [00:14, 8.99it/s] 126it [00:14, 9.18it/s] 127it [00:14, 9.19it/s] 128it [00:14, 8.77it/s] 129it [00:14, 8.99it/s] 130it [00:14, 8.97it/s] 131it [00:14, 8.96it/s] 132it [00:14, 8.49it/s] 133it [00:14, 8.75it/s] 134it [00:15, 8.95it/s] 135it [00:15, 9.06it/s] 136it [00:15, 8.69it/s] 137it [00:15, 8.92it/s] 138it [00:15, 9.07it/s] 139it [00:15, 9.02it/s] 140it [00:15, 8.96it/s] 141it [00:15, 8.63it/s] 142it [00:15, 8.81it/s] 143it [00:16, 9.02it/s] 144it [00:16, 9.17it/s] 145it [00:16, 8.91it/s] 146it [00:16, 9.10it/s] 147it [00:16, 9.22it/s] 148it [00:16, 8.83it/s] 149it [00:16, 8.98it/s] 150it [00:16, 9.01it/s]2025-05-26 04:15:03,892 - INFO - [Epoch 066 | Batch 0150] IWAE-loss 4754.2173 | mean log_px -0.0265 | KL -3233.78 + 151it [00:16, 9.21it/s] 152it [00:17, 8.87it/s] 153it [00:17, 9.12it/s] 154it [00:17, 9.30it/s] 155it [00:17, 9.43it/s] 156it [00:17, 9.02it/s] 157it [00:17, 9.23it/s] 158it [00:17, 9.40it/s] 159it [00:17, 9.51it/s] 160it [00:17, 9.05it/s] 161it [00:18, 9.26it/s] 162it [00:18, 9.40it/s] 163it [00:18, 9.44it/s] 164it [00:18, 9.02it/s] 165it [00:18, 9.22it/s] 166it [00:18, 9.36it/s] 167it [00:18, 9.49it/s] 168it [00:18, 9.03it/s] 169it [00:18, 9.24it/s] 170it [00:19, 9.38it/s] 171it [00:19, 9.49it/s] 172it [00:19, 9.03it/s] 173it [00:19, 9.24it/s] 174it [00:19, 9.39it/s] 175it [00:19, 9.52it/s] 176it [00:19, 9.06it/s] 177it [00:19, 9.26it/s] 178it [00:19, 9.40it/s] 179it [00:19, 9.52it/s] 180it [00:20, 9.05it/s] 181it [00:20, 9.25it/s] 182it [00:20, 9.38it/s] 183it [00:20, 9.48it/s] 184it [00:20, 9.02it/s] 185it [00:20, 9.23it/s] 186it [00:20, 9.36it/s] 187it [00:20, 9.40it/s] 188it [00:20, 8.96it/s] 189it [00:21, 9.15it/s] 190it [00:21, 9.33it/s] 191it [00:21, 8.95it/s] 192it [00:21, 9.17it/s] 193it [00:21, 9.34it/s] 194it [00:21, 8.94it/s] 195it [00:21, 8.62it/s] 196it [00:21, 8.99it/s] 196it [00:21, 8.94it/s] +2025-05-26 04:15:08,886 - INFO - Epoch: 66, Objective: tensor([4165.6123], device='cuda:0', grad_fn=), Loss: 0.015236176550388336, KL/n: 65.961181640625 + 0it [00:00, ?it/s]2025-05-26 04:15:09,138 - INFO - [Epoch 067 | Batch 0000] IWAE-loss 4508.1504 | mean log_px -0.0203 | KL -3233.36 + 1it [00:00, 5.39it/s] 2it [00:00, 7.29it/s] 3it [00:00, 8.27it/s] 4it [00:00, 8.21it/s] 5it [00:00, 8.68it/s] 6it [00:00, 8.83it/s] 7it [00:00, 9.13it/s] 8it [00:00, 8.86it/s] 9it [00:01, 9.02it/s] 10it [00:01, 9.09it/s] 11it [00:01, 8.74it/s] 12it [00:01, 9.03it/s] 13it [00:01, 9.23it/s] 14it [00:01, 9.38it/s] 15it [00:01, 8.93it/s] 16it [00:01, 9.16it/s] 17it [00:01, 9.38it/s] 18it [00:02, 9.51it/s] 19it [00:02, 9.05it/s] 20it [00:02, 9.27it/s] 21it [00:02, 9.45it/s] 22it [00:02, 9.57it/s] 23it [00:02, 9.19it/s] 24it [00:02, 9.39it/s] 25it [00:02, 9.55it/s] 26it [00:02, 9.64it/s] 27it [00:02, 9.72it/s] 28it [00:03, 9.77it/s] 29it [00:03, 9.32it/s] 30it [00:03, 9.48it/s] 31it [00:03, 9.61it/s] 32it [00:03, 9.68it/s] 33it [00:03, 9.73it/s] 34it [00:03, 9.28it/s] 35it [00:03, 9.44it/s] 36it [00:03, 9.57it/s] 37it [00:04, 9.68it/s] 38it [00:04, 9.61it/s] 39it [00:04, 9.70it/s] 40it [00:04, 9.75it/s] 41it [00:04, 9.79it/s] 42it [00:04, 9.82it/s] 43it [00:04, 9.35it/s] 44it [00:04, 9.50it/s] 45it [00:04, 9.62it/s] 46it [00:04, 9.70it/s] 47it [00:05, 9.77it/s] 48it [00:05, 9.80it/s] 49it [00:05, 9.34it/s] 50it [00:05, 9.49it/s]2025-05-26 04:15:14,459 - INFO - [Epoch 067 | Batch 0050] IWAE-loss 4197.2188 | mean log_px -0.0214 | KL -3226.38 + 51it [00:05, 9.59it/s] 52it [00:05, 9.68it/s] 53it [00:05, 9.14it/s] 54it [00:05, 9.33it/s] 55it [00:05, 9.50it/s] 56it [00:06, 9.60it/s] 57it [00:06, 9.58it/s] 58it [00:06, 9.68it/s] 59it [00:06, 9.76it/s] 60it [00:06, 9.78it/s] 61it [00:06, 9.81it/s] 62it [00:06, 9.18it/s] 63it [00:06, 9.39it/s] 64it [00:06, 9.55it/s] 65it [00:06, 9.66it/s] 66it [00:07, 9.72it/s] 67it [00:07, 9.16it/s] 68it [00:07, 9.37it/s] 69it [00:07, 9.52it/s] 70it [00:07, 9.62it/s] 71it [00:07, 9.71it/s] 72it [00:07, 9.28it/s] 73it [00:07, 9.44it/s] 74it [00:07, 9.57it/s] 75it [00:07, 9.66it/s] 76it [00:08, 9.72it/s] 77it [00:08, 9.21it/s] 78it [00:08, 9.40it/s] 79it [00:08, 9.54it/s] 80it [00:08, 9.64it/s] 81it [00:08, 9.72it/s] 82it [00:08, 9.77it/s] 83it [00:08, 9.81it/s] 84it [00:08, 9.84it/s] 85it [00:09, 9.87it/s] 86it [00:09, 9.88it/s] 87it [00:09, 9.90it/s] 88it [00:09, 9.88it/s] 89it [00:09, 9.90it/s] 90it [00:09, 9.90it/s] 91it [00:09, 9.91it/s] 92it [00:09, 9.90it/s] 93it [00:09, 9.92it/s] 94it [00:09, 9.42it/s] 95it [00:10, 9.56it/s] 96it [00:10, 9.66it/s] 97it [00:10, 9.25it/s] 98it [00:10, 9.44it/s] 99it [00:10, 9.59it/s] 100it [00:10, 9.68it/s]2025-05-26 04:15:19,658 - INFO - [Epoch 067 | Batch 0100] IWAE-loss 4479.0835 | mean log_px -0.0211 | KL -3224.74 + 101it [00:10, 9.75it/s] 102it [00:10, 9.80it/s] 103it [00:10, 9.83it/s] 104it [00:10, 9.35it/s] 105it [00:11, 9.52it/s] 106it [00:11, 9.62it/s] 107it [00:11, 9.70it/s] 108it [00:11, 9.75it/s] 109it [00:11, 9.79it/s] 110it [00:11, 9.26it/s] 111it [00:11, 9.45it/s] 112it [00:11, 9.56it/s] 113it [00:11, 9.66it/s] 114it [00:12, 9.72it/s] 115it [00:12, 9.75it/s] 116it [00:12, 9.05it/s] 117it [00:12, 9.29it/s] 118it [00:12, 9.44it/s] 119it [00:12, 9.46it/s] 120it [00:12, 9.57it/s] 121it [00:12, 9.61it/s] 122it [00:12, 9.64it/s] 123it [00:12, 9.71it/s] 124it [00:13, 9.70it/s] 125it [00:13, 9.73it/s] 126it [00:13, 9.76it/s] 127it [00:13, 9.77it/s] 128it [00:13, 9.81it/s] 129it [00:13, 9.81it/s] 130it [00:13, 9.78it/s] 131it [00:13, 9.72it/s] 132it [00:13, 9.77it/s] 133it [00:14, 9.77it/s] 134it [00:14, 9.78it/s] 135it [00:14, 9.81it/s] 136it [00:14, 9.33it/s] 137it [00:14, 9.50it/s] 138it [00:14, 9.60it/s] 139it [00:14, 9.70it/s] 140it [00:14, 9.75it/s] 141it [00:14, 9.78it/s] 142it [00:14, 9.28it/s] 143it [00:15, 9.44it/s] 144it [00:15, 9.55it/s] 145it [00:15, 9.64it/s] 146it [00:15, 9.72it/s] 147it [00:15, 9.59it/s] 148it [00:15, 9.68it/s] 149it [00:15, 9.14it/s] 150it [00:15, 9.33it/s]2025-05-26 04:15:24,872 - INFO - [Epoch 067 | Batch 0150] IWAE-loss 4168.6562 | mean log_px -0.0179 | KL -3215.23 + 151it [00:15, 9.47it/s] 152it [00:15, 9.53it/s] 153it [00:16, 9.62it/s] 154it [00:16, 9.22it/s] 155it [00:16, 9.24it/s] 156it [00:16, 8.76it/s] 157it [00:16, 8.88it/s] 158it [00:16, 9.06it/s] 159it [00:16, 9.24it/s] 160it [00:16, 8.79it/s] 161it [00:17, 9.03it/s] 162it [00:17, 9.20it/s] 163it [00:17, 9.34it/s] 164it [00:17, 9.43it/s] 165it [00:17, 9.50it/s] 166it [00:17, 9.50it/s] 167it [00:17, 9.56it/s] 168it [00:17, 9.60it/s] 169it [00:17, 9.09it/s] 170it [00:17, 9.30it/s] 171it [00:18, 9.48it/s] 172it [00:18, 9.59it/s] 173it [00:18, 9.20it/s] 174it [00:18, 9.40it/s] 175it [00:18, 9.52it/s] 176it [00:18, 9.61it/s] 177it [00:18, 9.70it/s] 178it [00:18, 9.26it/s] 179it [00:18, 9.43it/s] 180it [00:19, 9.56it/s] 181it [00:19, 9.66it/s] 182it [00:19, 9.72it/s] 183it [00:19, 9.78it/s] 184it [00:19, 9.29it/s] 185it [00:19, 9.47it/s] 186it [00:19, 9.57it/s] 187it [00:19, 9.67it/s] 188it [00:19, 9.72it/s] 189it [00:19, 9.77it/s] 190it [00:20, 9.81it/s] 191it [00:20, 9.34it/s] 192it [00:20, 9.48it/s] 193it [00:20, 9.60it/s] 194it [00:20, 9.68it/s] 195it [00:20, 9.16it/s] 196it [00:20, 9.45it/s] +2025-05-26 04:15:29,755 - INFO - Epoch: 67, Objective: tensor([4425.1938], device='cuda:0', grad_fn=), Loss: 0.020734276622533798, KL/n: 65.69780731201172 + 0it [00:00, ?it/s]2025-05-26 04:15:30,247 - INFO - [Epoch 068 | Batch 0000] IWAE-loss 4215.6938 | mean log_px -0.0170 | KL -3219.93 + 1it [00:00, 2.35it/s] 2it [00:00, 4.23it/s] 3it [00:00, 5.69it/s] 4it [00:00, 6.79it/s] 5it [00:00, 7.59it/s] 6it [00:00, 7.83it/s] 7it [00:01, 8.35it/s] 8it [00:01, 8.72it/s] 9it [00:01, 9.01it/s] 10it [00:01, 8.60it/s] 11it [00:01, 8.91it/s] 12it [00:01, 9.15it/s] 13it [00:01, 9.35it/s] 14it [00:01, 8.92it/s] 15it [00:01, 9.18it/s] 16it [00:02, 9.37it/s] 17it [00:02, 9.50it/s] 18it [00:02, 9.02it/s] 19it [00:02, 9.26it/s] 20it [00:02, 9.41it/s] 21it [00:02, 9.51it/s] 22it [00:02, 9.03it/s] 23it [00:02, 9.24it/s] 24it [00:02, 9.39it/s] 25it [00:02, 9.52it/s] 26it [00:03, 9.01it/s] 27it [00:03, 9.27it/s] 28it [00:03, 9.44it/s] 29it [00:03, 9.57it/s] 30it [00:03, 9.17it/s] 31it [00:03, 9.38it/s] 32it [00:03, 9.52it/s] 33it [00:03, 9.64it/s] 34it [00:03, 9.23it/s] 35it [00:04, 9.43it/s] 36it [00:04, 9.56it/s] 37it [00:04, 9.18it/s] 38it [00:04, 9.37it/s] 39it [00:04, 9.52it/s] 40it [00:04, 9.62it/s] 41it [00:04, 9.70it/s] 42it [00:04, 9.13it/s] 43it [00:04, 9.28it/s] 44it [00:05, 9.44it/s] 45it [00:05, 9.57it/s] 46it [00:05, 9.66it/s] 47it [00:05, 9.73it/s] 48it [00:05, 9.78it/s] 49it [00:05, 9.19it/s] 50it [00:05, 9.35it/s]2025-05-26 04:15:35,600 - INFO - [Epoch 068 | Batch 0050] IWAE-loss 4135.7124 | mean log_px -0.0192 | KL -3214.93 + 51it [00:05, 9.49it/s] 52it [00:05, 9.61it/s] 53it [00:05, 9.67it/s] 54it [00:06, 9.60it/s] 55it [00:06, 9.63it/s] 56it [00:06, 9.70it/s] 57it [00:06, 9.78it/s] 58it [00:06, 9.80it/s] 59it [00:06, 9.82it/s] 60it [00:06, 9.83it/s] 61it [00:06, 9.85it/s] 62it [00:06, 9.86it/s] 63it [00:06, 9.87it/s] 64it [00:07, 9.85it/s] 65it [00:07, 9.85it/s] 66it [00:07, 9.82it/s] 67it [00:07, 9.85it/s] 68it [00:07, 9.34it/s] 69it [00:07, 9.49it/s] 70it [00:07, 9.51it/s] 71it [00:07, 9.43it/s] 72it [00:07, 9.45it/s] 73it [00:08, 9.44it/s] 74it [00:08, 8.78it/s] 75it [00:08, 8.93it/s] 76it [00:08, 8.66it/s] 77it [00:08, 8.99it/s] 78it [00:08, 9.23it/s] 79it [00:08, 9.40it/s] 80it [00:08, 8.95it/s] 81it [00:08, 9.21it/s] 82it [00:09, 9.36it/s] 83it [00:09, 9.52it/s] 84it [00:09, 9.04it/s] 85it [00:09, 9.30it/s] 86it [00:09, 9.37it/s] 87it [00:09, 9.38it/s] 88it [00:09, 9.03it/s] 89it [00:09, 9.24it/s] 90it [00:09, 9.42it/s] 91it [00:09, 9.55it/s] 92it [00:10, 9.58it/s] 93it [00:10, 9.62it/s] 94it [00:10, 9.50it/s] 95it [00:10, 9.13it/s] 96it [00:10, 9.33it/s] 97it [00:10, 9.49it/s] 98it [00:10, 9.28it/s] 99it [00:10, 9.39it/s] 100it [00:10, 9.47it/s]2025-05-26 04:15:40,894 - INFO - [Epoch 068 | Batch 0100] IWAE-loss 4981.6865 | mean log_px -0.0295 | KL -3210.19 + 101it [00:11, 9.50it/s] 102it [00:11, 9.40it/s] 103it [00:11, 9.43it/s] 104it [00:11, 9.46it/s] 105it [00:11, 9.47it/s] 106it [00:11, 9.49it/s] 107it [00:11, 9.51it/s] 108it [00:11, 9.50it/s] 109it [00:11, 9.51it/s] 110it [00:11, 9.54it/s] 111it [00:12, 9.54it/s] 112it [00:12, 9.52it/s] 113it [00:12, 9.56it/s] 114it [00:12, 9.56it/s] 115it [00:12, 9.20it/s] 116it [00:12, 9.30it/s] 117it [00:12, 9.36it/s] 118it [00:12, 9.43it/s] 119it [00:12, 9.46it/s] 120it [00:13, 9.46it/s] 121it [00:13, 9.48it/s] 122it [00:13, 9.52it/s] 123it [00:13, 9.56it/s] 124it [00:13, 9.54it/s] 125it [00:13, 9.51it/s] 126it [00:13, 9.48it/s] 127it [00:13, 9.50it/s] 128it [00:13, 9.50it/s] 129it [00:14, 9.50it/s] 130it [00:14, 9.46it/s] 131it [00:14, 9.44it/s] 132it [00:14, 9.43it/s] 133it [00:14, 9.40it/s] 134it [00:14, 9.39it/s] 135it [00:14, 9.43it/s] 136it [00:14, 9.40it/s] 137it [00:14, 8.69it/s] 138it [00:14, 8.97it/s] 139it [00:15, 9.22it/s] 140it [00:15, 9.41it/s] 142it [00:15, 9.67it/s] 143it [00:15, 9.75it/s] 144it [00:15, 9.74it/s] 145it [00:15, 9.80it/s] 146it [00:15, 9.79it/s] 147it [00:15, 9.73it/s] 148it [00:16, 9.32it/s] 149it [00:16, 9.50it/s] 150it [00:16, 9.61it/s]2025-05-26 04:15:46,169 - INFO - [Epoch 068 | Batch 0150] IWAE-loss 3965.0554 | mean log_px -0.0127 | KL -3208.22 + 151it [00:16, 9.07it/s] 152it [00:16, 9.29it/s] 153it [00:16, 9.40it/s] 154it [00:16, 9.54it/s] 156it [00:16, 9.73it/s] 157it [00:16, 9.77it/s] 158it [00:17, 9.80it/s] 159it [00:17, 9.79it/s] 160it [00:17, 9.76it/s] 161it [00:17, 9.71it/s] 162it [00:17, 9.78it/s] 163it [00:17, 9.80it/s] 164it [00:17, 9.78it/s] 165it [00:17, 9.80it/s] 166it [00:17, 9.85it/s] 167it [00:17, 9.85it/s] 168it [00:18, 9.88it/s] 169it [00:18, 9.88it/s] 170it [00:18, 9.34it/s] 172it [00:18, 9.62it/s] 173it [00:18, 9.69it/s] 174it [00:18, 9.76it/s] 175it [00:18, 9.77it/s] 176it [00:18, 9.81it/s] 177it [00:19, 9.81it/s] 178it [00:19, 9.86it/s] 179it [00:19, 9.90it/s] 180it [00:19, 9.92it/s] 181it [00:19, 9.91it/s] 182it [00:19, 9.93it/s] 183it [00:19, 9.44it/s] 184it [00:19, 9.57it/s] 185it [00:19, 9.68it/s] 186it [00:19, 9.76it/s] 187it [00:20, 9.83it/s] 188it [00:20, 9.86it/s] 189it [00:20, 9.86it/s] 190it [00:20, 9.88it/s] 191it [00:20, 9.90it/s] 192it [00:20, 9.91it/s] 193it [00:20, 9.29it/s] 194it [00:20, 9.42it/s] 195it [00:20, 9.07it/s] 196it [00:20, 8.95it/s] 196it [00:21, 9.31it/s] +2025-05-26 04:15:50,941 - INFO - Epoch: 68, Objective: tensor([4401.1167], device='cuda:0', grad_fn=), Loss: 0.016813162714242935, KL/n: 65.4537582397461 + 0it [00:00, ?it/s]2025-05-26 04:15:51,227 - INFO - [Epoch 069 | Batch 0000] IWAE-loss 3877.0161 | mean log_px -0.0104 | KL -3203.73 + 1it [00:00, 5.40it/s] 2it [00:00, 6.84it/s] 4it [00:00, 8.47it/s] 6it [00:00, 9.18it/s] 8it [00:00, 9.50it/s] 10it [00:01, 9.40it/s] 11it [00:01, 9.50it/s] 12it [00:01, 9.61it/s] 14it [00:01, 9.79it/s] 16it [00:01, 9.87it/s] 18it [00:01, 9.89it/s] 19it [00:02, 9.38it/s] 20it [00:02, 9.13it/s] 21it [00:02, 9.09it/s] 22it [00:02, 9.18it/s] 23it [00:02, 9.33it/s] 24it [00:02, 9.41it/s] 25it [00:02, 9.48it/s] 26it [00:02, 9.45it/s] 27it [00:02, 9.49it/s] 28it [00:03, 9.62it/s] 29it [00:03, 9.13it/s] 31it [00:03, 9.55it/s] 33it [00:03, 9.76it/s] 35it [00:03, 9.88it/s] 37it [00:03, 9.93it/s] 38it [00:04, 9.93it/s] 39it [00:04, 9.94it/s] 41it [00:04, 9.88it/s] 42it [00:04, 9.54it/s] 43it [00:04, 9.63it/s] 44it [00:04, 9.71it/s] 46it [00:04, 9.42it/s] 47it [00:04, 9.53it/s] 48it [00:05, 9.64it/s] 50it [00:05, 9.82it/s]2025-05-26 04:15:56,414 - INFO - [Epoch 069 | Batch 0050] IWAE-loss 3863.5151 | mean log_px -0.0112 | KL -3199.91 + 51it [00:05, 9.85it/s] 52it [00:05, 9.14it/s] 53it [00:05, 9.19it/s] 54it [00:05, 9.21it/s] 55it [00:05, 9.22it/s] 56it [00:05, 9.42it/s] 58it [00:06, 9.69it/s] 60it [00:06, 9.83it/s] 62it [00:06, 9.91it/s] 64it [00:06, 9.97it/s] 65it [00:06, 9.93it/s] 67it [00:07, 9.97it/s] 68it [00:07, 9.97it/s] 70it [00:07, 10.01it/s] 71it [00:07, 9.92it/s] 72it [00:07, 9.90it/s] 73it [00:07, 9.85it/s] 75it [00:07, 9.94it/s] 77it [00:08, 9.99it/s] 79it [00:08, 10.02it/s] 81it [00:08, 9.98it/s] 82it [00:08, 9.90it/s] 84it [00:08, 9.94it/s] 86it [00:08, 9.99it/s] 88it [00:09, 10.01it/s] 89it [00:09, 10.01it/s] 90it [00:09, 10.00it/s] 92it [00:09, 10.02it/s] 94it [00:09, 10.03it/s] 96it [00:09, 10.04it/s] 98it [00:10, 10.05it/s] 100it [00:10, 10.07it/s]2025-05-26 04:16:01,468 - INFO - [Epoch 069 | Batch 0100] IWAE-loss 3742.5066 | mean log_px -0.0079 | KL -3197.15 + 102it [00:10, 9.71it/s] 104it [00:10, 9.82it/s] 105it [00:10, 9.84it/s] 106it [00:10, 9.86it/s] 107it [00:11, 9.82it/s] 108it [00:11, 9.86it/s] 110it [00:11, 9.95it/s] 112it [00:11, 9.99it/s] 114it [00:11, 10.01it/s] 116it [00:11, 10.04it/s] 118it [00:12, 10.06it/s] 120it [00:12, 10.06it/s] 122it [00:12, 10.07it/s] 124it [00:12, 10.08it/s] 126it [00:12, 10.09it/s] 128it [00:13, 10.08it/s] 130it [00:13, 10.07it/s] 132it [00:13, 9.69it/s] 134it [00:13, 9.80it/s] 136it [00:13, 9.87it/s] 138it [00:14, 9.95it/s] 140it [00:14, 9.97it/s] 142it [00:14, 10.00it/s] 144it [00:14, 9.75it/s] 145it [00:14, 9.77it/s] 146it [00:14, 9.80it/s] 148it [00:15, 9.89it/s] 150it [00:15, 9.95it/s]2025-05-26 04:16:06,513 - INFO - [Epoch 069 | Batch 0150] IWAE-loss 4124.4932 | mean log_px -0.0141 | KL -3199.10 + 151it [00:15, 9.51it/s] 152it [00:15, 9.56it/s] 153it [00:15, 9.58it/s] 154it [00:15, 9.61it/s] 155it [00:15, 9.63it/s] 156it [00:16, 9.53it/s] 157it [00:16, 9.44it/s] 158it [00:16, 9.00it/s] 159it [00:16, 9.10it/s] 160it [00:16, 8.80it/s] 161it [00:16, 9.01it/s] 162it [00:16, 9.22it/s] 163it [00:16, 9.39it/s] 164it [00:16, 9.50it/s] 165it [00:16, 9.60it/s] 166it [00:17, 9.64it/s] 167it [00:17, 9.30it/s] 168it [00:17, 9.44it/s] 169it [00:17, 9.53it/s] 170it [00:17, 9.58it/s] 171it [00:17, 9.63it/s] 172it [00:17, 9.27it/s] 173it [00:17, 9.37it/s] 174it [00:17, 9.34it/s] 175it [00:18, 9.44it/s] 176it [00:18, 9.52it/s] 177it [00:18, 9.07it/s] 178it [00:18, 9.27it/s] 179it [00:18, 9.43it/s] 180it [00:18, 8.99it/s] 181it [00:18, 9.19it/s] 182it [00:18, 9.21it/s] 183it [00:18, 9.36it/s] 184it [00:19, 8.94it/s] 185it [00:19, 9.15it/s] 186it [00:19, 9.31it/s] 187it [00:19, 8.92it/s] 188it [00:19, 9.15it/s] 189it [00:19, 9.32it/s] 190it [00:19, 8.94it/s] 191it [00:19, 9.16it/s] 192it [00:19, 9.34it/s] 193it [00:20, 8.95it/s] 194it [00:20, 9.17it/s] 195it [00:20, 8.84it/s] 196it [00:20, 9.60it/s] +2025-05-26 04:16:11,492 - INFO - Epoch: 69, Objective: tensor([5429.6377], device='cuda:0', grad_fn=), Loss: 0.039554789662361145, KL/n: 65.18160247802734 + 0it [00:00, ?it/s]2025-05-26 04:16:11,945 - INFO - [Epoch 070 | Batch 0000] IWAE-loss 3927.8982 | mean log_px -0.0122 | KL -3190.02 + 1it [00:00, 5.58it/s] 2it [00:00, 7.51it/s] 3it [00:00, 8.45it/s] 4it [00:00, 8.96it/s] 5it [00:00, 9.29it/s] 6it [00:00, 9.48it/s] 7it [00:00, 9.62it/s] 8it [00:00, 9.69it/s] 9it [00:00, 9.77it/s] 10it [00:01, 9.81it/s] 11it [00:01, 9.81it/s] 12it [00:01, 9.83it/s] 13it [00:01, 9.85it/s] 14it [00:01, 9.86it/s] 15it [00:01, 9.89it/s] 16it [00:01, 9.88it/s] 17it [00:01, 9.89it/s] 18it [00:01, 9.88it/s] 19it [00:01, 9.89it/s] 20it [00:02, 9.89it/s] 21it [00:02, 9.91it/s] 22it [00:02, 9.75it/s] 23it [00:02, 9.67it/s] 24it [00:02, 9.62it/s] 25it [00:02, 9.56it/s] 26it [00:02, 9.56it/s] 27it [00:02, 9.55it/s] 28it [00:02, 9.53it/s] 29it [00:03, 9.49it/s] 30it [00:03, 9.53it/s] 31it [00:03, 9.57it/s] 32it [00:03, 9.51it/s] 33it [00:03, 9.52it/s] 34it [00:03, 9.57it/s] 35it [00:03, 9.57it/s] 36it [00:03, 9.52it/s] 37it [00:03, 9.47it/s] 38it [00:03, 9.47it/s] 39it [00:04, 9.45it/s] 40it [00:04, 9.30it/s] 41it [00:04, 9.48it/s] 42it [00:04, 9.60it/s] 43it [00:04, 9.70it/s] 44it [00:04, 9.77it/s] 45it [00:04, 9.84it/s] 46it [00:04, 9.86it/s] 47it [00:04, 9.87it/s] 48it [00:05, 9.61it/s] 49it [00:05, 9.70it/s] 50it [00:05, 9.70it/s]2025-05-26 04:16:17,094 - INFO - [Epoch 070 | Batch 0050] IWAE-loss 4088.9717 | mean log_px -0.0128 | KL -3193.53 + 51it [00:05, 9.75it/s] 52it [00:05, 9.80it/s] 53it [00:05, 9.84it/s] 54it [00:05, 9.85it/s] 55it [00:05, 9.86it/s] 56it [00:05, 9.87it/s] 57it [00:05, 9.89it/s] 58it [00:06, 9.89it/s] 59it [00:06, 9.90it/s] 60it [00:06, 9.90it/s] 61it [00:06, 9.91it/s] 62it [00:06, 9.91it/s] 63it [00:06, 9.92it/s] 64it [00:06, 9.91it/s] 65it [00:06, 9.92it/s] 66it [00:06, 9.91it/s] 67it [00:06, 9.90it/s] 68it [00:07, 9.90it/s] 69it [00:07, 9.90it/s] 70it [00:07, 9.89it/s] 71it [00:07, 9.87it/s] 72it [00:07, 9.89it/s] 73it [00:07, 9.90it/s] 74it [00:07, 9.88it/s] 75it [00:07, 9.90it/s] 76it [00:07, 9.89it/s] 77it [00:07, 9.89it/s] 78it [00:08, 9.89it/s] 79it [00:08, 9.90it/s] 80it [00:08, 9.90it/s] 81it [00:08, 9.92it/s] 82it [00:08, 9.89it/s] 83it [00:08, 9.87it/s] 84it [00:08, 9.87it/s] 85it [00:08, 9.89it/s] 86it [00:08, 9.88it/s] 87it [00:08, 9.89it/s] 88it [00:09, 9.89it/s] 89it [00:09, 9.90it/s] 90it [00:09, 9.89it/s] 91it [00:09, 9.90it/s] 92it [00:09, 9.86it/s] 93it [00:09, 9.72it/s] 94it [00:09, 9.71it/s] 95it [00:09, 9.77it/s] 96it [00:09, 9.80it/s] 97it [00:09, 9.84it/s] 98it [00:10, 9.85it/s] 99it [00:10, 9.87it/s] 100it [00:10, 9.85it/s]2025-05-26 04:16:22,155 - INFO - [Epoch 070 | Batch 0100] IWAE-loss 4525.4941 | mean log_px -0.0213 | KL -3186.68 + 101it [00:10, 9.86it/s] 102it [00:10, 9.86it/s] 103it [00:10, 9.86it/s] 104it [00:10, 9.87it/s] 105it [00:10, 9.88it/s] 106it [00:10, 9.88it/s] 107it [00:10, 9.89it/s] 108it [00:11, 9.89it/s] 109it [00:11, 9.90it/s] 110it [00:11, 9.89it/s] 111it [00:11, 9.75it/s] 112it [00:11, 9.73it/s] 113it [00:11, 9.76it/s] 114it [00:11, 9.79it/s] 115it [00:11, 9.82it/s] 116it [00:11, 9.84it/s] 117it [00:12, 9.86it/s] 118it [00:12, 9.85it/s] 119it [00:12, 9.86it/s] 120it [00:12, 9.87it/s] 121it [00:12, 9.87it/s] 122it [00:12, 9.86it/s] 123it [00:12, 9.88it/s] 124it [00:12, 9.86it/s] 125it [00:12, 9.63it/s] 126it [00:12, 9.59it/s] 127it [00:13, 9.68it/s] 128it [00:13, 9.73it/s] 129it [00:13, 9.68it/s] 130it [00:13, 9.73it/s] 131it [00:13, 9.77it/s] 132it [00:13, 9.81it/s] 133it [00:13, 9.84it/s] 134it [00:13, 9.85it/s] 135it [00:13, 9.84it/s] 136it [00:13, 9.85it/s] 137it [00:14, 9.86it/s] 138it [00:14, 9.86it/s] 139it [00:14, 9.85it/s] 140it [00:14, 9.85it/s] 141it [00:14, 9.87it/s] 142it [00:14, 9.86it/s] 143it [00:14, 9.86it/s] 144it [00:14, 9.87it/s] 145it [00:14, 9.88it/s] 146it [00:14, 9.89it/s] 147it [00:15, 9.90it/s] 148it [00:15, 9.90it/s] 149it [00:15, 9.90it/s] 150it [00:15, 9.90it/s]2025-05-26 04:16:27,240 - INFO - [Epoch 070 | Batch 0150] IWAE-loss 3830.5117 | mean log_px -0.0118 | KL -3191.07 + 151it [00:15, 9.86it/s] 152it [00:15, 9.86it/s] 153it [00:15, 9.86it/s] 154it [00:15, 9.87it/s] 155it [00:15, 9.88it/s] 156it [00:15, 9.86it/s] 157it [00:16, 9.86it/s] 158it [00:16, 9.86it/s] 159it [00:16, 9.73it/s] 160it [00:16, 9.52it/s] 161it [00:16, 9.46it/s] 162it [00:16, 9.56it/s] 163it [00:16, 9.67it/s] 164it [00:16, 9.73it/s] 165it [00:16, 9.78it/s] 166it [00:17, 9.80it/s] 167it [00:17, 9.59it/s] 168it [00:17, 9.67it/s] 169it [00:17, 9.74it/s] 170it [00:17, 9.78it/s] 171it [00:17, 9.80it/s] 172it [00:17, 9.82it/s] 173it [00:17, 9.85it/s] 174it [00:17, 9.85it/s] 175it [00:17, 9.89it/s] 176it [00:18, 9.88it/s] 177it [00:18, 9.89it/s] 178it [00:18, 9.89it/s] 179it [00:18, 9.90it/s] 180it [00:18, 9.88it/s] 181it [00:18, 9.88it/s] 182it [00:18, 9.87it/s] 183it [00:18, 9.88it/s] 184it [00:18, 9.88it/s] 185it [00:18, 9.88it/s] 186it [00:19, 9.87it/s] 187it [00:19, 9.89it/s] 188it [00:19, 9.88it/s] 189it [00:19, 9.90it/s] 190it [00:19, 9.89it/s] 191it [00:19, 9.90it/s] 192it [00:19, 9.90it/s] 193it [00:19, 9.90it/s] 194it [00:19, 9.90it/s] 195it [00:19, 9.26it/s] 196it [00:20, 9.73it/s] +2025-05-26 04:16:31,950 - INFO - Epoch: 70, Objective: tensor([4718.2910], device='cuda:0', grad_fn=), Loss: 0.02613232657313347, KL/n: 64.95722961425781 + 0it [00:00, ?it/s]2025-05-26 04:16:32,218 - INFO - [Epoch 071 | Batch 0000] IWAE-loss 4098.5879 | mean log_px -0.0153 | KL -3181.93 + 1it [00:00, 4.85it/s] 2it [00:00, 6.91it/s] 3it [00:00, 8.01it/s] 4it [00:00, 8.66it/s] 5it [00:00, 8.41it/s] 6it [00:00, 8.84it/s] 7it [00:00, 9.07it/s] 8it [00:00, 9.25it/s] 9it [00:01, 9.43it/s] 10it [00:01, 9.56it/s] 11it [00:01, 9.07it/s] 12it [00:01, 9.27it/s] 13it [00:01, 9.41it/s] 14it [00:01, 9.54it/s] 15it [00:01, 9.64it/s] 16it [00:01, 9.70it/s] 17it [00:01, 9.76it/s] 18it [00:01, 9.80it/s] 19it [00:02, 9.83it/s] 20it [00:02, 9.84it/s] 21it [00:02, 9.86it/s] 22it [00:02, 9.85it/s] 23it [00:02, 9.85it/s] 24it [00:02, 9.83it/s] 25it [00:02, 9.84it/s] 26it [00:02, 9.85it/s] 27it [00:02, 9.86it/s] 28it [00:02, 9.86it/s] 29it [00:03, 9.88it/s] 30it [00:03, 9.87it/s] 31it [00:03, 9.87it/s] 32it [00:03, 9.87it/s] 33it [00:03, 9.88it/s] 34it [00:03, 9.87it/s] 35it [00:03, 9.87it/s] 36it [00:03, 9.87it/s] 37it [00:03, 9.89it/s] 38it [00:04, 9.88it/s] 39it [00:04, 9.88it/s] 40it [00:04, 9.87it/s] 41it [00:04, 9.88it/s] 42it [00:04, 9.87it/s] 43it [00:04, 9.88it/s] 44it [00:04, 9.87it/s] 45it [00:04, 9.89it/s] 46it [00:04, 9.88it/s] 47it [00:04, 9.89it/s] 48it [00:05, 9.87it/s] 49it [00:05, 9.88it/s] 50it [00:05, 9.86it/s]2025-05-26 04:16:37,365 - INFO - [Epoch 071 | Batch 0050] IWAE-loss 3795.4751 | mean log_px -0.0104 | KL -3178.03 + 51it [00:05, 9.85it/s] 52it [00:05, 9.64it/s] 53it [00:05, 9.60it/s] 54it [00:05, 9.56it/s] 55it [00:05, 9.53it/s] 56it [00:05, 9.54it/s] 57it [00:05, 9.50it/s] 58it [00:06, 9.48it/s] 59it [00:06, 9.45it/s] 60it [00:06, 9.47it/s] 61it [00:06, 9.54it/s] 62it [00:06, 9.56it/s] 63it [00:06, 9.58it/s] 64it [00:06, 9.55it/s] 65it [00:06, 9.48it/s] 66it [00:06, 9.49it/s] 67it [00:07, 9.51it/s] 68it [00:07, 9.52it/s] 69it [00:07, 9.52it/s] 70it [00:07, 9.51it/s] 71it [00:07, 9.50it/s] 72it [00:07, 9.34it/s] 73it [00:07, 9.31it/s] 74it [00:07, 9.35it/s] 75it [00:07, 9.36it/s] 76it [00:07, 9.38it/s] 77it [00:08, 9.38it/s] 78it [00:08, 9.06it/s] 79it [00:08, 9.15it/s] 80it [00:08, 9.06it/s] 81it [00:08, 9.13it/s] 82it [00:08, 9.20it/s] 83it [00:08, 9.27it/s] 84it [00:08, 9.30it/s] 85it [00:08, 9.34it/s] 86it [00:09, 9.39it/s] 87it [00:09, 9.40it/s] 88it [00:09, 9.41it/s] 89it [00:09, 9.45it/s] 90it [00:09, 9.39it/s] 91it [00:09, 9.38it/s] 92it [00:09, 9.36it/s] 93it [00:09, 9.39it/s] 94it [00:09, 9.40it/s] 95it [00:10, 9.42it/s] 96it [00:10, 9.54it/s] 97it [00:10, 9.65it/s] 98it [00:10, 9.72it/s] 99it [00:10, 9.76it/s] 100it [00:10, 9.78it/s]2025-05-26 04:16:42,660 - INFO - [Epoch 071 | Batch 0100] IWAE-loss 3703.3640 | mean log_px -0.0093 | KL -3174.69 + 101it [00:10, 9.80it/s] 102it [00:10, 9.81it/s] 103it [00:10, 9.82it/s] 104it [00:10, 9.84it/s] 105it [00:11, 9.86it/s] 106it [00:11, 9.87it/s] 107it [00:11, 9.86it/s] 108it [00:11, 9.86it/s] 109it [00:11, 9.87it/s] 110it [00:11, 9.86it/s] 111it [00:11, 9.87it/s] 112it [00:11, 9.87it/s] 113it [00:11, 9.86it/s] 114it [00:11, 9.86it/s] 115it [00:12, 9.70it/s] 116it [00:12, 9.76it/s] 117it [00:12, 9.80it/s] 118it [00:12, 9.81it/s] 119it [00:12, 9.84it/s] 120it [00:12, 9.82it/s] 121it [00:12, 9.84it/s] 122it [00:12, 9.81it/s] 123it [00:12, 9.83it/s] 124it [00:12, 9.82it/s] 125it [00:13, 9.85it/s] 126it [00:13, 9.84it/s] 127it [00:13, 9.80it/s] 128it [00:13, 9.82it/s] 129it [00:13, 9.84it/s] 130it [00:13, 9.85it/s] 131it [00:13, 9.87it/s] 132it [00:13, 9.84it/s] 133it [00:13, 9.86it/s] 134it [00:13, 9.86it/s] 135it [00:14, 9.79it/s] 136it [00:14, 9.81it/s] 137it [00:14, 9.83it/s] 138it [00:14, 9.82it/s] 139it [00:14, 9.84it/s] 140it [00:14, 9.83it/s] 141it [00:14, 9.83it/s] 142it [00:14, 9.83it/s] 143it [00:14, 9.84it/s] 144it [00:14, 9.85it/s] 145it [00:15, 9.86it/s] 146it [00:15, 9.85it/s] 147it [00:15, 9.87it/s] 148it [00:15, 9.87it/s] 149it [00:15, 9.67it/s] 150it [00:15, 9.72it/s]2025-05-26 04:16:47,748 - INFO - [Epoch 071 | Batch 0150] IWAE-loss 3954.1804 | mean log_px -0.0154 | KL -3167.20 + 151it [00:15, 9.75it/s] 152it [00:15, 9.79it/s] 153it [00:15, 9.81it/s] 154it [00:16, 9.82it/s] 155it [00:16, 9.85it/s] 156it [00:16, 9.83it/s] 157it [00:16, 9.85it/s] 158it [00:16, 9.85it/s] 159it [00:16, 9.86it/s] 160it [00:16, 9.86it/s] 161it [00:16, 9.29it/s] 162it [00:16, 9.45it/s] 163it [00:16, 9.56it/s] 164it [00:17, 9.65it/s] 165it [00:17, 9.72it/s] 166it [00:17, 9.77it/s] 167it [00:17, 9.80it/s] 168it [00:17, 9.70it/s] 169it [00:17, 9.73it/s] 170it [00:17, 9.76it/s] 171it [00:17, 9.79it/s] 172it [00:17, 9.80it/s] 173it [00:17, 9.81it/s] 174it [00:18, 9.81it/s] 175it [00:18, 9.80it/s] 176it [00:18, 9.80it/s] 177it [00:18, 9.83it/s] 178it [00:18, 9.83it/s] 179it [00:18, 9.83it/s] 180it [00:18, 9.84it/s] 181it [00:18, 9.84it/s] 182it [00:18, 9.83it/s] 183it [00:18, 9.86it/s] 184it [00:19, 9.87it/s] 185it [00:19, 9.89it/s] 186it [00:19, 9.89it/s] 187it [00:19, 9.90it/s] 188it [00:19, 9.90it/s] 189it [00:19, 9.90it/s] 190it [00:19, 9.89it/s] 191it [00:19, 9.85it/s] 192it [00:19, 9.84it/s] 193it [00:19, 9.87it/s] 194it [00:20, 9.85it/s] 195it [00:20, 9.22it/s] 196it [00:20, 8.91it/s] 196it [00:20, 9.61it/s] +2025-05-26 04:16:52,480 - INFO - Epoch: 71, Objective: tensor([4948.8066], device='cuda:0', grad_fn=), Loss: 0.03435065969824791, KL/n: 64.70899200439453 + 0it [00:00, ?it/s]2025-05-26 04:16:52,945 - INFO - [Epoch 072 | Batch 0000] IWAE-loss 4508.8237 | mean log_px -0.0191 | KL -3173.76 + 1it [00:00, 5.51it/s] 2it [00:00, 7.44it/s] 3it [00:00, 8.38it/s] 4it [00:00, 8.84it/s] 5it [00:00, 9.17it/s] 6it [00:00, 9.36it/s] 7it [00:00, 9.43it/s] 8it [00:00, 9.50it/s] 9it [00:01, 9.60it/s] 10it [00:01, 9.65it/s] 11it [00:01, 9.72it/s] 12it [00:01, 9.69it/s] 13it [00:01, 9.68it/s] 14it [00:01, 9.15it/s] 15it [00:01, 9.31it/s] 16it [00:01, 9.43it/s] 17it [00:01, 9.53it/s] 18it [00:01, 9.08it/s] 19it [00:02, 9.28it/s] 20it [00:02, 9.42it/s] 21it [00:02, 8.91it/s] 22it [00:02, 9.12it/s] 23it [00:02, 9.32it/s] 24it [00:02, 8.90it/s] 25it [00:02, 9.02it/s] 26it [00:02, 9.19it/s] 27it [00:02, 9.32it/s] 28it [00:03, 8.93it/s] 29it [00:03, 9.14it/s] 30it [00:03, 9.31it/s] 31it [00:03, 8.92it/s] 32it [00:03, 9.12it/s] 33it [00:03, 9.28it/s] 34it [00:03, 8.91it/s] 35it [00:03, 9.15it/s] 36it [00:03, 9.28it/s] 37it [00:04, 8.93it/s] 38it [00:04, 9.01it/s] 39it [00:04, 9.15it/s] 40it [00:04, 8.77it/s] 41it [00:04, 8.94it/s] 42it [00:04, 9.08it/s] 43it [00:04, 9.17it/s] 44it [00:04, 8.80it/s] 45it [00:04, 8.96it/s] 46it [00:05, 9.09it/s] 47it [00:05, 9.15it/s] 48it [00:05, 8.77it/s] 49it [00:05, 8.94it/s] 50it [00:05, 9.11it/s]2025-05-26 04:16:58,361 - INFO - [Epoch 072 | Batch 0050] IWAE-loss 4654.4067 | mean log_px -0.0212 | KL -3164.67 + 51it [00:05, 9.24it/s] 52it [00:05, 8.84it/s] 53it [00:05, 8.99it/s] 54it [00:05, 9.15it/s] 55it [00:06, 8.78it/s] 56it [00:06, 8.97it/s] 57it [00:06, 9.09it/s] 58it [00:06, 9.21it/s] 59it [00:06, 8.80it/s] 60it [00:06, 8.90it/s] 61it [00:06, 8.78it/s] 62it [00:06, 8.82it/s] 63it [00:06, 8.59it/s] 64it [00:07, 8.85it/s] 65it [00:07, 9.02it/s] 66it [00:07, 9.16it/s] 67it [00:07, 8.81it/s] 68it [00:07, 8.95it/s] 69it [00:07, 8.88it/s] 70it [00:07, 8.58it/s] 71it [00:07, 8.79it/s] 72it [00:07, 8.95it/s] 73it [00:08, 9.13it/s] 74it [00:08, 8.73it/s] 75it [00:08, 8.88it/s] 76it [00:08, 8.93it/s] 77it [00:08, 9.00it/s] 78it [00:08, 8.68it/s] 79it [00:08, 8.91it/s] 80it [00:08, 9.03it/s] 81it [00:08, 9.17it/s] 82it [00:09, 8.80it/s] 83it [00:09, 8.93it/s] 84it [00:09, 9.04it/s] 85it [00:09, 9.21it/s] 86it [00:09, 8.83it/s] 87it [00:09, 9.00it/s] 88it [00:09, 9.11it/s] 89it [00:09, 9.22it/s] 90it [00:09, 8.82it/s] 91it [00:10, 8.98it/s] 92it [00:10, 9.08it/s] 93it [00:10, 9.19it/s] 94it [00:10, 8.81it/s] 95it [00:10, 9.00it/s] 96it [00:10, 9.11it/s] 97it [00:10, 9.20it/s] 98it [00:10, 8.81it/s] 99it [00:10, 8.96it/s] 100it [00:11, 9.09it/s]2025-05-26 04:17:03,948 - INFO - [Epoch 072 | Batch 0100] IWAE-loss 5721.9814 | mean log_px -0.0405 | KL -3163.68 + 101it [00:11, 9.19it/s] 102it [00:11, 8.79it/s] 103it [00:11, 9.00it/s] 104it [00:11, 9.09it/s] 105it [00:11, 9.24it/s] 106it [00:11, 8.86it/s] 107it [00:11, 9.02it/s] 108it [00:11, 9.16it/s] 109it [00:12, 9.20it/s] 110it [00:12, 8.79it/s] 111it [00:12, 8.96it/s] 112it [00:12, 9.12it/s] 113it [00:12, 9.21it/s] 114it [00:12, 8.80it/s] 115it [00:12, 8.97it/s] 116it [00:12, 9.07it/s] 117it [00:12, 9.15it/s] 118it [00:13, 8.79it/s] 119it [00:13, 8.97it/s] 120it [00:13, 9.10it/s] 121it [00:13, 9.18it/s] 122it [00:13, 8.76it/s] 123it [00:13, 8.90it/s] 124it [00:13, 9.05it/s] 125it [00:13, 9.16it/s] 126it [00:13, 8.79it/s] 127it [00:14, 8.82it/s] 128it [00:14, 9.05it/s] 129it [00:14, 9.03it/s] 130it [00:14, 8.66it/s] 131it [00:14, 8.82it/s] 132it [00:14, 8.94it/s] 133it [00:14, 8.93it/s] 134it [00:14, 8.21it/s] 135it [00:15, 8.39it/s] 136it [00:15, 8.60it/s] 137it [00:15, 8.72it/s] 138it [00:15, 8.39it/s] 139it [00:15, 8.57it/s] 140it [00:15, 8.25it/s] 141it [00:15, 8.53it/s] 142it [00:15, 8.70it/s] 143it [00:15, 8.81it/s] 144it [00:16, 8.45it/s] 145it [00:16, 8.66it/s] 146it [00:16, 8.81it/s] 147it [00:16, 8.58it/s] 148it [00:16, 8.91it/s] 149it [00:16, 9.17it/s] 150it [00:16, 9.34it/s]2025-05-26 04:17:09,580 - INFO - [Epoch 072 | Batch 0150] IWAE-loss 4235.5010 | mean log_px -0.0156 | KL -3162.35 + 151it [00:16, 8.93it/s] 152it [00:16, 9.18it/s] 153it [00:17, 9.38it/s] 154it [00:17, 9.53it/s] 155it [00:17, 9.04it/s] 156it [00:17, 9.24it/s] 157it [00:17, 8.98it/s] 158it [00:17, 9.19it/s] 159it [00:17, 9.36it/s] 160it [00:17, 8.93it/s] 161it [00:17, 9.17it/s] 162it [00:18, 9.35it/s] 163it [00:18, 8.98it/s] 164it [00:18, 9.21it/s] 165it [00:18, 9.38it/s] 166it [00:18, 8.96it/s] 167it [00:18, 9.23it/s] 168it [00:18, 9.39it/s] 169it [00:18, 9.46it/s] 170it [00:18, 9.00it/s] 171it [00:18, 9.23it/s] 172it [00:19, 9.39it/s] 173it [00:19, 9.53it/s] 174it [00:19, 9.06it/s] 175it [00:19, 9.26it/s] 176it [00:19, 9.39it/s] 177it [00:19, 9.51it/s] 178it [00:19, 9.04it/s] 179it [00:19, 9.25it/s] 180it [00:19, 9.42it/s] 181it [00:20, 9.52it/s] 182it [00:20, 8.98it/s] 183it [00:20, 9.21it/s] 184it [00:20, 9.36it/s] 185it [00:20, 9.46it/s] 186it [00:20, 9.01it/s] 187it [00:20, 9.24it/s] 188it [00:20, 9.41it/s] 189it [00:20, 9.53it/s] 190it [00:21, 9.03it/s] 191it [00:21, 9.23it/s] 192it [00:21, 9.41it/s] 193it [00:21, 9.55it/s] 194it [00:21, 9.08it/s] 195it [00:21, 8.82it/s] 196it [00:21, 9.01it/s] +2025-05-26 04:17:14,567 - INFO - Epoch: 72, Objective: tensor([3779.6716], device='cuda:0', grad_fn=), Loss: 0.01213796902447939, KL/n: 64.47173309326172 + 0it [00:00, ?it/s]2025-05-26 04:17:14,839 - INFO - [Epoch 073 | Batch 0000] IWAE-loss 4182.9614 | mean log_px -0.0191 | KL -3160.06 + 1it [00:00, 4.82it/s] 3it [00:00, 7.86it/s] 5it [00:00, 8.85it/s] 6it [00:00, 9.12it/s] 8it [00:00, 9.51it/s] 9it [00:01, 9.13it/s] 11it [00:01, 9.48it/s] 12it [00:01, 9.59it/s] 14it [00:01, 9.77it/s] 16it [00:01, 9.88it/s] 18it [00:01, 9.96it/s] 20it [00:02, 10.00it/s] 22it [00:02, 10.02it/s] 24it [00:02, 10.00it/s] 26it [00:02, 10.01it/s] 28it [00:02, 9.69it/s] 29it [00:03, 9.74it/s] 30it [00:03, 9.78it/s] 32it [00:03, 9.87it/s] 34it [00:03, 9.90it/s] 35it [00:03, 9.77it/s] 36it [00:03, 9.44it/s] 38it [00:03, 9.68it/s] 40it [00:04, 9.81it/s] 41it [00:04, 9.84it/s] 42it [00:04, 9.87it/s] 43it [00:04, 9.90it/s] 45it [00:04, 9.96it/s] 46it [00:04, 9.96it/s] 47it [00:04, 9.96it/s] 48it [00:04, 9.46it/s] 50it [00:05, 9.70it/s]2025-05-26 04:17:19,946 - INFO - [Epoch 073 | Batch 0050] IWAE-loss 4043.1121 | mean log_px -0.0134 | KL -3153.70 + 51it [00:05, 9.26it/s] 53it [00:05, 9.57it/s] 54it [00:05, 9.64it/s] 56it [00:05, 9.81it/s] 58it [00:06, 9.90it/s] 59it [00:06, 9.90it/s] 61it [00:06, 9.98it/s] 62it [00:06, 9.51it/s] 64it [00:06, 9.70it/s] 65it [00:06, 9.75it/s] 66it [00:06, 9.78it/s] 67it [00:06, 9.30it/s] 68it [00:07, 9.46it/s] 70it [00:07, 9.70it/s] 72it [00:07, 9.80it/s] 74it [00:07, 9.90it/s] 76it [00:07, 9.93it/s] 78it [00:08, 9.96it/s] 79it [00:08, 9.95it/s] 80it [00:08, 9.95it/s] 82it [00:08, 9.64it/s] 83it [00:08, 9.66it/s] 84it [00:08, 9.68it/s] 85it [00:08, 9.71it/s] 86it [00:08, 9.73it/s] 87it [00:09, 9.23it/s] 88it [00:09, 9.41it/s] 89it [00:09, 9.44it/s] 90it [00:09, 9.52it/s] 91it [00:09, 9.59it/s] 92it [00:09, 9.62it/s] 93it [00:09, 9.67it/s] 94it [00:09, 9.24it/s] 95it [00:09, 9.41it/s] 96it [00:09, 9.52it/s] 98it [00:10, 9.74it/s] 100it [00:10, 9.83it/s]2025-05-26 04:17:25,104 - INFO - [Epoch 073 | Batch 0100] IWAE-loss 4164.0747 | mean log_px -0.0208 | KL -3156.93 + 101it [00:10, 9.39it/s] 103it [00:10, 9.33it/s] 105it [00:10, 9.58it/s] 107it [00:11, 9.74it/s] 108it [00:11, 9.78it/s] 110it [00:11, 9.89it/s] 112it [00:11, 9.96it/s] 114it [00:11, 9.99it/s] 116it [00:11, 10.03it/s] 118it [00:12, 10.04it/s] 120it [00:12, 10.03it/s] 122it [00:12, 10.05it/s] 124it [00:12, 10.06it/s] 126it [00:12, 10.08it/s] 128it [00:13, 10.09it/s] 130it [00:13, 10.07it/s] 132it [00:13, 10.07it/s] 134it [00:13, 10.06it/s] 136it [00:13, 9.72it/s] 137it [00:14, 9.75it/s] 138it [00:14, 9.79it/s] 140it [00:14, 9.79it/s] 141it [00:14, 9.82it/s] 143it [00:14, 9.91it/s] 145it [00:14, 9.96it/s] 146it [00:14, 9.96it/s] 147it [00:15, 9.81it/s] 148it [00:15, 9.41it/s] 149it [00:15, 9.55it/s] 150it [00:15, 9.65it/s]2025-05-26 04:17:30,176 - INFO - [Epoch 073 | Batch 0150] IWAE-loss 4541.8203 | mean log_px -0.0273 | KL -3146.10 + 151it [00:15, 9.19it/s] 153it [00:15, 9.58it/s] 155it [00:15, 9.75it/s] 156it [00:16, 9.41it/s] 157it [00:16, 9.38it/s] 158it [00:16, 9.32it/s] 159it [00:16, 9.41it/s] 160it [00:16, 9.56it/s] 162it [00:16, 9.77it/s] 163it [00:16, 9.80it/s] 164it [00:16, 9.83it/s] 165it [00:16, 9.87it/s] 167it [00:17, 9.97it/s] 169it [00:17, 9.63it/s] 170it [00:17, 9.70it/s] 172it [00:17, 9.84it/s] 174it [00:17, 9.93it/s] 175it [00:17, 9.93it/s] 176it [00:18, 9.94it/s] 178it [00:18, 9.99it/s] 179it [00:18, 9.99it/s] 181it [00:18, 9.97it/s] 183it [00:18, 9.68it/s] 184it [00:18, 9.73it/s] 185it [00:19, 9.77it/s] 186it [00:19, 9.30it/s] 188it [00:19, 9.60it/s] 189it [00:19, 9.67it/s] 191it [00:19, 9.83it/s] 193it [00:19, 9.89it/s] 194it [00:19, 9.47it/s] 195it [00:20, 9.22it/s] 196it [00:20, 9.69it/s] +2025-05-26 04:17:34,928 - INFO - Epoch: 73, Objective: tensor([3657.3047], device='cuda:0', grad_fn=), Loss: 0.007871869951486588, KL/n: 64.23025512695312 + 0it [00:00, ?it/s]2025-05-26 04:17:35,396 - INFO - [Epoch 074 | Batch 0000] IWAE-loss 4381.4062 | mean log_px -0.0209 | KL -3141.13 + 1it [00:00, 2.47it/s] 3it [00:00, 5.62it/s] 5it [00:00, 7.27it/s] 6it [00:00, 7.84it/s] 8it [00:01, 8.69it/s] 10it [00:01, 9.16it/s] 12it [00:01, 9.47it/s] 14it [00:01, 9.66it/s] 16it [00:01, 9.79it/s] 18it [00:02, 9.88it/s] 20it [00:02, 9.95it/s] 22it [00:02, 10.00it/s] 24it [00:02, 9.75it/s] 26it [00:02, 9.84it/s] 28it [00:03, 9.91it/s] 30it [00:03, 9.96it/s] 31it [00:03, 9.92it/s] 33it [00:03, 9.97it/s] 35it [00:03, 10.01it/s] 37it [00:03, 10.03it/s] 39it [00:04, 10.05it/s] 41it [00:04, 10.06it/s] 43it [00:04, 9.72it/s] 44it [00:04, 9.71it/s] 45it [00:04, 9.76it/s] 47it [00:05, 9.84it/s] 48it [00:05, 9.86it/s] 49it [00:05, 9.89it/s] 50it [00:05, 9.88it/s]2025-05-26 04:17:40,446 - INFO - [Epoch 074 | Batch 0050] IWAE-loss 4331.8213 | mean log_px -0.0203 | KL -3145.59 + 51it [00:05, 9.83it/s] 52it [00:05, 9.77it/s] 53it [00:05, 9.77it/s] 54it [00:05, 9.78it/s] 55it [00:05, 9.77it/s] 56it [00:05, 9.79it/s] 57it [00:06, 9.69it/s] 58it [00:06, 9.63it/s] 59it [00:06, 9.58it/s] 60it [00:06, 9.64it/s] 61it [00:06, 9.65it/s] 62it [00:06, 9.68it/s] 63it [00:06, 9.72it/s] 64it [00:06, 9.74it/s] 65it [00:06, 9.78it/s] 66it [00:06, 9.80it/s] 67it [00:07, 9.82it/s] 68it [00:07, 9.82it/s] 69it [00:07, 9.83it/s] 70it [00:07, 9.83it/s] 71it [00:07, 9.83it/s] 72it [00:07, 9.83it/s] 73it [00:07, 9.84it/s] 74it [00:07, 9.84it/s] 75it [00:07, 9.85it/s] 76it [00:07, 9.85it/s] 77it [00:08, 9.85it/s] 78it [00:08, 9.84it/s] 79it [00:08, 9.84it/s] 80it [00:08, 9.83it/s] 81it [00:08, 9.85it/s] 82it [00:08, 9.84it/s] 83it [00:08, 9.84it/s] 84it [00:08, 9.84it/s] 85it [00:08, 9.85it/s] 86it [00:09, 9.84it/s] 87it [00:09, 9.83it/s] 88it [00:09, 9.83it/s] 89it [00:09, 9.84it/s] 90it [00:09, 9.82it/s] 91it [00:09, 9.84it/s] 92it [00:09, 9.83it/s] 93it [00:09, 9.84it/s] 94it [00:09, 9.61it/s] 95it [00:09, 9.59it/s] 96it [00:10, 9.65it/s] 97it [00:10, 9.70it/s] 98it [00:10, 9.72it/s] 99it [00:10, 9.74it/s] 100it [00:10, 9.77it/s]2025-05-26 04:17:45,562 - INFO - [Epoch 074 | Batch 0100] IWAE-loss 3966.7395 | mean log_px -0.0130 | KL -3133.57 + 101it [00:10, 9.77it/s] 102it [00:10, 9.78it/s] 103it [00:10, 9.80it/s] 104it [00:10, 9.80it/s] 105it [00:10, 9.82it/s] 106it [00:11, 9.83it/s] 107it [00:11, 9.83it/s] 108it [00:11, 9.82it/s] 109it [00:11, 9.78it/s] 110it [00:11, 9.79it/s] 111it [00:11, 9.81it/s] 112it [00:11, 9.80it/s] 113it [00:11, 9.82it/s] 114it [00:11, 9.83it/s] 115it [00:11, 9.85it/s] 116it [00:12, 9.85it/s] 117it [00:12, 9.86it/s] 118it [00:12, 9.85it/s] 119it [00:12, 9.84it/s] 120it [00:12, 9.81it/s] 121it [00:12, 9.82it/s] 122it [00:12, 9.83it/s] 123it [00:12, 9.79it/s] 124it [00:12, 9.78it/s] 125it [00:12, 9.78it/s] 126it [00:13, 9.77it/s] 127it [00:13, 9.78it/s] 128it [00:13, 9.79it/s] 129it [00:13, 9.80it/s] 130it [00:13, 9.76it/s] 131it [00:13, 9.79it/s] 132it [00:13, 9.78it/s] 133it [00:13, 9.79it/s] 134it [00:13, 9.79it/s] 135it [00:14, 9.80it/s] 136it [00:14, 9.77it/s] 137it [00:14, 9.79it/s] 138it [00:14, 9.81it/s] 139it [00:14, 9.82it/s] 140it [00:14, 9.80it/s] 141it [00:14, 9.82it/s] 142it [00:14, 9.81it/s] 143it [00:14, 9.82it/s] 144it [00:14, 9.83it/s] 145it [00:15, 9.85it/s] 146it [00:15, 9.84it/s] 147it [00:15, 9.83it/s] 148it [00:15, 9.82it/s] 149it [00:15, 9.83it/s] 150it [00:15, 9.81it/s]2025-05-26 04:17:50,659 - INFO - [Epoch 074 | Batch 0150] IWAE-loss 3943.3928 | mean log_px -0.0122 | KL -3135.55 + 151it [00:15, 9.77it/s] 152it [00:15, 9.66it/s] 153it [00:15, 9.66it/s] 154it [00:15, 9.69it/s] 155it [00:16, 9.74it/s] 156it [00:16, 9.77it/s] 157it [00:16, 9.80it/s] 158it [00:16, 9.80it/s] 159it [00:16, 9.80it/s] 160it [00:16, 9.79it/s] 161it [00:16, 9.80it/s] 162it [00:16, 9.81it/s] 163it [00:16, 9.81it/s] 164it [00:16, 9.81it/s] 165it [00:17, 9.82it/s] 166it [00:17, 9.83it/s] 167it [00:17, 9.83it/s] 168it [00:17, 9.71it/s] 169it [00:17, 9.71it/s] 170it [00:17, 9.72it/s] 171it [00:17, 9.76it/s] 172it [00:17, 9.78it/s] 173it [00:17, 9.81it/s] 174it [00:17, 9.83it/s] 175it [00:18, 9.84it/s] 176it [00:18, 9.83it/s] 177it [00:18, 9.85it/s] 178it [00:18, 9.83it/s] 179it [00:18, 9.84it/s] 180it [00:18, 9.84it/s] 181it [00:18, 9.85it/s] 182it [00:18, 9.75it/s] 183it [00:18, 9.59it/s] 184it [00:19, 9.53it/s] 185it [00:19, 9.03it/s] 186it [00:19, 9.12it/s] 187it [00:19, 9.16it/s] 188it [00:19, 9.27it/s] 189it [00:19, 8.78it/s] 190it [00:19, 9.02it/s] 191it [00:19, 9.21it/s] 192it [00:19, 9.30it/s] 193it [00:20, 8.89it/s] 194it [00:20, 9.13it/s] 195it [00:20, 8.35it/s] 196it [00:20, 9.59it/s] +2025-05-26 04:17:55,503 - INFO - Epoch: 74, Objective: tensor([3946.5691], device='cuda:0', grad_fn=), Loss: 0.01754077710211277, KL/n: 63.97822570800781 + 0it [00:00, ?it/s]2025-05-26 04:17:55,797 - INFO - [Epoch 075 | Batch 0000] IWAE-loss 4051.3987 | mean log_px -0.0158 | KL -3134.45 + 1it [00:00, 5.14it/s] 2it [00:00, 6.45it/s] 3it [00:00, 7.50it/s] 4it [00:00, 8.14it/s] 5it [00:00, 8.56it/s] 6it [00:00, 8.42it/s] 7it [00:00, 8.69it/s] 8it [00:00, 8.90it/s] 9it [00:01, 9.09it/s] 10it [00:01, 9.20it/s] 11it [00:01, 8.78it/s] 12it [00:01, 8.93it/s] 13it [00:01, 9.08it/s] 14it [00:01, 9.21it/s] 15it [00:01, 9.28it/s] 16it [00:01, 8.68it/s] 17it [00:01, 8.84it/s] 18it [00:02, 9.01it/s] 19it [00:02, 9.17it/s] 20it [00:02, 9.30it/s] 21it [00:02, 9.47it/s] 22it [00:02, 9.60it/s] 23it [00:02, 9.69it/s] 24it [00:02, 9.15it/s] 25it [00:02, 9.35it/s] 26it [00:02, 9.50it/s] 27it [00:03, 9.63it/s] 28it [00:03, 9.72it/s] 29it [00:03, 9.77it/s] 30it [00:03, 9.82it/s] 31it [00:03, 9.85it/s] 32it [00:03, 9.88it/s] 33it [00:03, 9.88it/s] 34it [00:03, 9.23it/s] 35it [00:03, 9.44it/s] 36it [00:03, 9.57it/s] 37it [00:04, 9.67it/s] 38it [00:04, 9.74it/s] 39it [00:04, 9.77it/s] 40it [00:04, 9.79it/s] 41it [00:04, 9.84it/s] 42it [00:04, 9.87it/s] 43it [00:04, 9.23it/s] 44it [00:04, 9.41it/s] 45it [00:04, 9.57it/s] 46it [00:04, 9.64it/s] 47it [00:05, 9.73it/s] 48it [00:05, 9.71it/s] 49it [00:05, 9.72it/s] 50it [00:05, 9.17it/s]2025-05-26 04:18:01,130 - INFO - [Epoch 075 | Batch 0050] IWAE-loss 3742.8145 | mean log_px -0.0096 | KL -3130.84 + 51it [00:05, 9.27it/s] 52it [00:05, 9.44it/s] 53it [00:05, 9.58it/s] 54it [00:05, 9.65it/s] 55it [00:05, 9.74it/s] 56it [00:06, 9.76it/s] 57it [00:06, 9.82it/s] 58it [00:06, 9.84it/s] 59it [00:06, 9.72it/s] 60it [00:06, 9.63it/s] 61it [00:06, 9.49it/s] 62it [00:06, 8.83it/s] 63it [00:06, 9.01it/s] 64it [00:06, 9.19it/s] 65it [00:06, 9.33it/s] 66it [00:07, 9.42it/s] 67it [00:07, 9.49it/s] 68it [00:07, 8.94it/s] 69it [00:07, 9.15it/s] 70it [00:07, 9.29it/s] 71it [00:07, 9.41it/s] 72it [00:07, 8.85it/s] 73it [00:07, 9.07it/s] 74it [00:07, 9.23it/s] 75it [00:08, 9.29it/s] 76it [00:08, 8.79it/s] 77it [00:08, 9.02it/s] 78it [00:08, 9.22it/s] 79it [00:08, 9.39it/s] 80it [00:08, 9.48it/s] 81it [00:08, 9.00it/s] 82it [00:08, 9.26it/s] 83it [00:08, 9.19it/s] 84it [00:09, 9.39it/s] 85it [00:09, 8.94it/s] 86it [00:09, 9.19it/s] 87it [00:09, 9.41it/s] 88it [00:09, 9.53it/s] 89it [00:09, 9.65it/s] 90it [00:09, 9.09it/s] 91it [00:09, 9.34it/s] 92it [00:09, 9.47it/s] 93it [00:10, 9.59it/s] 94it [00:10, 9.65it/s] 95it [00:10, 9.75it/s] 96it [00:10, 9.76it/s] 97it [00:10, 9.12it/s] 98it [00:10, 9.07it/s] 99it [00:10, 9.22it/s] 100it [00:10, 9.39it/s]2025-05-26 04:18:06,475 - INFO - [Epoch 075 | Batch 0100] IWAE-loss 4642.5938 | mean log_px -0.0251 | KL -3130.53 + 101it [00:10, 9.54it/s] 102it [00:10, 9.67it/s] 103it [00:11, 9.15it/s] 104it [00:11, 9.38it/s] 105it [00:11, 9.55it/s] 106it [00:11, 9.61it/s] 107it [00:11, 9.70it/s] 108it [00:11, 9.72it/s] 110it [00:11, 9.85it/s] 111it [00:11, 9.36it/s] 112it [00:12, 9.50it/s] 113it [00:12, 9.60it/s] 114it [00:12, 9.67it/s] 115it [00:12, 9.74it/s] 116it [00:12, 9.80it/s] 117it [00:12, 9.85it/s] 118it [00:12, 9.23it/s] 120it [00:12, 9.52it/s] 121it [00:12, 9.63it/s] 122it [00:13, 9.72it/s] 123it [00:13, 9.35it/s] 124it [00:13, 9.52it/s] 125it [00:13, 9.62it/s] 126it [00:13, 9.70it/s] 127it [00:13, 9.18it/s] 128it [00:13, 9.39it/s] 129it [00:13, 9.56it/s] 130it [00:13, 9.62it/s] 131it [00:14, 9.72it/s] 132it [00:14, 9.16it/s] 134it [00:14, 9.52it/s] 135it [00:14, 9.62it/s] 136it [00:14, 9.69it/s] 137it [00:14, 9.21it/s] 138it [00:14, 9.37it/s] 139it [00:14, 8.99it/s] 140it [00:14, 9.21it/s] 141it [00:15, 9.38it/s] 142it [00:15, 9.54it/s] 143it [00:15, 9.66it/s] 144it [00:15, 9.73it/s] 146it [00:15, 9.37it/s] 147it [00:15, 9.48it/s] 148it [00:15, 9.56it/s] 149it [00:15, 9.67it/s] 150it [00:16, 9.17it/s]2025-05-26 04:18:11,737 - INFO - [Epoch 075 | Batch 0150] IWAE-loss 4248.3130 | mean log_px -0.0234 | KL -3122.70 + 151it [00:16, 9.38it/s] 152it [00:16, 9.49it/s] 153it [00:16, 9.60it/s] 154it [00:16, 9.65it/s] 155it [00:16, 8.99it/s] 156it [00:16, 8.90it/s] 157it [00:16, 8.99it/s] 158it [00:16, 9.22it/s] 159it [00:17, 8.86it/s] 160it [00:17, 9.15it/s] 161it [00:17, 9.38it/s] 162it [00:17, 9.44it/s] 163it [00:17, 8.98it/s] 164it [00:17, 9.20it/s] 165it [00:17, 9.41it/s] 166it [00:17, 9.55it/s] 167it [00:17, 9.07it/s] 168it [00:17, 9.22it/s] 169it [00:18, 9.38it/s] 170it [00:18, 9.52it/s] 171it [00:18, 9.08it/s] 172it [00:18, 9.31it/s] 173it [00:18, 9.50it/s] 174it [00:18, 9.61it/s] 175it [00:18, 9.10it/s] 176it [00:18, 9.33it/s] 177it [00:18, 9.50it/s] 178it [00:19, 9.60it/s] 179it [00:19, 9.09it/s] 180it [00:19, 9.31it/s] 181it [00:19, 9.48it/s] 182it [00:19, 9.43it/s] 183it [00:19, 8.90it/s] 184it [00:19, 9.16it/s] 185it [00:19, 9.35it/s] 186it [00:19, 9.51it/s] 187it [00:20, 9.04it/s] 188it [00:20, 9.24it/s] 190it [00:20, 9.13it/s] 191it [00:20, 9.33it/s] 192it [00:20, 9.45it/s] 193it [00:20, 9.57it/s] 194it [00:20, 9.12it/s] 195it [00:20, 8.92it/s] 196it [00:21, 9.32it/s] +2025-05-26 04:18:16,676 - INFO - Epoch: 75, Objective: tensor([4487.3818], device='cuda:0', grad_fn=), Loss: 0.022050147876143456, KL/n: 63.74296569824219 + 0it [00:00, ?it/s]2025-05-26 04:18:16,947 - INFO - [Epoch 076 | Batch 0000] IWAE-loss 3891.9312 | mean log_px -0.0134 | KL -3123.93 + 1it [00:00, 4.79it/s] 3it [00:00, 7.83it/s] 4it [00:00, 8.46it/s] 5it [00:00, 8.46it/s] 7it [00:00, 9.17it/s] 9it [00:01, 9.54it/s] 11it [00:01, 9.73it/s] 12it [00:01, 9.78it/s] 14it [00:01, 7.09it/s] 15it [00:01, 7.55it/s] 16it [00:01, 8.00it/s] 17it [00:02, 8.41it/s] 19it [00:02, 9.00it/s] 21it [00:02, 9.38it/s] 22it [00:02, 9.49it/s] 24it [00:02, 9.70it/s] 26it [00:02, 9.82it/s] 27it [00:03, 9.82it/s] 28it [00:03, 9.86it/s] 30it [00:03, 9.93it/s] 32it [00:03, 9.66it/s] 34it [00:03, 9.76it/s] 35it [00:03, 9.39it/s] 36it [00:03, 9.49it/s] 37it [00:04, 9.59it/s] 39it [00:04, 9.80it/s] 40it [00:04, 9.82it/s] 41it [00:04, 9.36it/s] 43it [00:04, 9.65it/s] 44it [00:04, 9.65it/s] 46it [00:05, 9.41it/s] 48it [00:05, 9.65it/s] 50it [00:05, 9.80it/s]2025-05-26 04:18:22,280 - INFO - [Epoch 076 | Batch 0050] IWAE-loss 3677.9912 | mean log_px -0.0094 | KL -3120.58 + 51it [00:05, 9.46it/s] 52it [00:05, 9.57it/s] 54it [00:05, 9.75it/s] 56it [00:06, 9.85it/s] 58it [00:06, 9.94it/s] 60it [00:06, 9.99it/s] 61it [00:06, 9.68it/s] 62it [00:06, 9.75it/s] 64it [00:06, 9.88it/s] 66it [00:07, 9.95it/s] 67it [00:07, 9.96it/s] 69it [00:07, 10.01it/s] 71it [00:07, 9.66it/s] 73it [00:07, 9.81it/s] 74it [00:07, 9.84it/s] 76it [00:08, 9.93it/s] 78it [00:08, 9.97it/s] 80it [00:08, 9.99it/s] 82it [00:08, 9.72it/s] 84it [00:08, 9.79it/s] 85it [00:08, 9.45it/s] 87it [00:09, 9.66it/s] 89it [00:09, 9.80it/s] 91it [00:09, 9.89it/s] 93it [00:09, 9.92it/s] 94it [00:09, 9.43it/s] 96it [00:10, 9.61it/s] 98it [00:10, 9.76it/s] 100it [00:10, 9.87it/s]2025-05-26 04:18:27,383 - INFO - [Epoch 076 | Batch 0100] IWAE-loss 4684.5400 | mean log_px -0.0297 | KL -3118.37 + 101it [00:10, 9.50it/s] 103it [00:10, 9.70it/s] 104it [00:10, 9.74it/s] 106it [00:11, 9.87it/s] 108it [00:11, 9.94it/s] 110it [00:11, 9.71it/s] 112it [00:11, 9.83it/s] 114it [00:11, 9.91it/s] 116it [00:12, 9.97it/s] 117it [00:12, 9.60it/s] 119it [00:12, 9.77it/s] 121it [00:12, 9.88it/s] 123it [00:12, 9.54it/s] 125it [00:13, 9.71it/s] 127it [00:13, 9.55it/s] 129it [00:13, 9.66it/s] 131it [00:13, 9.78it/s] 132it [00:13, 9.53it/s] 134it [00:14, 9.70it/s] 136it [00:14, 9.53it/s] 137it [00:14, 9.60it/s] 139it [00:14, 9.77it/s] 141it [00:14, 9.51it/s] 143it [00:14, 9.69it/s] 145it [00:15, 9.82it/s] 147it [00:15, 9.91it/s] 149it [00:15, 9.97it/s]2025-05-26 04:18:32,512 - INFO - [Epoch 076 | Batch 0150] IWAE-loss 4113.5596 | mean log_px -0.0186 | KL -3107.95 + 151it [00:15, 9.99it/s] 153it [00:15, 9.99it/s] 155it [00:16, 10.02it/s] 157it [00:16, 9.70it/s] 159it [00:16, 9.81it/s] 161it [00:16, 9.80it/s] 162it [00:16, 9.71it/s] 163it [00:17, 9.33it/s] 164it [00:17, 9.40it/s] 165it [00:17, 9.46it/s] 166it [00:17, 9.52it/s] 167it [00:17, 9.55it/s] 168it [00:17, 9.60it/s] 169it [00:17, 9.63it/s] 170it [00:17, 9.65it/s] 171it [00:17, 9.66it/s] 172it [00:17, 9.17it/s] 173it [00:18, 9.24it/s] 174it [00:18, 9.30it/s] 175it [00:18, 9.34it/s] 176it [00:18, 9.21it/s] 177it [00:18, 9.26it/s] 178it [00:18, 9.36it/s] 179it [00:18, 9.39it/s] 180it [00:18, 9.43it/s] 181it [00:18, 9.47it/s] 182it [00:19, 9.51it/s] 183it [00:19, 9.56it/s] 184it [00:19, 9.54it/s] 185it [00:19, 9.52it/s] 186it [00:19, 9.53it/s] 187it [00:19, 9.50it/s] 188it [00:19, 9.44it/s] 189it [00:19, 9.48it/s] 190it [00:19, 9.49it/s] 191it [00:19, 9.48it/s] 192it [00:20, 9.50it/s] 193it [00:20, 9.07it/s] 194it [00:20, 9.10it/s] 195it [00:20, 8.71it/s] 196it [00:20, 8.99it/s] 196it [00:20, 9.53it/s] +2025-05-26 04:18:37,375 - INFO - Epoch: 76, Objective: tensor([3478.5898], device='cuda:0', grad_fn=), Loss: 0.005448373034596443, KL/n: 63.492427825927734 + 0it [00:00, ?it/s]2025-05-26 04:18:37,660 - INFO - [Epoch 077 | Batch 0000] IWAE-loss 3869.8042 | mean log_px -0.0148 | KL -3113.27 + 1it [00:00, 4.58it/s] 2it [00:00, 6.54it/s] 3it [00:00, 7.65it/s] 4it [00:00, 8.14it/s] 5it [00:00, 8.63it/s] 6it [00:00, 8.35it/s] 7it [00:00, 8.69it/s] 8it [00:00, 8.90it/s] 9it [00:01, 9.12it/s] 10it [00:01, 9.23it/s] 11it [00:01, 9.33it/s] 12it [00:01, 9.39it/s] 13it [00:01, 9.48it/s] 14it [00:01, 9.53it/s] 15it [00:01, 9.50it/s] 16it [00:01, 9.53it/s] 17it [00:01, 9.56it/s] 18it [00:02, 9.55it/s] 19it [00:02, 9.58it/s] 20it [00:02, 9.56it/s] 21it [00:02, 9.65it/s] 22it [00:02, 9.67it/s] 23it [00:02, 9.71it/s] 24it [00:02, 9.68it/s] 25it [00:02, 9.27it/s] 26it [00:02, 9.33it/s] 27it [00:02, 9.44it/s] 28it [00:03, 9.49it/s] 29it [00:03, 9.53it/s] 30it [00:03, 9.58it/s] 31it [00:03, 9.58it/s] 32it [00:03, 9.59it/s] 33it [00:03, 9.56it/s] 34it [00:03, 9.56it/s] 35it [00:03, 9.53it/s] 36it [00:03, 9.52it/s] 37it [00:04, 9.53it/s] 38it [00:04, 9.55it/s] 39it [00:04, 9.48it/s] 40it [00:04, 9.47it/s] 41it [00:04, 9.51it/s] 42it [00:04, 8.99it/s] 43it [00:04, 9.17it/s] 44it [00:04, 9.27it/s] 45it [00:04, 9.38it/s] 46it [00:04, 9.42it/s] 47it [00:05, 9.45it/s] 48it [00:05, 9.50it/s] 49it [00:05, 9.56it/s] 50it [00:05, 9.60it/s]2025-05-26 04:18:42,971 - INFO - [Epoch 077 | Batch 0050] IWAE-loss 4025.5740 | mean log_px -0.0166 | KL -3104.95 + 51it [00:05, 9.57it/s] 52it [00:05, 9.53it/s] 53it [00:05, 9.54it/s] 54it [00:05, 9.57it/s] 55it [00:05, 9.62it/s] 56it [00:06, 9.57it/s] 57it [00:06, 9.52it/s] 58it [00:06, 9.50it/s] 59it [00:06, 9.54it/s] 60it [00:06, 9.58it/s] 61it [00:06, 9.34it/s] 62it [00:06, 8.99it/s] 63it [00:06, 9.12it/s] 64it [00:06, 9.23it/s] 65it [00:06, 9.34it/s] 66it [00:07, 9.39it/s] 67it [00:07, 9.45it/s] 68it [00:07, 9.48it/s] 69it [00:07, 9.51it/s] 70it [00:07, 9.51it/s] 71it [00:07, 9.57it/s] 72it [00:07, 9.62it/s] 73it [00:07, 9.59it/s] 74it [00:07, 9.63it/s] 75it [00:08, 9.60it/s] 76it [00:08, 9.59it/s] 77it [00:08, 9.55it/s] 78it [00:08, 9.55it/s] 79it [00:08, 9.52it/s] 80it [00:08, 9.52it/s] 81it [00:08, 9.52it/s] 82it [00:08, 9.57it/s] 83it [00:08, 9.54it/s] 84it [00:08, 9.53it/s] 85it [00:09, 9.57it/s] 86it [00:09, 9.60it/s] 87it [00:09, 9.63it/s] 88it [00:09, 9.59it/s] 89it [00:09, 9.55it/s] 90it [00:09, 9.57it/s] 91it [00:09, 9.58it/s] 92it [00:09, 9.57it/s] 93it [00:09, 9.61it/s] 94it [00:10, 9.59it/s] 95it [00:10, 9.62it/s] 96it [00:10, 9.15it/s] 97it [00:10, 9.29it/s] 98it [00:10, 9.37it/s] 99it [00:10, 9.42it/s] 100it [00:10, 9.47it/s]2025-05-26 04:18:48,239 - INFO - [Epoch 077 | Batch 0100] IWAE-loss 3877.6897 | mean log_px -0.0162 | KL -3102.57 + 101it [00:10, 9.51it/s] 102it [00:10, 9.51it/s] 103it [00:10, 9.52it/s] 104it [00:11, 9.53it/s] 105it [00:11, 8.96it/s] 106it [00:11, 9.13it/s] 107it [00:11, 9.30it/s] 108it [00:11, 9.37it/s] 109it [00:11, 9.42it/s] 110it [00:11, 9.53it/s] 111it [00:11, 9.53it/s] 112it [00:11, 9.53it/s] 113it [00:12, 9.41it/s] 114it [00:12, 9.43it/s] 115it [00:12, 9.48it/s] 116it [00:12, 9.48it/s] 117it [00:12, 9.49it/s] 118it [00:12, 9.48it/s] 119it [00:12, 9.54it/s] 120it [00:12, 9.48it/s] 121it [00:12, 9.51it/s] 122it [00:12, 9.54it/s] 123it [00:13, 9.60it/s] 124it [00:13, 9.03it/s] 125it [00:13, 9.16it/s] 126it [00:13, 8.89it/s] 127it [00:13, 9.13it/s] 128it [00:13, 9.26it/s] 129it [00:13, 9.33it/s] 130it [00:13, 9.41it/s] 131it [00:13, 9.51it/s] 132it [00:14, 9.53it/s] 133it [00:14, 9.50it/s] 134it [00:14, 9.51it/s] 135it [00:14, 9.53it/s] 136it [00:14, 9.55it/s] 137it [00:14, 9.54it/s] 138it [00:14, 9.52it/s] 139it [00:14, 9.58it/s] 140it [00:14, 9.57it/s] 141it [00:15, 9.60it/s] 142it [00:15, 9.63it/s] 143it [00:15, 9.69it/s] 144it [00:15, 9.70it/s] 145it [00:15, 9.73it/s] 146it [00:15, 9.66it/s] 147it [00:15, 9.64it/s] 148it [00:15, 9.62it/s] 149it [00:15, 9.61it/s] 150it [00:15, 9.60it/s]2025-05-26 04:18:53,519 - INFO - [Epoch 077 | Batch 0150] IWAE-loss 3844.5071 | mean log_px -0.0126 | KL -3099.34 + 151it [00:16, 9.59it/s] 152it [00:16, 9.59it/s] 153it [00:16, 9.61it/s] 154it [00:16, 9.66it/s] 155it [00:16, 9.63it/s] 156it [00:16, 9.60it/s] 157it [00:16, 9.56it/s] 158it [00:16, 9.61it/s] 159it [00:16, 9.61it/s] 160it [00:16, 9.56it/s] 161it [00:17, 9.53it/s] 162it [00:17, 9.58it/s] 163it [00:17, 9.56it/s] 164it [00:17, 9.52it/s] 165it [00:17, 9.04it/s] 166it [00:17, 9.15it/s] 167it [00:17, 9.33it/s] 168it [00:17, 9.46it/s] 169it [00:17, 9.48it/s] 170it [00:18, 9.44it/s] 171it [00:18, 9.47it/s] 172it [00:18, 8.98it/s] 173it [00:18, 9.15it/s] 174it [00:18, 9.26it/s] 175it [00:18, 9.39it/s] 176it [00:18, 9.44it/s] 177it [00:18, 9.50it/s] 178it [00:18, 9.52it/s] 179it [00:19, 9.56it/s] 180it [00:19, 9.52it/s] 181it [00:19, 9.52it/s] 182it [00:19, 9.54it/s] 183it [00:19, 9.58it/s] 184it [00:19, 9.58it/s] 185it [00:19, 9.09it/s] 186it [00:19, 9.21it/s] 187it [00:19, 9.31it/s] 188it [00:19, 9.38it/s] 189it [00:20, 9.43it/s] 190it [00:20, 9.51it/s] 191it [00:20, 9.54it/s] 192it [00:20, 9.52it/s] 193it [00:20, 9.54it/s] 194it [00:20, 9.55it/s] 195it [00:20, 8.94it/s] 196it [00:20, 9.20it/s] 196it [00:20, 9.38it/s] +2025-05-26 04:18:58,399 - INFO - Epoch: 77, Objective: tensor([3908.6809], device='cuda:0', grad_fn=), Loss: 0.015703242272138596, KL/n: 63.27415466308594 + 0it [00:00, ?it/s]2025-05-26 04:18:58,678 - INFO - [Epoch 078 | Batch 0000] IWAE-loss 3679.0872 | mean log_px -0.0106 | KL -3098.49 + 1it [00:00, 4.70it/s] 2it [00:00, 6.72it/s] 3it [00:00, 7.76it/s] 4it [00:00, 8.37it/s] 5it [00:00, 8.76it/s] 6it [00:00, 9.03it/s] 7it [00:00, 9.15it/s] 8it [00:00, 9.34it/s] 9it [00:01, 9.47it/s] 10it [00:01, 9.48it/s] 11it [00:01, 9.53it/s] 12it [00:01, 9.50it/s] 13it [00:01, 9.49it/s] 14it [00:01, 9.48it/s] 15it [00:01, 9.48it/s] 16it [00:01, 9.48it/s] 17it [00:01, 9.03it/s] 18it [00:02, 9.19it/s] 19it [00:02, 9.28it/s] 20it [00:02, 9.32it/s] 21it [00:02, 9.34it/s] 22it [00:02, 9.35it/s] 23it [00:02, 9.41it/s] 24it [00:02, 9.50it/s] 25it [00:02, 9.01it/s] 26it [00:02, 9.13it/s] 27it [00:02, 9.21it/s] 28it [00:03, 9.29it/s] 29it [00:03, 9.39it/s] 30it [00:03, 9.39it/s] 31it [00:03, 9.45it/s] 32it [00:03, 9.45it/s] 33it [00:03, 9.47it/s] 34it [00:03, 9.45it/s] 35it [00:03, 9.43it/s] 36it [00:03, 9.41it/s] 37it [00:04, 9.02it/s] 38it [00:04, 9.12it/s] 39it [00:04, 9.20it/s] 40it [00:04, 9.29it/s] 41it [00:04, 9.31it/s] 42it [00:04, 9.34it/s] 43it [00:04, 9.38it/s] 44it [00:04, 8.85it/s] 45it [00:04, 9.03it/s] 46it [00:05, 9.14it/s] 47it [00:05, 6.07it/s] 48it [00:05, 6.80it/s] 49it [00:05, 7.44it/s] 50it [00:05, 7.97it/s]2025-05-26 04:19:04,235 - INFO - [Epoch 078 | Batch 0050] IWAE-loss 4400.3760 | mean log_px -0.0214 | KL -3091.28 + 51it [00:05, 8.09it/s] 52it [00:05, 8.45it/s] 53it [00:05, 8.80it/s] 54it [00:06, 8.46it/s] 55it [00:06, 8.71it/s] 56it [00:06, 8.91it/s] 57it [00:06, 9.06it/s] 58it [00:06, 8.60it/s] 59it [00:06, 8.67it/s] 60it [00:06, 8.80it/s] 61it [00:06, 9.06it/s] 62it [00:06, 9.20it/s] 63it [00:07, 9.28it/s] 64it [00:07, 9.35it/s] 65it [00:07, 9.46it/s] 66it [00:07, 9.52it/s] 67it [00:07, 9.57it/s] 68it [00:07, 9.48it/s] 69it [00:07, 9.46it/s] 70it [00:07, 9.01it/s] 71it [00:07, 9.19it/s] 72it [00:08, 9.29it/s] 73it [00:08, 9.32it/s] 74it [00:08, 9.39it/s] 75it [00:08, 9.44it/s] 76it [00:08, 9.49it/s] 77it [00:08, 9.45it/s] 78it [00:08, 9.46it/s] 79it [00:08, 9.50it/s] 80it [00:08, 9.47it/s] 81it [00:08, 9.52it/s] 82it [00:09, 9.58it/s] 83it [00:09, 9.62it/s] 84it [00:09, 9.62it/s] 85it [00:09, 9.53it/s] 86it [00:09, 9.54it/s] 87it [00:09, 9.53it/s] 88it [00:09, 9.50it/s] 89it [00:09, 9.49it/s] 90it [00:09, 9.48it/s] 91it [00:10, 9.51it/s] 92it [00:10, 9.49it/s] 93it [00:10, 9.47it/s] 94it [00:10, 9.46it/s] 95it [00:10, 9.47it/s] 96it [00:10, 9.50it/s] 97it [00:10, 9.48it/s] 98it [00:10, 9.52it/s] 99it [00:10, 9.58it/s] 100it [00:10, 9.60it/s]2025-05-26 04:19:09,577 - INFO - [Epoch 078 | Batch 0100] IWAE-loss 4047.0798 | mean log_px -0.0176 | KL -3091.62 + 101it [00:11, 9.04it/s] 102it [00:11, 9.16it/s] 103it [00:11, 9.19it/s] 104it [00:11, 9.28it/s] 105it [00:11, 9.40it/s] 106it [00:11, 9.44it/s] 107it [00:11, 8.98it/s] 108it [00:11, 9.12it/s] 109it [00:11, 8.70it/s] 110it [00:12, 8.91it/s] 111it [00:12, 9.09it/s] 112it [00:12, 9.24it/s] 113it [00:12, 9.35it/s] 114it [00:12, 9.38it/s] 115it [00:12, 9.39it/s] 116it [00:12, 9.39it/s] 117it [00:12, 9.43it/s] 118it [00:12, 9.47it/s] 119it [00:13, 9.49it/s] 120it [00:13, 8.91it/s] 121it [00:13, 9.07it/s] 122it [00:13, 9.19it/s] 123it [00:13, 9.29it/s] 124it [00:13, 9.35it/s] 125it [00:13, 9.40it/s] 126it [00:13, 8.80it/s] 127it [00:13, 9.01it/s] 128it [00:14, 9.18it/s] 129it [00:14, 9.33it/s] 130it [00:14, 9.42it/s] 131it [00:14, 9.42it/s] 132it [00:14, 9.42it/s] 133it [00:14, 9.46it/s] 134it [00:14, 9.46it/s] 135it [00:14, 9.50it/s] 136it [00:14, 9.10it/s] 137it [00:14, 9.19it/s] 138it [00:15, 9.28it/s] 139it [00:15, 9.37it/s] 140it [00:15, 9.40it/s] 141it [00:15, 9.48it/s] 142it [00:15, 9.54it/s] 143it [00:15, 9.60it/s] 144it [00:15, 9.63it/s] 145it [00:15, 9.65it/s] 146it [00:15, 9.61it/s] 147it [00:16, 9.59it/s] 148it [00:16, 9.56it/s] 149it [00:16, 9.53it/s] 150it [00:16, 9.53it/s]2025-05-26 04:19:14,950 - INFO - [Epoch 078 | Batch 0150] IWAE-loss 4209.9824 | mean log_px -0.0231 | KL -3090.24 + 151it [00:16, 8.91it/s] 152it [00:16, 9.10it/s] 153it [00:16, 9.28it/s] 154it [00:16, 9.40it/s] 155it [00:16, 9.46it/s] 156it [00:17, 9.46it/s] 157it [00:17, 9.46it/s] 158it [00:17, 8.94it/s] 159it [00:17, 9.08it/s] 160it [00:17, 9.19it/s] 161it [00:17, 9.28it/s] 162it [00:17, 9.34it/s] 163it [00:17, 8.85it/s] 164it [00:17, 9.07it/s] 165it [00:17, 9.20it/s] 166it [00:18, 9.30it/s] 167it [00:18, 9.37it/s] 168it [00:18, 9.41it/s] 169it [00:18, 9.44it/s] 170it [00:18, 9.46it/s] 171it [00:18, 9.48it/s] 172it [00:18, 9.46it/s] 173it [00:18, 9.50it/s] 174it [00:18, 9.50it/s] 175it [00:19, 9.50it/s] 176it [00:19, 8.98it/s] 177it [00:19, 9.15it/s] 178it [00:19, 9.30it/s] 179it [00:19, 9.42it/s] 180it [00:19, 9.42it/s] 181it [00:19, 9.49it/s] 182it [00:19, 9.50it/s] 183it [00:19, 9.49it/s] 184it [00:20, 9.52it/s] 185it [00:20, 9.60it/s] 186it [00:20, 9.63it/s] 187it [00:20, 9.58it/s] 188it [00:20, 8.94it/s] 189it [00:20, 9.15it/s] 190it [00:20, 9.27it/s] 191it [00:20, 9.33it/s] 192it [00:20, 9.36it/s] 193it [00:20, 9.40it/s] 194it [00:21, 8.72it/s] 195it [00:21, 8.47it/s] 196it [00:21, 8.83it/s] 196it [00:21, 9.16it/s] +2025-05-26 04:19:19,932 - INFO - Epoch: 78, Objective: tensor([4202.6504], device='cuda:0', grad_fn=), Loss: 0.022261351346969604, KL/n: 63.005916595458984 + 0it [00:00, ?it/s]2025-05-26 04:19:20,206 - INFO - [Epoch 079 | Batch 0000] IWAE-loss 3951.9302 | mean log_px -0.0140 | KL -3084.01 + 1it [00:00, 5.43it/s] 2it [00:00, 7.32it/s] 3it [00:00, 8.22it/s] 4it [00:00, 8.68it/s] 5it [00:00, 8.54it/s] 6it [00:00, 8.78it/s] 7it [00:00, 9.04it/s] 8it [00:00, 9.23it/s] 9it [00:01, 9.40it/s] 10it [00:01, 9.40it/s] 11it [00:01, 9.52it/s] 12it [00:01, 9.54it/s] 13it [00:01, 9.51it/s] 14it [00:01, 9.51it/s] 15it [00:01, 9.54it/s] 16it [00:01, 9.57it/s] 17it [00:01, 9.57it/s] 18it [00:01, 9.56it/s] 19it [00:02, 9.51it/s] 20it [00:02, 9.53it/s] 21it [00:02, 9.59it/s] 22it [00:02, 9.57it/s] 23it [00:02, 9.57it/s] 24it [00:02, 9.56it/s] 25it [00:02, 8.99it/s] 26it [00:02, 9.12it/s] 27it [00:02, 9.30it/s] 28it [00:03, 9.37it/s] 29it [00:03, 9.44it/s] 30it [00:03, 9.53it/s] 31it [00:03, 9.52it/s] 32it [00:03, 9.51it/s] 33it [00:03, 9.41it/s] 34it [00:03, 9.45it/s] 35it [00:03, 9.55it/s] 36it [00:03, 9.55it/s] 37it [00:03, 9.59it/s] 38it [00:04, 9.56it/s] 39it [00:04, 9.56it/s] 40it [00:04, 9.53it/s] 41it [00:04, 9.55it/s] 42it [00:04, 9.57it/s] 43it [00:04, 9.61it/s] 44it [00:04, 9.18it/s] 45it [00:04, 9.29it/s] 46it [00:04, 9.37it/s] 47it [00:05, 9.41it/s] 48it [00:05, 9.46it/s] 49it [00:05, 9.53it/s] 50it [00:05, 9.50it/s]2025-05-26 04:19:25,487 - INFO - [Epoch 079 | Batch 0050] IWAE-loss 4607.3691 | mean log_px -0.0238 | KL -3084.28 + 51it [00:05, 9.58it/s] 52it [00:05, 9.54it/s] 53it [00:05, 9.55it/s] 54it [00:05, 9.53it/s] 55it [00:05, 9.51it/s] 56it [00:05, 9.54it/s] 57it [00:06, 9.59it/s] 58it [00:06, 9.63it/s] 59it [00:06, 9.67it/s] 60it [00:06, 9.69it/s] 61it [00:06, 9.72it/s] 62it [00:06, 9.73it/s] 63it [00:06, 9.71it/s] 64it [00:06, 9.63it/s] 65it [00:06, 9.64it/s] 66it [00:07, 9.63it/s] 67it [00:07, 9.63it/s] 68it [00:07, 9.59it/s] 69it [00:07, 9.63it/s] 70it [00:07, 9.62it/s] 71it [00:07, 9.63it/s] 72it [00:07, 9.60it/s] 73it [00:07, 9.60it/s] 74it [00:07, 9.59it/s] 75it [00:07, 9.60it/s] 76it [00:08, 9.62it/s] 77it [00:08, 9.62it/s] 78it [00:08, 9.67it/s] 79it [00:08, 9.70it/s] 80it [00:08, 9.70it/s] 81it [00:08, 9.72it/s] 82it [00:08, 9.73it/s] 83it [00:08, 9.25it/s] 84it [00:08, 9.29it/s] 85it [00:09, 9.42it/s] 86it [00:09, 8.95it/s] 87it [00:09, 9.08it/s] 88it [00:09, 9.22it/s] 89it [00:09, 9.35it/s] 90it [00:09, 9.34it/s] 91it [00:09, 9.44it/s] 92it [00:09, 9.46it/s] 93it [00:09, 9.52it/s] 94it [00:09, 9.58it/s] 95it [00:10, 9.15it/s] 96it [00:10, 8.76it/s] 97it [00:10, 8.76it/s] 98it [00:10, 8.98it/s] 99it [00:10, 8.68it/s] 100it [00:10, 8.96it/s]2025-05-26 04:19:30,787 - INFO - [Epoch 079 | Batch 0100] IWAE-loss 4182.2646 | mean log_px -0.0189 | KL -3085.25 + 101it [00:10, 9.13it/s] 102it [00:10, 9.31it/s] 103it [00:10, 9.44it/s] 104it [00:11, 9.54it/s] 105it [00:11, 9.61it/s] 106it [00:11, 9.65it/s] 107it [00:11, 9.69it/s] 108it [00:11, 9.71it/s] 109it [00:11, 9.71it/s] 110it [00:11, 9.71it/s] 111it [00:11, 9.73it/s] 112it [00:11, 9.74it/s] 113it [00:11, 9.74it/s] 114it [00:12, 9.73it/s] 115it [00:12, 9.51it/s] 116it [00:12, 9.19it/s] 117it [00:12, 9.36it/s] 118it [00:12, 9.47it/s] 119it [00:12, 9.56it/s] 120it [00:12, 9.63it/s] 121it [00:12, 9.66it/s] 122it [00:12, 9.69it/s] 123it [00:13, 9.71it/s] 124it [00:13, 9.72it/s] 125it [00:13, 9.73it/s] 126it [00:13, 9.73it/s] 127it [00:13, 9.43it/s] 128it [00:13, 9.52it/s] 129it [00:13, 9.61it/s] 130it [00:13, 9.67it/s] 131it [00:13, 9.69it/s] 132it [00:13, 9.71it/s] 133it [00:14, 9.74it/s] 134it [00:14, 9.74it/s] 135it [00:14, 9.74it/s] 136it [00:14, 9.16it/s] 137it [00:14, 9.33it/s] 138it [00:14, 9.45it/s] 139it [00:14, 9.56it/s] 140it [00:14, 9.61it/s] 141it [00:14, 9.66it/s] 142it [00:15, 9.46it/s] 143it [00:15, 9.53it/s] 144it [00:15, 9.05it/s] 145it [00:15, 9.26it/s] 146it [00:15, 9.40it/s] 147it [00:15, 9.50it/s] 148it [00:15, 9.57it/s] 149it [00:15, 9.65it/s] 150it [00:15, 9.68it/s]2025-05-26 04:19:35,999 - INFO - [Epoch 079 | Batch 0150] IWAE-loss 3905.8240 | mean log_px -0.0154 | KL -3072.65 + 151it [00:15, 9.69it/s] 152it [00:16, 9.71it/s] 153it [00:16, 9.74it/s] 154it [00:16, 9.74it/s] 155it [00:16, 9.72it/s] 156it [00:16, 9.56it/s] 157it [00:16, 8.90it/s] 158it [00:16, 8.95it/s] 159it [00:16, 9.10it/s] 160it [00:16, 9.16it/s] 161it [00:17, 9.24it/s] 162it [00:17, 9.32it/s] 163it [00:17, 9.40it/s] 164it [00:17, 9.38it/s] 165it [00:17, 9.40it/s] 166it [00:17, 9.41it/s] 167it [00:17, 9.39it/s] 168it [00:17, 9.36it/s] 169it [00:17, 9.30it/s] 170it [00:18, 9.44it/s] 171it [00:18, 9.45it/s] 172it [00:18, 9.18it/s] 173it [00:18, 9.37it/s] 174it [00:18, 9.49it/s] 175it [00:18, 9.19it/s] 176it [00:18, 9.36it/s] 177it [00:18, 9.50it/s] 178it [00:18, 9.56it/s] 179it [00:18, 9.63it/s] 180it [00:19, 9.67it/s] 181it [00:19, 9.70it/s] 182it [00:19, 9.70it/s] 183it [00:19, 9.73it/s] 184it [00:19, 9.73it/s] 185it [00:19, 9.75it/s] 186it [00:19, 9.74it/s] 187it [00:19, 9.75it/s] 188it [00:19, 9.74it/s] 189it [00:19, 9.75it/s] 190it [00:20, 9.74it/s] 191it [00:20, 9.59it/s] 192it [00:20, 9.26it/s] 193it [00:20, 9.40it/s] 194it [00:20, 9.50it/s] 195it [00:20, 8.61it/s] 196it [00:20, 8.96it/s] 196it [00:20, 9.42it/s] +2025-05-26 04:19:40,883 - INFO - Epoch: 79, Objective: tensor([3949.7637], device='cuda:0', grad_fn=), Loss: 0.015167269855737686, KL/n: 62.748844146728516 + 0it [00:00, ?it/s]2025-05-26 04:19:41,160 - INFO - [Epoch 080 | Batch 0000] IWAE-loss 4421.7627 | mean log_px -0.0238 | KL -3073.79 + 1it [00:00, 5.43it/s] 2it [00:00, 7.32it/s] 3it [00:00, 8.11it/s] 4it [00:00, 8.27it/s] 5it [00:00, 8.54it/s] 6it [00:00, 8.90it/s] 7it [00:00, 9.14it/s] 8it [00:00, 9.28it/s] 9it [00:01, 9.42it/s] 10it [00:01, 9.50it/s] 11it [00:01, 9.57it/s] 12it [00:01, 9.61it/s] 13it [00:01, 9.64it/s] 14it [00:01, 9.66it/s] 15it [00:01, 9.63it/s] 16it [00:01, 9.64it/s] 17it [00:01, 9.67it/s] 18it [00:01, 9.68it/s] 19it [00:02, 9.70it/s] 20it [00:02, 9.70it/s] 21it [00:02, 9.69it/s] 22it [00:02, 9.70it/s] 23it [00:02, 9.71it/s] 24it [00:02, 9.71it/s] 25it [00:02, 9.72it/s] 26it [00:02, 9.71it/s] 27it [00:02, 9.68it/s] 28it [00:02, 9.68it/s] 29it [00:03, 9.69it/s] 30it [00:03, 9.66it/s] 31it [00:03, 9.70it/s] 32it [00:03, 9.70it/s] 33it [00:03, 9.72it/s] 34it [00:03, 9.58it/s] 35it [00:03, 9.49it/s] 36it [00:03, 9.47it/s] 37it [00:03, 9.52it/s] 38it [00:04, 9.56it/s] 39it [00:04, 9.61it/s] 40it [00:04, 9.63it/s] 41it [00:04, 9.66it/s] 42it [00:04, 9.66it/s] 43it [00:04, 9.69it/s] 44it [00:04, 9.68it/s] 45it [00:04, 9.71it/s] 46it [00:04, 9.71it/s] 47it [00:04, 9.73it/s] 48it [00:05, 9.71it/s] 49it [00:05, 6.27it/s] 50it [00:05, 6.94it/s]2025-05-26 04:19:46,550 - INFO - [Epoch 080 | Batch 0050] IWAE-loss 4183.6655 | mean log_px -0.0173 | KL -3067.25 + 51it [00:05, 7.55it/s] 52it [00:05, 8.10it/s] 53it [00:05, 8.52it/s] 54it [00:05, 8.85it/s] 55it [00:05, 9.10it/s] 56it [00:06, 9.27it/s] 57it [00:06, 9.40it/s] 58it [00:06, 9.50it/s] 59it [00:06, 9.57it/s] 60it [00:06, 9.63it/s] 61it [00:06, 9.63it/s] 62it [00:06, 9.63it/s] 63it [00:06, 9.65it/s] 64it [00:06, 9.68it/s] 65it [00:07, 9.69it/s] 66it [00:07, 9.71it/s] 67it [00:07, 9.70it/s] 68it [00:07, 9.71it/s] 69it [00:07, 9.71it/s] 70it [00:07, 9.71it/s] 71it [00:07, 9.71it/s] 72it [00:07, 9.71it/s] 73it [00:07, 9.72it/s] 74it [00:07, 9.72it/s] 75it [00:08, 9.74it/s] 76it [00:08, 9.73it/s] 77it [00:08, 9.72it/s] 78it [00:08, 9.71it/s] 79it [00:08, 9.72it/s] 80it [00:08, 9.73it/s] 81it [00:08, 9.71it/s] 82it [00:08, 9.71it/s] 83it [00:08, 9.73it/s] 84it [00:08, 9.72it/s] 85it [00:09, 9.73it/s] 86it [00:09, 9.73it/s] 87it [00:09, 9.70it/s] 88it [00:09, 9.71it/s] 89it [00:09, 9.71it/s] 90it [00:09, 9.70it/s] 91it [00:09, 9.70it/s] 92it [00:09, 9.66it/s] 93it [00:09, 9.69it/s] 94it [00:10, 9.70it/s] 95it [00:10, 9.71it/s] 96it [00:10, 9.72it/s] 97it [00:10, 9.73it/s] 98it [00:10, 9.71it/s] 99it [00:10, 9.72it/s] 100it [00:10, 9.69it/s]2025-05-26 04:19:51,698 - INFO - [Epoch 080 | Batch 0100] IWAE-loss 3951.3103 | mean log_px -0.0163 | KL -3071.85 + 101it [00:10, 9.69it/s] 102it [00:10, 9.70it/s] 103it [00:10, 9.71it/s] 104it [00:11, 9.69it/s] 105it [00:11, 9.70it/s] 106it [00:11, 9.69it/s] 107it [00:11, 9.68it/s] 108it [00:11, 9.70it/s] 109it [00:11, 9.67it/s] 110it [00:11, 9.68it/s] 111it [00:11, 9.69it/s] 112it [00:11, 9.68it/s] 113it [00:11, 9.70it/s] 114it [00:12, 9.70it/s] 115it [00:12, 9.72it/s] 116it [00:12, 9.71it/s] 117it [00:12, 9.72it/s] 118it [00:12, 9.71it/s] 119it [00:12, 9.72it/s] 120it [00:12, 9.71it/s] 121it [00:12, 9.70it/s] 122it [00:12, 9.70it/s] 123it [00:12, 9.71it/s] 124it [00:13, 9.68it/s] 125it [00:13, 9.63it/s] 126it [00:13, 9.62it/s] 127it [00:13, 9.61it/s] 128it [00:13, 9.62it/s] 129it [00:13, 9.66it/s] 130it [00:13, 9.66it/s] 131it [00:13, 9.68it/s] 132it [00:13, 9.44it/s] 133it [00:14, 9.52it/s] 134it [00:14, 9.57it/s] 135it [00:14, 9.61it/s] 136it [00:14, 9.64it/s] 137it [00:14, 9.64it/s] 138it [00:14, 9.62it/s] 139it [00:14, 9.60it/s] 140it [00:14, 9.60it/s] 141it [00:14, 9.56it/s] 142it [00:14, 9.57it/s] 143it [00:15, 9.53it/s] 144it [00:15, 9.47it/s] 145it [00:15, 9.50it/s] 146it [00:15, 9.50it/s] 147it [00:15, 9.50it/s] 148it [00:15, 9.54it/s] 149it [00:15, 9.54it/s] 150it [00:15, 9.54it/s]2025-05-26 04:19:56,897 - INFO - [Epoch 080 | Batch 0150] IWAE-loss 3631.5173 | mean log_px -0.0095 | KL -3060.06 + 151it [00:15, 9.46it/s] 152it [00:16, 9.50it/s] 153it [00:16, 9.46it/s] 154it [00:16, 9.48it/s] 155it [00:16, 9.47it/s] 156it [00:16, 9.51it/s] 157it [00:16, 9.51it/s] 158it [00:16, 9.50it/s] 159it [00:16, 9.54it/s] 160it [00:16, 9.55it/s] 161it [00:16, 9.48it/s] 162it [00:17, 9.52it/s] 163it [00:17, 9.54it/s] 164it [00:17, 9.53it/s] 165it [00:17, 9.53it/s] 166it [00:17, 9.51it/s] 167it [00:17, 9.51it/s] 168it [00:17, 9.50it/s] 169it [00:17, 9.46it/s] 170it [00:17, 9.32it/s] 171it [00:18, 9.33it/s] 172it [00:18, 9.37it/s] 173it [00:18, 9.38it/s] 174it [00:18, 9.44it/s] 175it [00:18, 9.47it/s] 176it [00:18, 9.46it/s] 177it [00:18, 9.51it/s] 178it [00:18, 9.57it/s] 179it [00:18, 9.63it/s] 180it [00:18, 9.63it/s] 181it [00:19, 9.65it/s] 182it [00:19, 9.67it/s] 183it [00:19, 9.68it/s] 184it [00:19, 9.69it/s] 185it [00:19, 9.70it/s] 186it [00:19, 9.70it/s] 187it [00:19, 9.49it/s] 188it [00:19, 9.53it/s] 189it [00:19, 9.54it/s] 190it [00:20, 9.20it/s] 191it [00:20, 9.08it/s] 192it [00:20, 9.14it/s] 193it [00:20, 9.22it/s] 194it [00:20, 9.07it/s] 195it [00:20, 8.63it/s] 196it [00:20, 9.00it/s] 196it [00:20, 9.44it/s] +2025-05-26 04:20:01,780 - INFO - Epoch: 80, Objective: tensor([3925.0637], device='cuda:0', grad_fn=), Loss: 0.012692895717918873, KL/n: 62.49341583251953 + 0it [00:00, ?it/s]2025-05-26 04:20:02,031 - INFO - [Epoch 081 | Batch 0000] IWAE-loss 4076.6638 | mean log_px -0.0189 | KL -3062.57 + 1it [00:00, 5.96it/s] 2it [00:00, 7.37it/s] 3it [00:00, 7.85it/s] 4it [00:00, 8.22it/s] 5it [00:00, 8.66it/s] 6it [00:00, 8.99it/s] 7it [00:00, 9.24it/s] 8it [00:00, 8.98it/s] 9it [00:01, 9.07it/s] 10it [00:01, 9.18it/s] 11it [00:01, 9.26it/s] 12it [00:01, 9.10it/s] 13it [00:01, 9.23it/s] 14it [00:01, 9.31it/s] 15it [00:01, 9.38it/s] 16it [00:01, 9.43it/s] 17it [00:01, 9.45it/s] 18it [00:02, 9.49it/s] 19it [00:02, 9.45it/s] 20it [00:02, 9.46it/s] 21it [00:02, 9.48it/s] 22it [00:02, 9.51it/s] 23it [00:02, 9.51it/s] 24it [00:02, 9.45it/s] 25it [00:02, 9.45it/s] 26it [00:02, 9.50it/s] 27it [00:02, 9.45it/s] 28it [00:03, 9.50it/s] 29it [00:03, 9.53it/s] 30it [00:03, 9.30it/s] 31it [00:03, 9.29it/s] 32it [00:03, 9.37it/s] 33it [00:03, 9.40it/s] 34it [00:03, 9.36it/s] 35it [00:03, 9.46it/s] 36it [00:03, 9.46it/s] 37it [00:04, 9.12it/s] 38it [00:04, 9.28it/s] 39it [00:04, 9.42it/s] 40it [00:04, 9.51it/s] 41it [00:04, 9.56it/s] 42it [00:04, 9.62it/s] 43it [00:04, 9.65it/s] 44it [00:04, 9.67it/s] 45it [00:04, 9.70it/s] 46it [00:04, 9.72it/s] 47it [00:05, 9.73it/s] 48it [00:05, 9.74it/s] 49it [00:05, 9.76it/s] 50it [00:05, 9.75it/s]2025-05-26 04:20:07,339 - INFO - [Epoch 081 | Batch 0050] IWAE-loss 3596.1819 | mean log_px -0.0087 | KL -3056.84 + 51it [00:05, 9.39it/s] 52it [00:05, 9.44it/s] 53it [00:05, 9.52it/s] 54it [00:05, 9.57it/s] 55it [00:05, 9.53it/s] 56it [00:06, 9.39it/s] 57it [00:06, 9.27it/s] 58it [00:06, 9.18it/s] 59it [00:06, 8.88it/s] 60it [00:06, 9.03it/s] 61it [00:06, 9.15it/s] 62it [00:06, 9.23it/s] 63it [00:06, 9.30it/s] 64it [00:06, 9.27it/s] 65it [00:06, 9.31it/s] 66it [00:07, 9.34it/s] 67it [00:07, 9.34it/s] 68it [00:07, 9.34it/s] 69it [00:07, 9.39it/s] 70it [00:07, 9.49it/s] 71it [00:07, 9.40it/s] 72it [00:07, 9.44it/s] 73it [00:07, 9.44it/s] 74it [00:07, 9.17it/s] 75it [00:08, 9.33it/s] 76it [00:08, 9.45it/s] 77it [00:08, 9.45it/s] 78it [00:08, 9.22it/s] 79it [00:08, 9.37it/s] 80it [00:08, 9.43it/s] 81it [00:08, 9.47it/s] 82it [00:08, 9.54it/s] 83it [00:08, 9.59it/s] 84it [00:09, 9.60it/s] 85it [00:09, 9.64it/s] 86it [00:09, 9.65it/s] 87it [00:09, 9.68it/s] 88it [00:09, 9.40it/s] 89it [00:09, 9.50it/s] 90it [00:09, 9.56it/s] 91it [00:09, 9.33it/s] 92it [00:09, 9.44it/s] 93it [00:09, 9.51it/s] 94it [00:10, 9.57it/s] 95it [00:10, 9.63it/s] 96it [00:10, 9.64it/s] 97it [00:10, 9.68it/s] 98it [00:10, 9.69it/s] 99it [00:10, 9.72it/s] 100it [00:10, 9.73it/s]2025-05-26 04:20:12,641 - INFO - [Epoch 081 | Batch 0100] IWAE-loss 4514.4556 | mean log_px -0.0243 | KL -3053.01 + 101it [00:10, 9.42it/s] 102it [00:10, 9.42it/s] 103it [00:10, 9.51it/s] 104it [00:11, 9.58it/s] 105it [00:11, 9.63it/s] 106it [00:11, 9.64it/s] 107it [00:11, 9.66it/s] 108it [00:11, 9.66it/s] 109it [00:11, 9.69it/s] 110it [00:11, 9.69it/s] 111it [00:11, 9.65it/s] 112it [00:11, 9.65it/s] 113it [00:12, 9.68it/s] 114it [00:12, 9.69it/s] 115it [00:12, 9.70it/s] 116it [00:12, 9.71it/s] 117it [00:12, 9.70it/s] 118it [00:12, 9.70it/s] 119it [00:12, 9.69it/s] 120it [00:12, 9.69it/s] 121it [00:12, 9.71it/s] 122it [00:12, 9.70it/s] 123it [00:13, 9.70it/s] 124it [00:13, 9.67it/s] 125it [00:13, 9.67it/s] 126it [00:13, 9.67it/s] 127it [00:13, 9.69it/s] 128it [00:13, 9.69it/s] 129it [00:13, 9.70it/s] 130it [00:13, 9.70it/s] 131it [00:13, 9.71it/s] 132it [00:13, 9.70it/s] 133it [00:14, 9.72it/s] 134it [00:14, 9.71it/s] 135it [00:14, 9.73it/s] 136it [00:14, 9.72it/s] 137it [00:14, 9.72it/s] 138it [00:14, 9.72it/s] 139it [00:14, 9.73it/s] 140it [00:14, 9.71it/s] 141it [00:14, 9.68it/s] 142it [00:15, 9.70it/s] 143it [00:15, 9.67it/s] 144it [00:15, 9.67it/s] 145it [00:15, 9.70it/s] 146it [00:15, 9.68it/s] 147it [00:15, 9.68it/s] 148it [00:15, 9.67it/s] 149it [00:15, 9.68it/s] 150it [00:15, 9.67it/s]2025-05-26 04:20:17,813 - INFO - [Epoch 081 | Batch 0150] IWAE-loss 3807.7285 | mean log_px -0.0127 | KL -3054.70 + 151it [00:15, 9.37it/s] 152it [00:16, 9.23it/s] 153it [00:16, 9.39it/s] 154it [00:16, 9.49it/s] 155it [00:16, 9.51it/s] 156it [00:16, 9.56it/s] 157it [00:16, 9.35it/s] 158it [00:16, 9.46it/s] 159it [00:16, 9.55it/s] 160it [00:16, 9.59it/s] 161it [00:17, 9.63it/s] 162it [00:17, 9.63it/s] 163it [00:17, 9.66it/s] 164it [00:17, 9.64it/s] 165it [00:17, 9.66it/s] 166it [00:17, 9.68it/s] 167it [00:17, 9.69it/s] 168it [00:17, 9.69it/s] 169it [00:17, 9.72it/s] 170it [00:17, 9.68it/s] 171it [00:18, 9.69it/s] 172it [00:18, 9.68it/s] 173it [00:18, 9.67it/s] 174it [00:18, 9.66it/s] 175it [00:18, 9.69it/s] 176it [00:18, 9.68it/s] 177it [00:18, 9.70it/s] 178it [00:18, 9.69it/s] 179it [00:18, 9.72it/s] 180it [00:18, 9.72it/s] 181it [00:19, 9.74it/s] 182it [00:19, 9.69it/s] 183it [00:19, 9.70it/s] 184it [00:19, 9.56it/s] 185it [00:19, 9.62it/s] 186it [00:19, 9.63it/s] 187it [00:19, 9.66it/s] 188it [00:19, 9.66it/s] 189it [00:19, 9.69it/s] 190it [00:19, 9.66it/s] 191it [00:20, 9.68it/s] 192it [00:20, 9.64it/s] 193it [00:20, 9.67it/s] 194it [00:20, 9.68it/s] 195it [00:20, 9.23it/s] 196it [00:20, 9.47it/s] +2025-05-26 04:20:22,598 - INFO - Epoch: 81, Objective: tensor([4405.5898], device='cuda:0', grad_fn=), Loss: 0.024367935955524445, KL/n: 62.24941635131836 + 0it [00:00, ?it/s]2025-05-26 04:20:22,864 - INFO - [Epoch 082 | Batch 0000] IWAE-loss 4408.0596 | mean log_px -0.0199 | KL -3051.39 + 1it [00:00, 4.85it/s] 2it [00:00, 6.95it/s] 4it [00:00, 8.61it/s] 5it [00:00, 8.99it/s] 6it [00:00, 9.27it/s] 7it [00:00, 9.47it/s] 8it [00:00, 9.01it/s] 10it [00:01, 9.45it/s] 11it [00:01, 9.58it/s] 12it [00:01, 9.67it/s] 13it [00:01, 9.75it/s] 14it [00:01, 9.79it/s] 15it [00:01, 9.85it/s] 16it [00:01, 9.29it/s] 17it [00:01, 9.48it/s] 18it [00:01, 9.61it/s] 19it [00:02, 9.70it/s] 20it [00:02, 9.77it/s] 21it [00:02, 9.83it/s] 22it [00:02, 9.85it/s] 23it [00:02, 9.87it/s] 24it [00:02, 9.90it/s] 25it [00:02, 9.59it/s] 26it [00:02, 9.69it/s] 27it [00:02, 9.77it/s] 28it [00:02, 9.17it/s] 29it [00:03, 9.40it/s] 30it [00:03, 9.56it/s] 32it [00:03, 9.77it/s] 33it [00:03, 9.82it/s] 34it [00:03, 9.76it/s] 35it [00:03, 9.26it/s] 36it [00:03, 9.39it/s] 37it [00:03, 9.55it/s] 38it [00:04, 9.67it/s] 40it [00:04, 9.81it/s] 41it [00:04, 9.44it/s] 42it [00:04, 9.55it/s] 43it [00:04, 9.66it/s] 44it [00:04, 9.73it/s] 46it [00:04, 9.85it/s] 47it [00:04, 9.88it/s] 48it [00:05, 9.87it/s] 49it [00:05, 9.80it/s] 50it [00:05, 9.80it/s]2025-05-26 04:20:28,045 - INFO - [Epoch 082 | Batch 0050] IWAE-loss 4216.4087 | mean log_px -0.0181 | KL -3045.86 + 51it [00:05, 9.19it/s] 52it [00:05, 9.39it/s] 53it [00:05, 9.55it/s] 54it [00:05, 9.66it/s] 55it [00:05, 9.75it/s] 56it [00:05, 9.81it/s] 57it [00:05, 9.86it/s] 58it [00:06, 9.89it/s] 59it [00:06, 9.91it/s] 60it [00:06, 9.91it/s] 61it [00:06, 9.93it/s] 62it [00:06, 9.94it/s] 63it [00:06, 9.95it/s] 64it [00:06, 9.44it/s] 66it [00:06, 9.69it/s] 68it [00:07, 9.82it/s] 69it [00:07, 6.97it/s] 70it [00:07, 7.27it/s] 71it [00:07, 7.80it/s] 72it [00:07, 8.27it/s] 73it [00:07, 8.68it/s] 74it [00:07, 9.01it/s] 75it [00:08, 9.27it/s] 76it [00:08, 9.46it/s] 78it [00:08, 9.70it/s] 79it [00:08, 9.77it/s] 81it [00:08, 9.87it/s] 82it [00:08, 9.41it/s] 83it [00:08, 9.54it/s] 84it [00:08, 9.65it/s] 85it [00:09, 9.74it/s] 86it [00:09, 9.78it/s] 88it [00:09, 9.88it/s] 89it [00:09, 9.47it/s] 90it [00:09, 9.58it/s] 91it [00:09, 9.68it/s] 92it [00:09, 9.75it/s] 93it [00:09, 9.81it/s] 94it [00:09, 9.76it/s] 95it [00:10, 9.10it/s] 96it [00:10, 9.32it/s] 97it [00:10, 9.50it/s] 98it [00:10, 9.63it/s] 99it [00:10, 9.73it/s] 100it [00:10, 9.79it/s]2025-05-26 04:20:33,385 - INFO - [Epoch 082 | Batch 0100] IWAE-loss 4081.9727 | mean log_px -0.0158 | KL -3040.89 + 101it [00:10, 9.22it/s] 102it [00:10, 9.42it/s] 103it [00:10, 9.58it/s] 105it [00:11, 9.31it/s] 106it [00:11, 9.46it/s] 107it [00:11, 9.59it/s] 108it [00:11, 9.69it/s] 109it [00:11, 9.76it/s] 110it [00:11, 9.81it/s] 111it [00:11, 9.85it/s] 112it [00:11, 9.72it/s] 113it [00:11, 9.17it/s] 114it [00:12, 9.38it/s] 115it [00:12, 9.55it/s] 116it [00:12, 9.66it/s] 117it [00:12, 9.74it/s] 118it [00:12, 9.80it/s] 119it [00:12, 9.84it/s] 120it [00:12, 9.88it/s] 121it [00:12, 9.90it/s] 122it [00:12, 9.92it/s] 123it [00:12, 9.93it/s] 124it [00:13, 9.94it/s] 125it [00:13, 9.31it/s] 126it [00:13, 9.49it/s] 127it [00:13, 9.63it/s] 128it [00:13, 9.66it/s] 129it [00:13, 9.74it/s] 130it [00:13, 9.80it/s] 131it [00:13, 9.85it/s] 132it [00:13, 9.88it/s] 133it [00:14, 9.91it/s] 134it [00:14, 9.92it/s] 135it [00:14, 9.31it/s] 136it [00:14, 9.50it/s] 137it [00:14, 9.64it/s] 138it [00:14, 9.72it/s] 140it [00:14, 9.87it/s] 142it [00:14, 9.50it/s] 143it [00:15, 9.61it/s] 144it [00:15, 9.70it/s] 145it [00:15, 9.74it/s] 147it [00:15, 9.87it/s] 148it [00:15, 9.89it/s] 149it [00:15, 9.90it/s] 150it [00:15, 9.91it/s]2025-05-26 04:20:38,547 - INFO - [Epoch 082 | Batch 0150] IWAE-loss 3857.5825 | mean log_px -0.0146 | KL -3036.50 + 151it [00:15, 9.35it/s] 152it [00:15, 9.51it/s] 153it [00:16, 9.64it/s] 154it [00:16, 9.74it/s] 155it [00:16, 9.21it/s] 156it [00:16, 9.41it/s] 157it [00:16, 9.46it/s] 158it [00:16, 9.39it/s] 159it [00:16, 8.88it/s] 160it [00:16, 9.16it/s] 161it [00:16, 9.38it/s] 162it [00:17, 9.54it/s] 163it [00:17, 9.65it/s] 164it [00:17, 9.75it/s] 165it [00:17, 9.80it/s] 166it [00:17, 9.84it/s] 167it [00:17, 9.27it/s] 168it [00:17, 9.46it/s] 169it [00:17, 9.50it/s] 170it [00:17, 9.62it/s] 171it [00:17, 9.73it/s] 172it [00:18, 9.79it/s] 173it [00:18, 9.84it/s] 174it [00:18, 9.88it/s] 175it [00:18, 9.92it/s] 177it [00:18, 9.97it/s] 178it [00:18, 9.94it/s] 179it [00:18, 9.50it/s] 180it [00:18, 9.61it/s] 182it [00:19, 9.79it/s] 184it [00:19, 9.89it/s] 186it [00:19, 9.93it/s] 187it [00:19, 9.92it/s] 188it [00:19, 9.93it/s] 190it [00:19, 9.96it/s] 192it [00:20, 9.98it/s] 194it [00:20, 10.00it/s] 195it [00:20, 9.25it/s] 196it [00:20, 9.51it/s] +2025-05-26 04:20:43,331 - INFO - Epoch: 82, Objective: tensor([3370.0046], device='cuda:0', grad_fn=), Loss: 0.005570830777287483, KL/n: 62.00031280517578 + 0it [00:00, ?it/s]2025-05-26 04:20:43,609 - INFO - [Epoch 083 | Batch 0000] IWAE-loss 4002.6240 | mean log_px -0.0153 | KL -3036.43 + 1it [00:00, 5.19it/s] 2it [00:00, 6.68it/s] 3it [00:00, 7.87it/s] 4it [00:00, 8.56it/s] 5it [00:00, 8.96it/s] 6it [00:00, 9.12it/s] 7it [00:00, 9.34it/s] 8it [00:00, 9.51it/s] 9it [00:01, 9.64it/s] 10it [00:01, 9.69it/s] 11it [00:01, 9.13it/s] 12it [00:01, 9.33it/s] 13it [00:01, 9.51it/s] 14it [00:01, 9.65it/s] 16it [00:01, 9.82it/s] 18it [00:01, 9.89it/s] 20it [00:02, 9.92it/s] 21it [00:02, 9.93it/s] 22it [00:02, 9.93it/s] 23it [00:02, 9.94it/s] 24it [00:02, 9.95it/s] 26it [00:02, 9.98it/s] 28it [00:02, 9.96it/s] 29it [00:03, 9.91it/s] 30it [00:03, 9.84it/s] 31it [00:03, 9.88it/s] 32it [00:03, 9.91it/s] 34it [00:03, 9.95it/s] 36it [00:03, 9.98it/s] 38it [00:03, 10.00it/s] 39it [00:04, 9.98it/s] 40it [00:04, 9.95it/s] 41it [00:04, 9.94it/s] 42it [00:04, 9.94it/s] 44it [00:04, 9.96it/s] 46it [00:04, 9.98it/s] 48it [00:04, 9.98it/s] 49it [00:05, 9.98it/s] 50it [00:05, 9.98it/s]2025-05-26 04:20:48,686 - INFO - [Epoch 083 | Batch 0050] IWAE-loss 3834.6262 | mean log_px -0.0148 | KL -3028.71 + 51it [00:05, 9.94it/s] 52it [00:05, 9.96it/s] 54it [00:05, 9.98it/s] 56it [00:05, 9.57it/s] 57it [00:05, 9.65it/s] 58it [00:05, 9.69it/s] 59it [00:06, 9.73it/s] 60it [00:06, 9.77it/s] 61it [00:06, 9.80it/s] 62it [00:06, 9.83it/s] 63it [00:06, 9.85it/s] 64it [00:06, 9.85it/s] 65it [00:06, 9.88it/s] 66it [00:06, 9.21it/s] 67it [00:06, 9.41it/s] 68it [00:07, 9.52it/s] 69it [00:07, 9.65it/s] 70it [00:07, 9.74it/s] 71it [00:07, 9.80it/s] 72it [00:07, 9.84it/s] 73it [00:07, 9.86it/s] 74it [00:07, 9.89it/s] 75it [00:07, 9.89it/s] 76it [00:07, 9.27it/s] 77it [00:07, 9.47it/s] 78it [00:08, 9.60it/s] 79it [00:08, 9.70it/s] 80it [00:08, 9.77it/s] 81it [00:08, 9.82it/s] 82it [00:08, 9.85it/s] 83it [00:08, 9.86it/s] 84it [00:08, 9.86it/s] 86it [00:08, 9.42it/s] 87it [00:08, 9.54it/s] 88it [00:09, 9.63it/s] 89it [00:09, 9.71it/s] 90it [00:09, 9.76it/s] 91it [00:09, 9.81it/s] 92it [00:09, 9.85it/s] 93it [00:09, 9.89it/s] 94it [00:09, 9.26it/s] 95it [00:09, 9.47it/s] 96it [00:09, 9.61it/s] 97it [00:10, 9.71it/s] 98it [00:10, 9.77it/s] 99it [00:10, 9.19it/s] 100it [00:10, 9.39it/s]2025-05-26 04:20:53,864 - INFO - [Epoch 083 | Batch 0100] IWAE-loss 4239.6172 | mean log_px -0.0240 | KL -3028.14 + 101it [00:10, 9.52it/s] 102it [00:10, 9.62it/s] 103it [00:10, 9.70it/s] 104it [00:10, 9.76it/s] 105it [00:10, 9.80it/s] 106it [00:10, 9.82it/s] 107it [00:11, 9.85it/s] 108it [00:11, 9.86it/s] 109it [00:11, 9.89it/s] 110it [00:11, 9.89it/s] 111it [00:11, 9.92it/s] 112it [00:11, 9.91it/s] 113it [00:11, 9.91it/s] 114it [00:11, 9.38it/s] 115it [00:11, 9.53it/s] 116it [00:11, 9.63it/s] 117it [00:12, 9.69it/s] 118it [00:12, 9.04it/s] 119it [00:12, 9.25it/s] 120it [00:12, 9.43it/s] 121it [00:12, 9.57it/s] 122it [00:12, 9.66it/s] 123it [00:12, 9.74it/s] 124it [00:12, 9.80it/s] 125it [00:12, 9.24it/s] 126it [00:13, 9.45it/s] 127it [00:13, 9.57it/s] 128it [00:13, 9.67it/s] 129it [00:13, 9.75it/s] 130it [00:13, 9.76it/s] 131it [00:13, 9.81it/s] 132it [00:13, 9.20it/s] 133it [00:13, 9.41it/s] 134it [00:13, 9.54it/s] 135it [00:13, 9.64it/s] 136it [00:14, 9.71it/s] 137it [00:14, 9.77it/s] 138it [00:14, 9.18it/s] 139it [00:14, 9.36it/s] 140it [00:14, 9.52it/s] 141it [00:14, 9.63it/s] 142it [00:14, 9.70it/s] 143it [00:14, 9.68it/s] 144it [00:14, 9.73it/s] 145it [00:15, 9.31it/s] 146it [00:15, 9.48it/s] 147it [00:15, 9.61it/s] 148it [00:15, 9.68it/s] 149it [00:15, 9.77it/s] 150it [00:15, 9.81it/s]2025-05-26 04:20:59,053 - INFO - [Epoch 083 | Batch 0150] IWAE-loss 3907.8083 | mean log_px -0.0154 | KL -3022.59 + 151it [00:15, 9.21it/s] 152it [00:15, 9.41it/s] 153it [00:15, 9.54it/s] 154it [00:15, 9.65it/s] 155it [00:16, 9.72it/s] 156it [00:16, 9.69it/s] 157it [00:16, 9.60it/s] 158it [00:16, 9.66it/s] 159it [00:16, 9.72it/s] 160it [00:16, 9.75it/s] 161it [00:16, 9.79it/s] 162it [00:16, 9.82it/s] 163it [00:16, 9.80it/s] 164it [00:16, 9.81it/s] 165it [00:17, 9.84it/s] 166it [00:17, 9.86it/s] 167it [00:17, 9.85it/s] 168it [00:17, 9.85it/s] 169it [00:17, 9.85it/s] 170it [00:17, 9.86it/s] 171it [00:17, 9.86it/s] 172it [00:17, 9.25it/s] 173it [00:17, 9.42it/s] 174it [00:18, 9.53it/s] 175it [00:18, 9.61it/s] 176it [00:18, 9.67it/s] 177it [00:18, 9.72it/s] 178it [00:18, 9.76it/s] 179it [00:18, 9.78it/s] 180it [00:18, 9.81it/s] 181it [00:18, 9.84it/s] 182it [00:18, 9.84it/s] 183it [00:18, 9.85it/s] 184it [00:19, 9.85it/s] 185it [00:19, 9.87it/s] 186it [00:19, 9.85it/s] 187it [00:19, 9.86it/s] 188it [00:19, 9.35it/s] 189it [00:19, 9.49it/s] 190it [00:19, 9.58it/s] 191it [00:19, 9.67it/s] 192it [00:19, 9.12it/s] 193it [00:19, 9.34it/s] 194it [00:20, 9.47it/s] 195it [00:20, 9.16it/s] 196it [00:20, 8.88it/s] 196it [00:20, 9.61it/s] +2025-05-26 04:21:03,847 - INFO - Epoch: 83, Objective: tensor([3918.3167], device='cuda:0', grad_fn=), Loss: 0.013034864328801632, KL/n: 61.751060485839844 + 0it [00:00, ?it/s]2025-05-26 04:21:04,142 - INFO - [Epoch 084 | Batch 0000] IWAE-loss 3879.0281 | mean log_px -0.0132 | KL -3020.57 + 1it [00:00, 4.93it/s] 2it [00:00, 7.01it/s] 4it [00:00, 8.64it/s] 5it [00:00, 8.50it/s] 6it [00:00, 8.89it/s] 8it [00:00, 9.39it/s] 9it [00:01, 9.16it/s] 10it [00:01, 9.35it/s] 11it [00:01, 9.51it/s] 12it [00:01, 9.64it/s] 13it [00:01, 9.13it/s] 14it [00:01, 9.35it/s] 15it [00:01, 9.53it/s] 16it [00:01, 9.63it/s] 17it [00:01, 9.13it/s] 18it [00:01, 9.35it/s] 20it [00:02, 9.65it/s] 21it [00:02, 9.73it/s] 22it [00:02, 9.80it/s] 23it [00:02, 9.84it/s] 25it [00:02, 9.92it/s] 27it [00:02, 9.89it/s] 28it [00:02, 9.84it/s] 29it [00:03, 9.84it/s] 30it [00:03, 9.85it/s] 31it [00:03, 9.89it/s] 32it [00:03, 9.91it/s] 33it [00:03, 9.93it/s] 34it [00:03, 9.94it/s] 35it [00:03, 9.34it/s] 36it [00:03, 9.50it/s] 37it [00:03, 9.64it/s] 38it [00:04, 9.71it/s] 39it [00:04, 9.80it/s] 40it [00:04, 9.82it/s] 41it [00:04, 9.86it/s] 42it [00:04, 6.03it/s] 43it [00:04, 6.84it/s] 44it [00:04, 7.54it/s] 45it [00:04, 8.14it/s] 46it [00:05, 8.61it/s] 47it [00:05, 8.97it/s] 48it [00:05, 9.24it/s] 49it [00:05, 9.45it/s] 50it [00:05, 9.60it/s]2025-05-26 04:21:09,491 - INFO - [Epoch 084 | Batch 0050] IWAE-loss 3803.3413 | mean log_px -0.0113 | KL -3022.37 + 51it [00:05, 9.10it/s] 52it [00:05, 9.33it/s] 53it [00:05, 9.52it/s] 54it [00:05, 9.63it/s] 55it [00:05, 9.74it/s] 56it [00:06, 9.79it/s] 58it [00:06, 9.86it/s] 59it [00:06, 9.88it/s] 60it [00:06, 9.90it/s] 61it [00:06, 9.82it/s] 62it [00:06, 9.59it/s] 63it [00:06, 8.95it/s] 64it [00:06, 9.16it/s] 65it [00:07, 9.35it/s] 66it [00:07, 9.46it/s] 67it [00:07, 9.57it/s] 68it [00:07, 9.64it/s] 69it [00:07, 9.69it/s] 70it [00:07, 9.69it/s] 71it [00:07, 9.74it/s] 72it [00:07, 9.74it/s] 73it [00:07, 9.17it/s] 74it [00:07, 9.37it/s] 75it [00:08, 9.55it/s] 76it [00:08, 9.67it/s] 77it [00:08, 9.76it/s] 78it [00:08, 9.82it/s] 79it [00:08, 9.87it/s] 80it [00:08, 9.89it/s] 82it [00:08, 9.94it/s] 83it [00:08, 9.94it/s] 84it [00:08, 9.94it/s] 85it [00:09, 9.95it/s] 86it [00:09, 9.95it/s] 87it [00:09, 9.95it/s] 88it [00:09, 9.94it/s] 89it [00:09, 9.95it/s] 90it [00:09, 9.93it/s] 91it [00:09, 9.94it/s] 92it [00:09, 9.94it/s] 94it [00:09, 9.96it/s] 95it [00:10, 9.97it/s] 96it [00:10, 9.94it/s] 97it [00:10, 9.91it/s] 98it [00:10, 9.44it/s] 100it [00:10, 9.68it/s]2025-05-26 04:21:14,640 - INFO - [Epoch 084 | Batch 0100] IWAE-loss 6303.6221 | mean log_px -0.0504 | KL -3017.94 + 101it [00:10, 9.75it/s] 102it [00:10, 9.80it/s] 103it [00:10, 9.85it/s] 104it [00:10, 9.87it/s] 106it [00:11, 9.56it/s] 107it [00:11, 9.65it/s] 108it [00:11, 9.72it/s] 109it [00:11, 9.79it/s] 110it [00:11, 9.82it/s] 111it [00:11, 9.27it/s] 112it [00:11, 9.46it/s] 114it [00:12, 9.70it/s] 115it [00:12, 9.76it/s] 116it [00:12, 9.81it/s] 117it [00:12, 9.84it/s] 118it [00:12, 9.84it/s] 119it [00:12, 9.86it/s] 120it [00:12, 9.86it/s] 121it [00:12, 9.89it/s] 122it [00:12, 9.25it/s] 123it [00:12, 9.41it/s] 124it [00:13, 9.54it/s] 125it [00:13, 9.65it/s] 126it [00:13, 9.73it/s] 127it [00:13, 9.80it/s] 128it [00:13, 9.83it/s] 129it [00:13, 9.85it/s] 130it [00:13, 9.86it/s] 131it [00:13, 9.88it/s] 132it [00:13, 9.89it/s] 133it [00:13, 9.89it/s] 134it [00:14, 9.90it/s] 135it [00:14, 9.26it/s] 136it [00:14, 9.35it/s] 137it [00:14, 9.52it/s] 138it [00:14, 9.63it/s] 139it [00:14, 9.73it/s] 140it [00:14, 9.79it/s] 141it [00:14, 9.84it/s] 142it [00:14, 9.87it/s] 143it [00:15, 9.90it/s] 144it [00:15, 9.91it/s] 145it [00:15, 9.92it/s] 146it [00:15, 9.91it/s] 147it [00:15, 9.92it/s] 148it [00:15, 9.92it/s] 149it [00:15, 9.92it/s] 150it [00:15, 9.92it/s]2025-05-26 04:21:19,765 - INFO - [Epoch 084 | Batch 0150] IWAE-loss 3802.7544 | mean log_px -0.0130 | KL -3015.59 + 151it [00:15, 9.91it/s] 152it [00:15, 9.92it/s] 153it [00:16, 9.93it/s] 154it [00:16, 9.95it/s] 155it [00:16, 9.95it/s] 156it [00:16, 9.92it/s] 157it [00:16, 9.92it/s] 158it [00:16, 9.94it/s] 159it [00:16, 9.94it/s] 160it [00:16, 9.92it/s] 161it [00:16, 9.92it/s] 162it [00:16, 9.92it/s] 163it [00:17, 9.94it/s] 164it [00:17, 9.94it/s] 165it [00:17, 9.93it/s] 166it [00:17, 9.93it/s] 167it [00:17, 9.94it/s] 168it [00:17, 9.94it/s] 169it [00:17, 9.94it/s] 170it [00:17, 9.93it/s] 171it [00:17, 9.94it/s] 172it [00:17, 9.88it/s] 173it [00:18, 9.91it/s] 174it [00:18, 9.91it/s] 175it [00:18, 9.91it/s] 176it [00:18, 9.91it/s] 177it [00:18, 9.93it/s] 178it [00:18, 9.93it/s] 179it [00:18, 9.93it/s] 180it [00:18, 9.93it/s] 181it [00:18, 9.93it/s] 182it [00:18, 9.93it/s] 183it [00:19, 9.93it/s] 184it [00:19, 9.93it/s] 185it [00:19, 9.94it/s] 186it [00:19, 9.93it/s] 187it [00:19, 9.94it/s] 188it [00:19, 9.93it/s] 189it [00:19, 9.94it/s] 190it [00:19, 9.94it/s] 191it [00:19, 9.93it/s] 192it [00:19, 9.92it/s] 193it [00:20, 9.94it/s] 194it [00:20, 9.94it/s] 195it [00:20, 9.47it/s] 196it [00:20, 9.59it/s] +2025-05-26 04:21:24,416 - INFO - Epoch: 84, Objective: tensor([4500.4517], device='cuda:0', grad_fn=), Loss: 0.03310453146696091, KL/n: 61.500885009765625 + 0it [00:00, ?it/s]2025-05-26 04:21:24,694 - INFO - [Epoch 085 | Batch 0000] IWAE-loss 3595.1533 | mean log_px -0.0110 | KL -3013.15 + 1it [00:00, 4.74it/s] 2it [00:00, 6.80it/s] 3it [00:00, 7.90it/s] 4it [00:00, 8.54it/s] 5it [00:00, 8.99it/s] 6it [00:00, 9.25it/s] 7it [00:00, 9.46it/s] 8it [00:00, 9.57it/s] 9it [00:01, 9.66it/s] 10it [00:01, 9.72it/s] 11it [00:01, 9.78it/s] 12it [00:01, 9.17it/s] 13it [00:01, 9.36it/s] 14it [00:01, 9.51it/s] 15it [00:01, 9.61it/s] 16it [00:01, 9.69it/s] 17it [00:01, 9.73it/s] 18it [00:01, 9.77it/s] 19it [00:02, 9.79it/s] 20it [00:02, 9.80it/s] 21it [00:02, 9.82it/s] 22it [00:02, 9.83it/s] 23it [00:02, 9.84it/s] 24it [00:02, 9.80it/s] 25it [00:02, 9.84it/s] 26it [00:02, 9.83it/s] 27it [00:02, 9.41it/s] 28it [00:02, 9.51it/s] 29it [00:03, 9.61it/s] 30it [00:03, 9.07it/s] 31it [00:03, 9.30it/s] 32it [00:03, 9.46it/s] 33it [00:03, 9.58it/s] 34it [00:03, 9.66it/s] 35it [00:03, 9.73it/s] 36it [00:03, 9.77it/s] 37it [00:03, 9.80it/s] 38it [00:04, 9.82it/s] 39it [00:04, 9.84it/s] 40it [00:04, 9.82it/s] 41it [00:04, 9.83it/s] 42it [00:04, 9.82it/s] 43it [00:04, 9.82it/s] 44it [00:04, 9.82it/s] 45it [00:04, 9.85it/s] 46it [00:04, 9.82it/s] 47it [00:04, 9.84it/s] 48it [00:05, 9.11it/s] 49it [00:05, 9.28it/s] 50it [00:05, 9.43it/s]2025-05-26 04:21:29,891 - INFO - [Epoch 085 | Batch 0050] IWAE-loss 3756.6094 | mean log_px -0.0141 | KL -3010.08 + 51it [00:05, 9.53it/s] 52it [00:05, 9.61it/s] 53it [00:05, 9.70it/s] 54it [00:05, 9.69it/s] 55it [00:05, 9.72it/s] 56it [00:05, 9.62it/s] 57it [00:05, 9.65it/s] 58it [00:06, 9.73it/s] 59it [00:06, 9.79it/s] 60it [00:06, 9.82it/s] 61it [00:06, 9.85it/s] 62it [00:06, 9.83it/s] 63it [00:06, 9.85it/s] 64it [00:06, 9.86it/s] 65it [00:06, 9.86it/s] 66it [00:06, 9.86it/s] 67it [00:07, 9.87it/s] 68it [00:07, 9.86it/s] 69it [00:07, 9.86it/s] 70it [00:07, 9.87it/s] 71it [00:07, 9.87it/s] 72it [00:07, 9.85it/s] 73it [00:07, 9.86it/s] 74it [00:07, 9.34it/s] 75it [00:07, 9.50it/s] 76it [00:07, 9.60it/s] 77it [00:08, 9.70it/s] 78it [00:08, 9.75it/s] 79it [00:08, 9.18it/s] 80it [00:08, 9.39it/s] 81it [00:08, 9.54it/s] 82it [00:08, 9.63it/s] 83it [00:08, 9.71it/s] 84it [00:08, 9.76it/s] 85it [00:08, 9.79it/s] 86it [00:08, 9.81it/s] 87it [00:09, 9.84it/s] 88it [00:09, 9.87it/s] 89it [00:09, 9.90it/s] 90it [00:09, 9.90it/s] 91it [00:09, 9.88it/s] 92it [00:09, 9.87it/s] 93it [00:09, 9.87it/s] 94it [00:09, 9.84it/s] 95it [00:09, 9.86it/s] 96it [00:09, 9.85it/s] 97it [00:10, 9.85it/s] 98it [00:10, 9.80it/s] 99it [00:10, 9.81it/s] 100it [00:10, 9.80it/s]2025-05-26 04:21:35,009 - INFO - [Epoch 085 | Batch 0100] IWAE-loss 3645.5867 | mean log_px -0.0103 | KL -3006.17 + 101it [00:10, 9.82it/s] 102it [00:10, 9.85it/s] 103it [00:10, 9.86it/s] 104it [00:10, 9.87it/s] 105it [00:10, 9.87it/s] 106it [00:11, 9.84it/s] 107it [00:11, 9.84it/s] 108it [00:11, 9.32it/s] 109it [00:11, 9.47it/s] 110it [00:11, 9.59it/s] 111it [00:11, 9.66it/s] 112it [00:11, 9.72it/s] 113it [00:11, 9.77it/s] 114it [00:11, 9.81it/s] 115it [00:11, 9.84it/s] 116it [00:12, 9.84it/s] 117it [00:12, 9.83it/s] 118it [00:12, 9.84it/s] 119it [00:12, 9.86it/s] 120it [00:12, 9.85it/s] 121it [00:12, 9.85it/s] 122it [00:12, 9.83it/s] 123it [00:12, 9.85it/s] 124it [00:12, 9.86it/s] 125it [00:12, 9.86it/s] 126it [00:13, 9.87it/s] 127it [00:13, 9.88it/s] 128it [00:13, 9.87it/s] 129it [00:13, 9.88it/s] 130it [00:13, 9.87it/s] 131it [00:13, 9.88it/s] 132it [00:13, 9.88it/s] 133it [00:13, 9.87it/s] 134it [00:13, 9.85it/s] 135it [00:13, 9.87it/s] 136it [00:14, 9.87it/s] 137it [00:14, 9.88it/s] 138it [00:14, 9.88it/s] 139it [00:14, 9.88it/s] 140it [00:14, 9.87it/s] 141it [00:14, 9.37it/s] 142it [00:14, 9.51it/s] 143it [00:14, 9.62it/s] 144it [00:14, 9.69it/s] 145it [00:14, 9.74it/s] 146it [00:15, 9.77it/s] 147it [00:15, 9.81it/s] 148it [00:15, 9.81it/s] 149it [00:15, 9.83it/s] 150it [00:15, 9.83it/s]2025-05-26 04:21:40,115 - INFO - [Epoch 085 | Batch 0150] IWAE-loss 4150.4175 | mean log_px -0.0174 | KL -3003.18 + 151it [00:15, 9.83it/s] 152it [00:15, 9.82it/s] 153it [00:15, 9.85it/s] 154it [00:15, 9.84it/s] 155it [00:16, 9.87it/s] 156it [00:16, 9.85it/s] 157it [00:16, 9.85it/s] 158it [00:16, 9.85it/s] 159it [00:16, 9.80it/s] 160it [00:16, 9.71it/s] 161it [00:16, 9.75it/s] 162it [00:16, 9.79it/s] 163it [00:16, 9.83it/s] 164it [00:16, 9.82it/s] 165it [00:17, 9.83it/s] 166it [00:17, 9.83it/s] 167it [00:17, 9.83it/s] 168it [00:17, 9.82it/s] 169it [00:17, 9.79it/s] 170it [00:17, 9.64it/s] 171it [00:17, 9.49it/s] 172it [00:17, 8.86it/s] 173it [00:17, 9.12it/s] 174it [00:17, 9.29it/s] 175it [00:18, 9.44it/s] 176it [00:18, 9.55it/s] 177it [00:18, 9.63it/s] 178it [00:18, 9.69it/s] 179it [00:18, 9.75it/s] 180it [00:18, 9.77it/s] 181it [00:18, 9.80it/s] 182it [00:18, 9.16it/s] 183it [00:18, 9.36it/s] 184it [00:19, 9.50it/s] 185it [00:19, 9.62it/s] 186it [00:19, 9.68it/s] 187it [00:19, 9.74it/s] 188it [00:19, 9.78it/s] 189it [00:19, 9.78it/s] 190it [00:19, 9.80it/s] 191it [00:19, 9.82it/s] 192it [00:19, 9.83it/s] 193it [00:19, 9.84it/s] 194it [00:20, 9.82it/s] 195it [00:20, 8.79it/s] 196it [00:20, 9.06it/s] 196it [00:20, 9.63it/s] +2025-05-26 04:21:44,899 - INFO - Epoch: 85, Objective: tensor([3568.9839], device='cuda:0', grad_fn=), Loss: 0.01087101548910141, KL/n: 61.26937484741211 + 0it [00:00, ?it/s]2025-05-26 04:21:45,197 - INFO - [Epoch 086 | Batch 0000] IWAE-loss 3738.7234 | mean log_px -0.0156 | KL -3002.08 + 1it [00:00, 4.80it/s] 2it [00:00, 6.87it/s] 3it [00:00, 8.00it/s] 4it [00:00, 8.65it/s] 5it [00:00, 8.56it/s] 6it [00:00, 8.96it/s] 7it [00:00, 9.25it/s] 8it [00:00, 9.45it/s] 9it [00:01, 9.59it/s] 10it [00:01, 8.98it/s] 11it [00:01, 9.24it/s] 12it [00:01, 9.40it/s] 13it [00:01, 9.54it/s] 14it [00:01, 9.62it/s] 15it [00:01, 9.68it/s] 16it [00:01, 9.73it/s] 17it [00:01, 9.76it/s] 18it [00:01, 9.77it/s] 19it [00:02, 9.78it/s] 20it [00:02, 9.79it/s] 21it [00:02, 9.81it/s] 22it [00:02, 9.82it/s] 23it [00:02, 9.84it/s] 24it [00:02, 9.81it/s] 25it [00:02, 9.77it/s] 26it [00:02, 9.79it/s] 27it [00:02, 9.81it/s] 28it [00:02, 9.82it/s] 29it [00:03, 9.84it/s] 30it [00:03, 9.84it/s] 31it [00:03, 9.84it/s] 32it [00:03, 9.84it/s] 33it [00:03, 9.85it/s] 34it [00:03, 9.84it/s] 35it [00:03, 9.85it/s] 36it [00:03, 9.82it/s] 37it [00:03, 9.21it/s] 38it [00:04, 9.39it/s] 39it [00:04, 9.51it/s] 40it [00:04, 9.60it/s] 41it [00:04, 9.68it/s] 42it [00:04, 9.74it/s] 43it [00:04, 9.62it/s] 44it [00:04, 9.56it/s] 45it [00:04, 9.60it/s] 46it [00:04, 9.67it/s] 47it [00:04, 9.75it/s] 48it [00:05, 9.79it/s] 49it [00:05, 9.32it/s] 50it [00:05, 9.43it/s]2025-05-26 04:21:50,374 - INFO - [Epoch 086 | Batch 0050] IWAE-loss 3615.4333 | mean log_px -0.0113 | KL -2999.07 + 51it [00:05, 9.52it/s] 52it [00:05, 9.61it/s] 53it [00:05, 9.69it/s] 54it [00:05, 9.74it/s] 55it [00:05, 9.79it/s] 56it [00:05, 9.79it/s] 57it [00:05, 9.81it/s] 58it [00:06, 9.81it/s] 59it [00:06, 9.81it/s] 60it [00:06, 9.36it/s] 61it [00:06, 9.49it/s] 62it [00:06, 9.60it/s] 63it [00:06, 9.68it/s] 64it [00:06, 9.72it/s] 65it [00:07, 6.30it/s] 66it [00:07, 6.81it/s] 67it [00:07, 7.49it/s] 68it [00:07, 8.05it/s] 69it [00:07, 8.41it/s] 70it [00:07, 8.77it/s] 71it [00:07, 9.08it/s] 72it [00:07, 9.28it/s] 73it [00:07, 8.99it/s] 74it [00:07, 9.24it/s] 75it [00:08, 9.42it/s] 76it [00:08, 9.52it/s] 77it [00:08, 9.64it/s] 78it [00:08, 9.69it/s] 79it [00:08, 9.73it/s] 80it [00:08, 9.75it/s] 81it [00:08, 9.78it/s] 82it [00:08, 9.78it/s] 83it [00:08, 9.82it/s] 84it [00:08, 9.81it/s] 85it [00:09, 9.83it/s] 86it [00:09, 9.82it/s] 87it [00:09, 9.82it/s] 88it [00:09, 9.83it/s] 89it [00:09, 9.84it/s] 90it [00:09, 9.80it/s] 91it [00:09, 9.83it/s] 92it [00:09, 9.83it/s] 93it [00:09, 9.84it/s] 94it [00:10, 9.83it/s] 95it [00:10, 9.23it/s] 96it [00:10, 9.38it/s] 97it [00:10, 9.52it/s] 98it [00:10, 9.61it/s] 99it [00:10, 9.66it/s] 100it [00:10, 9.68it/s]2025-05-26 04:21:55,730 - INFO - [Epoch 086 | Batch 0100] IWAE-loss 4592.9512 | mean log_px -0.0254 | KL -2993.21 + 101it [00:10, 9.10it/s] 102it [00:10, 9.32it/s] 103it [00:10, 9.48it/s] 104it [00:11, 9.58it/s] 105it [00:11, 9.65it/s] 106it [00:11, 9.70it/s] 107it [00:11, 9.76it/s] 108it [00:11, 9.78it/s] 109it [00:11, 9.78it/s] 110it [00:11, 9.81it/s] 111it [00:11, 9.82it/s] 112it [00:11, 9.84it/s] 113it [00:11, 9.83it/s] 114it [00:12, 9.22it/s] 115it [00:12, 9.41it/s] 116it [00:12, 9.54it/s] 117it [00:12, 9.64it/s] 118it [00:12, 9.69it/s] 119it [00:12, 9.74it/s] 120it [00:12, 9.76it/s] 121it [00:12, 9.80it/s] 122it [00:12, 9.80it/s] 123it [00:13, 9.81it/s] 124it [00:13, 9.83it/s] 125it [00:13, 9.83it/s] 126it [00:13, 9.83it/s] 127it [00:13, 9.84it/s] 128it [00:13, 9.82it/s] 129it [00:13, 9.83it/s] 130it [00:13, 9.83it/s] 131it [00:13, 9.84it/s] 132it [00:13, 9.84it/s] 133it [00:14, 9.85it/s] 134it [00:14, 9.22it/s] 135it [00:14, 9.40it/s] 136it [00:14, 9.52it/s] 137it [00:14, 9.62it/s] 138it [00:14, 9.68it/s] 139it [00:14, 9.71it/s] 140it [00:14, 9.75it/s] 141it [00:14, 9.79it/s] 142it [00:14, 9.78it/s] 143it [00:15, 9.82it/s] 144it [00:15, 9.83it/s] 145it [00:15, 9.84it/s] 146it [00:15, 9.83it/s] 147it [00:15, 9.21it/s] 148it [00:15, 9.35it/s] 149it [00:15, 9.49it/s] 150it [00:15, 9.59it/s]2025-05-26 04:22:00,903 - INFO - [Epoch 086 | Batch 0150] IWAE-loss 3799.1528 | mean log_px -0.0115 | KL -2990.14 + 151it [00:15, 9.06it/s] 152it [00:16, 9.29it/s] 153it [00:16, 9.47it/s] 154it [00:16, 9.58it/s] 155it [00:16, 9.65it/s] 156it [00:16, 9.68it/s] 157it [00:16, 9.70it/s] 158it [00:16, 9.74it/s] 159it [00:16, 9.78it/s] 160it [00:16, 9.78it/s] 161it [00:16, 9.81it/s] 162it [00:17, 9.79it/s] 163it [00:17, 9.82it/s] 164it [00:17, 9.81it/s] 165it [00:17, 9.84it/s] 166it [00:17, 9.83it/s] 167it [00:17, 9.82it/s] 168it [00:17, 9.83it/s] 169it [00:17, 9.82it/s] 170it [00:17, 9.82it/s] 171it [00:17, 9.83it/s] 172it [00:18, 9.82it/s] 173it [00:18, 9.83it/s] 174it [00:18, 9.83it/s] 175it [00:18, 9.84it/s] 176it [00:18, 9.86it/s] 177it [00:18, 9.25it/s] 178it [00:18, 9.43it/s] 179it [00:18, 9.56it/s] 180it [00:18, 9.53it/s] 181it [00:19, 9.61it/s] 182it [00:19, 9.67it/s] 183it [00:19, 9.71it/s] 184it [00:19, 9.73it/s] 185it [00:19, 9.76it/s] 186it [00:19, 9.80it/s] 187it [00:19, 9.83it/s] 188it [00:19, 9.84it/s] 189it [00:19, 9.82it/s] 190it [00:19, 9.82it/s] 191it [00:20, 9.21it/s] 192it [00:20, 9.37it/s] 193it [00:20, 9.51it/s] 194it [00:20, 9.59it/s] 195it [00:20, 8.66it/s] 196it [00:20, 9.49it/s] +2025-05-26 04:22:05,695 - INFO - Epoch: 86, Objective: tensor([3665.3276], device='cuda:0', grad_fn=), Loss: 0.01617186702787876, KL/n: 61.00396728515625 + 0it [00:00, ?it/s]2025-05-26 04:22:05,969 - INFO - [Epoch 087 | Batch 0000] IWAE-loss 3902.4707 | mean log_px -0.0153 | KL -2986.10 + 1it [00:00, 5.28it/s] 2it [00:00, 7.23it/s] 3it [00:00, 8.07it/s] 4it [00:00, 8.69it/s] 5it [00:00, 9.11it/s] 6it [00:00, 9.35it/s] 7it [00:00, 9.53it/s] 8it [00:00, 9.65it/s] 9it [00:01, 9.72it/s] 10it [00:01, 9.78it/s] 11it [00:01, 9.82it/s] 12it [00:01, 9.68it/s] 13it [00:01, 9.75it/s] 14it [00:01, 9.78it/s] 15it [00:01, 9.82it/s] 16it [00:01, 9.83it/s] 17it [00:01, 9.79it/s] 18it [00:01, 9.16it/s] 19it [00:02, 9.36it/s] 20it [00:02, 9.52it/s] 21it [00:02, 9.64it/s] 22it [00:02, 9.71it/s] 23it [00:02, 9.25it/s] 24it [00:02, 9.41it/s] 25it [00:02, 9.54it/s] 26it [00:02, 9.06it/s] 27it [00:02, 9.28it/s] 28it [00:03, 9.43it/s] 29it [00:03, 9.56it/s] 30it [00:03, 9.65it/s] 31it [00:03, 9.74it/s] 32it [00:03, 9.77it/s] 33it [00:03, 9.81it/s] 34it [00:03, 9.83it/s] 35it [00:03, 9.86it/s] 36it [00:03, 9.87it/s] 37it [00:03, 9.88it/s] 38it [00:04, 9.89it/s] 39it [00:04, 9.28it/s] 40it [00:04, 9.43it/s] 41it [00:04, 9.56it/s] 42it [00:04, 9.22it/s] 43it [00:04, 9.43it/s] 44it [00:04, 9.52it/s] 45it [00:04, 9.62it/s] 46it [00:04, 9.69it/s] 47it [00:04, 9.75it/s] 48it [00:05, 9.16it/s] 49it [00:05, 9.36it/s] 50it [00:05, 9.49it/s]2025-05-26 04:22:11,174 - INFO - [Epoch 087 | Batch 0050] IWAE-loss 4207.4248 | mean log_px -0.0193 | KL -2987.37 + 51it [00:05, 9.61it/s] 52it [00:05, 9.68it/s] 53it [00:05, 9.75it/s] 54it [00:05, 9.79it/s] 55it [00:05, 9.84it/s] 56it [00:05, 9.85it/s] 57it [00:05, 9.87it/s] 58it [00:06, 9.38it/s] 59it [00:06, 9.54it/s] 60it [00:06, 9.63it/s] 61it [00:06, 9.70it/s] 62it [00:06, 9.74it/s] 63it [00:06, 9.79it/s] 64it [00:06, 9.20it/s] 65it [00:06, 9.40it/s] 66it [00:06, 9.55it/s] 67it [00:07, 9.65it/s] 68it [00:07, 9.72it/s] 69it [00:07, 9.78it/s] 70it [00:07, 9.81it/s] 71it [00:07, 9.85it/s] 72it [00:07, 9.85it/s] 73it [00:07, 9.84it/s] 74it [00:07, 9.70it/s] 75it [00:07, 8.86it/s] 76it [00:08, 9.06it/s] 77it [00:08, 9.29it/s] 78it [00:08, 9.43it/s] 79it [00:08, 9.56it/s] 80it [00:08, 9.66it/s] 81it [00:08, 9.72it/s] 82it [00:08, 9.75it/s] 83it [00:08, 9.78it/s] 84it [00:08, 9.78it/s] 85it [00:08, 9.14it/s] 86it [00:09, 9.34it/s] 87it [00:09, 9.45it/s] 88it [00:09, 9.49it/s] 89it [00:09, 9.10it/s] 90it [00:09, 9.18it/s] 91it [00:09, 9.38it/s] 92it [00:09, 8.85it/s] 93it [00:09, 9.12it/s] 94it [00:09, 9.19it/s] 95it [00:10, 9.38it/s] 96it [00:10, 9.52it/s] 97it [00:10, 9.63it/s] 98it [00:10, 9.70it/s] 99it [00:10, 9.74it/s] 100it [00:10, 9.77it/s]2025-05-26 04:22:16,409 - INFO - [Epoch 087 | Batch 0100] IWAE-loss 3976.6338 | mean log_px -0.0192 | KL -2984.05 + 101it [00:10, 9.16it/s] 102it [00:10, 9.37it/s] 103it [00:10, 9.52it/s] 104it [00:10, 9.63it/s] 105it [00:11, 9.71it/s] 106it [00:11, 9.74it/s] 107it [00:11, 9.17it/s] 108it [00:11, 9.37it/s] 109it [00:11, 9.52it/s] 110it [00:11, 9.64it/s] 111it [00:11, 9.72it/s] 112it [00:11, 9.77it/s] 113it [00:11, 9.81it/s] 114it [00:11, 9.82it/s] 115it [00:12, 9.84it/s] 116it [00:12, 9.86it/s] 117it [00:12, 9.23it/s] 118it [00:12, 9.40it/s] 119it [00:12, 9.50it/s] 120it [00:12, 9.61it/s] 121it [00:12, 9.69it/s] 122it [00:12, 9.75it/s] 123it [00:12, 9.79it/s] 124it [00:13, 9.82it/s] 125it [00:13, 9.86it/s] 126it [00:13, 9.86it/s] 127it [00:13, 9.87it/s] 128it [00:13, 9.87it/s] 129it [00:13, 9.87it/s] 130it [00:13, 9.87it/s] 131it [00:13, 9.88it/s] 132it [00:13, 9.87it/s] 133it [00:13, 9.88it/s] 134it [00:14, 9.88it/s] 135it [00:14, 9.89it/s] 136it [00:14, 9.88it/s] 137it [00:14, 9.25it/s] 138it [00:14, 9.39it/s] 139it [00:14, 9.53it/s] 140it [00:14, 9.62it/s] 141it [00:14, 9.71it/s] 142it [00:14, 9.76it/s] 143it [00:14, 9.19it/s] 144it [00:15, 9.39it/s] 145it [00:15, 9.55it/s] 146it [00:15, 9.64it/s] 147it [00:15, 9.12it/s] 148it [00:15, 9.33it/s] 149it [00:15, 9.50it/s] 150it [00:15, 9.60it/s]2025-05-26 04:22:21,608 - INFO - [Epoch 087 | Batch 0150] IWAE-loss 3641.0764 | mean log_px -0.0103 | KL -2975.16 + 151it [00:15, 9.68it/s] 152it [00:15, 9.75it/s] 153it [00:16, 9.80it/s] 154it [00:16, 9.83it/s] 155it [00:16, 9.86it/s] 156it [00:16, 9.86it/s] 157it [00:16, 9.35it/s] 158it [00:16, 9.49it/s] 159it [00:16, 9.61it/s] 160it [00:16, 9.69it/s] 161it [00:16, 9.75it/s] 162it [00:16, 9.78it/s] 163it [00:17, 9.81it/s] 164it [00:17, 9.83it/s] 165it [00:17, 9.86it/s] 166it [00:17, 9.23it/s] 167it [00:17, 9.43it/s] 168it [00:17, 9.56it/s] 169it [00:17, 9.67it/s] 170it [00:17, 9.74it/s] 171it [00:17, 9.79it/s] 172it [00:17, 9.81it/s] 173it [00:18, 9.84it/s] 174it [00:18, 9.84it/s] 175it [00:18, 9.87it/s] 176it [00:18, 9.87it/s] 177it [00:18, 9.89it/s] 178it [00:18, 9.88it/s] 179it [00:18, 9.88it/s] 180it [00:18, 9.89it/s] 181it [00:18, 9.88it/s] 182it [00:19, 9.34it/s] 183it [00:19, 9.52it/s] 184it [00:19, 9.62it/s] 186it [00:19, 9.79it/s] 188it [00:19, 9.87it/s] 189it [00:19, 9.89it/s] 190it [00:19, 9.49it/s] 191it [00:19, 9.54it/s] 192it [00:20, 9.62it/s] 193it [00:20, 9.71it/s] 194it [00:20, 9.78it/s] 195it [00:20, 9.40it/s] 196it [00:20, 9.55it/s] +2025-05-26 04:22:26,341 - INFO - Epoch: 87, Objective: tensor([3995.7356], device='cuda:0', grad_fn=), Loss: 0.013150476850569248, KL/n: 60.77505874633789 + 0it [00:00, ?it/s]2025-05-26 04:22:26,616 - INFO - [Epoch 088 | Batch 0000] IWAE-loss 3533.7141 | mean log_px -0.0108 | KL -2978.48 + 1it [00:00, 4.65it/s] 2it [00:00, 6.76it/s] 4it [00:00, 8.36it/s] 5it [00:00, 8.75it/s] 6it [00:00, 9.05it/s] 7it [00:00, 9.30it/s] 8it [00:00, 9.48it/s] 9it [00:01, 9.62it/s] 10it [00:01, 9.71it/s] 11it [00:01, 9.79it/s] 12it [00:01, 9.84it/s] 14it [00:01, 9.91it/s] 15it [00:01, 9.92it/s] 16it [00:01, 9.92it/s] 17it [00:01, 9.93it/s] 18it [00:01, 9.45it/s] 19it [00:02, 9.58it/s] 20it [00:02, 9.67it/s] 21it [00:02, 9.76it/s] 22it [00:02, 9.80it/s] 23it [00:02, 9.86it/s] 24it [00:02, 9.89it/s] 25it [00:02, 9.92it/s] 26it [00:02, 9.90it/s] 27it [00:02, 9.93it/s] 28it [00:02, 9.44it/s] 29it [00:03, 9.59it/s] 30it [00:03, 9.68it/s] 31it [00:03, 9.74it/s] 32it [00:03, 9.78it/s] 33it [00:03, 9.35it/s] 34it [00:03, 9.51it/s] 36it [00:03, 9.48it/s] 37it [00:03, 9.21it/s] 38it [00:04, 9.38it/s] 39it [00:04, 9.52it/s] 40it [00:04, 9.64it/s] 42it [00:04, 9.80it/s] 43it [00:04, 9.84it/s] 44it [00:04, 9.85it/s] 45it [00:04, 9.86it/s] 46it [00:04, 9.87it/s] 47it [00:04, 9.90it/s] 48it [00:05, 9.91it/s] 49it [00:05, 9.93it/s] 50it [00:05, 9.93it/s]2025-05-26 04:22:31,764 - INFO - [Epoch 088 | Batch 0050] IWAE-loss 4089.7800 | mean log_px -0.0202 | KL -2976.60 + 51it [00:05, 9.92it/s] 52it [00:05, 9.93it/s] 53it [00:05, 9.93it/s] 54it [00:05, 9.93it/s] 55it [00:05, 9.94it/s] 56it [00:05, 9.93it/s] 57it [00:05, 9.94it/s] 58it [00:06, 6.12it/s] 59it [00:06, 6.90it/s] 60it [00:06, 7.60it/s] 61it [00:06, 8.18it/s] 62it [00:06, 8.63it/s] 64it [00:06, 9.21it/s] 65it [00:06, 9.38it/s] 66it [00:07, 9.11it/s] 67it [00:07, 9.32it/s] 68it [00:07, 9.46it/s] 69it [00:07, 9.56it/s] 70it [00:07, 9.65it/s] 71it [00:07, 9.72it/s] 72it [00:07, 9.75it/s] 73it [00:07, 9.73it/s] 74it [00:07, 9.74it/s] 75it [00:07, 9.80it/s] 76it [00:08, 9.82it/s] 78it [00:08, 9.41it/s] 79it [00:08, 9.55it/s] 80it [00:08, 9.65it/s] 82it [00:08, 9.78it/s] 83it [00:08, 9.46it/s] 84it [00:08, 9.53it/s] 85it [00:09, 9.61it/s] 86it [00:09, 9.69it/s] 87it [00:09, 9.74it/s] 88it [00:09, 9.76it/s] 89it [00:09, 9.80it/s] 90it [00:09, 9.81it/s] 91it [00:09, 9.83it/s] 92it [00:09, 9.85it/s] 93it [00:09, 9.87it/s] 94it [00:09, 9.88it/s] 95it [00:10, 9.88it/s] 96it [00:10, 9.87it/s] 97it [00:10, 9.86it/s] 98it [00:10, 9.85it/s] 99it [00:10, 9.88it/s] 100it [00:10, 9.87it/s]2025-05-26 04:22:37,083 - INFO - [Epoch 088 | Batch 0100] IWAE-loss 3568.9946 | mean log_px -0.0101 | KL -2965.73 + 101it [00:10, 9.86it/s] 102it [00:10, 9.86it/s] 103it [00:10, 9.89it/s] 104it [00:10, 9.89it/s] 105it [00:11, 9.89it/s] 106it [00:11, 9.89it/s] 107it [00:11, 9.90it/s] 108it [00:11, 9.89it/s] 109it [00:11, 9.88it/s] 110it [00:11, 9.87it/s] 111it [00:11, 9.89it/s] 112it [00:11, 9.87it/s] 113it [00:11, 9.88it/s] 114it [00:11, 9.68it/s] 115it [00:12, 9.66it/s] 116it [00:12, 9.67it/s] 117it [00:12, 9.74it/s] 118it [00:12, 9.78it/s] 119it [00:12, 9.82it/s] 120it [00:12, 9.84it/s] 121it [00:12, 9.86it/s] 122it [00:12, 9.87it/s] 123it [00:12, 9.87it/s] 124it [00:12, 9.87it/s] 125it [00:13, 9.88it/s] 126it [00:13, 9.25it/s] 127it [00:13, 9.41it/s] 128it [00:13, 9.52it/s] 129it [00:13, 9.63it/s] 130it [00:13, 9.66it/s] 131it [00:13, 9.72it/s] 132it [00:13, 9.13it/s] 133it [00:13, 9.35it/s] 134it [00:14, 9.50it/s] 135it [00:14, 8.99it/s] 136it [00:14, 9.22it/s] 137it [00:14, 9.40it/s] 138it [00:14, 9.53it/s] 139it [00:14, 9.64it/s] 140it [00:14, 9.71it/s] 141it [00:14, 9.77it/s] 142it [00:14, 9.79it/s] 143it [00:14, 9.82it/s] 144it [00:15, 9.82it/s] 145it [00:15, 9.21it/s] 146it [00:15, 9.38it/s] 147it [00:15, 9.51it/s] 148it [00:15, 9.61it/s] 149it [00:15, 9.70it/s] 150it [00:15, 9.76it/s]2025-05-26 04:22:42,253 - INFO - [Epoch 088 | Batch 0150] IWAE-loss 3878.7766 | mean log_px -0.0216 | KL -2965.69 + 151it [00:15, 9.80it/s] 152it [00:15, 9.81it/s] 153it [00:16, 9.83it/s] 154it [00:16, 9.82it/s] 155it [00:16, 9.22it/s] 156it [00:16, 9.42it/s] 157it [00:16, 9.54it/s] 158it [00:16, 9.64it/s] 159it [00:16, 9.70it/s] 160it [00:16, 9.15it/s] 161it [00:16, 9.36it/s] 162it [00:16, 9.51it/s] 163it [00:17, 9.62it/s] 164it [00:17, 9.69it/s] 165it [00:17, 9.74it/s] 166it [00:17, 9.79it/s] 167it [00:17, 9.80it/s] 168it [00:17, 9.82it/s] 169it [00:17, 9.86it/s] 170it [00:17, 9.87it/s] 171it [00:17, 9.88it/s] 172it [00:17, 9.88it/s] 173it [00:18, 9.85it/s] 174it [00:18, 9.71it/s] 175it [00:18, 9.15it/s] 176it [00:18, 9.17it/s] 177it [00:18, 9.10it/s] 178it [00:18, 8.99it/s] 179it [00:18, 9.20it/s] 180it [00:18, 9.39it/s] 181it [00:18, 9.53it/s] 182it [00:19, 9.62it/s] 183it [00:19, 9.69it/s] 184it [00:19, 9.73it/s] 185it [00:19, 9.78it/s] 186it [00:19, 9.81it/s] 187it [00:19, 9.84it/s] 188it [00:19, 9.16it/s] 189it [00:19, 9.35it/s] 190it [00:19, 9.42it/s] 191it [00:20, 9.51it/s] 192it [00:20, 9.54it/s] 193it [00:20, 9.64it/s] 194it [00:20, 9.08it/s] 195it [00:20, 8.84it/s] 196it [00:20, 9.50it/s] +2025-05-26 04:22:47,095 - INFO - Epoch: 88, Objective: tensor([3712.7053], device='cuda:0', grad_fn=), Loss: 0.014657406136393547, KL/n: 60.55072784423828 + 0it [00:00, ?it/s]2025-05-26 04:22:47,367 - INFO - [Epoch 089 | Batch 0000] IWAE-loss 3791.1438 | mean log_px -0.0117 | KL -2966.70 + 1it [00:00, 4.76it/s] 2it [00:00, 6.82it/s] 3it [00:00, 7.92it/s] 4it [00:00, 8.60it/s] 5it [00:00, 8.40it/s] 6it [00:00, 8.84it/s] 7it [00:00, 9.15it/s] 8it [00:00, 9.38it/s] 9it [00:01, 9.53it/s] 10it [00:01, 9.62it/s] 11it [00:01, 9.70it/s] 12it [00:01, 9.68it/s] 13it [00:01, 9.75it/s] 14it [00:01, 9.16it/s] 15it [00:01, 9.36it/s] 16it [00:01, 9.51it/s] 17it [00:01, 9.62it/s] 18it [00:01, 9.69it/s] 19it [00:02, 9.75it/s] 20it [00:02, 9.78it/s] 21it [00:02, 9.30it/s] 22it [00:02, 9.45it/s] 23it [00:02, 9.46it/s] 24it [00:02, 8.86it/s] 25it [00:02, 9.15it/s] 26it [00:02, 9.35it/s] 27it [00:02, 9.46it/s] 28it [00:03, 9.05it/s] 29it [00:03, 9.27it/s] 30it [00:03, 9.44it/s] 31it [00:03, 9.55it/s] 32it [00:03, 9.64it/s] 33it [00:03, 9.70it/s] 34it [00:03, 9.13it/s] 35it [00:03, 9.31it/s] 36it [00:03, 9.48it/s] 37it [00:04, 9.09it/s] 38it [00:04, 9.32it/s] 39it [00:04, 9.48it/s] 40it [00:04, 8.97it/s] 41it [00:04, 9.22it/s] 42it [00:04, 9.39it/s] 43it [00:04, 9.53it/s] 44it [00:04, 9.60it/s] 45it [00:04, 9.67it/s] 46it [00:04, 9.68it/s] 47it [00:05, 9.75it/s] 48it [00:05, 9.79it/s] 49it [00:05, 9.85it/s] 50it [00:05, 9.86it/s]2025-05-26 04:22:52,653 - INFO - [Epoch 089 | Batch 0050] IWAE-loss 3452.4019 | mean log_px -0.0074 | KL -2963.17 + 51it [00:05, 9.86it/s] 52it [00:05, 9.81it/s] 53it [00:05, 9.84it/s] 54it [00:05, 9.79it/s] 55it [00:05, 9.83it/s] 56it [00:06, 9.23it/s] 57it [00:06, 9.43it/s] 58it [00:06, 9.56it/s] 59it [00:06, 9.69it/s] 60it [00:06, 9.75it/s] 61it [00:06, 9.82it/s] 62it [00:06, 9.84it/s] 63it [00:06, 9.86it/s] 64it [00:06, 9.88it/s] 65it [00:06, 9.90it/s] 66it [00:07, 9.90it/s] 67it [00:07, 9.91it/s] 68it [00:07, 9.70it/s] 69it [00:07, 8.80it/s] 70it [00:07, 8.77it/s] 71it [00:07, 8.96it/s] 72it [00:07, 9.13it/s] 73it [00:07, 9.28it/s] 74it [00:07, 9.37it/s] 75it [00:07, 9.45it/s] 76it [00:08, 9.52it/s] 77it [00:08, 9.58it/s] 78it [00:08, 9.60it/s] 79it [00:08, 9.59it/s] 80it [00:08, 9.58it/s] 81it [00:08, 9.55it/s] 82it [00:08, 9.65it/s] 83it [00:08, 9.24it/s] 84it [00:08, 9.42it/s] 85it [00:09, 9.56it/s] 86it [00:09, 9.60it/s] 87it [00:09, 9.69it/s] 88it [00:09, 9.68it/s] 89it [00:09, 9.75it/s] 90it [00:09, 9.78it/s] 91it [00:09, 9.81it/s] 92it [00:09, 9.83it/s] 93it [00:09, 9.86it/s] 94it [00:09, 9.87it/s] 95it [00:10, 9.89it/s] 96it [00:10, 9.87it/s] 97it [00:10, 9.90it/s] 98it [00:10, 9.89it/s] 99it [00:10, 9.89it/s] 100it [00:10, 9.89it/s]2025-05-26 04:22:57,846 - INFO - [Epoch 089 | Batch 0100] IWAE-loss 3771.1143 | mean log_px -0.0146 | KL -2961.73 + 101it [00:10, 9.87it/s] 102it [00:10, 9.88it/s] 103it [00:10, 9.39it/s] 104it [00:10, 9.52it/s] 105it [00:11, 9.64it/s] 106it [00:11, 9.71it/s] 107it [00:11, 9.78it/s] 108it [00:11, 9.27it/s] 109it [00:11, 9.45it/s] 110it [00:11, 9.57it/s] 111it [00:11, 9.67it/s] 112it [00:11, 9.73it/s] 113it [00:11, 9.78it/s] 114it [00:12, 9.81it/s] 115it [00:12, 9.84it/s] 116it [00:12, 9.85it/s] 117it [00:12, 9.20it/s] 118it [00:12, 9.33it/s] 119it [00:12, 9.46it/s] 120it [00:12, 9.59it/s] 121it [00:12, 9.70it/s] 122it [00:12, 9.75it/s] 123it [00:12, 9.80it/s] 124it [00:13, 9.36it/s] 125it [00:13, 9.51it/s] 126it [00:13, 9.62it/s] 127it [00:13, 9.70it/s] 128it [00:13, 9.76it/s] 129it [00:13, 9.78it/s] 130it [00:13, 9.80it/s] 131it [00:13, 9.84it/s] 132it [00:13, 9.23it/s] 133it [00:14, 9.25it/s] 134it [00:14, 9.35it/s] 135it [00:14, 9.48it/s] 136it [00:14, 8.98it/s] 137it [00:14, 9.24it/s] 138it [00:14, 9.42it/s] 139it [00:14, 9.56it/s] 140it [00:14, 9.67it/s] 141it [00:14, 9.74it/s] 142it [00:14, 9.19it/s] 143it [00:15, 9.39it/s] 144it [00:15, 9.48it/s] 145it [00:15, 9.58it/s] 146it [00:15, 9.67it/s] 147it [00:15, 9.74it/s] 148it [00:15, 9.77it/s] 149it [00:15, 9.82it/s] 150it [00:15, 9.84it/s]2025-05-26 04:23:03,065 - INFO - [Epoch 089 | Batch 0150] IWAE-loss 3447.8906 | mean log_px -0.0127 | KL -2953.03 + 151it [00:15, 9.21it/s] 152it [00:16, 9.39it/s] 153it [00:16, 9.53it/s] 154it [00:16, 9.63it/s] 155it [00:16, 9.24it/s] 156it [00:16, 9.42it/s] 157it [00:16, 9.56it/s] 158it [00:16, 9.66it/s] 159it [00:16, 9.12it/s] 160it [00:16, 9.34it/s] 161it [00:16, 9.48it/s] 162it [00:17, 9.60it/s] 163it [00:17, 9.69it/s] 164it [00:17, 9.76it/s] 165it [00:17, 9.75it/s] 166it [00:17, 9.05it/s] 167it [00:17, 9.26it/s] 168it [00:17, 9.43it/s] 169it [00:17, 9.56it/s] 170it [00:17, 9.04it/s] 171it [00:18, 9.27it/s] 172it [00:18, 9.44it/s] 173it [00:18, 9.57it/s] 174it [00:18, 9.66it/s] 175it [00:18, 9.73it/s] 176it [00:18, 9.15it/s] 177it [00:18, 9.36it/s] 178it [00:18, 9.49it/s] 179it [00:18, 9.63it/s] 180it [00:18, 9.12it/s] 181it [00:19, 9.29it/s] 182it [00:19, 9.45it/s] 183it [00:19, 9.57it/s] 184it [00:19, 9.66it/s] 185it [00:19, 9.13it/s] 186it [00:19, 9.34it/s] 187it [00:19, 9.47it/s] 188it [00:19, 9.56it/s] 189it [00:19, 9.67it/s] 190it [00:20, 9.24it/s] 191it [00:20, 9.21it/s] 192it [00:20, 8.91it/s] 193it [00:20, 8.86it/s] 194it [00:20, 9.06it/s] 195it [00:20, 8.82it/s] 196it [00:20, 9.13it/s] 196it [00:20, 9.44it/s] +2025-05-26 04:23:07,986 - INFO - Epoch: 89, Objective: tensor([3744.3455], device='cuda:0', grad_fn=), Loss: 0.016745569184422493, KL/n: 60.30201721191406 + 0it [00:00, ?it/s]2025-05-26 04:23:08,263 - INFO - [Epoch 090 | Batch 0000] IWAE-loss 4105.8560 | mean log_px -0.0164 | KL -2952.96 + 1it [00:00, 4.75it/s] 2it [00:00, 6.79it/s] 3it [00:00, 7.90it/s] 4it [00:00, 8.51it/s] 5it [00:00, 8.90it/s] 6it [00:00, 8.66it/s] 7it [00:00, 9.00it/s] 8it [00:00, 9.23it/s] 9it [00:01, 9.40it/s] 10it [00:01, 9.50it/s] 11it [00:01, 9.57it/s] 12it [00:01, 9.14it/s] 13it [00:01, 9.33it/s] 14it [00:01, 9.43it/s] 15it [00:01, 9.53it/s] 16it [00:01, 9.59it/s] 17it [00:01, 9.63it/s] 18it [00:02, 9.17it/s] 19it [00:02, 9.32it/s] 20it [00:02, 9.43it/s] 21it [00:02, 9.52it/s] 22it [00:02, 9.56it/s] 23it [00:02, 9.10it/s] 24it [00:02, 9.27it/s] 25it [00:02, 9.40it/s] 26it [00:02, 9.51it/s] 27it [00:02, 9.57it/s] 28it [00:03, 9.60it/s] 29it [00:03, 9.66it/s] 30it [00:03, 9.70it/s] 31it [00:03, 9.48it/s] 32it [00:03, 9.50it/s] 33it [00:03, 9.59it/s] 34it [00:03, 9.66it/s] 35it [00:03, 9.09it/s] 36it [00:03, 9.28it/s] 37it [00:04, 9.45it/s] 38it [00:04, 9.55it/s] 39it [00:04, 9.63it/s] 40it [00:04, 9.68it/s] 41it [00:04, 9.14it/s] 42it [00:04, 9.23it/s] 43it [00:04, 9.30it/s] 44it [00:04, 9.39it/s] 45it [00:04, 9.51it/s] 46it [00:04, 8.97it/s] 47it [00:05, 9.21it/s] 48it [00:05, 9.36it/s] 49it [00:05, 9.49it/s] 50it [00:05, 9.57it/s]2025-05-26 04:23:13,578 - INFO - [Epoch 090 | Batch 0050] IWAE-loss 3642.5940 | mean log_px -0.0134 | KL -2952.94 + 51it [00:05, 9.00it/s] 52it [00:05, 9.22it/s] 53it [00:05, 9.36it/s] 54it [00:05, 9.49it/s] 55it [00:05, 9.56it/s] 56it [00:06, 9.62it/s] 57it [00:06, 9.67it/s] 58it [00:06, 9.70it/s] 59it [00:06, 9.72it/s] 60it [00:06, 9.75it/s] 61it [00:06, 9.75it/s] 62it [00:06, 9.75it/s] 63it [00:06, 9.75it/s] 64it [00:07, 6.29it/s] 65it [00:07, 7.04it/s] 66it [00:07, 7.66it/s] 67it [00:07, 8.19it/s] 68it [00:07, 8.60it/s] 69it [00:07, 8.39it/s] 70it [00:07, 8.75it/s] 71it [00:07, 9.05it/s] 72it [00:07, 9.24it/s] 73it [00:07, 9.41it/s] 74it [00:08, 9.44it/s] 75it [00:08, 9.00it/s] 76it [00:08, 9.04it/s] 77it [00:08, 9.25it/s] 78it [00:08, 9.39it/s] 79it [00:08, 9.48it/s] 80it [00:08, 9.55it/s] 81it [00:08, 9.61it/s] 82it [00:08, 9.64it/s] 83it [00:09, 9.68it/s] 84it [00:09, 9.67it/s] 85it [00:09, 9.69it/s] 86it [00:09, 9.63it/s] 87it [00:09, 9.65it/s] 88it [00:09, 9.66it/s] 89it [00:09, 9.68it/s] 90it [00:09, 9.05it/s] 91it [00:09, 9.25it/s] 92it [00:09, 9.40it/s] 93it [00:10, 9.50it/s] 94it [00:10, 9.56it/s] 95it [00:10, 9.62it/s] 96it [00:10, 9.06it/s] 97it [00:10, 9.25it/s] 98it [00:10, 9.40it/s] 99it [00:10, 9.51it/s] 100it [00:10, 9.57it/s]2025-05-26 04:23:19,026 - INFO - [Epoch 090 | Batch 0100] IWAE-loss 4252.8389 | mean log_px -0.0252 | KL -2944.33 + 101it [00:10, 9.60it/s] 102it [00:11, 9.63it/s] 103it [00:11, 9.64it/s] 104it [00:11, 9.68it/s] 105it [00:11, 9.72it/s] 106it [00:11, 9.73it/s] 107it [00:11, 9.75it/s] 108it [00:11, 9.75it/s] 109it [00:11, 9.76it/s] 110it [00:11, 9.77it/s] 111it [00:11, 9.77it/s] 112it [00:12, 9.76it/s] 113it [00:12, 9.75it/s] 114it [00:12, 9.75it/s] 115it [00:12, 9.60it/s] 116it [00:12, 9.57it/s] 117it [00:12, 9.56it/s] 118it [00:12, 9.57it/s] 119it [00:12, 9.56it/s] 120it [00:12, 9.56it/s] 121it [00:13, 9.51it/s] 122it [00:13, 9.50it/s] 123it [00:13, 9.52it/s] 124it [00:13, 9.47it/s] 125it [00:13, 9.49it/s] 126it [00:13, 9.52it/s] 127it [00:13, 9.50it/s] 128it [00:13, 8.96it/s] 129it [00:13, 9.09it/s] 130it [00:13, 9.17it/s] 131it [00:14, 9.28it/s] 132it [00:14, 8.75it/s] 133it [00:14, 8.98it/s] 134it [00:14, 9.08it/s] 135it [00:14, 9.18it/s] 136it [00:14, 9.26it/s] 137it [00:14, 9.31it/s] 138it [00:14, 9.38it/s] 139it [00:14, 9.47it/s] 140it [00:15, 9.53it/s] 141it [00:15, 9.60it/s] 142it [00:15, 9.64it/s] 143it [00:15, 9.68it/s] 144it [00:15, 9.70it/s] 145it [00:15, 9.71it/s] 146it [00:15, 9.72it/s] 147it [00:15, 9.73it/s] 148it [00:15, 9.74it/s] 149it [00:15, 9.66it/s] 150it [00:16, 9.61it/s]2025-05-26 04:23:24,280 - INFO - [Epoch 090 | Batch 0150] IWAE-loss 3503.3472 | mean log_px -0.0103 | KL -2943.74 + 151it [00:16, 9.53it/s] 152it [00:16, 9.05it/s] 153it [00:16, 9.21it/s] 154it [00:16, 9.30it/s] 155it [00:16, 9.36it/s] 156it [00:16, 9.43it/s] 157it [00:16, 9.48it/s] 158it [00:16, 9.43it/s] 159it [00:17, 9.52it/s] 160it [00:17, 9.19it/s] 161it [00:17, 9.36it/s] 162it [00:17, 8.90it/s] 163it [00:17, 9.13it/s] 164it [00:17, 9.30it/s] 165it [00:17, 9.45it/s] 166it [00:17, 9.54it/s] 167it [00:17, 9.62it/s] 168it [00:18, 9.66it/s] 169it [00:18, 9.70it/s] 170it [00:18, 9.11it/s] 171it [00:18, 9.29it/s] 172it [00:18, 9.43it/s] 173it [00:18, 9.53it/s] 174it [00:18, 9.12it/s] 175it [00:18, 9.30it/s] 176it [00:18, 9.44it/s] 177it [00:18, 9.55it/s] 178it [00:19, 9.62it/s] 179it [00:19, 9.67it/s] 180it [00:19, 9.21it/s] 181it [00:19, 9.38it/s] 182it [00:19, 9.50it/s] 183it [00:19, 9.58it/s] 184it [00:19, 9.63it/s] 185it [00:19, 9.69it/s] 186it [00:19, 9.71it/s] 187it [00:20, 9.74it/s] 188it [00:20, 9.73it/s] 189it [00:20, 9.14it/s] 190it [00:20, 9.31it/s] 191it [00:20, 9.47it/s] 192it [00:20, 9.55it/s] 193it [00:20, 9.02it/s] 194it [00:20, 9.22it/s] 195it [00:20, 8.80it/s] 196it [00:21, 9.13it/s] 196it [00:21, 9.30it/s] +2025-05-26 04:23:29,188 - INFO - Epoch: 90, Objective: tensor([3948.3491], device='cuda:0', grad_fn=), Loss: 0.02164594642817974, KL/n: 60.072139739990234 + 0it [00:00, ?it/s]2025-05-26 04:23:29,447 - INFO - [Epoch 091 | Batch 0000] IWAE-loss 3966.0691 | mean log_px -0.0175 | KL -2943.96 + 1it [00:00, 6.03it/s] 2it [00:00, 7.60it/s] 3it [00:00, 8.46it/s] 4it [00:00, 8.94it/s] 5it [00:00, 9.25it/s] 6it [00:00, 9.42it/s] 7it [00:00, 9.55it/s] 8it [00:00, 9.63it/s] 9it [00:00, 9.64it/s] 10it [00:01, 9.69it/s] 11it [00:01, 9.73it/s] 12it [00:01, 9.75it/s] 13it [00:01, 9.77it/s] 14it [00:01, 9.77it/s] 15it [00:01, 9.79it/s] 16it [00:01, 9.77it/s] 17it [00:01, 9.78it/s] 18it [00:01, 9.78it/s] 19it [00:02, 9.77it/s] 20it [00:02, 9.77it/s] 21it [00:02, 9.78it/s] 22it [00:02, 9.79it/s] 23it [00:02, 9.81it/s] 24it [00:02, 9.81it/s] 25it [00:02, 9.79it/s] 26it [00:02, 9.79it/s] 27it [00:02, 9.79it/s] 28it [00:02, 9.80it/s] 29it [00:03, 9.80it/s] 30it [00:03, 9.80it/s] 31it [00:03, 9.80it/s] 32it [00:03, 9.79it/s] 33it [00:03, 9.78it/s] 34it [00:03, 9.78it/s] 35it [00:03, 9.80it/s] 36it [00:03, 9.80it/s] 37it [00:03, 9.82it/s] 38it [00:03, 9.82it/s] 39it [00:04, 9.80it/s] 40it [00:04, 9.80it/s] 41it [00:04, 9.80it/s] 42it [00:04, 9.80it/s] 43it [00:04, 9.79it/s] 44it [00:04, 9.79it/s] 45it [00:04, 9.78it/s] 46it [00:04, 9.79it/s] 47it [00:04, 9.79it/s] 48it [00:04, 9.78it/s] 49it [00:05, 9.80it/s] 50it [00:05, 9.79it/s]2025-05-26 04:23:34,560 - INFO - [Epoch 091 | Batch 0050] IWAE-loss 3997.3748 | mean log_px -0.0152 | KL -2940.93 + 51it [00:05, 9.78it/s] 52it [00:05, 9.78it/s] 53it [00:05, 9.77it/s] 54it [00:05, 9.77it/s] 55it [00:05, 9.78it/s] 56it [00:05, 9.78it/s] 57it [00:05, 9.79it/s] 58it [00:05, 9.79it/s] 59it [00:06, 9.80it/s] 60it [00:06, 9.79it/s] 61it [00:06, 9.61it/s] 62it [00:06, 9.58it/s] 63it [00:06, 9.59it/s] 64it [00:06, 9.06it/s] 65it [00:06, 9.26it/s] 66it [00:06, 9.39it/s] 67it [00:06, 9.47it/s] 68it [00:07, 9.53it/s] 69it [00:07, 9.59it/s] 70it [00:07, 9.63it/s] 71it [00:07, 9.09it/s] 72it [00:07, 9.25it/s] 73it [00:07, 9.39it/s] 74it [00:07, 9.49it/s] 75it [00:07, 9.55it/s] 76it [00:07, 9.55it/s] 77it [00:08, 9.57it/s] 78it [00:08, 9.53it/s] 79it [00:08, 9.53it/s] 80it [00:08, 9.60it/s] 81it [00:08, 9.65it/s] 82it [00:08, 9.68it/s] 83it [00:08, 9.69it/s] 84it [00:08, 9.58it/s] 85it [00:08, 9.63it/s] 86it [00:08, 8.94it/s] 87it [00:09, 9.15it/s] 88it [00:09, 9.32it/s] 89it [00:09, 9.46it/s] 90it [00:09, 9.54it/s] 91it [00:09, 9.60it/s] 92it [00:09, 9.64it/s] 93it [00:09, 9.07it/s] 94it [00:09, 9.22it/s] 95it [00:09, 9.33it/s] 96it [00:10, 9.44it/s] 97it [00:10, 9.50it/s] 98it [00:10, 9.53it/s] 99it [00:10, 9.51it/s] 100it [00:10, 9.45it/s]2025-05-26 04:23:39,826 - INFO - [Epoch 091 | Batch 0100] IWAE-loss 3747.8899 | mean log_px -0.0144 | KL -2939.49 + 101it [00:10, 9.46it/s] 102it [00:10, 9.53it/s] 103it [00:10, 9.57it/s] 104it [00:10, 9.61it/s] 105it [00:10, 9.61it/s] 106it [00:11, 9.39it/s] 107it [00:11, 9.34it/s] 108it [00:11, 9.31it/s] 109it [00:11, 8.87it/s] 110it [00:11, 8.98it/s] 111it [00:11, 9.17it/s] 112it [00:11, 9.21it/s] 113it [00:11, 9.34it/s] 114it [00:11, 9.45it/s] 115it [00:12, 9.54it/s] 116it [00:12, 9.51it/s] 117it [00:12, 9.57it/s] 118it [00:12, 9.63it/s] 119it [00:12, 9.68it/s] 120it [00:12, 9.70it/s] 121it [00:12, 9.61it/s] 122it [00:12, 9.61it/s] 123it [00:12, 9.66it/s] 124it [00:12, 9.64it/s] 125it [00:13, 9.63it/s] 126it [00:13, 9.56it/s] 127it [00:13, 9.56it/s] 128it [00:13, 9.54it/s] 129it [00:13, 9.54it/s] 130it [00:13, 9.53it/s] 131it [00:13, 9.59it/s] 132it [00:13, 9.60it/s] 133it [00:13, 9.48it/s] 134it [00:14, 9.34it/s] 135it [00:14, 9.41it/s] 136it [00:14, 9.43it/s] 137it [00:14, 9.48it/s] 138it [00:14, 9.51it/s] 139it [00:14, 9.56it/s] 140it [00:14, 9.58it/s] 141it [00:14, 9.06it/s] 142it [00:14, 9.24it/s] 143it [00:14, 9.35it/s] 144it [00:15, 9.43it/s] 145it [00:15, 9.45it/s] 146it [00:15, 9.46it/s] 147it [00:15, 9.47it/s] 148it [00:15, 9.51it/s] 149it [00:15, 9.54it/s] 150it [00:15, 9.59it/s]2025-05-26 04:23:45,102 - INFO - [Epoch 091 | Batch 0150] IWAE-loss 4462.9419 | mean log_px -0.0253 | KL -2929.27 + 151it [00:15, 9.03it/s] 152it [00:15, 9.20it/s] 153it [00:16, 9.29it/s] 154it [00:16, 9.38it/s] 155it [00:16, 9.43it/s] 156it [00:16, 9.48it/s] 157it [00:16, 9.55it/s] 158it [00:16, 9.56it/s] 159it [00:16, 9.61it/s] 160it [00:16, 9.56it/s] 161it [00:16, 9.56it/s] 162it [00:16, 9.59it/s] 163it [00:17, 9.55it/s] 164it [00:17, 9.49it/s] 165it [00:17, 9.52it/s] 166it [00:17, 9.50it/s] 167it [00:17, 9.53it/s] 168it [00:17, 9.42it/s] 169it [00:17, 9.50it/s] 170it [00:17, 9.51it/s] 171it [00:17, 9.00it/s] 172it [00:18, 9.10it/s] 173it [00:18, 9.26it/s] 174it [00:18, 9.26it/s] 175it [00:18, 9.22it/s] 176it [00:18, 9.24it/s] 177it [00:18, 9.36it/s] 178it [00:18, 9.47it/s] 179it [00:18, 9.54it/s] 180it [00:18, 9.58it/s] 181it [00:19, 9.61it/s] 182it [00:19, 9.61it/s] 183it [00:19, 9.60it/s] 184it [00:19, 9.14it/s] 185it [00:19, 9.25it/s] 186it [00:19, 9.33it/s] 187it [00:19, 9.41it/s] 188it [00:19, 9.45it/s] 189it [00:19, 9.45it/s] 190it [00:19, 9.05it/s] 191it [00:20, 9.21it/s] 192it [00:20, 9.33it/s] 193it [00:20, 9.41it/s] 194it [00:20, 9.45it/s] 195it [00:20, 8.90it/s] 196it [00:20, 9.18it/s] 196it [00:20, 9.47it/s] +2025-05-26 04:23:50,013 - INFO - Epoch: 91, Objective: tensor([3768.4514], device='cuda:0', grad_fn=), Loss: 0.01296775322407484, KL/n: 59.81892013549805 + 0it [00:00, ?it/s]2025-05-26 04:23:50,293 - INFO - [Epoch 092 | Batch 0000] IWAE-loss 3812.1208 | mean log_px -0.0154 | KL -2928.92 + 1it [00:00, 5.32it/s] 2it [00:00, 7.20it/s] 3it [00:00, 8.14it/s] 4it [00:00, 8.63it/s] 5it [00:00, 8.93it/s] 6it [00:00, 8.63it/s] 7it [00:00, 8.91it/s] 8it [00:00, 9.09it/s] 9it [00:01, 9.18it/s] 10it [00:01, 9.32it/s] 11it [00:01, 9.37it/s] 12it [00:01, 9.41it/s] 13it [00:01, 9.42it/s] 14it [00:01, 9.43it/s] 15it [00:01, 9.44it/s] 16it [00:01, 9.49it/s] 17it [00:01, 9.51it/s] 18it [00:02, 8.99it/s] 19it [00:02, 9.17it/s] 20it [00:02, 9.27it/s] 21it [00:02, 9.38it/s] 22it [00:02, 9.44it/s] 23it [00:02, 9.45it/s] 24it [00:02, 9.40it/s] 25it [00:02, 9.35it/s] 26it [00:02, 9.25it/s] 27it [00:02, 9.33it/s] 28it [00:03, 9.46it/s] 29it [00:03, 9.51it/s] 30it [00:03, 9.56it/s] 31it [00:03, 9.53it/s] 32it [00:03, 9.55it/s] 33it [00:03, 9.55it/s] 34it [00:03, 9.55it/s] 35it [00:03, 9.58it/s] 36it [00:03, 9.56it/s] 37it [00:04, 9.55it/s] 38it [00:04, 9.55it/s] 39it [00:04, 9.04it/s] 40it [00:04, 9.14it/s] 41it [00:04, 9.25it/s] 42it [00:04, 9.25it/s] 43it [00:04, 9.29it/s] 44it [00:04, 9.39it/s] 45it [00:04, 9.45it/s] 46it [00:04, 9.48it/s] 47it [00:05, 9.53it/s] 48it [00:05, 9.53it/s] 49it [00:05, 9.01it/s] 50it [00:05, 9.12it/s]2025-05-26 04:23:55,628 - INFO - [Epoch 092 | Batch 0050] IWAE-loss 3494.9722 | mean log_px -0.0081 | KL -2923.38 + 51it [00:05, 9.24it/s] 52it [00:05, 9.38it/s] 53it [00:05, 9.47it/s] 54it [00:05, 9.41it/s] 55it [00:05, 9.45it/s] 56it [00:06, 9.46it/s] 57it [00:06, 9.51it/s] 58it [00:06, 9.49it/s] 59it [00:06, 9.51it/s] 60it [00:06, 9.51it/s] 61it [00:06, 9.56it/s] 62it [00:06, 9.58it/s] 63it [00:06, 9.54it/s] 64it [00:06, 9.23it/s] 65it [00:07, 9.32it/s] 66it [00:07, 9.36it/s] 67it [00:07, 9.42it/s] 68it [00:07, 6.13it/s] 69it [00:07, 6.86it/s] 70it [00:07, 7.50it/s] 71it [00:07, 8.03it/s] 72it [00:07, 8.45it/s] 73it [00:08, 8.74it/s] 74it [00:08, 9.01it/s] 75it [00:08, 8.92it/s] 76it [00:08, 9.12it/s] 77it [00:08, 9.25it/s] 78it [00:08, 9.35it/s] 79it [00:08, 9.42it/s] 80it [00:08, 9.43it/s] 81it [00:08, 9.35it/s] 82it [00:08, 9.40it/s] 83it [00:09, 9.39it/s] 84it [00:09, 8.88it/s] 85it [00:09, 9.14it/s] 86it [00:09, 9.35it/s] 87it [00:09, 9.49it/s] 88it [00:09, 9.55it/s] 89it [00:09, 9.24it/s] 90it [00:09, 9.40it/s] 91it [00:09, 9.14it/s] 92it [00:10, 9.27it/s] 93it [00:10, 9.40it/s] 94it [00:10, 9.52it/s] 95it [00:10, 9.05it/s] 96it [00:10, 9.22it/s] 97it [00:10, 9.41it/s] 98it [00:10, 9.49it/s] 99it [00:10, 9.59it/s] 100it [00:10, 9.65it/s]2025-05-26 04:24:01,114 - INFO - [Epoch 092 | Batch 0100] IWAE-loss 3449.9321 | mean log_px -0.0083 | KL -2921.72 + 101it [00:11, 9.12it/s] 102it [00:11, 9.31it/s] 103it [00:11, 9.47it/s] 104it [00:11, 9.60it/s] 105it [00:11, 9.56it/s] 106it [00:11, 9.64it/s] 107it [00:11, 9.74it/s] 108it [00:11, 9.77it/s] 109it [00:11, 9.79it/s] 110it [00:11, 9.82it/s] 111it [00:12, 9.84it/s] 112it [00:12, 9.83it/s] 113it [00:12, 9.85it/s] 114it [00:12, 9.85it/s] 115it [00:12, 9.87it/s] 116it [00:12, 9.89it/s] 117it [00:12, 9.88it/s] 118it [00:12, 9.85it/s] 119it [00:12, 9.82it/s] 120it [00:12, 9.80it/s] 121it [00:13, 9.81it/s] 122it [00:13, 9.33it/s] 123it [00:13, 9.47it/s] 124it [00:13, 9.54it/s] 125it [00:13, 9.06it/s] 126it [00:13, 9.20it/s] 127it [00:13, 9.35it/s] 128it [00:13, 9.46it/s] 129it [00:13, 8.94it/s] 130it [00:14, 9.19it/s] 131it [00:14, 9.38it/s] 132it [00:14, 9.51it/s] 133it [00:14, 9.59it/s] 134it [00:14, 9.05it/s] 135it [00:14, 9.24it/s] 136it [00:14, 9.40it/s] 137it [00:14, 9.51it/s] 138it [00:14, 9.60it/s] 139it [00:14, 9.67it/s] 140it [00:15, 9.70it/s] 141it [00:15, 9.07it/s] 142it [00:15, 9.29it/s] 143it [00:15, 9.43it/s] 144it [00:15, 9.52it/s] 145it [00:15, 9.60it/s] 146it [00:15, 9.58it/s] 147it [00:15, 9.65it/s] 148it [00:15, 9.56it/s] 149it [00:16, 9.57it/s] 150it [00:16, 9.55it/s]2025-05-26 04:24:06,361 - INFO - [Epoch 092 | Batch 0150] IWAE-loss 3478.1560 | mean log_px -0.0111 | KL -2921.63 + 151it [00:16, 9.57it/s] 152it [00:16, 9.57it/s] 153it [00:16, 9.58it/s] 154it [00:16, 9.52it/s] 155it [00:16, 9.54it/s] 156it [00:16, 9.51it/s] 157it [00:16, 9.56it/s] 158it [00:16, 9.56it/s] 159it [00:17, 9.52it/s] 160it [00:17, 9.50it/s] 161it [00:17, 9.48it/s] 162it [00:17, 9.48it/s] 163it [00:17, 9.48it/s] 164it [00:17, 9.08it/s] 165it [00:17, 9.14it/s] 166it [00:17, 9.23it/s] 167it [00:17, 9.31it/s] 168it [00:18, 9.35it/s] 169it [00:18, 9.37it/s] 170it [00:18, 9.34it/s] 171it [00:18, 9.39it/s] 172it [00:18, 9.39it/s] 173it [00:18, 8.91it/s] 174it [00:18, 9.08it/s] 175it [00:18, 9.19it/s] 176it [00:18, 9.19it/s] 177it [00:19, 9.21it/s] 178it [00:19, 8.87it/s] 179it [00:19, 9.02it/s] 180it [00:19, 9.16it/s] 181it [00:19, 9.24it/s] 182it [00:19, 8.81it/s] 183it [00:19, 8.84it/s] 184it [00:19, 9.02it/s] 185it [00:19, 9.14it/s] 186it [00:20, 9.22it/s] 187it [00:20, 9.31it/s] 188it [00:20, 9.31it/s] 189it [00:20, 9.37it/s] 190it [00:20, 9.44it/s] 191it [00:20, 9.44it/s] 192it [00:20, 9.44it/s] 193it [00:20, 9.02it/s] 194it [00:20, 9.15it/s] 195it [00:21, 8.69it/s] 196it [00:21, 8.94it/s] 196it [00:21, 9.25it/s] +2025-05-26 04:24:11,329 - INFO - Epoch: 92, Objective: tensor([3705.5750], device='cuda:0', grad_fn=), Loss: 0.016982443630695343, KL/n: 59.582088470458984 + 0it [00:00, ?it/s]2025-05-26 04:24:11,608 - INFO - [Epoch 093 | Batch 0000] IWAE-loss 4068.8088 | mean log_px -0.0203 | KL -2920.25 + 1it [00:00, 4.70it/s] 2it [00:00, 6.72it/s] 3it [00:00, 7.79it/s] 4it [00:00, 8.44it/s] 5it [00:00, 8.79it/s] 6it [00:00, 9.03it/s] 7it [00:00, 9.22it/s] 8it [00:00, 9.32it/s] 9it [00:01, 9.43it/s] 10it [00:01, 8.98it/s] 11it [00:01, 9.11it/s] 12it [00:01, 9.27it/s] 13it [00:01, 9.34it/s] 14it [00:01, 9.42it/s] 15it [00:01, 9.46it/s] 16it [00:01, 9.43it/s] 17it [00:01, 9.47it/s] 18it [00:02, 9.49it/s] 19it [00:02, 9.50it/s] 20it [00:02, 9.48it/s] 21it [00:02, 9.49it/s] 22it [00:02, 9.50it/s] 23it [00:02, 9.51it/s] 24it [00:02, 9.53it/s] 25it [00:02, 9.53it/s] 26it [00:02, 9.54it/s] 27it [00:02, 9.48it/s] 28it [00:03, 9.46it/s] 29it [00:03, 9.46it/s] 30it [00:03, 9.48it/s] 31it [00:03, 9.50it/s] 32it [00:03, 9.55it/s] 33it [00:03, 9.63it/s] 34it [00:03, 9.51it/s] 35it [00:03, 9.54it/s] 36it [00:03, 9.10it/s] 37it [00:04, 9.26it/s] 38it [00:04, 9.14it/s] 39it [00:04, 9.22it/s] 40it [00:04, 9.29it/s] 41it [00:04, 9.35it/s] 42it [00:04, 9.37it/s] 43it [00:04, 8.89it/s] 44it [00:04, 9.07it/s] 45it [00:04, 9.10it/s] 46it [00:05, 9.20it/s] 47it [00:05, 9.29it/s] 48it [00:05, 9.34it/s] 49it [00:05, 9.42it/s] 50it [00:05, 8.90it/s]2025-05-26 04:24:16,971 - INFO - [Epoch 093 | Batch 0050] IWAE-loss 4193.2715 | mean log_px -0.0235 | KL -2915.12 + 51it [00:05, 9.08it/s] 52it [00:05, 9.22it/s] 53it [00:05, 9.30it/s] 54it [00:05, 9.35it/s] 55it [00:05, 9.49it/s] 56it [00:06, 9.50it/s] 57it [00:06, 9.51it/s] 58it [00:06, 9.53it/s] 59it [00:06, 9.60it/s] 60it [00:06, 9.63it/s] 61it [00:06, 9.64it/s] 62it [00:06, 9.64it/s] 63it [00:06, 9.60it/s] 64it [00:06, 9.59it/s] 65it [00:07, 9.56it/s] 66it [00:07, 9.57it/s] 67it [00:07, 9.56it/s] 68it [00:07, 9.53it/s] 69it [00:07, 9.12it/s] 70it [00:07, 9.07it/s] 71it [00:07, 8.56it/s] 72it [00:07, 8.85it/s] 73it [00:07, 9.08it/s] 74it [00:07, 9.25it/s] 75it [00:08, 9.35it/s] 76it [00:08, 9.46it/s] 77it [00:08, 9.53it/s] 78it [00:08, 9.55it/s] 79it [00:08, 9.03it/s] 80it [00:08, 9.13it/s] 81it [00:08, 9.32it/s] 82it [00:08, 9.33it/s] 83it [00:08, 9.39it/s] 84it [00:09, 9.29it/s] 85it [00:09, 9.42it/s] 86it [00:09, 9.48it/s] 87it [00:09, 9.10it/s] 88it [00:09, 9.22it/s] 89it [00:09, 9.32it/s] 90it [00:09, 9.25it/s] 91it [00:09, 9.29it/s] 92it [00:09, 9.36it/s] 93it [00:10, 9.45it/s] 94it [00:10, 9.48it/s] 95it [00:10, 9.51it/s] 96it [00:10, 9.50it/s] 97it [00:10, 9.52it/s] 98it [00:10, 9.56it/s] 99it [00:10, 9.53it/s] 100it [00:10, 9.53it/s]2025-05-26 04:24:22,291 - INFO - [Epoch 093 | Batch 0100] IWAE-loss 3753.0735 | mean log_px -0.0142 | KL -2914.49 + 101it [00:10, 9.49it/s] 102it [00:10, 9.51it/s] 103it [00:11, 9.09it/s] 104it [00:11, 9.16it/s] 105it [00:11, 9.32it/s] 106it [00:11, 9.35it/s] 107it [00:11, 9.39it/s] 108it [00:11, 9.10it/s] 109it [00:11, 9.26it/s] 110it [00:11, 9.22it/s] 111it [00:11, 9.29it/s] 112it [00:12, 9.36it/s] 113it [00:12, 9.39it/s] 114it [00:12, 9.39it/s] 115it [00:12, 9.44it/s] 116it [00:12, 9.44it/s] 117it [00:12, 9.52it/s] 118it [00:12, 9.57it/s] 119it [00:12, 9.13it/s] 120it [00:12, 9.30it/s] 121it [00:13, 9.39it/s] 122it [00:13, 9.38it/s] 123it [00:13, 9.36it/s] 124it [00:13, 9.35it/s] 125it [00:13, 8.85it/s] 126it [00:13, 9.01it/s] 127it [00:13, 9.22it/s] 128it [00:13, 9.30it/s] 129it [00:13, 9.35it/s] 130it [00:13, 9.40it/s] 131it [00:14, 8.93it/s] 132it [00:14, 9.11it/s] 133it [00:14, 9.28it/s] 134it [00:14, 9.34it/s] 135it [00:14, 9.37it/s] 136it [00:14, 9.46it/s] 137it [00:14, 9.48it/s] 138it [00:14, 9.51it/s] 139it [00:14, 9.47it/s] 140it [00:15, 9.49it/s] 141it [00:15, 9.49it/s] 142it [00:15, 9.49it/s] 143it [00:15, 9.52it/s] 144it [00:15, 9.55it/s] 145it [00:15, 9.46it/s] 146it [00:15, 9.48it/s] 147it [00:15, 9.47it/s] 148it [00:15, 9.51it/s] 149it [00:16, 8.98it/s] 150it [00:16, 9.06it/s]2025-05-26 04:24:27,666 - INFO - [Epoch 093 | Batch 0150] IWAE-loss 3694.4592 | mean log_px -0.0135 | KL -2910.63 + 151it [00:16, 9.10it/s] 152it [00:16, 9.25it/s] 153it [00:16, 9.26it/s] 154it [00:16, 9.19it/s] 155it [00:16, 9.24it/s] 156it [00:16, 9.33it/s] 157it [00:16, 9.37it/s] 158it [00:16, 9.46it/s] 159it [00:17, 9.47it/s] 160it [00:17, 9.51it/s] 161it [00:17, 9.52it/s] 162it [00:17, 9.57it/s] 163it [00:17, 9.54it/s] 164it [00:17, 9.53it/s] 165it [00:17, 9.45it/s] 166it [00:17, 9.04it/s] 167it [00:17, 9.18it/s] 168it [00:18, 9.26it/s] 169it [00:18, 9.36it/s] 170it [00:18, 9.39it/s] 171it [00:18, 9.39it/s] 172it [00:18, 9.40it/s] 173it [00:18, 9.45it/s] 174it [00:18, 8.98it/s] 175it [00:18, 8.79it/s] 176it [00:18, 8.92it/s] 177it [00:19, 9.03it/s] 178it [00:19, 9.11it/s] 179it [00:19, 9.09it/s] 180it [00:19, 9.23it/s] 181it [00:19, 9.19it/s] 182it [00:19, 8.77it/s] 183it [00:19, 8.89it/s] 184it [00:19, 9.08it/s] 185it [00:19, 9.22it/s] 186it [00:20, 9.33it/s] 187it [00:20, 9.41it/s] 188it [00:20, 9.42it/s] 189it [00:20, 9.51it/s] 190it [00:20, 9.57it/s] 191it [00:20, 9.63it/s] 192it [00:20, 9.58it/s] 193it [00:20, 9.58it/s] 194it [00:20, 9.56it/s] 195it [00:20, 8.95it/s] 196it [00:21, 9.13it/s] 196it [00:21, 9.27it/s] +2025-05-26 04:24:32,610 - INFO - Epoch: 93, Objective: tensor([3518.6760], device='cuda:0', grad_fn=), Loss: 0.009369171224534512, KL/n: 59.381324768066406 + 0it [00:00, ?it/s]2025-05-26 04:24:33,071 - INFO - [Epoch 094 | Batch 0000] IWAE-loss 3675.7261 | mean log_px -0.0113 | KL -2903.85 + 1it [00:00, 5.26it/s] 2it [00:00, 7.14it/s] 3it [00:00, 8.06it/s] 4it [00:00, 8.60it/s] 5it [00:00, 8.96it/s] 6it [00:00, 9.14it/s] 7it [00:00, 9.32it/s] 8it [00:00, 9.43it/s] 9it [00:01, 9.42it/s] 10it [00:01, 9.51it/s] 11it [00:01, 9.55it/s] 12it [00:01, 9.53it/s] 13it [00:01, 9.55it/s] 14it [00:01, 9.58it/s] 15it [00:01, 9.55it/s] 16it [00:01, 9.57it/s] 17it [00:01, 9.57it/s] 18it [00:01, 9.46it/s] 19it [00:02, 9.56it/s] 20it [00:02, 9.47it/s] 21it [00:02, 9.49it/s] 22it [00:02, 9.48it/s] 23it [00:02, 9.51it/s] 24it [00:02, 9.48it/s] 25it [00:02, 9.55it/s] 26it [00:02, 9.00it/s] 27it [00:02, 9.15it/s] 28it [00:03, 9.27it/s] 29it [00:03, 9.36it/s] 30it [00:03, 9.38it/s] 31it [00:03, 9.42it/s] 32it [00:03, 9.41it/s] 33it [00:03, 9.46it/s] 34it [00:03, 9.45it/s] 35it [00:03, 9.54it/s] 36it [00:03, 9.56it/s] 37it [00:03, 9.53it/s] 38it [00:04, 9.52it/s] 39it [00:04, 9.51it/s] 40it [00:04, 9.51it/s] 41it [00:04, 9.53it/s] 42it [00:04, 9.48it/s] 43it [00:04, 8.98it/s] 44it [00:04, 9.11it/s] 45it [00:04, 9.11it/s] 46it [00:04, 9.19it/s] 47it [00:05, 8.94it/s] 48it [00:05, 9.13it/s] 49it [00:05, 9.16it/s] 50it [00:05, 9.23it/s]2025-05-26 04:24:38,382 - INFO - [Epoch 094 | Batch 0050] IWAE-loss 4268.3975 | mean log_px -0.0242 | KL -2905.98 + 51it [00:05, 8.86it/s] 52it [00:05, 9.07it/s] 53it [00:05, 9.16it/s] 54it [00:05, 9.18it/s] 55it [00:05, 9.28it/s] 56it [00:06, 9.30it/s] 57it [00:06, 9.35it/s] 58it [00:06, 9.36it/s] 59it [00:06, 9.39it/s] 60it [00:06, 9.45it/s] 61it [00:06, 9.46it/s] 62it [00:06, 9.07it/s] 63it [00:06, 9.20it/s] 64it [00:06, 9.31it/s] 65it [00:07, 9.33it/s] 66it [00:07, 9.36it/s] 67it [00:07, 9.38it/s] 68it [00:07, 9.42it/s] 69it [00:07, 9.44it/s] 70it [00:07, 8.91it/s] 71it [00:07, 9.13it/s] 72it [00:07, 9.17it/s] 73it [00:07, 9.25it/s] 74it [00:07, 9.31it/s] 75it [00:08, 9.39it/s] 76it [00:08, 9.43it/s] 77it [00:08, 8.91it/s] 78it [00:08, 9.06it/s] 79it [00:08, 9.19it/s] 80it [00:08, 9.29it/s] 81it [00:08, 9.37it/s] 82it [00:08, 9.47it/s] 83it [00:08, 9.49it/s] 84it [00:09, 9.49it/s] 85it [00:09, 9.51it/s] 86it [00:09, 9.51it/s] 87it [00:09, 9.52it/s] 88it [00:09, 9.48it/s] 89it [00:09, 9.47it/s] 90it [00:09, 9.47it/s] 91it [00:09, 9.53it/s] 92it [00:09, 9.56it/s] 93it [00:09, 9.60it/s] 94it [00:10, 9.57it/s] 95it [00:10, 9.57it/s] 96it [00:10, 9.53it/s] 97it [00:10, 9.48it/s] 98it [00:10, 9.49it/s] 99it [00:10, 9.45it/s] 100it [00:10, 8.92it/s]2025-05-26 04:24:43,748 - INFO - [Epoch 094 | Batch 0100] IWAE-loss 3504.3542 | mean log_px -0.0100 | KL -2904.47 + 101it [00:10, 9.11it/s] 102it [00:10, 9.17it/s] 103it [00:11, 9.08it/s] 104it [00:11, 9.10it/s] 105it [00:11, 9.22it/s] 106it [00:11, 9.29it/s] 107it [00:11, 9.32it/s] 108it [00:11, 9.24it/s] 109it [00:11, 8.57it/s] 110it [00:11, 8.78it/s] 111it [00:11, 8.94it/s] 112it [00:12, 9.03it/s] 113it [00:12, 8.77it/s] 114it [00:12, 8.96it/s] 115it [00:12, 9.07it/s] 116it [00:12, 9.07it/s] 117it [00:12, 9.18it/s] 118it [00:12, 9.24it/s] 119it [00:12, 9.32it/s] 120it [00:12, 9.43it/s] 121it [00:13, 9.43it/s] 122it [00:13, 9.46it/s] 123it [00:13, 9.52it/s] 124it [00:13, 9.47it/s] 125it [00:13, 9.49it/s] 126it [00:13, 9.51it/s] 127it [00:13, 9.53it/s] 128it [00:13, 9.48it/s] 129it [00:13, 9.50it/s] 130it [00:13, 9.51it/s] 131it [00:14, 9.50it/s] 132it [00:14, 9.50it/s] 133it [00:14, 9.52it/s] 134it [00:14, 9.50it/s] 135it [00:14, 9.47it/s] 136it [00:14, 9.50it/s] 137it [00:14, 9.50it/s] 138it [00:14, 9.48it/s] 139it [00:14, 9.48it/s] 140it [00:15, 9.43it/s] 141it [00:15, 9.47it/s] 142it [00:15, 9.46it/s] 143it [00:15, 9.48it/s] 144it [00:15, 9.48it/s] 145it [00:15, 9.50it/s] 146it [00:15, 9.47it/s] 147it [00:15, 9.49it/s] 148it [00:15, 9.50it/s] 149it [00:16, 9.54it/s] 150it [00:16, 9.54it/s]2025-05-26 04:24:49,091 - INFO - [Epoch 094 | Batch 0150] IWAE-loss 3472.2581 | mean log_px -0.0113 | KL -2900.82 + 151it [00:16, 9.56it/s] 152it [00:16, 9.51it/s] 153it [00:16, 9.58it/s] 154it [00:16, 9.59it/s] 155it [00:16, 9.59it/s] 156it [00:16, 9.56it/s] 157it [00:16, 9.53it/s] 158it [00:16, 9.53it/s] 159it [00:17, 9.48it/s] 160it [00:17, 9.50it/s] 161it [00:17, 9.51it/s] 162it [00:17, 9.37it/s] 163it [00:17, 9.23it/s] 164it [00:17, 8.71it/s] 165it [00:17, 8.93it/s] 166it [00:17, 9.08it/s] 167it [00:17, 9.20it/s] 168it [00:18, 8.76it/s] 169it [00:18, 8.99it/s] 170it [00:18, 9.08it/s] 171it [00:18, 9.18it/s] 172it [00:18, 8.75it/s] 173it [00:18, 8.95it/s] 174it [00:18, 9.12it/s] 175it [00:18, 9.21it/s] 176it [00:18, 9.29it/s] 177it [00:19, 9.35it/s] 178it [00:19, 9.41it/s] 179it [00:19, 9.42it/s] 180it [00:19, 9.39it/s] 181it [00:19, 9.44it/s] 182it [00:19, 9.42it/s] 183it [00:19, 9.47it/s] 184it [00:19, 9.47it/s] 185it [00:19, 9.49it/s] 186it [00:19, 9.48it/s] 187it [00:20, 9.50it/s] 188it [00:20, 9.53it/s] 189it [00:20, 9.53it/s] 190it [00:20, 9.50it/s] 191it [00:20, 9.48it/s] 192it [00:20, 9.47it/s] 193it [00:20, 9.46it/s] 194it [00:20, 9.45it/s] 195it [00:20, 8.87it/s] 196it [00:21, 9.06it/s] 196it [00:21, 9.28it/s] +2025-05-26 04:24:54,044 - INFO - Epoch: 94, Objective: tensor([3317.0979], device='cuda:0', grad_fn=), Loss: 0.006679388228803873, KL/n: 59.15084457397461 + 0it [00:00, ?it/s]2025-05-26 04:24:54,318 - INFO - [Epoch 095 | Batch 0000] IWAE-loss 3526.1443 | mean log_px -0.0090 | KL -2896.83 + 1it [00:00, 4.83it/s] 2it [00:00, 6.78it/s] 3it [00:00, 7.31it/s] 4it [00:00, 8.02it/s] 5it [00:00, 8.47it/s] 6it [00:00, 8.69it/s] 7it [00:00, 8.45it/s] 8it [00:00, 8.70it/s] 9it [00:01, 8.89it/s] 10it [00:01, 9.01it/s] 11it [00:01, 8.65it/s] 12it [00:01, 8.84it/s] 13it [00:01, 9.07it/s] 14it [00:01, 8.73it/s] 15it [00:01, 8.94it/s] 16it [00:01, 9.06it/s] 17it [00:01, 9.21it/s] 18it [00:02, 8.84it/s] 19it [00:02, 9.02it/s] 20it [00:02, 9.14it/s] 21it [00:02, 9.27it/s] 22it [00:02, 8.87it/s] 23it [00:02, 9.07it/s] 24it [00:02, 9.17it/s] 25it [00:02, 9.26it/s] 26it [00:02, 8.84it/s] 27it [00:03, 9.04it/s] 28it [00:03, 9.18it/s] 29it [00:03, 9.27it/s] 30it [00:03, 8.86it/s] 31it [00:03, 9.06it/s] 32it [00:03, 9.17it/s] 33it [00:03, 9.26it/s] 34it [00:03, 8.88it/s] 35it [00:03, 9.04it/s] 36it [00:04, 9.11it/s] 37it [00:04, 9.17it/s] 38it [00:04, 8.75it/s] 39it [00:04, 8.94it/s] 40it [00:04, 9.15it/s] 41it [00:04, 9.24it/s] 42it [00:04, 8.83it/s] 43it [00:04, 9.02it/s] 44it [00:04, 9.15it/s] 45it [00:05, 9.24it/s] 46it [00:05, 8.86it/s] 47it [00:05, 9.05it/s] 48it [00:05, 9.16it/s] 49it [00:05, 9.24it/s] 50it [00:05, 8.74it/s]2025-05-26 04:24:59,881 - INFO - [Epoch 095 | Batch 0050] IWAE-loss 3349.6074 | mean log_px -0.0067 | KL -2888.48 + 51it [00:05, 8.92it/s] 52it [00:05, 9.10it/s] 53it [00:05, 9.17it/s] 54it [00:06, 8.71it/s] 55it [00:06, 8.91it/s] 56it [00:06, 9.09it/s] 57it [00:06, 9.24it/s] 58it [00:06, 8.82it/s] 59it [00:06, 8.94it/s] 60it [00:06, 9.09it/s] 61it [00:06, 9.23it/s] 62it [00:06, 8.83it/s] 63it [00:07, 9.02it/s] 64it [00:07, 9.16it/s] 65it [00:07, 9.24it/s] 66it [00:07, 8.75it/s] 67it [00:07, 8.84it/s] 68it [00:07, 8.96it/s] 69it [00:07, 8.81it/s] 70it [00:07, 8.92it/s] 71it [00:07, 8.62it/s] 72it [00:08, 8.89it/s] 73it [00:08, 8.95it/s] 74it [00:08, 9.07it/s] 75it [00:08, 8.58it/s] 76it [00:08, 8.61it/s] 77it [00:08, 8.67it/s] 78it [00:08, 8.87it/s] 79it [00:08, 8.95it/s] 80it [00:09, 8.71it/s] 81it [00:09, 8.91it/s] 82it [00:09, 9.07it/s] 83it [00:09, 8.79it/s] 84it [00:09, 8.98it/s] 85it [00:09, 9.09it/s] 86it [00:09, 8.87it/s] 87it [00:09, 9.03it/s] 88it [00:09, 9.10it/s] 89it [00:09, 9.21it/s] 90it [00:10, 9.31it/s] 91it [00:10, 9.37it/s] 92it [00:10, 9.38it/s] 93it [00:10, 9.37it/s] 94it [00:10, 9.01it/s] 95it [00:10, 9.11it/s] 96it [00:10, 9.15it/s] 97it [00:10, 9.25it/s] 98it [00:10, 9.31it/s] 99it [00:11, 9.42it/s] 100it [00:11, 9.44it/s]2025-05-26 04:25:05,408 - INFO - [Epoch 095 | Batch 0100] IWAE-loss 3535.2415 | mean log_px -0.0105 | KL -2890.72 + 101it [00:11, 9.43it/s] 102it [00:11, 9.41it/s] 103it [00:11, 8.88it/s] 104it [00:11, 9.05it/s] 105it [00:11, 9.18it/s] 106it [00:11, 9.27it/s] 107it [00:11, 9.35it/s] 108it [00:12, 9.28it/s] 109it [00:12, 9.35it/s] 110it [00:12, 9.41it/s] 111it [00:12, 9.43it/s] 112it [00:12, 9.40it/s] 113it [00:12, 9.40it/s] 114it [00:12, 9.48it/s] 115it [00:12, 9.43it/s] 116it [00:12, 9.48it/s] 117it [00:12, 9.42it/s] 118it [00:13, 9.42it/s] 119it [00:13, 8.90it/s] 120it [00:13, 8.99it/s] 121it [00:13, 9.13it/s] 122it [00:13, 9.21it/s] 123it [00:13, 9.28it/s] 124it [00:13, 9.28it/s] 125it [00:13, 9.34it/s] 126it [00:13, 8.93it/s] 127it [00:14, 9.08it/s] 128it [00:14, 9.13it/s] 129it [00:14, 8.73it/s] 130it [00:14, 8.92it/s] 131it [00:14, 9.05it/s] 132it [00:14, 9.08it/s] 133it [00:14, 9.20it/s] 134it [00:14, 9.25it/s] 135it [00:14, 9.23it/s] 136it [00:15, 9.28it/s] 137it [00:15, 9.36it/s] 138it [00:15, 9.40it/s] 139it [00:15, 9.33it/s] 140it [00:15, 9.35it/s] 141it [00:15, 9.40it/s] 142it [00:15, 9.44it/s] 143it [00:15, 9.42it/s] 144it [00:15, 9.43it/s] 145it [00:16, 9.07it/s] 146it [00:16, 9.16it/s] 147it [00:16, 9.24it/s] 148it [00:16, 8.85it/s] 149it [00:16, 9.04it/s] 150it [00:16, 9.12it/s]2025-05-26 04:25:10,834 - INFO - [Epoch 095 | Batch 0150] IWAE-loss 4350.0732 | mean log_px -0.0231 | KL -2887.25 + 151it [00:16, 9.24it/s] 152it [00:16, 9.32it/s] 153it [00:16, 9.35it/s] 154it [00:17, 8.92it/s] 155it [00:17, 9.11it/s] 156it [00:17, 9.23it/s] 157it [00:17, 9.30it/s] 158it [00:17, 9.32it/s] 159it [00:17, 9.39it/s] 160it [00:17, 9.42it/s] 161it [00:17, 9.45it/s] 162it [00:17, 9.47it/s] 163it [00:17, 9.49it/s] 164it [00:18, 9.50it/s] 165it [00:18, 9.40it/s] 166it [00:18, 9.46it/s] 167it [00:18, 9.51it/s] 168it [00:18, 9.52it/s] 169it [00:18, 9.53it/s] 170it [00:18, 9.50it/s] 171it [00:18, 9.48it/s] 172it [00:18, 9.49it/s] 173it [00:19, 8.96it/s] 174it [00:19, 9.13it/s] 175it [00:19, 9.28it/s] 176it [00:19, 9.35it/s] 177it [00:19, 9.37it/s] 178it [00:19, 9.46it/s] 179it [00:19, 9.11it/s] 180it [00:19, 9.21it/s] 181it [00:19, 9.32it/s] 182it [00:20, 8.76it/s] 183it [00:20, 8.98it/s] 184it [00:20, 9.10it/s] 185it [00:20, 9.27it/s] 186it [00:20, 9.26it/s] 187it [00:20, 9.35it/s] 188it [00:20, 9.38it/s] 189it [00:20, 9.37it/s] 190it [00:20, 9.39it/s] 191it [00:21, 8.92it/s] 192it [00:21, 9.12it/s] 193it [00:21, 9.16it/s] 194it [00:21, 9.26it/s] 195it [00:21, 8.73it/s] 196it [00:21, 8.91it/s] 196it [00:21, 9.06it/s] +2025-05-26 04:25:15,798 - INFO - Epoch: 95, Objective: tensor([3332.1047], device='cuda:0', grad_fn=), Loss: 0.008258700370788574, KL/n: 58.8862190246582 + 0it [00:00, ?it/s]2025-05-26 04:25:16,263 - INFO - [Epoch 096 | Batch 0000] IWAE-loss 4336.8301 | mean log_px -0.0305 | KL -2885.20 + 1it [00:00, 4.72it/s] 2it [00:00, 6.72it/s] 3it [00:00, 7.75it/s] 4it [00:00, 8.36it/s] 5it [00:00, 8.78it/s] 6it [00:00, 9.04it/s] 7it [00:00, 8.68it/s] 8it [00:00, 8.88it/s] 9it [00:01, 9.06it/s] 10it [00:01, 9.14it/s] 11it [00:01, 9.28it/s] 12it [00:01, 9.36it/s] 13it [00:01, 9.37it/s] 14it [00:01, 9.41it/s] 15it [00:01, 9.36it/s] 16it [00:01, 9.36it/s] 17it [00:01, 9.39it/s] 18it [00:02, 9.34it/s] 19it [00:02, 9.39it/s] 20it [00:02, 9.43it/s] 21it [00:02, 9.49it/s] 22it [00:02, 9.53it/s] 23it [00:02, 9.52it/s] 24it [00:02, 9.49it/s] 25it [00:02, 9.49it/s] 26it [00:02, 9.45it/s] 27it [00:02, 9.42it/s] 28it [00:03, 9.51it/s] 29it [00:03, 9.45it/s] 30it [00:03, 9.44it/s] 31it [00:03, 9.43it/s] 32it [00:03, 9.45it/s] 33it [00:03, 9.47it/s] 34it [00:03, 9.42it/s] 35it [00:03, 9.45it/s] 36it [00:03, 9.40it/s] 37it [00:04, 9.36it/s] 38it [00:04, 9.39it/s] 39it [00:04, 9.40it/s] 40it [00:04, 9.44it/s] 41it [00:04, 9.32it/s] 42it [00:04, 9.15it/s] 43it [00:04, 9.28it/s] 44it [00:04, 9.40it/s] 45it [00:04, 9.49it/s] 46it [00:04, 9.50it/s] 47it [00:05, 9.48it/s] 48it [00:05, 9.05it/s] 49it [00:05, 9.20it/s] 50it [00:05, 9.31it/s]2025-05-26 04:25:21,615 - INFO - [Epoch 096 | Batch 0050] IWAE-loss 3660.0618 | mean log_px -0.0111 | KL -2883.02 + 51it [00:05, 9.34it/s] 52it [00:05, 9.26it/s] 53it [00:05, 8.50it/s] 54it [00:05, 8.69it/s] 55it [00:06, 8.95it/s] 56it [00:06, 9.12it/s] 57it [00:06, 8.75it/s] 58it [00:06, 8.98it/s] 59it [00:06, 9.14it/s] 60it [00:06, 9.21it/s] 61it [00:06, 9.33it/s] 62it [00:06, 9.42it/s] 63it [00:06, 8.80it/s] 64it [00:06, 9.02it/s] 65it [00:07, 9.17it/s] 66it [00:07, 9.15it/s] 67it [00:07, 8.74it/s] 68it [00:07, 8.97it/s] 69it [00:07, 9.12it/s] 70it [00:07, 9.24it/s] 71it [00:07, 9.36it/s] 72it [00:07, 9.42it/s] 73it [00:07, 9.41it/s] 74it [00:08, 9.43it/s] 75it [00:08, 9.43it/s] 76it [00:08, 9.44it/s] 77it [00:08, 9.47it/s] 78it [00:08, 9.45it/s] 79it [00:08, 9.44it/s] 80it [00:08, 9.40it/s] 81it [00:08, 9.48it/s] 82it [00:08, 9.41it/s] 83it [00:09, 9.45it/s] 84it [00:09, 9.44it/s] 85it [00:09, 9.52it/s] 86it [00:09, 9.49it/s] 87it [00:09, 9.43it/s] 88it [00:09, 9.11it/s] 89it [00:09, 9.24it/s] 90it [00:09, 9.26it/s] 91it [00:09, 9.36it/s] 92it [00:09, 9.40it/s] 93it [00:10, 9.46it/s] 94it [00:10, 9.42it/s] 95it [00:10, 9.45it/s] 96it [00:10, 9.40it/s] 97it [00:10, 9.49it/s] 98it [00:10, 9.49it/s] 99it [00:10, 9.47it/s] 100it [00:10, 9.51it/s]2025-05-26 04:25:27,010 - INFO - [Epoch 096 | Batch 0100] IWAE-loss 3525.8738 | mean log_px -0.0101 | KL -2880.33 + 101it [00:10, 9.46it/s] 102it [00:11, 9.49it/s] 103it [00:11, 9.48it/s] 104it [00:11, 9.53it/s] 105it [00:11, 9.50it/s] 106it [00:11, 9.48it/s] 107it [00:11, 9.44it/s] 108it [00:11, 9.06it/s] 109it [00:11, 9.00it/s] 110it [00:11, 9.22it/s] 111it [00:12, 9.41it/s] 112it [00:12, 9.53it/s] 113it [00:12, 9.63it/s] 114it [00:12, 9.69it/s] 115it [00:12, 9.75it/s] 116it [00:12, 9.77it/s] 117it [00:12, 9.80it/s] 118it [00:12, 9.82it/s] 119it [00:12, 9.83it/s] 120it [00:12, 9.83it/s] 121it [00:13, 9.82it/s] 122it [00:13, 9.82it/s] 123it [00:13, 9.75it/s] 124it [00:13, 9.64it/s] 125it [00:13, 9.67it/s] 127it [00:13, 9.80it/s] 128it [00:13, 9.82it/s] 129it [00:13, 9.83it/s] 130it [00:13, 9.84it/s] 131it [00:14, 9.83it/s] 132it [00:14, 9.69it/s] 133it [00:14, 9.73it/s] 134it [00:14, 9.76it/s] 135it [00:14, 9.78it/s] 136it [00:14, 9.78it/s] 137it [00:14, 9.81it/s] 138it [00:14, 9.82it/s] 139it [00:14, 9.84it/s] 140it [00:14, 9.84it/s] 141it [00:15, 9.84it/s] 142it [00:15, 9.81it/s] 143it [00:15, 9.84it/s] 144it [00:15, 9.84it/s] 145it [00:15, 9.84it/s] 146it [00:15, 9.83it/s] 147it [00:15, 9.71it/s] 148it [00:15, 9.71it/s] 149it [00:15, 9.75it/s] 150it [00:15, 9.76it/s]2025-05-26 04:25:32,162 - INFO - [Epoch 096 | Batch 0150] IWAE-loss 3406.4150 | mean log_px -0.0099 | KL -2879.07 + 151it [00:16, 9.77it/s] 152it [00:16, 9.77it/s] 153it [00:16, 9.80it/s] 154it [00:16, 9.81it/s] 155it [00:16, 9.84it/s] 156it [00:16, 9.82it/s] 157it [00:16, 9.72it/s] 158it [00:16, 9.75it/s] 159it [00:16, 9.75it/s] 160it [00:17, 9.76it/s] 161it [00:17, 9.79it/s] 162it [00:17, 9.78it/s] 163it [00:17, 9.81it/s] 164it [00:17, 9.83it/s] 165it [00:17, 9.84it/s] 166it [00:17, 9.84it/s] 167it [00:17, 9.84it/s] 168it [00:17, 9.84it/s] 169it [00:17, 9.84it/s] 170it [00:18, 9.85it/s] 171it [00:18, 9.85it/s] 172it [00:18, 9.86it/s] 173it [00:18, 9.86it/s] 174it [00:18, 9.86it/s] 175it [00:18, 9.74it/s] 176it [00:18, 9.73it/s] 177it [00:18, 9.74it/s] 178it [00:18, 9.78it/s] 179it [00:18, 9.81it/s] 180it [00:19, 9.82it/s] 181it [00:19, 9.83it/s] 182it [00:19, 9.83it/s] 183it [00:19, 9.86it/s] 184it [00:19, 9.86it/s] 185it [00:19, 9.87it/s] 186it [00:19, 9.86it/s] 187it [00:19, 9.86it/s] 188it [00:19, 9.85it/s] 189it [00:19, 9.87it/s] 190it [00:20, 9.87it/s] 191it [00:20, 9.64it/s] 192it [00:20, 9.69it/s] 193it [00:20, 9.75it/s] 194it [00:20, 9.78it/s] 195it [00:20, 9.25it/s] 196it [00:20, 9.44it/s] +2025-05-26 04:25:36,874 - INFO - Epoch: 96, Objective: tensor([3542.8840], device='cuda:0', grad_fn=), Loss: 0.012501702643930912, KL/n: 58.68415069580078 + 0it [00:00, ?it/s]2025-05-26 04:25:37,156 - INFO - [Epoch 097 | Batch 0000] IWAE-loss 4043.2427 | mean log_px -0.0168 | KL -2875.78 + 1it [00:00, 5.36it/s] 2it [00:00, 7.34it/s] 3it [00:00, 8.35it/s] 4it [00:00, 8.90it/s] 5it [00:00, 9.25it/s] 6it [00:00, 9.45it/s] 7it [00:00, 9.61it/s] 8it [00:00, 9.70it/s] 9it [00:00, 9.78it/s] 10it [00:01, 9.80it/s] 11it [00:01, 9.85it/s] 12it [00:01, 9.86it/s] 13it [00:01, 9.88it/s] 14it [00:01, 9.88it/s] 15it [00:01, 9.89it/s] 16it [00:01, 9.89it/s] 17it [00:01, 9.90it/s] 18it [00:01, 9.90it/s] 19it [00:02, 9.92it/s] 20it [00:02, 9.92it/s] 21it [00:02, 9.92it/s] 22it [00:02, 9.91it/s] 23it [00:02, 9.91it/s] 24it [00:02, 9.91it/s] 25it [00:02, 9.91it/s] 26it [00:02, 9.90it/s] 27it [00:02, 9.91it/s] 28it [00:02, 9.90it/s] 29it [00:03, 9.89it/s] 30it [00:03, 9.88it/s] 31it [00:03, 9.85it/s] 32it [00:03, 9.84it/s] 33it [00:03, 9.85it/s] 34it [00:03, 9.75it/s] 35it [00:03, 9.76it/s] 36it [00:03, 9.65it/s] 37it [00:03, 9.63it/s] 38it [00:03, 9.65it/s] 39it [00:04, 9.73it/s] 40it [00:04, 9.77it/s] 41it [00:04, 9.82it/s] 42it [00:04, 9.84it/s] 43it [00:04, 9.86it/s] 44it [00:04, 9.86it/s] 45it [00:04, 9.88it/s] 46it [00:04, 9.87it/s] 47it [00:04, 9.87it/s] 48it [00:04, 9.87it/s] 49it [00:05, 9.88it/s] 50it [00:05, 9.88it/s]2025-05-26 04:25:42,226 - INFO - [Epoch 097 | Batch 0050] IWAE-loss 3348.9727 | mean log_px -0.0105 | KL -2877.25 + 51it [00:05, 9.86it/s] 52it [00:05, 9.87it/s] 53it [00:05, 9.88it/s] 54it [00:05, 9.86it/s] 55it [00:05, 9.86it/s] 56it [00:05, 9.86it/s] 57it [00:05, 9.88it/s] 58it [00:05, 9.88it/s] 59it [00:06, 9.88it/s] 60it [00:06, 9.87it/s] 61it [00:06, 9.88it/s] 62it [00:06, 9.88it/s] 63it [00:06, 9.88it/s] 64it [00:06, 9.89it/s] 65it [00:06, 9.90it/s] 66it [00:06, 9.89it/s] 67it [00:06, 9.90it/s] 68it [00:06, 9.88it/s] 69it [00:07, 9.89it/s] 70it [00:07, 9.90it/s] 71it [00:07, 9.89it/s] 72it [00:07, 9.88it/s] 73it [00:07, 9.89it/s] 74it [00:07, 9.81it/s] 75it [00:07, 9.83it/s] 76it [00:07, 9.84it/s] 77it [00:07, 9.83it/s] 78it [00:07, 9.83it/s] 79it [00:08, 9.85it/s] 80it [00:08, 9.84it/s] 81it [00:08, 9.86it/s] 82it [00:08, 9.86it/s] 83it [00:08, 9.86it/s] 84it [00:08, 9.82it/s] 85it [00:08, 9.81it/s] 86it [00:08, 9.81it/s] 87it [00:08, 9.84it/s] 88it [00:09, 9.84it/s] 89it [00:09, 9.86it/s] 90it [00:09, 9.75it/s] 91it [00:09, 9.75it/s] 92it [00:09, 9.73it/s] 93it [00:09, 9.72it/s] 94it [00:09, 9.69it/s] 95it [00:09, 9.70it/s] 96it [00:09, 9.72it/s] 97it [00:09, 9.72it/s] 98it [00:10, 9.72it/s] 99it [00:10, 9.74it/s] 100it [00:10, 9.75it/s]2025-05-26 04:25:47,316 - INFO - [Epoch 097 | Batch 0100] IWAE-loss 3721.4724 | mean log_px -0.0175 | KL -2865.73 + 101it [00:10, 9.74it/s] 102it [00:10, 9.73it/s] 103it [00:10, 9.74it/s] 104it [00:10, 9.74it/s] 105it [00:10, 9.72it/s] 106it [00:10, 9.56it/s] 107it [00:10, 9.37it/s] 108it [00:11, 9.34it/s] 109it [00:11, 9.38it/s] 110it [00:11, 9.40it/s] 111it [00:11, 9.44it/s] 112it [00:11, 9.45it/s] 113it [00:11, 9.48it/s] 114it [00:11, 9.50it/s] 115it [00:11, 9.49it/s] 116it [00:11, 9.49it/s] 117it [00:12, 9.48it/s] 118it [00:12, 9.50it/s] 119it [00:12, 9.54it/s] 120it [00:12, 9.60it/s] 121it [00:12, 9.64it/s] 122it [00:12, 9.68it/s] 123it [00:12, 9.70it/s] 124it [00:12, 9.71it/s] 125it [00:12, 9.72it/s] 126it [00:12, 9.73it/s] 127it [00:13, 9.74it/s] 128it [00:13, 9.75it/s] 129it [00:13, 9.75it/s] 130it [00:13, 9.73it/s] 131it [00:13, 9.74it/s] 132it [00:13, 9.75it/s] 133it [00:13, 9.75it/s] 134it [00:13, 9.75it/s] 135it [00:13, 9.76it/s] 136it [00:13, 9.75it/s] 137it [00:14, 9.75it/s] 138it [00:14, 9.75it/s] 139it [00:14, 9.68it/s] 140it [00:14, 9.69it/s] 141it [00:14, 9.71it/s] 142it [00:14, 9.72it/s] 143it [00:14, 9.73it/s] 144it [00:14, 9.73it/s] 145it [00:14, 9.66it/s] 146it [00:15, 9.61it/s] 147it [00:15, 9.57it/s] 148it [00:15, 9.60it/s] 149it [00:15, 9.66it/s] 150it [00:15, 9.68it/s]2025-05-26 04:25:52,506 - INFO - [Epoch 097 | Batch 0150] IWAE-loss 3712.6641 | mean log_px -0.0218 | KL -2866.04 + 151it [00:15, 9.68it/s] 152it [00:15, 9.69it/s] 153it [00:15, 9.71it/s] 154it [00:15, 9.72it/s] 155it [00:15, 9.73it/s] 156it [00:16, 9.69it/s] 157it [00:16, 9.50it/s] 158it [00:16, 9.27it/s] 159it [00:16, 9.28it/s] 160it [00:16, 9.32it/s] 161it [00:16, 9.39it/s] 162it [00:16, 9.45it/s] 163it [00:16, 9.52it/s] 164it [00:16, 9.55it/s] 165it [00:17, 9.57it/s] 166it [00:17, 9.58it/s] 167it [00:17, 9.61it/s] 168it [00:17, 9.58it/s] 169it [00:17, 9.63it/s] 170it [00:17, 9.65it/s] 171it [00:17, 9.69it/s] 172it [00:17, 9.53it/s] 173it [00:17, 9.60it/s] 174it [00:17, 9.63it/s] 175it [00:18, 9.62it/s] 176it [00:18, 9.66it/s] 177it [00:18, 9.67it/s] 178it [00:18, 9.12it/s] 179it [00:18, 9.35it/s] 180it [00:18, 9.48it/s] 181it [00:18, 9.60it/s] 182it [00:18, 9.69it/s] 183it [00:18, 9.76it/s] 184it [00:18, 9.81it/s] 185it [00:19, 9.85it/s] 186it [00:19, 9.87it/s] 187it [00:19, 9.87it/s] 188it [00:19, 9.88it/s] 189it [00:19, 9.89it/s] 190it [00:19, 9.89it/s] 191it [00:19, 9.91it/s] 192it [00:19, 9.91it/s] 193it [00:19, 9.92it/s] 194it [00:19, 9.93it/s] 195it [00:20, 9.00it/s] 196it [00:20, 9.66it/s] +2025-05-26 04:25:57,295 - INFO - Epoch: 97, Objective: tensor([3453.2244], device='cuda:0', grad_fn=), Loss: 0.01020082551985979, KL/n: 58.48168182373047 + 0it [00:00, ?it/s]2025-05-26 04:25:57,755 - INFO - [Epoch 098 | Batch 0000] IWAE-loss 3513.9075 | mean log_px -0.0093 | KL -2864.63 + 1it [00:00, 5.48it/s] 3it [00:00, 8.28it/s] 5it [00:00, 9.12it/s] 6it [00:00, 9.33it/s] 8it [00:00, 9.64it/s] 10it [00:01, 9.79it/s] 11it [00:01, 9.48it/s] 12it [00:01, 9.59it/s] 13it [00:01, 9.63it/s] 14it [00:01, 9.72it/s] 16it [00:01, 9.85it/s] 17it [00:01, 9.88it/s] 18it [00:01, 9.88it/s] 19it [00:02, 9.74it/s] 20it [00:02, 9.79it/s] 21it [00:02, 9.84it/s] 22it [00:02, 9.37it/s] 23it [00:02, 9.50it/s] 25it [00:02, 9.74it/s] 26it [00:02, 9.76it/s] 27it [00:02, 9.37it/s] 28it [00:02, 9.51it/s] 30it [00:03, 9.71it/s] 32it [00:03, 9.82it/s] 33it [00:03, 9.85it/s] 34it [00:03, 9.88it/s] 36it [00:03, 9.94it/s] 38it [00:03, 9.98it/s] 40it [00:04, 9.96it/s] 41it [00:04, 9.95it/s] 42it [00:04, 9.95it/s] 43it [00:04, 9.82it/s] 44it [00:04, 9.75it/s] 45it [00:04, 9.28it/s] 46it [00:04, 9.45it/s] 48it [00:04, 9.70it/s] 49it [00:05, 9.76it/s]2025-05-26 04:26:02,857 - INFO - [Epoch 098 | Batch 0050] IWAE-loss 4490.0361 | mean log_px -0.0283 | KL -2859.88 + 51it [00:05, 9.86it/s] 53it [00:05, 9.93it/s] 55it [00:05, 9.97it/s] 56it [00:05, 9.89it/s] 57it [00:05, 9.40it/s] 58it [00:06, 9.53it/s] 60it [00:06, 9.72it/s] 62it [00:06, 9.84it/s] 64it [00:06, 9.91it/s] 66it [00:06, 9.95it/s] 68it [00:07, 9.96it/s] 70it [00:07, 9.96it/s] 71it [00:07, 9.94it/s] 72it [00:07, 9.91it/s] 73it [00:07, 9.89it/s] 74it [00:07, 9.40it/s] 75it [00:07, 9.54it/s] 77it [00:07, 9.75it/s] 78it [00:08, 9.80it/s] 80it [00:08, 9.91it/s] 82it [00:08, 9.96it/s] 83it [00:08, 9.94it/s] 84it [00:08, 9.54it/s] 86it [00:08, 9.67it/s] 87it [00:08, 9.74it/s] 88it [00:09, 9.79it/s] 89it [00:09, 9.84it/s] 90it [00:09, 9.87it/s] 91it [00:09, 9.33it/s] 92it [00:09, 9.45it/s] 93it [00:09, 9.56it/s] 94it [00:09, 9.66it/s] 95it [00:09, 9.15it/s] 97it [00:10, 9.53it/s] 98it [00:10, 9.63it/s] 99it [00:10, 9.71it/s]2025-05-26 04:26:07,984 - INFO - [Epoch 098 | Batch 0100] IWAE-loss 3895.4548 | mean log_px -0.0165 | KL -2864.15 + 101it [00:10, 9.84it/s] 103it [00:10, 9.92it/s] 104it [00:10, 9.92it/s] 106it [00:10, 9.98it/s] 108it [00:11, 10.02it/s] 109it [00:11, 10.01it/s] 111it [00:11, 10.03it/s] 113it [00:11, 10.04it/s] 115it [00:11, 10.05it/s] 117it [00:12, 10.05it/s] 119it [00:12, 10.05it/s] 121it [00:12, 10.04it/s] 123it [00:12, 10.03it/s] 125it [00:12, 10.01it/s] 127it [00:13, 9.68it/s] 128it [00:13, 9.73it/s] 129it [00:13, 9.78it/s] 130it [00:13, 9.82it/s] 132it [00:13, 9.91it/s] 134it [00:13, 9.96it/s] 136it [00:13, 9.99it/s] 137it [00:14, 9.99it/s] 139it [00:14, 10.02it/s] 141it [00:14, 9.73it/s] 142it [00:14, 9.78it/s] 144it [00:14, 9.86it/s] 145it [00:14, 9.86it/s] 147it [00:15, 9.61it/s] 148it [00:15, 9.64it/s] 149it [00:15, 9.71it/s] 150it [00:15, 9.77it/s]2025-05-26 04:26:13,033 - INFO - [Epoch 098 | Batch 0150] IWAE-loss 3752.1211 | mean log_px -0.0133 | KL -2858.67 + 151it [00:15, 9.80it/s] 152it [00:15, 9.83it/s] 153it [00:15, 9.87it/s] 155it [00:15, 9.90it/s] 156it [00:15, 9.92it/s] 157it [00:16, 9.94it/s] 158it [00:16, 9.94it/s] 159it [00:16, 9.95it/s] 160it [00:16, 9.94it/s] 161it [00:16, 9.90it/s] 162it [00:16, 9.88it/s] 163it [00:16, 9.86it/s] 164it [00:16, 9.83it/s] 165it [00:16, 9.84it/s] 166it [00:16, 9.82it/s] 167it [00:17, 9.81it/s] 168it [00:17, 9.81it/s] 169it [00:17, 9.65it/s] 170it [00:17, 9.68it/s] 171it [00:17, 9.72it/s] 172it [00:17, 9.75it/s] 173it [00:17, 9.79it/s] 174it [00:17, 9.79it/s] 175it [00:17, 9.81it/s] 176it [00:18, 9.81it/s] 177it [00:18, 9.82it/s] 178it [00:18, 9.82it/s] 179it [00:18, 9.84it/s] 180it [00:18, 9.82it/s] 181it [00:18, 9.85it/s] 182it [00:18, 9.84it/s] 183it [00:18, 9.82it/s] 184it [00:18, 9.81it/s] 185it [00:18, 9.83it/s] 186it [00:19, 9.80it/s] 187it [00:19, 9.82it/s] 188it [00:19, 9.82it/s] 189it [00:19, 9.82it/s] 190it [00:19, 9.83it/s] 191it [00:19, 9.82it/s] 192it [00:19, 9.83it/s] 193it [00:19, 9.83it/s] 194it [00:19, 9.83it/s] 195it [00:19, 9.37it/s] 196it [00:20, 9.74it/s] +2025-05-26 04:26:17,729 - INFO - Epoch: 98, Objective: tensor([3792.0647], device='cuda:0', grad_fn=), Loss: 0.014100815169513226, KL/n: 58.269466400146484 + 0it [00:00, ?it/s]2025-05-26 04:26:18,007 - INFO - [Epoch 099 | Batch 0000] IWAE-loss 3312.5208 | mean log_px -0.0071 | KL -2853.84 + 1it [00:00, 5.19it/s] 2it [00:00, 6.98it/s] 3it [00:00, 8.08it/s] 4it [00:00, 8.71it/s] 5it [00:00, 9.11it/s] 6it [00:00, 9.35it/s] 7it [00:00, 9.52it/s] 8it [00:00, 9.59it/s] 9it [00:01, 9.69it/s] 10it [00:01, 9.76it/s] 11it [00:01, 9.79it/s] 12it [00:01, 9.75it/s] 13it [00:01, 9.80it/s] 14it [00:01, 9.82it/s] 15it [00:01, 9.86it/s] 16it [00:01, 9.85it/s] 17it [00:01, 9.67it/s] 18it [00:01, 9.65it/s] 19it [00:02, 9.72it/s] 20it [00:02, 9.77it/s] 21it [00:02, 9.80it/s] 22it [00:02, 9.81it/s] 23it [00:02, 9.80it/s] 24it [00:02, 9.83it/s] 25it [00:02, 9.86it/s] 26it [00:02, 9.82it/s] 27it [00:02, 9.66it/s] 28it [00:02, 9.69it/s] 29it [00:03, 9.70it/s] 30it [00:03, 9.77it/s] 31it [00:03, 9.82it/s] 32it [00:03, 9.84it/s] 33it [00:03, 9.87it/s] 34it [00:03, 9.88it/s] 35it [00:03, 9.91it/s] 36it [00:03, 9.89it/s] 37it [00:03, 9.91it/s] 38it [00:03, 9.91it/s] 39it [00:04, 9.92it/s] 40it [00:04, 9.92it/s] 41it [00:04, 9.92it/s] 42it [00:04, 9.91it/s] 43it [00:04, 9.91it/s] 44it [00:04, 9.93it/s] 45it [00:04, 9.94it/s] 46it [00:04, 9.93it/s] 47it [00:04, 9.95it/s] 48it [00:04, 9.95it/s] 49it [00:05, 9.95it/s] 50it [00:05, 9.95it/s]2025-05-26 04:26:23,090 - INFO - [Epoch 099 | Batch 0050] IWAE-loss 3289.7585 | mean log_px -0.0074 | KL -2854.63 + 51it [00:05, 9.92it/s] 52it [00:05, 9.93it/s] 53it [00:05, 9.93it/s] 54it [00:05, 9.93it/s] 55it [00:05, 9.94it/s] 56it [00:05, 9.95it/s] 57it [00:05, 9.97it/s] 58it [00:05, 9.94it/s] 59it [00:06, 9.94it/s] 60it [00:06, 9.94it/s] 61it [00:06, 9.95it/s] 62it [00:06, 9.95it/s] 63it [00:06, 9.95it/s] 64it [00:06, 9.94it/s] 65it [00:06, 9.79it/s] 66it [00:06, 9.80it/s] 67it [00:06, 9.77it/s] 68it [00:06, 9.63it/s] 69it [00:07, 9.42it/s] 70it [00:07, 9.40it/s] 71it [00:07, 9.50it/s] 72it [00:07, 9.57it/s] 73it [00:07, 9.63it/s] 74it [00:07, 9.66it/s] 75it [00:07, 9.66it/s] 76it [00:07, 9.65it/s] 77it [00:07, 9.69it/s] 78it [00:08, 9.69it/s] 79it [00:08, 9.72it/s] 80it [00:08, 9.69it/s] 81it [00:08, 9.69it/s] 82it [00:08, 9.70it/s] 83it [00:08, 9.63it/s] 84it [00:08, 9.59it/s] 85it [00:08, 9.60it/s] 86it [00:08, 9.59it/s] 87it [00:08, 9.66it/s] 88it [00:09, 9.74it/s] 89it [00:09, 9.80it/s] 90it [00:09, 9.81it/s] 91it [00:09, 9.85it/s] 92it [00:09, 9.86it/s] 93it [00:09, 9.88it/s] 94it [00:09, 9.89it/s] 95it [00:09, 9.91it/s] 96it [00:09, 9.91it/s] 97it [00:09, 9.92it/s] 98it [00:10, 9.93it/s] 99it [00:10, 9.93it/s] 100it [00:10, 9.92it/s]2025-05-26 04:26:28,201 - INFO - [Epoch 099 | Batch 0100] IWAE-loss 3397.9956 | mean log_px -0.0134 | KL -2848.25 + 101it [00:10, 9.91it/s] 102it [00:10, 9.91it/s] 103it [00:10, 9.92it/s] 104it [00:10, 9.91it/s] 105it [00:10, 9.91it/s] 106it [00:10, 9.92it/s] 107it [00:10, 9.92it/s] 108it [00:11, 9.91it/s] 109it [00:11, 9.92it/s] 110it [00:11, 9.92it/s] 111it [00:11, 9.92it/s] 112it [00:11, 9.92it/s] 113it [00:11, 9.92it/s] 114it [00:11, 9.92it/s] 115it [00:11, 9.92it/s] 116it [00:11, 9.91it/s] 117it [00:11, 9.91it/s] 118it [00:12, 9.92it/s] 119it [00:12, 9.93it/s] 120it [00:12, 9.92it/s] 121it [00:12, 9.92it/s] 122it [00:12, 9.91it/s] 123it [00:12, 9.90it/s] 124it [00:12, 9.91it/s] 125it [00:12, 9.91it/s] 126it [00:12, 9.89it/s] 127it [00:13, 9.91it/s] 128it [00:13, 9.91it/s] 129it [00:13, 9.92it/s] 130it [00:13, 9.91it/s] 131it [00:13, 9.93it/s] 132it [00:13, 9.92it/s] 133it [00:13, 9.94it/s] 134it [00:13, 9.94it/s] 135it [00:13, 9.94it/s] 136it [00:13, 9.94it/s] 137it [00:14, 9.95it/s] 138it [00:14, 9.95it/s] 139it [00:14, 9.95it/s] 140it [00:14, 9.95it/s] 141it [00:14, 9.96it/s] 142it [00:14, 9.95it/s] 143it [00:14, 9.96it/s] 144it [00:14, 9.95it/s] 145it [00:14, 9.95it/s] 146it [00:14, 9.96it/s] 147it [00:15, 9.95it/s] 148it [00:15, 9.95it/s] 149it [00:15, 9.94it/s] 150it [00:15, 9.94it/s]2025-05-26 04:26:33,238 - INFO - [Epoch 099 | Batch 0150] IWAE-loss 3503.2078 | mean log_px -0.0094 | KL -2843.22 + 151it [00:15, 9.93it/s] 152it [00:15, 9.93it/s] 153it [00:15, 9.94it/s] 154it [00:15, 9.93it/s] 155it [00:15, 9.94it/s] 156it [00:15, 9.93it/s] 157it [00:16, 9.92it/s] 158it [00:16, 9.93it/s] 159it [00:16, 9.85it/s] 160it [00:16, 9.81it/s] 161it [00:16, 9.85it/s] 162it [00:16, 9.86it/s] 163it [00:16, 9.86it/s] 164it [00:16, 9.86it/s] 165it [00:16, 9.87it/s] 166it [00:16, 9.89it/s] 167it [00:17, 9.90it/s] 168it [00:17, 9.86it/s] 169it [00:17, 9.87it/s] 170it [00:17, 9.87it/s] 171it [00:17, 9.89it/s] 172it [00:17, 9.89it/s] 173it [00:17, 9.90it/s] 174it [00:17, 9.89it/s] 176it [00:17, 9.49it/s] 178it [00:18, 9.75it/s] 180it [00:18, 9.89it/s] 182it [00:18, 9.94it/s] 183it [00:18, 9.88it/s] 184it [00:18, 9.86it/s] 185it [00:18, 9.87it/s] 186it [00:18, 9.88it/s] 187it [00:19, 9.90it/s] 188it [00:19, 9.91it/s] 189it [00:19, 9.92it/s] 190it [00:19, 9.92it/s] 191it [00:19, 9.92it/s] 192it [00:19, 9.92it/s] 193it [00:19, 9.94it/s] 194it [00:19, 9.82it/s] 195it [00:19, 9.39it/s] 196it [00:19, 9.50it/s] 196it [00:20, 9.77it/s] +2025-05-26 04:26:37,915 - INFO - Epoch: 99, Objective: tensor([3379.9856], device='cuda:0', grad_fn=), Loss: 0.00989951379597187, KL/n: 58.04240417480469 +2025-05-26 04:26:37,918 - INFO - Select objective: bbb + 0it [00:00, ?it/s] 2it [00:00, 17.04it/s] 5it [00:00, 22.98it/s] 8it [00:00, 24.95it/s] 11it [00:00, 26.32it/s] 14it [00:00, 27.09it/s] 17it [00:00, 27.73it/s] 20it [00:00, 28.09it/s] 23it [00:00, 28.23it/s] 26it [00:00, 28.40it/s] 29it [00:01, 28.62it/s] 32it [00:01, 28.70it/s] 35it [00:01, 28.62it/s] 38it [00:01, 28.86it/s] 41it [00:01, 28.90it/s] 44it [00:01, 28.73it/s] 47it [00:01, 28.80it/s] 50it [00:01, 28.44it/s] 53it [00:01, 28.55it/s] 56it [00:02, 28.61it/s] 59it [00:02, 28.55it/s] 62it [00:02, 28.72it/s] 65it [00:02, 28.70it/s] 68it [00:02, 29.00it/s] 71it [00:02, 28.81it/s] 74it [00:02, 28.56it/s] 77it [00:02, 28.88it/s] 80it [00:02, 28.68it/s] 83it [00:02, 28.70it/s] 86it [00:03, 28.55it/s] 89it [00:03, 28.54it/s] 92it [00:03, 28.61it/s] 95it [00:03, 28.68it/s] 98it [00:03, 28.97it/s] 101it [00:03, 28.99it/s] 104it [00:03, 28.92it/s] 107it [00:03, 28.74it/s] 110it [00:03, 28.83it/s] 113it [00:03, 28.85it/s] 116it [00:04, 28.87it/s] 119it [00:04, 28.95it/s] 122it [00:04, 29.12it/s] 125it [00:04, 29.03it/s] 128it [00:04, 28.99it/s] 131it [00:04, 29.09it/s] 134it [00:04, 28.94it/s] 137it [00:04, 28.93it/s] 140it [00:04, 29.01it/s] 143it [00:05, 28.91it/s] 146it [00:05, 28.84it/s] 149it [00:05, 28.91it/s] 152it [00:05, 29.02it/s] 155it [00:05, 29.02it/s] 158it [00:05, 29.13it/s] 161it [00:05, 29.12it/s] 164it [00:05, 29.15it/s] 167it [00:05, 29.23it/s] 170it [00:05, 29.28it/s] 173it [00:06, 29.45it/s] 176it [00:06, 28.77it/s] 179it [00:06, 28.37it/s] 182it [00:06, 27.07it/s] 185it [00:06, 27.59it/s] 188it [00:06, 28.06it/s] 191it [00:06, 28.49it/s] 194it [00:06, 28.85it/s] 197it [00:06, 28.85it/s] 200it [00:07, 28.84it/s] 203it [00:07, 28.93it/s] 206it [00:07, 29.12it/s] 209it [00:07, 29.22it/s] 212it [00:07, 29.30it/s] 215it [00:07, 29.43it/s] 218it [00:07, 29.25it/s] 221it [00:07, 29.29it/s] 224it [00:07, 29.33it/s] 227it [00:07, 29.13it/s] 230it [00:08, 28.94it/s] 233it [00:08, 28.83it/s] 236it [00:08, 28.82it/s] 239it [00:08, 28.84it/s] 242it [00:08, 28.75it/s] 245it [00:08, 28.74it/s] 248it [00:08, 28.75it/s] 251it [00:08, 28.77it/s] 254it [00:08, 28.68it/s] 257it [00:08, 28.75it/s] 260it [00:09, 28.76it/s] 263it [00:09, 28.80it/s] 266it [00:09, 28.78it/s] 269it [00:09, 28.79it/s] 272it [00:09, 28.79it/s] 275it [00:09, 28.74it/s] 278it [00:09, 28.73it/s] 280it [00:09, 28.42it/s] +2025-05-26 04:26:48,110 - INFO - Epoch: 0, Objective: 0.030164141207933426, Loss: 0.02757582627236843, KL/n: 0.002588314935564995 + 0%| | 0/84 [00:00), Loss: 0.43466299772262573, KL/n: 68.75403594970703 + 0it [00:00, ?it/s]2025-05-26 04:43:18,403 - INFO - [Epoch 001 | Batch 0000] IWAE-loss 28074.5488 | mean log_px -0.3577 | KL -3369.96 + 1it [00:00, 5.62it/s] 2it [00:00, 7.50it/s] 3it [00:00, 8.42it/s] 4it [00:00, 8.93it/s] 5it [00:00, 9.25it/s] 6it [00:00, 9.44it/s] 7it [00:00, 9.57it/s] 8it [00:00, 9.64it/s] 9it [00:00, 9.67it/s] 10it [00:01, 9.71it/s] 11it [00:01, 9.74it/s] 12it [00:01, 9.74it/s] 13it [00:01, 9.77it/s] 14it [00:01, 9.78it/s] 15it [00:01, 9.78it/s] 16it [00:01, 9.76it/s] 17it [00:01, 9.78it/s] 18it [00:01, 9.78it/s] 19it [00:02, 9.79it/s] 20it [00:02, 9.81it/s] 21it [00:02, 9.83it/s] 22it [00:02, 9.81it/s] 23it [00:02, 9.79it/s] 24it [00:02, 9.79it/s] 25it [00:02, 9.80it/s] 26it [00:02, 9.79it/s] 27it [00:02, 9.81it/s] 28it [00:02, 9.81it/s] 29it [00:03, 9.80it/s] 30it [00:03, 9.80it/s] 31it [00:03, 9.78it/s] 32it [00:03, 9.78it/s] 33it [00:03, 9.79it/s] 34it [00:03, 9.82it/s] 35it [00:03, 9.82it/s] 36it [00:03, 9.78it/s] 37it [00:03, 9.76it/s] 38it [00:03, 9.73it/s] 39it [00:04, 9.76it/s] 40it [00:04, 9.77it/s] 41it [00:04, 9.77it/s] 42it [00:04, 9.78it/s] 43it [00:04, 9.76it/s] 44it [00:04, 9.74it/s] 45it [00:04, 9.69it/s] 46it [00:04, 9.66it/s] 47it [00:04, 9.69it/s] 48it [00:04, 9.68it/s] 49it [00:05, 9.06it/s] 50it [00:05, 9.26it/s]2025-05-26 04:43:23,543 - INFO - [Epoch 001 | Batch 0050] IWAE-loss 26761.6230 | mean log_px -0.3389 | KL -3393.95 + 51it [00:05, 9.39it/s] 52it [00:05, 9.49it/s] 53it [00:05, 9.56it/s] 54it [00:05, 9.55it/s] 55it [00:05, 9.59it/s] 56it [00:05, 9.65it/s] 57it [00:05, 9.61it/s] 58it [00:06, 9.62it/s] 59it [00:06, 9.66it/s] 60it [00:06, 9.69it/s] 61it [00:06, 9.73it/s] 62it [00:06, 9.71it/s] 63it [00:06, 9.72it/s] 64it [00:06, 9.75it/s] 65it [00:06, 9.73it/s] 66it [00:06, 9.72it/s] 67it [00:06, 9.74it/s] 68it [00:07, 9.75it/s] 69it [00:07, 9.77it/s] 70it [00:07, 9.76it/s] 71it [00:07, 9.79it/s] 72it [00:07, 9.80it/s] 73it [00:07, 9.81it/s] 74it [00:07, 9.71it/s] 75it [00:07, 9.74it/s] 76it [00:07, 9.74it/s] 77it [00:07, 9.78it/s] 78it [00:08, 9.79it/s] 79it [00:08, 9.81it/s] 80it [00:08, 9.80it/s] 81it [00:08, 9.77it/s] 82it [00:08, 9.78it/s] 83it [00:08, 9.81it/s] 84it [00:08, 9.75it/s] 85it [00:08, 9.76it/s] 86it [00:08, 9.75it/s] 87it [00:09, 9.75it/s] 88it [00:09, 9.72it/s] 89it [00:09, 9.61it/s] 90it [00:09, 9.67it/s] 91it [00:09, 9.72it/s] 92it [00:09, 9.72it/s] 93it [00:09, 9.72it/s] 94it [00:09, 9.74it/s] 95it [00:09, 9.77it/s] 96it [00:09, 9.78it/s] 97it [00:10, 9.78it/s] 98it [00:10, 9.73it/s] 99it [00:10, 9.76it/s] 100it [00:10, 9.75it/s]2025-05-26 04:43:28,676 - INFO - [Epoch 001 | Batch 0100] IWAE-loss 28285.6133 | mean log_px -0.3769 | KL -3410.21 + 101it [00:10, 9.76it/s] 102it [00:10, 9.74it/s] 103it [00:10, 9.76it/s] 104it [00:10, 9.74it/s] 105it [00:10, 9.76it/s] 106it [00:10, 9.77it/s] 107it [00:11, 9.06it/s] 108it [00:11, 9.22it/s] 109it [00:11, 9.38it/s] 110it [00:11, 9.49it/s] 111it [00:11, 9.48it/s] 112it [00:11, 9.58it/s] 113it [00:11, 9.65it/s] 114it [00:11, 9.68it/s] 115it [00:11, 9.72it/s] 116it [00:12, 9.73it/s] 117it [00:12, 9.73it/s] 118it [00:12, 9.75it/s] 119it [00:12, 9.78it/s] 120it [00:12, 9.78it/s] 121it [00:12, 9.79it/s] 122it [00:12, 9.80it/s] 123it [00:12, 9.78it/s] 124it [00:12, 9.78it/s] 125it [00:12, 9.79it/s] 126it [00:13, 9.71it/s] 127it [00:13, 9.72it/s] 128it [00:13, 9.75it/s] 129it [00:13, 9.75it/s] 130it [00:13, 9.78it/s] 131it [00:13, 9.79it/s] 132it [00:13, 9.75it/s] 133it [00:13, 9.75it/s] 134it [00:13, 9.78it/s] 135it [00:13, 9.79it/s] 136it [00:14, 9.72it/s] 137it [00:14, 9.75it/s] 138it [00:14, 9.74it/s] 139it [00:14, 9.73it/s] 140it [00:14, 9.31it/s] 141it [00:14, 9.46it/s] 142it [00:14, 9.55it/s] 143it [00:14, 9.61it/s] 144it [00:14, 9.67it/s] 145it [00:15, 9.73it/s] 146it [00:15, 9.74it/s] 147it [00:15, 9.77it/s] 148it [00:15, 9.79it/s] 149it [00:15, 9.78it/s] 150it [00:15, 9.77it/s]2025-05-26 04:43:33,840 - INFO - [Epoch 001 | Batch 0150] IWAE-loss 24188.4082 | mean log_px -0.3034 | KL -3424.15 + 151it [00:15, 9.77it/s] 152it [00:15, 9.64it/s] 153it [00:15, 9.60it/s] 154it [00:15, 9.59it/s] 155it [00:16, 9.61it/s] 156it [00:16, 9.44it/s] 157it [00:16, 9.47it/s] 158it [00:16, 9.50it/s] 159it [00:16, 9.49it/s] 160it [00:16, 9.49it/s] 161it [00:16, 9.55it/s] 162it [00:16, 9.27it/s] 163it [00:16, 9.41it/s] 164it [00:16, 9.52it/s] 165it [00:17, 9.62it/s] 166it [00:17, 9.64it/s] 167it [00:17, 9.72it/s] 168it [00:17, 9.74it/s] 169it [00:17, 9.73it/s] 170it [00:17, 9.76it/s] 171it [00:17, 9.76it/s] 172it [00:17, 9.79it/s] 173it [00:17, 9.83it/s] 174it [00:18, 9.84it/s] 175it [00:18, 9.81it/s] 176it [00:18, 9.82it/s] 177it [00:18, 9.81it/s] 178it [00:18, 9.83it/s] 179it [00:18, 9.82it/s] 180it [00:18, 9.83it/s] 181it [00:18, 9.82it/s] 182it [00:18, 9.22it/s] 183it [00:18, 9.39it/s] 184it [00:19, 9.52it/s] 185it [00:19, 9.60it/s] 186it [00:19, 9.68it/s] 187it [00:19, 9.71it/s] 188it [00:19, 9.74it/s] 189it [00:19, 9.78it/s] 190it [00:19, 9.80it/s] 191it [00:19, 9.83it/s] 192it [00:19, 9.83it/s] 193it [00:19, 9.85it/s] 194it [00:20, 9.84it/s] 195it [00:20, 9.34it/s] 196it [00:20, 9.63it/s] +2025-05-26 04:43:38,612 - INFO - Epoch: 1, Objective: tensor([25134.6309], device='cuda:0', grad_fn=), Loss: 0.3120049238204956, KL/n: 70.07382202148438 + 0it [00:00, ?it/s]2025-05-26 04:43:38,880 - INFO - [Epoch 002 | Batch 0000] IWAE-loss 26034.8926 | mean log_px -0.3319 | KL -3429.36 + 1it [00:00, 5.34it/s] 2it [00:00, 7.32it/s] 3it [00:00, 8.34it/s] 4it [00:00, 8.90it/s] 5it [00:00, 9.25it/s] 6it [00:00, 9.38it/s] 7it [00:00, 9.54it/s] 8it [00:00, 9.63it/s] 9it [00:00, 9.70it/s] 10it [00:01, 9.71it/s] 11it [00:01, 9.74it/s] 12it [00:01, 9.76it/s] 13it [00:01, 9.80it/s] 14it [00:01, 9.78it/s] 15it [00:01, 9.81it/s] 16it [00:01, 9.79it/s] 17it [00:01, 9.82it/s] 18it [00:01, 9.80it/s] 19it [00:02, 9.72it/s] 20it [00:02, 9.77it/s] 21it [00:02, 9.56it/s] 22it [00:02, 9.61it/s] 23it [00:02, 9.68it/s] 24it [00:02, 9.56it/s] 25it [00:02, 9.48it/s] 26it [00:02, 9.33it/s] 27it [00:02, 9.43it/s] 28it [00:02, 9.49it/s] 29it [00:03, 9.53it/s] 30it [00:03, 9.56it/s] 31it [00:03, 9.59it/s] 32it [00:03, 9.60it/s] 33it [00:03, 9.64it/s] 34it [00:03, 9.64it/s] 35it [00:03, 9.65it/s] 36it [00:03, 9.61it/s] 37it [00:03, 9.68it/s] 38it [00:04, 9.72it/s] 39it [00:04, 9.68it/s] 40it [00:04, 9.70it/s] 41it [00:04, 9.75it/s] 42it [00:04, 9.77it/s] 43it [00:04, 9.80it/s] 44it [00:04, 9.81it/s] 45it [00:04, 9.83it/s] 46it [00:04, 9.82it/s] 47it [00:04, 9.82it/s] 48it [00:05, 9.82it/s] 49it [00:05, 9.83it/s] 50it [00:05, 9.83it/s]2025-05-26 04:43:44,022 - INFO - [Epoch 002 | Batch 0050] IWAE-loss 24607.2324 | mean log_px -0.3063 | KL -3444.27 + 51it [00:05, 9.83it/s] 52it [00:05, 9.84it/s] 53it [00:05, 9.85it/s] 54it [00:05, 9.84it/s] 55it [00:05, 9.85it/s] 56it [00:05, 9.85it/s] 57it [00:05, 9.84it/s] 58it [00:06, 9.81it/s] 59it [00:06, 9.83it/s] 60it [00:06, 9.82it/s] 61it [00:06, 9.83it/s] 62it [00:06, 9.84it/s] 63it [00:06, 9.85it/s] 64it [00:06, 9.83it/s] 65it [00:06, 9.83it/s] 66it [00:06, 9.86it/s] 67it [00:06, 9.72it/s] 68it [00:07, 9.60it/s] 69it [00:07, 9.62it/s] 70it [00:07, 9.68it/s] 71it [00:07, 9.76it/s] 72it [00:07, 9.76it/s] 73it [00:07, 9.79it/s] 74it [00:07, 9.80it/s] 75it [00:07, 9.79it/s] 76it [00:07, 9.79it/s] 77it [00:07, 9.81it/s] 78it [00:08, 9.76it/s] 79it [00:08, 9.77it/s] 80it [00:08, 9.78it/s] 81it [00:08, 9.78it/s] 82it [00:08, 6.15it/s] 83it [00:08, 6.92it/s] 84it [00:08, 7.58it/s] 85it [00:09, 8.13it/s] 86it [00:09, 8.56it/s] 87it [00:09, 8.89it/s] 88it [00:09, 9.13it/s] 89it [00:09, 9.34it/s] 90it [00:09, 9.49it/s] 91it [00:09, 9.55it/s] 92it [00:09, 9.62it/s] 93it [00:09, 9.69it/s] 94it [00:09, 9.72it/s] 95it [00:10, 9.73it/s] 96it [00:10, 9.69it/s] 97it [00:10, 9.72it/s] 98it [00:10, 9.55it/s] 99it [00:10, 9.65it/s] 100it [00:10, 9.65it/s]2025-05-26 04:43:49,341 - INFO - [Epoch 002 | Batch 0100] IWAE-loss 20464.7461 | mean log_px -0.2492 | KL -3452.10 + 101it [00:10, 9.72it/s] 102it [00:10, 9.72it/s] 103it [00:10, 9.74it/s] 104it [00:10, 9.76it/s] 105it [00:11, 9.80it/s] 106it [00:11, 9.79it/s] 107it [00:11, 9.81it/s] 108it [00:11, 9.83it/s] 109it [00:11, 9.84it/s] 110it [00:11, 9.84it/s] 111it [00:11, 9.87it/s] 112it [00:11, 9.84it/s] 113it [00:11, 9.85it/s] 114it [00:11, 9.82it/s] 115it [00:12, 9.81it/s] 116it [00:12, 9.76it/s] 117it [00:12, 9.78it/s] 118it [00:12, 9.79it/s] 119it [00:12, 9.77it/s] 120it [00:12, 9.79it/s] 121it [00:12, 9.81it/s] 122it [00:12, 9.81it/s] 123it [00:12, 9.80it/s] 124it [00:12, 9.82it/s] 125it [00:13, 9.84it/s] 126it [00:13, 9.83it/s] 127it [00:13, 9.86it/s] 128it [00:13, 9.84it/s] 129it [00:13, 9.85it/s] 130it [00:13, 9.84it/s] 131it [00:13, 9.84it/s] 132it [00:13, 9.83it/s] 133it [00:13, 9.83it/s] 134it [00:14, 9.84it/s] 135it [00:14, 9.84it/s] 136it [00:14, 9.83it/s] 137it [00:14, 9.83it/s] 138it [00:14, 9.85it/s] 139it [00:14, 9.84it/s] 140it [00:14, 9.82it/s] 141it [00:14, 9.82it/s] 142it [00:14, 9.82it/s] 143it [00:14, 9.83it/s] 144it [00:15, 9.81it/s] 145it [00:15, 9.82it/s] 146it [00:15, 9.81it/s] 147it [00:15, 9.83it/s] 148it [00:15, 9.82it/s] 149it [00:15, 9.81it/s] 150it [00:15, 9.81it/s]2025-05-26 04:43:54,432 - INFO - [Epoch 002 | Batch 0150] IWAE-loss 18063.8633 | mean log_px -0.2179 | KL -3453.99 + 151it [00:15, 9.81it/s] 152it [00:15, 9.64it/s] 153it [00:15, 9.66it/s] 154it [00:16, 9.56it/s] 155it [00:16, 9.65it/s] 156it [00:16, 9.70it/s] 157it [00:16, 9.74it/s] 158it [00:16, 9.76it/s] 159it [00:16, 9.79it/s] 160it [00:16, 9.81it/s] 161it [00:16, 9.81it/s] 162it [00:16, 9.81it/s] 163it [00:16, 9.82it/s] 164it [00:17, 9.82it/s] 165it [00:17, 9.84it/s] 166it [00:17, 9.82it/s] 167it [00:17, 9.80it/s] 168it [00:17, 9.79it/s] 169it [00:17, 9.83it/s] 170it [00:17, 9.82it/s] 171it [00:17, 9.81it/s] 172it [00:17, 9.79it/s] 173it [00:17, 9.84it/s] 174it [00:18, 9.81it/s] 175it [00:18, 9.84it/s] 176it [00:18, 9.62it/s] 177it [00:18, 9.59it/s] 178it [00:18, 9.55it/s] 179it [00:18, 9.66it/s] 180it [00:18, 9.71it/s] 181it [00:18, 9.73it/s] 182it [00:18, 9.63it/s] 183it [00:19, 9.68it/s] 184it [00:19, 9.69it/s] 185it [00:19, 9.76it/s] 186it [00:19, 9.58it/s] 187it [00:19, 9.68it/s] 188it [00:19, 9.75it/s] 189it [00:19, 9.80it/s] 190it [00:19, 9.79it/s] 191it [00:19, 9.83it/s] 192it [00:19, 9.82it/s] 193it [00:20, 9.84it/s] 194it [00:20, 9.80it/s] 195it [00:20, 9.28it/s] 196it [00:20, 9.59it/s] +2025-05-26 04:43:59,169 - INFO - Epoch: 2, Objective: tensor([23773.6406], device='cuda:0', grad_fn=), Loss: 0.30370157957077026, KL/n: 70.60922241210938 + 0it [00:00, ?it/s]2025-05-26 04:43:59,435 - INFO - [Epoch 003 | Batch 0000] IWAE-loss 22127.6270 | mean log_px -0.2715 | KL -3458.96 + 1it [00:00, 4.78it/s] 2it [00:00, 6.83it/s] 3it [00:00, 7.96it/s] 4it [00:00, 8.58it/s] 5it [00:00, 8.96it/s] 6it [00:00, 9.23it/s] 7it [00:00, 9.42it/s] 8it [00:00, 9.54it/s] 9it [00:01, 9.62it/s] 10it [00:01, 9.05it/s] 11it [00:01, 9.27it/s] 12it [00:01, 9.37it/s] 13it [00:01, 9.48it/s] 14it [00:01, 9.56it/s] 15it [00:01, 9.63it/s] 16it [00:01, 9.70it/s] 17it [00:01, 9.75it/s] 18it [00:01, 9.77it/s] 19it [00:02, 9.68it/s] 20it [00:02, 9.73it/s] 21it [00:02, 9.75it/s] 22it [00:02, 9.74it/s] 23it [00:02, 9.46it/s] 24it [00:02, 9.15it/s] 25it [00:02, 9.36it/s] 26it [00:02, 9.49it/s] 27it [00:02, 9.61it/s] 28it [00:03, 9.65it/s] 29it [00:03, 9.69it/s] 30it [00:03, 9.71it/s] 31it [00:03, 9.77it/s] 32it [00:03, 9.76it/s] 33it [00:03, 9.79it/s] 34it [00:03, 9.76it/s] 35it [00:03, 9.76it/s] 36it [00:03, 9.75it/s] 37it [00:03, 9.79it/s] 38it [00:04, 9.80it/s] 39it [00:04, 9.79it/s] 40it [00:04, 9.80it/s] 41it [00:04, 9.80it/s] 42it [00:04, 9.78it/s] 43it [00:04, 9.79it/s] 44it [00:04, 9.81it/s] 45it [00:04, 9.80it/s] 46it [00:04, 9.80it/s] 47it [00:04, 9.81it/s] 48it [00:05, 9.83it/s] 49it [00:05, 9.81it/s] 50it [00:05, 9.81it/s]2025-05-26 04:44:04,618 - INFO - [Epoch 003 | Batch 0050] IWAE-loss 18690.7363 | mean log_px -0.2205 | KL -3462.40 + 51it [00:05, 9.18it/s] 52it [00:05, 9.33it/s] 53it [00:05, 9.45it/s] 54it [00:05, 9.53it/s] 55it [00:05, 9.60it/s] 56it [00:05, 9.62it/s] 57it [00:06, 9.68it/s] 58it [00:06, 9.73it/s] 59it [00:06, 9.76it/s] 60it [00:06, 9.72it/s] 61it [00:06, 9.13it/s] 62it [00:06, 9.31it/s] 63it [00:06, 9.47it/s] 64it [00:06, 9.53it/s] 65it [00:06, 9.59it/s] 66it [00:06, 9.64it/s] 67it [00:07, 9.70it/s] 68it [00:07, 9.68it/s] 69it [00:07, 9.73it/s] 70it [00:07, 9.75it/s] 71it [00:07, 9.75it/s] 72it [00:07, 9.77it/s] 73it [00:07, 9.78it/s] 74it [00:07, 9.80it/s] 75it [00:07, 9.81it/s] 76it [00:07, 9.79it/s] 77it [00:08, 9.79it/s] 78it [00:08, 9.14it/s] 79it [00:08, 9.34it/s] 80it [00:08, 9.47it/s] 81it [00:08, 9.55it/s] 82it [00:08, 9.60it/s] 83it [00:08, 9.65it/s] 84it [00:08, 9.68it/s] 85it [00:08, 9.76it/s] 86it [00:09, 9.75it/s] 87it [00:09, 9.18it/s] 88it [00:09, 9.16it/s] 89it [00:09, 9.31it/s] 90it [00:09, 9.45it/s] 91it [00:09, 9.55it/s] 92it [00:09, 9.62it/s] 93it [00:09, 9.68it/s] 94it [00:09, 9.72it/s] 95it [00:09, 9.73it/s] 96it [00:10, 9.75it/s] 97it [00:10, 9.76it/s] 98it [00:10, 9.79it/s] 99it [00:10, 9.77it/s] 100it [00:10, 9.76it/s]2025-05-26 04:44:09,832 - INFO - [Epoch 003 | Batch 0100] IWAE-loss 22098.5781 | mean log_px -0.2703 | KL -3471.58 + 101it [00:10, 9.79it/s] 102it [00:10, 9.81it/s] 103it [00:10, 9.79it/s] 104it [00:10, 9.16it/s] 105it [00:11, 9.36it/s] 106it [00:11, 9.42it/s] 107it [00:11, 9.56it/s] 108it [00:11, 9.61it/s] 109it [00:11, 9.69it/s] 110it [00:11, 9.75it/s] 111it [00:11, 9.78it/s] 112it [00:11, 9.78it/s] 113it [00:11, 9.78it/s] 114it [00:11, 9.78it/s] 115it [00:12, 9.79it/s] 116it [00:12, 9.78it/s] 117it [00:12, 9.14it/s] 118it [00:12, 9.33it/s] 119it [00:12, 9.45it/s] 120it [00:12, 9.57it/s] 121it [00:12, 9.46it/s] 122it [00:12, 9.08it/s] 123it [00:12, 9.30it/s] 124it [00:12, 9.46it/s] 125it [00:13, 9.58it/s] 126it [00:13, 9.62it/s] 127it [00:13, 9.54it/s] 128it [00:13, 9.41it/s] 129it [00:13, 9.40it/s] 130it [00:13, 9.49it/s] 131it [00:13, 9.54it/s] 132it [00:13, 9.61it/s] 133it [00:13, 9.66it/s] 134it [00:14, 9.69it/s] 135it [00:14, 9.72it/s] 136it [00:14, 9.74it/s] 137it [00:14, 9.80it/s] 138it [00:14, 9.79it/s] 139it [00:14, 9.71it/s] 140it [00:14, 9.51it/s] 141it [00:14, 9.59it/s] 142it [00:14, 9.64it/s] 143it [00:14, 9.56it/s] 144it [00:15, 9.58it/s] 145it [00:15, 9.66it/s] 146it [00:15, 9.70it/s] 147it [00:15, 9.73it/s] 148it [00:15, 9.77it/s] 149it [00:15, 9.77it/s] 150it [00:15, 9.63it/s]2025-05-26 04:44:15,048 - INFO - [Epoch 003 | Batch 0150] IWAE-loss 23228.7480 | mean log_px -0.2856 | KL -3470.63 + 151it [00:15, 9.68it/s] 152it [00:15, 9.71it/s] 153it [00:15, 9.74it/s] 154it [00:16, 9.75it/s] 155it [00:16, 9.76it/s] 156it [00:16, 9.79it/s] 157it [00:16, 9.78it/s] 158it [00:16, 9.54it/s] 159it [00:16, 9.60it/s] 160it [00:16, 9.66it/s] 161it [00:16, 9.72it/s] 162it [00:16, 9.75it/s] 163it [00:17, 9.75it/s] 164it [00:17, 9.75it/s] 165it [00:17, 9.78it/s] 166it [00:17, 9.79it/s] 167it [00:17, 9.82it/s] 168it [00:17, 9.77it/s] 169it [00:17, 9.79it/s] 170it [00:17, 9.80it/s] 171it [00:17, 9.81it/s] 172it [00:17, 9.81it/s] 173it [00:18, 9.82it/s] 174it [00:18, 9.81it/s] 175it [00:18, 9.83it/s] 176it [00:18, 9.81it/s] 177it [00:18, 9.82it/s] 178it [00:18, 9.84it/s] 179it [00:18, 9.79it/s] 180it [00:18, 9.79it/s] 181it [00:18, 9.82it/s] 182it [00:18, 9.80it/s] 183it [00:19, 9.81it/s] 184it [00:19, 9.82it/s] 185it [00:19, 9.79it/s] 186it [00:19, 9.78it/s] 187it [00:19, 9.79it/s] 188it [00:19, 9.79it/s] 189it [00:19, 9.79it/s] 190it [00:19, 9.79it/s] 191it [00:19, 9.83it/s] 192it [00:19, 9.83it/s] 193it [00:20, 9.81it/s] 194it [00:20, 9.81it/s] 195it [00:20, 9.28it/s] 196it [00:20, 8.82it/s] 196it [00:20, 9.56it/s] +2025-05-26 04:44:19,789 - INFO - Epoch: 3, Objective: tensor([23300.8750], device='cuda:0', grad_fn=), Loss: 0.2900332510471344, KL/n: 70.9906005859375 + 0it [00:00, ?it/s]2025-05-26 04:44:20,248 - INFO - [Epoch 004 | Batch 0000] IWAE-loss 12282.2793 | mean log_px -0.1411 | KL -3474.90 + 1it [00:00, 5.30it/s] 2it [00:00, 7.24it/s] 3it [00:00, 8.24it/s] 4it [00:00, 8.83it/s] 5it [00:00, 9.15it/s] 6it [00:00, 8.83it/s] 7it [00:00, 9.08it/s] 8it [00:00, 9.29it/s] 9it [00:01, 9.47it/s] 10it [00:01, 9.60it/s] 11it [00:01, 9.68it/s] 12it [00:01, 9.72it/s] 13it [00:01, 9.75it/s] 14it [00:01, 9.27it/s] 15it [00:01, 9.43it/s] 16it [00:01, 9.50it/s] 17it [00:01, 9.02it/s] 18it [00:01, 9.24it/s] 19it [00:02, 9.43it/s] 20it [00:02, 9.55it/s] 21it [00:02, 9.65it/s] 22it [00:02, 9.23it/s] 23it [00:02, 9.40it/s] 24it [00:02, 9.51it/s] 25it [00:02, 9.62it/s] 26it [00:02, 9.68it/s] 27it [00:02, 9.72it/s] 28it [00:03, 9.75it/s] 29it [00:03, 9.79it/s] 30it [00:03, 9.79it/s] 31it [00:03, 9.77it/s] 32it [00:03, 9.81it/s] 33it [00:03, 9.82it/s] 34it [00:03, 9.81it/s] 35it [00:03, 9.80it/s] 36it [00:03, 9.19it/s] 37it [00:03, 9.38it/s] 38it [00:04, 9.49it/s] 39it [00:04, 9.58it/s] 40it [00:04, 9.17it/s] 41it [00:04, 9.39it/s] 42it [00:04, 9.51it/s] 43it [00:04, 9.16it/s] 44it [00:04, 9.36it/s] 45it [00:04, 9.49it/s] 46it [00:04, 9.56it/s] 47it [00:05, 9.61it/s] 48it [00:05, 9.17it/s] 49it [00:05, 9.34it/s] 50it [00:05, 9.44it/s]2025-05-26 04:44:25,499 - INFO - [Epoch 004 | Batch 0050] IWAE-loss 23196.6523 | mean log_px -0.2816 | KL -3483.42 + 51it [00:05, 9.55it/s] 52it [00:05, 9.65it/s] 53it [00:05, 9.11it/s] 54it [00:05, 9.29it/s] 55it [00:05, 9.46it/s] 56it [00:05, 9.56it/s] 57it [00:06, 9.65it/s] 58it [00:06, 9.69it/s] 59it [00:06, 9.75it/s] 60it [00:06, 9.36it/s] 61it [00:06, 9.47it/s] 62it [00:06, 9.56it/s] 63it [00:06, 9.59it/s] 64it [00:06, 9.65it/s] 65it [00:06, 9.71it/s] 66it [00:07, 9.72it/s] 67it [00:07, 9.78it/s] 68it [00:07, 9.77it/s] 69it [00:07, 9.17it/s] 70it [00:07, 9.35it/s] 71it [00:07, 9.49it/s] 72it [00:07, 9.59it/s] 73it [00:07, 9.67it/s] 74it [00:07, 9.10it/s] 75it [00:07, 9.32it/s] 76it [00:08, 9.45it/s] 77it [00:08, 9.58it/s] 78it [00:08, 9.60it/s] 79it [00:08, 9.70it/s] 80it [00:08, 9.74it/s] 81it [00:08, 9.77it/s] 82it [00:08, 9.71it/s] 83it [00:08, 9.26it/s] 84it [00:08, 9.43it/s] 85it [00:09, 9.55it/s] 86it [00:09, 9.17it/s] 87it [00:09, 9.36it/s] 88it [00:09, 9.49it/s] 89it [00:09, 9.60it/s] 90it [00:09, 9.67it/s] 91it [00:09, 9.70it/s] 92it [00:09, 9.13it/s] 93it [00:09, 9.29it/s] 94it [00:09, 9.43it/s] 95it [00:10, 9.52it/s] 96it [00:10, 9.08it/s] 97it [00:10, 9.29it/s] 98it [00:10, 9.42it/s] 99it [00:10, 9.54it/s] 100it [00:10, 9.23it/s]2025-05-26 04:44:30,778 - INFO - [Epoch 004 | Batch 0100] IWAE-loss 22043.1543 | mean log_px -0.2736 | KL -3483.78 + 101it [00:10, 9.25it/s] 102it [00:10, 8.94it/s] 103it [00:10, 9.18it/s] 104it [00:11, 9.33it/s] 105it [00:11, 9.47it/s] 106it [00:11, 9.55it/s] 107it [00:11, 8.87it/s] 108it [00:11, 9.13it/s] 109it [00:11, 9.30it/s] 110it [00:11, 9.40it/s] 111it [00:11, 8.94it/s] 112it [00:11, 9.17it/s] 113it [00:12, 9.33it/s] 114it [00:12, 9.47it/s] 115it [00:12, 9.35it/s] 116it [00:12, 9.11it/s] 117it [00:12, 9.24it/s] 118it [00:12, 9.41it/s] 119it [00:12, 9.53it/s] 120it [00:12, 9.62it/s] 121it [00:12, 9.66it/s] 122it [00:12, 9.69it/s] 123it [00:13, 9.74it/s] 124it [00:13, 9.77it/s] 125it [00:13, 9.76it/s] 126it [00:13, 9.70it/s] 127it [00:13, 9.75it/s] 128it [00:13, 9.74it/s] 129it [00:13, 9.77it/s] 130it [00:13, 9.29it/s] 131it [00:13, 9.45it/s] 132it [00:14, 9.56it/s] 133it [00:14, 9.64it/s] 134it [00:14, 9.67it/s] 135it [00:14, 9.71it/s] 136it [00:14, 9.27it/s] 137it [00:14, 9.39it/s] 138it [00:14, 9.48it/s] 139it [00:14, 9.01it/s] 140it [00:14, 9.23it/s] 141it [00:14, 9.40it/s] 142it [00:15, 9.50it/s] 143it [00:15, 9.13it/s] 144it [00:15, 9.35it/s] 145it [00:15, 9.49it/s] 146it [00:15, 9.59it/s] 147it [00:15, 9.66it/s] 148it [00:15, 9.11it/s] 149it [00:15, 9.30it/s] 150it [00:15, 9.43it/s]2025-05-26 04:44:36,081 - INFO - [Epoch 004 | Batch 0150] IWAE-loss 22188.4727 | mean log_px -0.2672 | KL -3485.55 + 151it [00:16, 9.45it/s] 152it [00:16, 9.08it/s] 153it [00:16, 9.30it/s] 154it [00:16, 9.45it/s] 155it [00:16, 9.56it/s] 156it [00:16, 9.64it/s] 157it [00:16, 9.68it/s] 158it [00:16, 9.70it/s] 159it [00:16, 9.72it/s] 160it [00:16, 9.71it/s] 161it [00:17, 9.25it/s] 162it [00:17, 9.40it/s] 163it [00:17, 9.53it/s] 164it [00:17, 9.58it/s] 165it [00:17, 9.63it/s] 166it [00:17, 9.69it/s] 167it [00:17, 9.12it/s] 168it [00:17, 9.33it/s] 169it [00:17, 9.48it/s] 170it [00:18, 9.56it/s] 171it [00:18, 9.64it/s] 172it [00:18, 9.68it/s] 173it [00:18, 9.73it/s] 174it [00:18, 9.13it/s] 175it [00:18, 9.31it/s] 176it [00:18, 9.43it/s] 177it [00:18, 9.53it/s] 178it [00:18, 9.13it/s] 179it [00:18, 9.33it/s] 180it [00:19, 9.46it/s] 181it [00:19, 9.57it/s] 182it [00:19, 9.65it/s] 183it [00:19, 9.23it/s] 184it [00:19, 9.39it/s] 185it [00:19, 9.49it/s] 186it [00:19, 9.56it/s] 187it [00:19, 9.17it/s] 188it [00:19, 9.37it/s] 189it [00:20, 9.52it/s] 190it [00:20, 9.58it/s] 191it [00:20, 9.63it/s] 192it [00:20, 9.67it/s] 193it [00:20, 9.73it/s] 194it [00:20, 9.27it/s] 195it [00:20, 8.87it/s] 196it [00:20, 9.40it/s] +2025-05-26 04:44:40,956 - INFO - Epoch: 4, Objective: tensor([19702.6348], device='cuda:0', grad_fn=), Loss: 0.23782320320606232, KL/n: 71.2601089477539 + 0it [00:00, ?it/s]2025-05-26 04:44:41,225 - INFO - [Epoch 005 | Batch 0000] IWAE-loss 16530.5488 | mean log_px -0.1878 | KL -3492.38 + 1it [00:00, 5.53it/s] 2it [00:00, 7.37it/s] 3it [00:00, 8.35it/s] 4it [00:00, 8.81it/s] 5it [00:00, 9.14it/s] 6it [00:00, 9.32it/s] 8it [00:00, 9.61it/s] 9it [00:00, 9.66it/s] 10it [00:01, 9.72it/s] 11it [00:01, 9.74it/s] 12it [00:01, 9.75it/s] 13it [00:01, 9.80it/s] 14it [00:01, 9.77it/s] 15it [00:01, 9.77it/s] 16it [00:01, 9.38it/s] 17it [00:01, 9.51it/s] 18it [00:01, 9.60it/s] 19it [00:02, 9.68it/s] 20it [00:02, 9.73it/s] 21it [00:02, 9.75it/s] 22it [00:02, 9.76it/s] 23it [00:02, 9.20it/s] 24it [00:02, 9.38it/s] 25it [00:02, 9.53it/s] 26it [00:02, 9.57it/s] 27it [00:02, 8.96it/s] 28it [00:03, 8.99it/s] 29it [00:03, 9.18it/s] 30it [00:03, 9.39it/s] 31it [00:03, 9.54it/s] 32it [00:03, 9.59it/s] 33it [00:03, 9.65it/s] 34it [00:03, 9.70it/s] 35it [00:03, 9.72it/s] 36it [00:03, 9.73it/s] 37it [00:03, 9.74it/s] 38it [00:04, 9.72it/s] 39it [00:04, 9.75it/s] 40it [00:04, 9.77it/s] 41it [00:04, 9.80it/s] 42it [00:04, 9.69it/s] 43it [00:04, 9.71it/s] 44it [00:04, 9.74it/s] 45it [00:04, 9.77it/s] 46it [00:04, 9.75it/s] 47it [00:04, 9.78it/s] 48it [00:05, 9.78it/s] 49it [00:05, 9.82it/s] 50it [00:05, 9.80it/s]2025-05-26 04:44:46,403 - INFO - [Epoch 005 | Batch 0050] IWAE-loss 17774.5938 | mean log_px -0.2058 | KL -3492.53 + 51it [00:05, 9.79it/s] 52it [00:05, 9.80it/s] 53it [00:05, 9.81it/s] 54it [00:05, 9.77it/s] 55it [00:05, 9.79it/s] 56it [00:05, 9.77it/s] 57it [00:05, 9.78it/s] 58it [00:06, 9.78it/s] 59it [00:06, 9.77it/s] 60it [00:06, 9.80it/s] 61it [00:06, 9.81it/s] 62it [00:06, 9.80it/s] 63it [00:06, 9.83it/s] 64it [00:06, 9.18it/s] 65it [00:06, 9.35it/s] 66it [00:06, 9.46it/s] 67it [00:07, 9.57it/s] 68it [00:07, 9.65it/s] 69it [00:07, 9.73it/s] 70it [00:07, 9.70it/s] 71it [00:07, 9.74it/s] 72it [00:07, 9.77it/s] 73it [00:07, 9.81it/s] 74it [00:07, 9.31it/s] 75it [00:07, 9.46it/s] 76it [00:07, 9.57it/s] 77it [00:08, 9.64it/s] 78it [00:08, 9.69it/s] 79it [00:08, 9.72it/s] 80it [00:08, 9.76it/s] 81it [00:08, 9.73it/s] 82it [00:08, 9.76it/s] 83it [00:08, 9.18it/s] 84it [00:08, 9.12it/s] 85it [00:08, 9.01it/s] 86it [00:09, 9.16it/s] 87it [00:09, 9.34it/s] 88it [00:09, 9.46it/s] 89it [00:09, 9.59it/s] 90it [00:09, 9.67it/s] 91it [00:09, 9.68it/s] 92it [00:09, 9.70it/s] 93it [00:09, 9.74it/s] 94it [00:09, 9.74it/s] 95it [00:09, 9.76it/s] 96it [00:10, 9.72it/s] 97it [00:10, 9.69it/s] 98it [00:10, 9.07it/s] 99it [00:10, 8.74it/s] 100it [00:10, 8.86it/s]2025-05-26 04:44:51,651 - INFO - [Epoch 005 | Batch 0100] IWAE-loss 13819.5430 | mean log_px -0.1567 | KL -3497.92 + 101it [00:10, 8.56it/s] 102it [00:10, 8.91it/s] 103it [00:10, 9.16it/s] 104it [00:10, 9.33it/s] 105it [00:11, 9.47it/s] 106it [00:11, 9.57it/s] 107it [00:11, 9.63it/s] 108it [00:11, 9.67it/s] 109it [00:11, 9.73it/s] 110it [00:11, 9.75it/s] 111it [00:11, 9.74it/s] 112it [00:11, 9.70it/s] 113it [00:11, 9.72it/s] 114it [00:11, 9.26it/s] 115it [00:12, 9.42it/s] 116it [00:12, 9.48it/s] 117it [00:12, 9.59it/s] 118it [00:12, 9.03it/s] 119it [00:12, 9.25it/s] 120it [00:12, 9.39it/s] 121it [00:12, 9.48it/s] 122it [00:12, 9.54it/s] 123it [00:12, 9.61it/s] 124it [00:13, 9.66it/s] 125it [00:13, 9.61it/s] 126it [00:13, 9.54it/s] 127it [00:13, 9.59it/s] 128it [00:13, 9.67it/s] 129it [00:13, 9.70it/s] 130it [00:13, 9.64it/s] 131it [00:13, 9.67it/s] 132it [00:13, 9.61it/s] 133it [00:13, 9.61it/s] 134it [00:14, 9.64it/s] 135it [00:14, 9.64it/s] 136it [00:14, 9.66it/s] 137it [00:14, 9.73it/s] 138it [00:14, 9.32it/s] 139it [00:14, 9.36it/s] 140it [00:14, 8.90it/s] 141it [00:14, 9.09it/s] 142it [00:14, 9.18it/s] 143it [00:15, 9.27it/s] 144it [00:15, 9.32it/s] 145it [00:15, 9.38it/s] 146it [00:15, 8.89it/s] 147it [00:15, 9.08it/s] 148it [00:15, 9.19it/s] 149it [00:15, 8.87it/s] 150it [00:15, 9.06it/s]2025-05-26 04:44:56,960 - INFO - [Epoch 005 | Batch 0150] IWAE-loss 18954.9707 | mean log_px -0.2272 | KL -3503.50 + 151it [00:15, 9.17it/s] 152it [00:16, 8.78it/s] 153it [00:16, 8.92it/s] 154it [00:16, 9.08it/s] 155it [00:16, 9.13it/s] 156it [00:16, 9.24it/s] 157it [00:16, 9.31it/s] 158it [00:16, 9.39it/s] 159it [00:16, 9.46it/s] 160it [00:16, 9.49it/s] 161it [00:16, 9.39it/s] 162it [00:17, 9.43it/s] 163it [00:17, 9.48it/s] 164it [00:17, 9.45it/s] 165it [00:17, 9.47it/s] 166it [00:17, 8.95it/s] 167it [00:17, 9.06it/s] 168it [00:17, 9.12it/s] 169it [00:17, 9.33it/s] 170it [00:17, 8.90it/s] 171it [00:18, 9.17it/s] 172it [00:18, 9.36it/s] 173it [00:18, 9.51it/s] 174it [00:18, 9.61it/s] 175it [00:18, 9.07it/s] 176it [00:18, 9.31it/s] 177it [00:18, 9.48it/s] 178it [00:18, 9.61it/s] 179it [00:18, 9.72it/s] 180it [00:19, 9.78it/s] 181it [00:19, 9.83it/s] 182it [00:19, 9.84it/s] 183it [00:19, 9.25it/s] 184it [00:19, 9.42it/s] 185it [00:19, 9.58it/s] 186it [00:19, 9.66it/s] 187it [00:19, 9.70it/s] 188it [00:19, 9.75it/s] 189it [00:19, 9.32it/s] 190it [00:20, 9.47it/s] 191it [00:20, 9.59it/s] 192it [00:20, 9.62it/s] 193it [00:20, 9.61it/s] 194it [00:20, 9.39it/s] 195it [00:20, 8.92it/s] 196it [00:20, 9.43it/s] +2025-05-26 04:45:01,861 - INFO - Epoch: 5, Objective: tensor([12165.8643], device='cuda:0', grad_fn=), Loss: 0.1356792002916336, KL/n: 71.50433349609375 + 0it [00:00, ?it/s]2025-05-26 04:45:02,306 - INFO - [Epoch 006 | Batch 0000] IWAE-loss 17046.0859 | mean log_px -0.1989 | KL -3502.32 + 1it [00:00, 4.72it/s] 2it [00:00, 6.75it/s] 3it [00:00, 7.66it/s] 4it [00:00, 8.10it/s] 5it [00:00, 8.57it/s] 6it [00:00, 8.90it/s] 7it [00:00, 8.61it/s] 8it [00:00, 8.97it/s] 9it [00:01, 9.26it/s] 10it [00:01, 9.45it/s] 11it [00:01, 9.01it/s] 12it [00:01, 9.26it/s] 13it [00:01, 9.41it/s] 14it [00:01, 8.96it/s] 16it [00:01, 9.40it/s] 17it [00:01, 9.54it/s] 18it [00:02, 9.62it/s] 19it [00:02, 9.68it/s] 20it [00:02, 9.63it/s] 21it [00:02, 9.69it/s] 22it [00:02, 9.74it/s] 23it [00:02, 9.79it/s] 24it [00:02, 9.80it/s] 25it [00:02, 9.79it/s] 26it [00:02, 9.33it/s] 27it [00:02, 9.48it/s] 28it [00:03, 9.55it/s] 29it [00:03, 9.57it/s] 30it [00:03, 9.67it/s] 31it [00:03, 9.75it/s] 32it [00:03, 9.67it/s] 33it [00:03, 9.49it/s] 34it [00:03, 9.53it/s] 35it [00:03, 9.65it/s] 36it [00:03, 9.08it/s] 37it [00:04, 9.32it/s] 38it [00:04, 8.91it/s] 39it [00:04, 9.18it/s] 40it [00:04, 9.33it/s] 41it [00:04, 9.49it/s] 42it [00:04, 9.11it/s] 43it [00:04, 9.30it/s] 44it [00:04, 9.45it/s] 45it [00:04, 9.54it/s] 46it [00:04, 9.61it/s] 47it [00:05, 9.69it/s] 48it [00:05, 9.73it/s] 49it [00:05, 9.79it/s] 50it [00:05, 9.83it/s]2025-05-26 04:45:07,600 - INFO - [Epoch 006 | Batch 0050] IWAE-loss 15465.3457 | mean log_px -0.1867 | KL -3503.66 + 51it [00:05, 9.84it/s] 52it [00:05, 9.33it/s] 53it [00:05, 9.51it/s] 54it [00:05, 9.61it/s] 55it [00:05, 9.71it/s] 56it [00:06, 9.75it/s] 57it [00:06, 9.80it/s] 58it [00:06, 9.82it/s] 59it [00:06, 9.81it/s] 60it [00:06, 9.81it/s] 61it [00:06, 9.84it/s] 62it [00:06, 9.56it/s] 63it [00:06, 9.19it/s] 64it [00:06, 9.36it/s] 65it [00:06, 9.51it/s] 66it [00:07, 9.58it/s] 67it [00:07, 9.67it/s] 68it [00:07, 9.69it/s] 69it [00:07, 9.74it/s] 70it [00:07, 9.74it/s] 71it [00:07, 8.90it/s] 72it [00:07, 9.13it/s] 73it [00:07, 9.35it/s] 74it [00:07, 9.49it/s] 75it [00:07, 9.61it/s] 76it [00:08, 9.63it/s] 77it [00:08, 9.70it/s] 78it [00:08, 9.74it/s] 79it [00:08, 9.80it/s] 80it [00:08, 9.82it/s] 81it [00:08, 9.85it/s] 82it [00:08, 9.85it/s] 83it [00:08, 9.86it/s] 84it [00:08, 9.83it/s] 85it [00:09, 9.85it/s] 86it [00:09, 9.85it/s] 87it [00:09, 9.84it/s] 88it [00:09, 9.83it/s] 89it [00:09, 9.84it/s] 90it [00:09, 9.81it/s] 91it [00:09, 9.34it/s] 92it [00:09, 9.49it/s] 93it [00:09, 9.53it/s] 94it [00:09, 9.02it/s] 95it [00:10, 9.27it/s] 96it [00:10, 9.40it/s] 97it [00:10, 9.54it/s] 98it [00:10, 9.62it/s] 99it [00:10, 9.17it/s] 100it [00:10, 9.34it/s]2025-05-26 04:45:12,823 - INFO - [Epoch 006 | Batch 0100] IWAE-loss 16232.7539 | mean log_px -0.1872 | KL -3505.36 + 101it [00:10, 9.49it/s] 102it [00:10, 9.57it/s] 103it [00:10, 9.65it/s] 104it [00:11, 9.71it/s] 105it [00:11, 9.76it/s] 106it [00:11, 9.79it/s] 107it [00:11, 9.83it/s] 108it [00:11, 9.86it/s] 109it [00:11, 9.88it/s] 110it [00:11, 9.89it/s] 111it [00:11, 9.90it/s] 112it [00:11, 9.89it/s] 113it [00:11, 9.87it/s] 114it [00:12, 9.83it/s] 115it [00:12, 9.87it/s] 116it [00:12, 9.79it/s] 117it [00:12, 9.74it/s] 118it [00:12, 9.70it/s] 119it [00:12, 9.71it/s] 120it [00:12, 9.68it/s] 121it [00:12, 9.68it/s] 122it [00:12, 9.69it/s] 123it [00:12, 9.20it/s] 124it [00:13, 9.27it/s] 125it [00:13, 9.19it/s] 126it [00:13, 8.65it/s] 127it [00:13, 8.73it/s] 128it [00:13, 8.87it/s] 129it [00:13, 9.04it/s] 130it [00:13, 9.12it/s] 131it [00:13, 9.24it/s] 132it [00:13, 9.32it/s] 133it [00:14, 9.38it/s] 134it [00:14, 9.39it/s] 135it [00:14, 9.42it/s] 136it [00:14, 9.43it/s] 137it [00:14, 9.37it/s] 138it [00:14, 9.34it/s] 139it [00:14, 9.34it/s] 140it [00:14, 9.38it/s] 141it [00:14, 9.26it/s] 142it [00:15, 9.28it/s] 143it [00:15, 9.31it/s] 144it [00:15, 9.38it/s] 145it [00:15, 8.90it/s] 146it [00:15, 9.08it/s] 147it [00:15, 9.15it/s] 148it [00:15, 9.21it/s] 149it [00:15, 9.28it/s] 150it [00:15, 9.36it/s]2025-05-26 04:45:18,120 - INFO - [Epoch 006 | Batch 0150] IWAE-loss 16457.2578 | mean log_px -0.1880 | KL -3506.98 + 151it [00:16, 9.38it/s] 152it [00:16, 9.40it/s] 153it [00:16, 9.42it/s] 154it [00:16, 9.47it/s] 155it [00:16, 9.45it/s] 156it [00:16, 9.47it/s] 157it [00:16, 9.46it/s] 158it [00:16, 9.50it/s] 159it [00:16, 9.47it/s] 160it [00:16, 9.51it/s] 161it [00:17, 9.48it/s] 162it [00:17, 9.42it/s] 163it [00:17, 9.44it/s] 164it [00:17, 9.11it/s] 165it [00:17, 9.22it/s] 166it [00:17, 9.32it/s] 167it [00:17, 9.37it/s] 168it [00:17, 9.43it/s] 169it [00:17, 9.47it/s] 170it [00:18, 9.47it/s] 171it [00:18, 9.47it/s] 172it [00:18, 9.42it/s] 173it [00:18, 9.48it/s] 174it [00:18, 9.51it/s] 175it [00:18, 9.48it/s] 176it [00:18, 9.51it/s] 177it [00:18, 9.54it/s] 178it [00:18, 8.98it/s] 179it [00:18, 9.11it/s] 180it [00:19, 9.20it/s] 181it [00:19, 9.33it/s] 182it [00:19, 9.38it/s] 183it [00:19, 9.34it/s] 184it [00:19, 9.36it/s] 185it [00:19, 8.92it/s] 186it [00:19, 9.09it/s] 187it [00:19, 9.24it/s] 188it [00:19, 9.29it/s] 189it [00:20, 9.36it/s] 190it [00:20, 9.33it/s] 191it [00:20, 9.39it/s] 192it [00:20, 9.41it/s] 193it [00:20, 9.49it/s] 194it [00:20, 9.44it/s] 195it [00:20, 8.91it/s] 196it [00:20, 9.14it/s] 196it [00:20, 9.38it/s] +2025-05-26 04:45:23,047 - INFO - Epoch: 6, Objective: tensor([15376.6016], device='cuda:0', grad_fn=), Loss: 0.17358337342739105, KL/n: 71.75361633300781 + 0it [00:00, ?it/s]2025-05-26 04:45:23,326 - INFO - [Epoch 007 | Batch 0000] IWAE-loss 17575.0977 | mean log_px -0.2084 | KL -3514.32 + 1it [00:00, 5.35it/s] 2it [00:00, 7.22it/s] 3it [00:00, 8.12it/s] 4it [00:00, 8.63it/s] 5it [00:00, 9.00it/s] 6it [00:00, 9.22it/s] 7it [00:00, 9.26it/s] 8it [00:00, 9.35it/s] 9it [00:01, 9.43it/s] 10it [00:01, 9.44it/s] 11it [00:01, 9.51it/s] 12it [00:01, 9.57it/s] 13it [00:01, 9.62it/s] 14it [00:01, 9.64it/s] 15it [00:01, 9.60it/s] 16it [00:01, 9.59it/s] 17it [00:01, 9.56it/s] 18it [00:01, 9.38it/s] 19it [00:02, 9.47it/s] 20it [00:02, 9.49it/s] 21it [00:02, 9.52it/s] 22it [00:02, 9.57it/s] 23it [00:02, 9.59it/s] 24it [00:02, 9.65it/s] 25it [00:02, 9.67it/s] 26it [00:02, 9.64it/s] 27it [00:02, 9.63it/s] 28it [00:03, 9.65it/s] 29it [00:03, 9.63it/s] 30it [00:03, 9.68it/s] 31it [00:03, 9.69it/s] 32it [00:03, 9.63it/s] 33it [00:03, 9.66it/s] 34it [00:03, 9.61it/s] 35it [00:03, 9.59it/s] 36it [00:03, 9.54it/s] 37it [00:03, 9.35it/s] 38it [00:04, 9.45it/s] 39it [00:04, 9.44it/s] 40it [00:04, 9.45it/s] 41it [00:04, 9.33it/s] 42it [00:04, 9.38it/s] 43it [00:04, 9.47it/s] 44it [00:04, 9.48it/s] 45it [00:04, 9.51it/s] 46it [00:04, 9.56it/s] 47it [00:04, 9.59it/s] 48it [00:05, 9.56it/s] 49it [00:05, 9.60it/s] 50it [00:05, 9.49it/s]2025-05-26 04:45:28,560 - INFO - [Epoch 007 | Batch 0050] IWAE-loss 11222.3057 | mean log_px -0.1177 | KL -3518.79 + 51it [00:05, 9.55it/s] 52it [00:05, 9.60it/s] 53it [00:05, 9.61it/s] 54it [00:05, 9.61it/s] 55it [00:05, 9.64it/s] 56it [00:05, 9.62it/s] 57it [00:06, 9.64it/s] 58it [00:06, 9.64it/s] 59it [00:06, 9.66it/s] 60it [00:06, 9.65it/s] 61it [00:06, 9.68it/s] 62it [00:06, 9.69it/s] 63it [00:06, 9.65it/s] 64it [00:06, 9.63it/s] 65it [00:06, 9.66it/s] 66it [00:06, 9.65it/s] 67it [00:07, 9.66it/s] 68it [00:07, 9.66it/s] 69it [00:07, 9.66it/s] 70it [00:07, 9.65it/s] 71it [00:07, 9.62it/s] 72it [00:07, 9.58it/s] 73it [00:07, 9.51it/s] 74it [00:07, 9.53it/s] 75it [00:07, 9.51it/s] 76it [00:08, 9.60it/s] 77it [00:08, 9.62it/s] 78it [00:08, 9.61it/s] 79it [00:08, 9.59it/s] 80it [00:08, 9.58it/s] 81it [00:08, 9.58it/s] 82it [00:08, 9.52it/s] 83it [00:08, 9.53it/s] 84it [00:08, 9.51it/s] 85it [00:08, 9.51it/s] 86it [00:09, 9.52it/s] 87it [00:09, 9.54it/s] 88it [00:09, 9.54it/s] 89it [00:09, 9.57it/s] 90it [00:09, 9.56it/s] 91it [00:09, 9.55it/s] 92it [00:09, 9.60it/s] 93it [00:09, 9.56it/s] 94it [00:09, 9.57it/s] 95it [00:10, 9.61it/s] 96it [00:10, 9.58it/s] 97it [00:10, 9.60it/s] 98it [00:10, 9.58it/s] 99it [00:10, 9.54it/s] 100it [00:10, 9.57it/s]2025-05-26 04:45:33,771 - INFO - [Epoch 007 | Batch 0100] IWAE-loss 15323.3848 | mean log_px -0.1767 | KL -3517.25 + 101it [00:10, 9.52it/s] 102it [00:10, 9.56it/s] 103it [00:10, 9.56it/s] 104it [00:10, 9.56it/s] 105it [00:11, 9.58it/s] 106it [00:11, 9.56it/s] 107it [00:11, 9.58it/s] 108it [00:11, 9.43it/s] 109it [00:11, 9.49it/s] 110it [00:11, 9.49it/s] 111it [00:11, 9.56it/s] 112it [00:11, 9.55it/s] 113it [00:11, 9.57it/s] 114it [00:11, 9.58it/s] 115it [00:12, 9.61it/s] 116it [00:12, 9.61it/s] 117it [00:12, 9.61it/s] 118it [00:12, 9.63it/s] 119it [00:12, 9.60it/s] 120it [00:12, 9.62it/s] 121it [00:12, 9.59it/s] 122it [00:12, 9.57it/s] 123it [00:12, 9.57it/s] 124it [00:13, 9.55it/s] 125it [00:13, 9.57it/s] 126it [00:13, 9.57it/s] 127it [00:13, 9.61it/s] 128it [00:13, 9.58it/s] 129it [00:13, 9.58it/s] 130it [00:13, 9.52it/s] 131it [00:13, 9.52it/s] 132it [00:13, 9.57it/s] 133it [00:13, 9.59it/s] 134it [00:14, 9.58it/s] 135it [00:14, 9.60it/s] 136it [00:14, 9.59it/s] 137it [00:14, 9.56it/s] 138it [00:14, 9.57it/s] 139it [00:14, 9.60it/s] 140it [00:14, 9.62it/s] 141it [00:14, 9.62it/s] 142it [00:14, 9.57it/s] 143it [00:15, 9.59it/s] 144it [00:15, 9.58it/s] 145it [00:15, 9.63it/s] 146it [00:15, 9.64it/s] 147it [00:15, 9.69it/s] 148it [00:15, 9.64it/s] 149it [00:15, 9.59it/s] 150it [00:15, 9.60it/s]2025-05-26 04:45:38,988 - INFO - [Epoch 007 | Batch 0150] IWAE-loss 19223.7129 | mean log_px -0.2297 | KL -3526.62 + 151it [00:15, 9.59it/s] 152it [00:15, 9.58it/s] 153it [00:16, 9.61it/s] 154it [00:16, 9.58it/s] 155it [00:16, 9.59it/s] 156it [00:16, 9.60it/s] 157it [00:16, 9.56it/s] 158it [00:16, 9.54it/s] 159it [00:16, 9.54it/s] 160it [00:16, 9.55it/s] 161it [00:16, 9.60it/s] 162it [00:16, 9.61it/s] 163it [00:17, 9.57it/s] 164it [00:17, 9.58it/s] 165it [00:17, 9.65it/s] 166it [00:17, 9.53it/s] 167it [00:17, 9.57it/s] 168it [00:17, 9.55it/s] 169it [00:17, 9.59it/s] 170it [00:17, 9.63it/s] 171it [00:17, 9.65it/s] 172it [00:18, 9.62it/s] 173it [00:18, 9.65it/s] 174it [00:18, 9.56it/s] 175it [00:18, 9.60it/s] 176it [00:18, 9.56it/s] 177it [00:18, 9.59it/s] 178it [00:18, 9.04it/s] 179it [00:18, 9.18it/s] 180it [00:18, 9.29it/s] 181it [00:19, 9.40it/s] 182it [00:19, 9.45it/s] 183it [00:19, 9.52it/s] 184it [00:19, 9.50it/s] 185it [00:19, 9.51it/s] 186it [00:19, 9.52it/s] 187it [00:19, 9.54it/s] 188it [00:19, 9.56it/s] 189it [00:19, 9.50it/s] 190it [00:19, 9.53it/s] 191it [00:20, 9.58it/s] 192it [00:20, 9.61it/s] 193it [00:20, 9.65it/s] 194it [00:20, 9.67it/s] 195it [00:20, 8.95it/s] 196it [00:20, 9.16it/s] 196it [00:20, 9.49it/s] +2025-05-26 04:45:43,830 - INFO - Epoch: 7, Objective: tensor([11751.9316], device='cuda:0', grad_fn=), Loss: 0.11317390948534012, KL/n: 71.94717407226562 + 0it [00:00, ?it/s]2025-05-26 04:45:44,286 - INFO - [Epoch 008 | Batch 0000] IWAE-loss 14055.2070 | mean log_px -0.1545 | KL -3523.18 + 1it [00:00, 4.70it/s] 2it [00:00, 6.70it/s] 3it [00:00, 7.80it/s] 4it [00:00, 8.40it/s] 5it [00:00, 8.83it/s] 6it [00:00, 9.10it/s] 7it [00:00, 9.30it/s] 8it [00:00, 9.39it/s] 9it [00:01, 9.47it/s] 10it [00:01, 9.43it/s] 11it [00:01, 9.48it/s] 12it [00:01, 9.05it/s] 13it [00:01, 9.22it/s] 14it [00:01, 9.31it/s] 15it [00:01, 9.39it/s] 16it [00:01, 9.50it/s] 17it [00:01, 9.57it/s] 18it [00:02, 9.03it/s] 19it [00:02, 9.13it/s] 20it [00:02, 9.30it/s] 21it [00:02, 9.32it/s] 22it [00:02, 9.39it/s] 23it [00:02, 9.40it/s] 24it [00:02, 8.94it/s] 25it [00:02, 8.89it/s] 26it [00:02, 9.07it/s] 27it [00:02, 9.27it/s] 28it [00:03, 9.37it/s] 29it [00:03, 9.48it/s] 30it [00:03, 9.54it/s] 31it [00:03, 9.58it/s] 32it [00:03, 9.61it/s] 33it [00:03, 9.60it/s] 34it [00:03, 9.63it/s] 35it [00:03, 9.61it/s] 36it [00:03, 9.66it/s] 37it [00:04, 9.64it/s] 38it [00:04, 9.59it/s] 39it [00:04, 9.60it/s] 40it [00:04, 9.52it/s] 41it [00:04, 9.54it/s] 42it [00:04, 9.45it/s] 43it [00:04, 9.55it/s] 44it [00:04, 9.51it/s] 45it [00:04, 8.98it/s] 46it [00:04, 9.16it/s] 47it [00:05, 9.30it/s] 48it [00:05, 9.39it/s] 49it [00:05, 9.48it/s] 50it [00:05, 9.50it/s]2025-05-26 04:45:49,613 - INFO - [Epoch 008 | Batch 0050] IWAE-loss 12810.5664 | mean log_px -0.1418 | KL -3528.74 + 51it [00:05, 9.57it/s] 52it [00:05, 9.63it/s] 53it [00:05, 9.61it/s] 54it [00:05, 9.61it/s] 55it [00:05, 9.07it/s] 56it [00:06, 9.23it/s] 57it [00:06, 9.36it/s] 58it [00:06, 9.45it/s] 59it [00:06, 9.50it/s] 60it [00:06, 9.56it/s] 61it [00:06, 9.51it/s] 62it [00:06, 9.47it/s] 63it [00:06, 9.52it/s] 64it [00:06, 8.96it/s] 65it [00:07, 9.04it/s] 66it [00:07, 9.15it/s] 67it [00:07, 9.30it/s] 68it [00:07, 9.39it/s] 69it [00:07, 9.46it/s] 70it [00:07, 9.52it/s] 71it [00:07, 9.21it/s] 72it [00:07, 9.32it/s] 73it [00:07, 9.43it/s] 74it [00:07, 9.03it/s] 75it [00:08, 9.22it/s] 76it [00:08, 9.32it/s] 77it [00:08, 9.42it/s] 78it [00:08, 9.50it/s] 79it [00:08, 9.49it/s] 80it [00:08, 9.54it/s] 81it [00:08, 9.55it/s] 82it [00:08, 9.58it/s] 83it [00:08, 9.04it/s] 84it [00:09, 9.20it/s] 85it [00:09, 9.33it/s] 86it [00:09, 9.36it/s] 87it [00:09, 9.44it/s] 88it [00:09, 9.51it/s] 89it [00:09, 9.55it/s] 90it [00:09, 9.54it/s] 91it [00:09, 9.59it/s] 92it [00:09, 9.59it/s] 93it [00:10, 9.03it/s] 94it [00:10, 9.23it/s] 95it [00:10, 9.36it/s] 96it [00:10, 9.39it/s] 97it [00:10, 9.49it/s] 98it [00:10, 9.52it/s] 99it [00:10, 9.53it/s] 100it [00:10, 9.57it/s]2025-05-26 04:45:54,937 - INFO - [Epoch 008 | Batch 0100] IWAE-loss 9847.4746 | mean log_px -0.0930 | KL -3528.36 + 101it [00:10, 9.57it/s] 102it [00:10, 9.56it/s] 103it [00:11, 9.60it/s] 104it [00:11, 9.60it/s] 105it [00:11, 9.62it/s] 106it [00:11, 9.61it/s] 107it [00:11, 9.60it/s] 108it [00:11, 9.05it/s] 109it [00:11, 9.25it/s] 110it [00:11, 9.33it/s] 111it [00:11, 9.47it/s] 112it [00:12, 9.07it/s] 113it [00:12, 9.23it/s] 114it [00:12, 9.33it/s] 115it [00:12, 8.89it/s] 116it [00:12, 9.09it/s] 117it [00:12, 9.24it/s] 118it [00:12, 9.27it/s] 119it [00:12, 9.39it/s] 120it [00:12, 9.47it/s] 121it [00:12, 9.08it/s] 122it [00:13, 9.20it/s] 123it [00:13, 9.33it/s] 124it [00:13, 8.88it/s] 125it [00:13, 9.13it/s] 126it [00:13, 9.29it/s] 127it [00:13, 9.37it/s] 128it [00:13, 9.44it/s] 129it [00:13, 9.47it/s] 130it [00:13, 8.95it/s] 131it [00:14, 9.15it/s] 132it [00:14, 9.28it/s] 133it [00:14, 9.38it/s] 134it [00:14, 9.45it/s] 135it [00:14, 9.06it/s] 136it [00:14, 9.24it/s] 137it [00:14, 9.36it/s] 138it [00:14, 9.42it/s] 139it [00:14, 8.92it/s] 140it [00:15, 9.17it/s] 141it [00:15, 9.32it/s] 142it [00:15, 9.42it/s] 143it [00:15, 9.49it/s] 144it [00:15, 9.35it/s] 145it [00:15, 9.40it/s] 146it [00:15, 9.49it/s] 147it [00:15, 9.52it/s] 148it [00:15, 9.51it/s] 149it [00:16, 8.99it/s] 150it [00:16, 9.18it/s]2025-05-26 04:46:00,320 - INFO - [Epoch 008 | Batch 0150] IWAE-loss 11725.8896 | mean log_px -0.1225 | KL -3532.75 + 151it [00:16, 9.29it/s] 152it [00:16, 9.35it/s] 153it [00:16, 9.46it/s] 154it [00:16, 9.46it/s] 155it [00:16, 9.53it/s] 156it [00:16, 9.53it/s] 157it [00:16, 8.95it/s] 158it [00:16, 9.12it/s] 159it [00:17, 9.26it/s] 160it [00:17, 9.34it/s] 161it [00:17, 9.39it/s] 162it [00:17, 9.48it/s] 163it [00:17, 9.48it/s] 164it [00:17, 9.38it/s] 165it [00:17, 9.16it/s] 166it [00:17, 9.22it/s] 167it [00:17, 9.34it/s] 168it [00:18, 9.41it/s] 169it [00:18, 9.46it/s] 170it [00:18, 9.52it/s] 171it [00:18, 9.56it/s] 172it [00:18, 9.07it/s] 173it [00:18, 9.27it/s] 174it [00:18, 9.40it/s] 175it [00:18, 9.42it/s] 176it [00:18, 9.48it/s] 177it [00:18, 9.39it/s] 178it [00:19, 9.49it/s] 179it [00:19, 9.54it/s] 180it [00:19, 8.97it/s] 181it [00:19, 9.12it/s] 182it [00:19, 9.28it/s] 183it [00:19, 9.36it/s] 184it [00:19, 9.43it/s] 185it [00:19, 9.44it/s] 186it [00:19, 8.97it/s] 187it [00:20, 9.19it/s] 188it [00:20, 9.32it/s] 189it [00:20, 9.42it/s] 190it [00:20, 9.05it/s] 191it [00:20, 9.23it/s] 192it [00:20, 9.30it/s] 193it [00:20, 9.45it/s] 194it [00:20, 9.50it/s] 195it [00:20, 8.41it/s] 196it [00:21, 8.82it/s] 196it [00:21, 9.27it/s] +2025-05-26 04:46:05,278 - INFO - Epoch: 8, Objective: tensor([19531.0215], device='cuda:0', grad_fn=), Loss: 0.22876138985157013, KL/n: 72.13713073730469 + 0it [00:00, ?it/s]2025-05-26 04:46:05,533 - INFO - [Epoch 009 | Batch 0000] IWAE-loss 15139.6064 | mean log_px -0.1711 | KL -3532.32 + 1it [00:00, 6.19it/s] 2it [00:00, 7.85it/s] 3it [00:00, 7.91it/s] 4it [00:00, 8.47it/s] 5it [00:00, 8.84it/s] 6it [00:00, 8.51it/s] 7it [00:00, 8.84it/s] 8it [00:00, 9.08it/s] 9it [00:01, 9.23it/s] 10it [00:01, 8.77it/s] 11it [00:01, 9.00it/s] 12it [00:01, 8.74it/s] 13it [00:01, 8.98it/s] 14it [00:01, 9.11it/s] 15it [00:01, 9.27it/s] 16it [00:01, 9.36it/s] 17it [00:01, 9.44it/s] 18it [00:02, 9.51it/s] 19it [00:02, 9.56it/s] 20it [00:02, 9.54it/s] 21it [00:02, 9.59it/s] 22it [00:02, 9.55it/s] 23it [00:02, 9.57it/s] 24it [00:02, 9.56it/s] 25it [00:02, 9.00it/s] 26it [00:02, 9.17it/s] 27it [00:02, 9.28it/s] 28it [00:03, 9.42it/s] 29it [00:03, 9.47it/s] 30it [00:03, 9.52it/s] 31it [00:03, 9.58it/s] 32it [00:03, 9.58it/s] 33it [00:03, 9.04it/s] 34it [00:03, 9.14it/s] 35it [00:03, 9.28it/s] 36it [00:03, 9.33it/s] 37it [00:04, 9.35it/s] 38it [00:04, 9.41it/s] 39it [00:04, 9.44it/s] 40it [00:04, 9.43it/s] 41it [00:04, 9.48it/s] 42it [00:04, 9.56it/s] 43it [00:04, 9.60it/s] 44it [00:04, 9.62it/s] 45it [00:04, 9.66it/s] 46it [00:04, 9.58it/s] 47it [00:05, 9.64it/s] 48it [00:05, 9.61it/s] 49it [00:05, 9.04it/s] 50it [00:05, 9.15it/s]2025-05-26 04:46:10,898 - INFO - [Epoch 009 | Batch 0050] IWAE-loss 10535.8184 | mean log_px -0.1103 | KL -3535.26 + 51it [00:05, 9.29it/s] 52it [00:05, 9.37it/s] 53it [00:05, 9.45it/s] 54it [00:05, 9.50it/s] 55it [00:05, 9.49it/s] 56it [00:06, 9.05it/s] 57it [00:06, 9.22it/s] 58it [00:06, 9.26it/s] 59it [00:06, 9.31it/s] 60it [00:06, 9.43it/s] 61it [00:06, 9.49it/s] 62it [00:06, 8.95it/s] 63it [00:06, 9.10it/s] 64it [00:06, 9.27it/s] 65it [00:07, 9.29it/s] 66it [00:07, 9.45it/s] 67it [00:07, 9.19it/s] 68it [00:07, 9.39it/s] 69it [00:07, 9.55it/s] 70it [00:07, 9.64it/s] 71it [00:07, 9.71it/s] 72it [00:07, 9.76it/s] 73it [00:07, 9.80it/s] 74it [00:07, 9.83it/s] 75it [00:08, 9.86it/s] 76it [00:08, 9.86it/s] 77it [00:08, 9.88it/s] 78it [00:08, 9.88it/s] 79it [00:08, 9.91it/s] 80it [00:08, 9.91it/s] 81it [00:08, 9.91it/s] 82it [00:08, 9.91it/s] 83it [00:08, 9.90it/s] 84it [00:08, 9.48it/s] 85it [00:09, 9.63it/s] 86it [00:09, 9.48it/s] 87it [00:09, 9.59it/s] 88it [00:09, 9.67it/s] 89it [00:09, 9.75it/s] 90it [00:09, 9.79it/s] 91it [00:09, 9.83it/s] 92it [00:09, 9.85it/s] 93it [00:09, 9.88it/s] 94it [00:09, 9.88it/s] 95it [00:10, 9.88it/s] 96it [00:10, 9.87it/s] 97it [00:10, 9.48it/s] 98it [00:10, 9.57it/s] 99it [00:10, 9.69it/s] 100it [00:10, 9.75it/s]2025-05-26 04:46:16,094 - INFO - [Epoch 009 | Batch 0100] IWAE-loss 12649.1650 | mean log_px -0.1434 | KL -3534.93 + 101it [00:10, 9.78it/s] 102it [00:10, 9.81it/s] 103it [00:10, 9.84it/s] 104it [00:11, 9.85it/s] 105it [00:11, 9.29it/s] 106it [00:11, 9.47it/s] 107it [00:11, 9.59it/s] 108it [00:11, 9.69it/s] 109it [00:11, 9.75it/s] 110it [00:11, 9.79it/s] 111it [00:11, 9.83it/s] 112it [00:11, 9.85it/s] 113it [00:11, 9.87it/s] 114it [00:12, 9.87it/s] 115it [00:12, 9.84it/s] 116it [00:12, 9.81it/s] 117it [00:12, 9.84it/s] 118it [00:12, 9.84it/s] 119it [00:12, 9.87it/s] 120it [00:12, 9.73it/s] 121it [00:12, 9.09it/s] 122it [00:12, 9.15it/s] 123it [00:13, 9.35it/s] 124it [00:13, 8.94it/s] 125it [00:13, 9.21it/s] 126it [00:13, 9.40it/s] 127it [00:13, 9.55it/s] 128it [00:13, 9.64it/s] 129it [00:13, 9.72it/s] 130it [00:13, 9.19it/s] 131it [00:13, 9.38it/s] 132it [00:13, 9.47it/s] 133it [00:14, 9.60it/s] 134it [00:14, 9.66it/s] 135it [00:14, 9.16it/s] 136it [00:14, 9.36it/s] 137it [00:14, 9.50it/s] 138it [00:14, 9.61it/s] 139it [00:14, 9.70it/s] 140it [00:14, 9.76it/s] 141it [00:14, 9.80it/s] 142it [00:14, 9.82it/s] 143it [00:15, 9.84it/s] 144it [00:15, 9.85it/s] 145it [00:15, 9.87it/s] 146it [00:15, 9.86it/s] 147it [00:15, 9.88it/s] 148it [00:15, 9.87it/s] 149it [00:15, 9.89it/s] 150it [00:15, 9.88it/s]2025-05-26 04:46:21,279 - INFO - [Epoch 009 | Batch 0150] IWAE-loss 14599.3418 | mean log_px -0.1665 | KL -3540.62 + 151it [00:15, 9.89it/s] 152it [00:16, 9.88it/s] 153it [00:16, 9.90it/s] 154it [00:16, 9.90it/s] 155it [00:16, 9.90it/s] 156it [00:16, 9.88it/s] 157it [00:16, 9.88it/s] 158it [00:16, 9.88it/s] 159it [00:16, 9.88it/s] 160it [00:16, 9.89it/s] 161it [00:16, 9.32it/s] 162it [00:17, 9.48it/s] 163it [00:17, 9.58it/s] 164it [00:17, 9.66it/s] 165it [00:17, 9.67it/s] 166it [00:17, 9.73it/s] 167it [00:17, 9.78it/s] 168it [00:17, 9.80it/s] 169it [00:17, 9.85it/s] 170it [00:17, 9.86it/s] 171it [00:17, 9.88it/s] 172it [00:18, 9.88it/s] 173it [00:18, 9.89it/s] 174it [00:18, 9.89it/s] 175it [00:18, 9.90it/s] 176it [00:18, 9.89it/s] 177it [00:18, 9.90it/s] 178it [00:18, 9.90it/s] 179it [00:18, 9.90it/s] 180it [00:18, 9.90it/s] 181it [00:18, 9.91it/s] 182it [00:19, 9.88it/s] 183it [00:19, 9.55it/s] 184it [00:19, 9.55it/s] 185it [00:19, 9.53it/s] 186it [00:19, 9.52it/s] 187it [00:19, 9.59it/s] 188it [00:19, 9.54it/s] 189it [00:19, 9.59it/s] 190it [00:19, 9.56it/s] 191it [00:20, 9.54it/s] 192it [00:20, 9.42it/s] 193it [00:20, 9.41it/s] 194it [00:20, 9.49it/s] 195it [00:20, 8.91it/s] 196it [00:20, 9.13it/s] 196it [00:20, 9.50it/s] +2025-05-26 04:46:26,037 - INFO - Epoch: 9, Objective: tensor([12982.9697], device='cuda:0', grad_fn=), Loss: 0.14898112416267395, KL/n: 72.30970001220703 + 0it [00:00, ?it/s]2025-05-26 04:46:26,490 - INFO - [Epoch 010 | Batch 0000] IWAE-loss 13698.6484 | mean log_px -0.1451 | KL -3541.10 + 1it [00:00, 4.73it/s] 2it [00:00, 6.72it/s] 3it [00:00, 7.64it/s] 4it [00:00, 7.94it/s] 5it [00:00, 8.38it/s] 6it [00:00, 8.23it/s] 7it [00:00, 8.57it/s] 8it [00:00, 8.83it/s] 9it [00:01, 8.99it/s] 10it [00:01, 9.15it/s] 11it [00:01, 9.24it/s] 12it [00:01, 9.33it/s] 13it [00:01, 8.89it/s] 14it [00:01, 9.05it/s] 15it [00:01, 9.21it/s] 16it [00:01, 9.26it/s] 17it [00:01, 9.35it/s] 18it [00:02, 9.38it/s] 19it [00:02, 9.41it/s] 20it [00:02, 9.43it/s] 21it [00:02, 9.44it/s] 22it [00:02, 9.43it/s] 23it [00:02, 9.39it/s] 24it [00:02, 9.44it/s] 25it [00:02, 9.47it/s] 26it [00:02, 9.47it/s] 27it [00:03, 9.48it/s] 28it [00:03, 9.51it/s] 29it [00:03, 9.52it/s] 30it [00:03, 9.20it/s] 31it [00:03, 9.30it/s] 32it [00:03, 9.36it/s] 33it [00:03, 9.37it/s] 34it [00:03, 9.39it/s] 35it [00:03, 9.45it/s] 36it [00:03, 9.40it/s] 37it [00:04, 9.45it/s] 38it [00:04, 9.45it/s] 39it [00:04, 9.48it/s] 40it [00:04, 9.52it/s] 41it [00:04, 9.54it/s] 42it [00:04, 9.51it/s] 43it [00:04, 9.53it/s] 44it [00:04, 9.01it/s] 45it [00:04, 9.14it/s] 46it [00:05, 9.23it/s] 47it [00:05, 8.98it/s] 48it [00:05, 9.10it/s] 49it [00:05, 8.75it/s] 50it [00:05, 8.96it/s]2025-05-26 04:46:31,909 - INFO - [Epoch 010 | Batch 0050] IWAE-loss 15355.1699 | mean log_px -0.1796 | KL -3543.84 + 51it [00:05, 9.13it/s] 52it [00:05, 9.25it/s] 53it [00:05, 9.32it/s] 54it [00:05, 9.33it/s] 55it [00:06, 9.42it/s] 56it [00:06, 9.41it/s] 57it [00:06, 9.42it/s] 58it [00:06, 9.38it/s] 59it [00:06, 9.42it/s] 60it [00:06, 8.93it/s] 61it [00:06, 9.09it/s] 62it [00:06, 9.20it/s] 63it [00:06, 9.30it/s] 64it [00:06, 9.36it/s] 65it [00:07, 9.33it/s] 66it [00:07, 9.35it/s] 67it [00:07, 9.44it/s] 68it [00:07, 9.41it/s] 69it [00:07, 9.43it/s] 70it [00:07, 9.46it/s] 71it [00:07, 9.45it/s] 72it [00:07, 9.45it/s] 73it [00:07, 8.92it/s] 74it [00:08, 9.10it/s] 75it [00:08, 9.23it/s] 76it [00:08, 9.33it/s] 77it [00:08, 9.36it/s] 78it [00:08, 9.37it/s] 79it [00:08, 9.42it/s] 80it [00:08, 9.43it/s] 81it [00:08, 8.95it/s] 82it [00:08, 9.10it/s] 83it [00:09, 9.24it/s] 84it [00:09, 9.30it/s] 85it [00:09, 9.38it/s] 86it [00:09, 9.41it/s] 87it [00:09, 9.40it/s] 88it [00:09, 9.44it/s] 89it [00:09, 9.45it/s] 90it [00:09, 9.48it/s] 91it [00:09, 9.51it/s] 92it [00:09, 9.50it/s] 93it [00:10, 9.48it/s] 94it [00:10, 9.44it/s] 95it [00:10, 9.46it/s] 96it [00:10, 9.44it/s] 97it [00:10, 9.45it/s] 98it [00:10, 9.46it/s] 99it [00:10, 9.52it/s] 100it [00:10, 9.49it/s]2025-05-26 04:46:37,244 - INFO - [Epoch 010 | Batch 0100] IWAE-loss 10181.3457 | mean log_px -0.1026 | KL -3547.27 + 101it [00:10, 9.48it/s] 102it [00:11, 9.42it/s] 103it [00:11, 9.37it/s] 104it [00:11, 9.41it/s] 105it [00:11, 9.44it/s] 106it [00:11, 9.42it/s] 107it [00:11, 9.47it/s] 108it [00:11, 9.47it/s] 109it [00:11, 9.51it/s] 110it [00:11, 9.52it/s] 111it [00:12, 9.02it/s] 112it [00:12, 9.20it/s] 113it [00:12, 9.32it/s] 114it [00:12, 9.29it/s] 115it [00:12, 9.41it/s] 116it [00:12, 9.49it/s] 117it [00:12, 9.56it/s] 118it [00:12, 9.51it/s] 119it [00:12, 9.50it/s] 120it [00:12, 9.54it/s] 121it [00:13, 9.52it/s] 122it [00:13, 9.51it/s] 123it [00:13, 9.52it/s] 124it [00:13, 9.51it/s] 125it [00:13, 9.51it/s] 126it [00:13, 9.48it/s] 127it [00:13, 9.50it/s] 128it [00:13, 9.49it/s] 129it [00:13, 9.52it/s] 130it [00:14, 8.96it/s] 131it [00:14, 9.07it/s] 132it [00:14, 9.24it/s] 133it [00:14, 9.30it/s] 134it [00:14, 9.39it/s] 135it [00:14, 9.47it/s] 136it [00:14, 9.52it/s] 137it [00:14, 9.46it/s] 138it [00:14, 9.42it/s] 139it [00:14, 9.44it/s] 140it [00:15, 9.46it/s] 141it [00:15, 9.47it/s] 142it [00:15, 9.40it/s] 143it [00:15, 9.40it/s] 144it [00:15, 9.38it/s] 145it [00:15, 9.36it/s] 146it [00:15, 9.32it/s] 147it [00:15, 9.33it/s] 148it [00:15, 9.22it/s] 149it [00:16, 9.18it/s] 150it [00:16, 9.27it/s]2025-05-26 04:46:42,572 - INFO - [Epoch 010 | Batch 0150] IWAE-loss 12556.6738 | mean log_px -0.1344 | KL -3543.33 + 151it [00:16, 9.28it/s] 152it [00:16, 9.28it/s] 153it [00:16, 9.33it/s] 154it [00:16, 8.89it/s] 155it [00:16, 9.06it/s] 156it [00:16, 9.19it/s] 157it [00:16, 9.26it/s] 158it [00:17, 9.31it/s] 159it [00:17, 9.36it/s] 160it [00:17, 9.29it/s] 161it [00:17, 9.32it/s] 162it [00:17, 9.35it/s] 163it [00:17, 9.26it/s] 164it [00:17, 9.19it/s] 165it [00:17, 9.24it/s] 166it [00:17, 9.27it/s] 167it [00:18, 9.28it/s] 168it [00:18, 9.33it/s] 169it [00:18, 9.37it/s] 170it [00:18, 8.90it/s] 171it [00:18, 9.09it/s] 172it [00:18, 9.19it/s] 173it [00:18, 9.16it/s] 174it [00:18, 9.21it/s] 175it [00:18, 9.32it/s] 176it [00:18, 9.26it/s] 177it [00:19, 9.39it/s] 178it [00:19, 9.46it/s] 179it [00:19, 9.44it/s] 180it [00:19, 8.89it/s] 181it [00:19, 9.03it/s] 182it [00:19, 9.10it/s] 183it [00:19, 9.16it/s] 184it [00:19, 9.25it/s] 185it [00:19, 9.38it/s] 186it [00:20, 9.34it/s] 187it [00:20, 9.43it/s] 188it [00:20, 9.34it/s] 189it [00:20, 9.25it/s] 190it [00:20, 9.33it/s] 191it [00:20, 9.42it/s] 192it [00:20, 9.45it/s] 193it [00:20, 9.44it/s] 194it [00:20, 9.43it/s] 195it [00:21, 8.85it/s] 196it [00:21, 9.00it/s] 196it [00:21, 9.24it/s] +2025-05-26 04:46:47,556 - INFO - Epoch: 10, Objective: tensor([15107.3916], device='cuda:0', grad_fn=), Loss: 0.16303861141204834, KL/n: 72.43524169921875 + 0it [00:00, ?it/s]2025-05-26 04:46:47,815 - INFO - [Epoch 011 | Batch 0000] IWAE-loss 10246.0049 | mean log_px -0.1013 | KL -3548.55 + 1it [00:00, 5.93it/s] 2it [00:00, 7.65it/s] 3it [00:00, 8.40it/s] 4it [00:00, 8.76it/s] 5it [00:00, 9.04it/s] 6it [00:00, 9.17it/s] 7it [00:00, 9.27it/s] 8it [00:00, 9.35it/s] 9it [00:01, 9.45it/s] 10it [00:01, 9.32it/s] 11it [00:01, 9.05it/s] 12it [00:01, 9.02it/s] 13it [00:01, 9.23it/s] 14it [00:01, 9.37it/s] 15it [00:01, 9.45it/s] 16it [00:01, 9.41it/s] 17it [00:01, 9.26it/s] 18it [00:01, 9.07it/s] 19it [00:02, 9.09it/s] 20it [00:02, 9.24it/s] 21it [00:02, 9.24it/s] 22it [00:02, 9.29it/s] 23it [00:02, 9.38it/s] 24it [00:02, 9.43it/s] 25it [00:02, 9.46it/s] 26it [00:02, 9.46it/s] 27it [00:02, 9.38it/s] 28it [00:03, 9.29it/s] 29it [00:03, 9.40it/s] 30it [00:03, 9.49it/s] 31it [00:03, 9.33it/s] 32it [00:03, 9.35it/s] 33it [00:03, 9.30it/s] 34it [00:03, 9.33it/s] 35it [00:03, 9.40it/s] 36it [00:03, 9.36it/s] 37it [00:04, 9.46it/s] 38it [00:04, 9.43it/s] 39it [00:04, 9.46it/s] 40it [00:04, 9.50it/s] 41it [00:04, 9.46it/s] 42it [00:04, 9.49it/s] 43it [00:04, 9.52it/s] 44it [00:04, 9.45it/s] 45it [00:04, 9.42it/s] 46it [00:04, 9.34it/s] 47it [00:05, 9.30it/s] 48it [00:05, 9.40it/s] 49it [00:05, 9.51it/s] 50it [00:05, 9.46it/s]2025-05-26 04:46:53,145 - INFO - [Epoch 011 | Batch 0050] IWAE-loss 13919.8701 | mean log_px -0.1529 | KL -3551.17 + 51it [00:05, 9.45it/s] 52it [00:05, 9.48it/s] 53it [00:05, 9.33it/s] 54it [00:05, 9.34it/s] 55it [00:05, 9.36it/s] 56it [00:06, 9.32it/s] 57it [00:06, 9.31it/s] 58it [00:06, 9.36it/s] 59it [00:06, 9.41it/s] 60it [00:06, 9.46it/s] 61it [00:06, 9.35it/s] 62it [00:06, 9.19it/s] 63it [00:06, 9.23it/s] 64it [00:06, 8.81it/s] 65it [00:07, 8.98it/s] 66it [00:07, 9.06it/s] 67it [00:07, 9.19it/s] 68it [00:07, 9.31it/s] 69it [00:07, 9.40it/s] 70it [00:07, 9.45it/s] 71it [00:07, 9.46it/s] 72it [00:07, 9.21it/s] 73it [00:07, 9.38it/s] 74it [00:07, 9.45it/s] 75it [00:08, 9.56it/s] 76it [00:08, 9.65it/s] 77it [00:08, 9.70it/s] 78it [00:08, 9.73it/s] 79it [00:08, 9.76it/s] 80it [00:08, 9.75it/s] 81it [00:08, 9.75it/s] 82it [00:08, 9.76it/s] 83it [00:08, 9.77it/s] 84it [00:08, 9.74it/s] 85it [00:09, 9.53it/s] 86it [00:09, 9.62it/s] 87it [00:09, 9.62it/s] 88it [00:09, 9.67it/s] 89it [00:09, 9.73it/s] 90it [00:09, 9.69it/s] 91it [00:09, 9.44it/s] 92it [00:09, 9.55it/s] 93it [00:09, 9.63it/s] 94it [00:10, 9.67it/s] 95it [00:10, 9.72it/s] 96it [00:10, 9.77it/s] 97it [00:10, 9.79it/s] 98it [00:10, 9.74it/s] 99it [00:10, 9.75it/s] 100it [00:10, 9.76it/s]2025-05-26 04:46:58,403 - INFO - [Epoch 011 | Batch 0100] IWAE-loss 11395.6230 | mean log_px -0.1321 | KL -3551.43 + 101it [00:10, 9.47it/s] 102it [00:10, 9.36it/s] 103it [00:10, 9.52it/s] 104it [00:11, 9.61it/s] 105it [00:11, 9.65it/s] 106it [00:11, 9.71it/s] 107it [00:11, 9.73it/s] 108it [00:11, 9.77it/s] 109it [00:11, 9.81it/s] 110it [00:11, 9.82it/s] 111it [00:11, 9.86it/s] 112it [00:11, 9.88it/s] 113it [00:11, 9.88it/s] 114it [00:12, 9.85it/s] 115it [00:12, 9.78it/s] 116it [00:12, 9.79it/s] 117it [00:12, 9.78it/s] 118it [00:12, 9.76it/s] 119it [00:12, 9.69it/s] 120it [00:12, 9.64it/s] 121it [00:12, 9.67it/s] 122it [00:12, 9.72it/s] 123it [00:13, 9.71it/s] 124it [00:13, 9.76it/s] 125it [00:13, 9.78it/s] 126it [00:13, 9.81it/s] 127it [00:13, 9.78it/s] 128it [00:13, 9.78it/s] 129it [00:13, 9.82it/s] 130it [00:13, 9.83it/s] 131it [00:13, 9.86it/s] 132it [00:13, 9.89it/s] 133it [00:14, 9.91it/s] 134it [00:14, 9.92it/s] 135it [00:14, 9.80it/s] 136it [00:14, 9.79it/s] 137it [00:14, 9.80it/s] 138it [00:14, 9.82it/s] 139it [00:14, 9.86it/s] 140it [00:14, 9.81it/s] 141it [00:14, 9.82it/s] 142it [00:14, 9.76it/s] 143it [00:15, 9.58it/s] 144it [00:15, 9.52it/s] 145it [00:15, 9.56it/s] 146it [00:15, 9.58it/s] 147it [00:15, 9.55it/s] 148it [00:15, 9.51it/s] 149it [00:15, 9.45it/s] 150it [00:15, 9.44it/s]2025-05-26 04:47:03,553 - INFO - [Epoch 011 | Batch 0150] IWAE-loss 14350.5879 | mean log_px -0.1595 | KL -3548.78 + 151it [00:15, 9.45it/s] 152it [00:16, 9.44it/s] 153it [00:16, 9.39it/s] 154it [00:16, 9.37it/s] 155it [00:16, 9.39it/s] 156it [00:16, 9.39it/s] 157it [00:16, 9.41it/s] 158it [00:16, 9.37it/s] 159it [00:16, 9.43it/s] 160it [00:16, 9.50it/s] 161it [00:16, 9.58it/s] 162it [00:17, 9.64it/s] 163it [00:17, 9.67it/s] 164it [00:17, 9.71it/s] 165it [00:17, 9.72it/s] 166it [00:17, 9.77it/s] 167it [00:17, 9.80it/s] 168it [00:17, 9.78it/s] 169it [00:17, 9.80it/s] 170it [00:17, 9.69it/s] 171it [00:17, 9.56it/s] 172it [00:18, 9.47it/s] 173it [00:18, 9.44it/s] 174it [00:18, 9.40it/s] 175it [00:18, 9.47it/s] 176it [00:18, 9.45it/s] 177it [00:18, 8.90it/s] 178it [00:18, 9.11it/s] 179it [00:18, 9.31it/s] 180it [00:18, 9.47it/s] 181it [00:19, 9.58it/s] 182it [00:19, 9.64it/s] 183it [00:19, 9.72it/s] 184it [00:19, 9.76it/s] 185it [00:19, 9.79it/s] 186it [00:19, 9.79it/s] 187it [00:19, 9.79it/s] 188it [00:19, 9.80it/s] 189it [00:19, 9.81it/s] 190it [00:19, 9.82it/s] 191it [00:20, 9.83it/s] 192it [00:20, 9.81it/s] 193it [00:20, 9.82it/s] 194it [00:20, 9.80it/s] 195it [00:20, 9.32it/s] 196it [00:20, 9.02it/s] 196it [00:20, 9.48it/s] +2025-05-26 04:47:08,357 - INFO - Epoch: 11, Objective: tensor([10451.8135], device='cuda:0', grad_fn=), Loss: 0.1001165509223938, KL/n: 72.5517807006836 + 0it [00:00, ?it/s]2025-05-26 04:47:08,812 - INFO - [Epoch 012 | Batch 0000] IWAE-loss 8402.5049 | mean log_px -0.0712 | KL -3554.51 + 1it [00:00, 5.23it/s] 2it [00:00, 6.74it/s] 4it [00:00, 8.47it/s] 5it [00:00, 8.89it/s] 6it [00:00, 9.06it/s] 7it [00:00, 9.26it/s] 8it [00:00, 8.92it/s] 9it [00:01, 9.10it/s] 10it [00:01, 9.28it/s] 12it [00:01, 9.61it/s] 13it [00:01, 9.65it/s] 14it [00:01, 9.71it/s] 15it [00:01, 9.72it/s] 16it [00:01, 9.71it/s] 17it [00:01, 9.26it/s] 18it [00:01, 9.31it/s] 19it [00:02, 9.49it/s] 20it [00:02, 9.57it/s] 21it [00:02, 9.69it/s] 22it [00:02, 9.62it/s] 23it [00:02, 9.67it/s] 24it [00:02, 9.73it/s] 25it [00:02, 9.76it/s] 26it [00:02, 9.79it/s] 27it [00:02, 9.73it/s] 28it [00:03, 9.08it/s] 29it [00:03, 9.21it/s] 30it [00:03, 9.43it/s] 31it [00:03, 9.59it/s] 32it [00:03, 9.10it/s] 33it [00:03, 9.24it/s] 34it [00:03, 9.31it/s] 35it [00:03, 9.50it/s] 36it [00:03, 9.61it/s] 37it [00:03, 9.71it/s] 38it [00:04, 9.77it/s] 40it [00:04, 9.91it/s] 42it [00:04, 9.97it/s] 43it [00:04, 9.96it/s] 44it [00:04, 9.96it/s] 46it [00:04, 10.01it/s] 48it [00:05, 10.03it/s] 50it [00:05, 10.00it/s]2025-05-26 04:47:13,994 - INFO - [Epoch 012 | Batch 0050] IWAE-loss 10922.4316 | mean log_px -0.1087 | KL -3553.06 + 51it [00:05, 9.52it/s] 52it [00:05, 9.61it/s] 53it [00:05, 9.66it/s] 54it [00:05, 9.74it/s] 56it [00:05, 9.42it/s] 57it [00:06, 9.34it/s] 58it [00:06, 9.42it/s] 60it [00:06, 9.67it/s] 61it [00:06, 9.27it/s] 63it [00:06, 9.57it/s] 64it [00:06, 9.66it/s] 66it [00:06, 9.81it/s] 67it [00:07, 9.32it/s] 68it [00:07, 9.37it/s] 69it [00:07, 9.50it/s] 70it [00:07, 9.61it/s] 71it [00:07, 9.17it/s] 72it [00:07, 9.35it/s] 74it [00:07, 9.18it/s] 76it [00:08, 9.49it/s] 77it [00:08, 9.59it/s] 78it [00:08, 9.21it/s] 79it [00:08, 9.40it/s] 80it [00:08, 9.54it/s] 82it [00:08, 9.38it/s] 83it [00:08, 9.51it/s] 84it [00:08, 9.62it/s] 86it [00:09, 9.46it/s] 87it [00:09, 9.57it/s] 89it [00:09, 9.76it/s] 91it [00:09, 9.56it/s] 92it [00:09, 9.59it/s] 94it [00:09, 9.75it/s] 95it [00:10, 9.43it/s] 96it [00:10, 9.51it/s] 97it [00:10, 9.62it/s] 98it [00:10, 9.65it/s] 100it [00:10, 9.81it/s]2025-05-26 04:47:19,255 - INFO - [Epoch 012 | Batch 0100] IWAE-loss 11670.1055 | mean log_px -0.1183 | KL -3560.71 + 101it [00:10, 9.84it/s] 102it [00:10, 9.44it/s] 103it [00:10, 9.57it/s] 104it [00:10, 9.68it/s] 105it [00:11, 9.30it/s] 107it [00:11, 9.62it/s] 108it [00:11, 9.70it/s] 109it [00:11, 9.25it/s] 110it [00:11, 9.43it/s] 111it [00:11, 9.57it/s] 112it [00:11, 9.66it/s] 113it [00:11, 9.28it/s] 115it [00:12, 9.62it/s] 116it [00:12, 9.57it/s] 117it [00:12, 9.39it/s] 118it [00:12, 9.26it/s] 119it [00:12, 9.36it/s] 120it [00:12, 9.03it/s] 121it [00:12, 9.25it/s] 122it [00:12, 9.40it/s] 123it [00:12, 8.97it/s] 124it [00:13, 9.21it/s] 125it [00:13, 9.37it/s] 126it [00:13, 8.94it/s] 127it [00:13, 9.22it/s] 128it [00:13, 9.37it/s] 129it [00:13, 9.53it/s] 130it [00:13, 9.06it/s] 132it [00:13, 9.47it/s] 133it [00:14, 9.54it/s] 134it [00:14, 9.12it/s] 135it [00:14, 9.19it/s] 136it [00:14, 9.38it/s] 137it [00:14, 9.09it/s] 138it [00:14, 9.34it/s] 139it [00:14, 9.52it/s] 140it [00:14, 9.65it/s] 141it [00:14, 9.18it/s] 142it [00:15, 9.39it/s] 143it [00:15, 9.54it/s] 144it [00:15, 9.66it/s] 146it [00:15, 9.84it/s] 147it [00:15, 9.37it/s] 148it [00:15, 9.52it/s] 150it [00:15, 9.75it/s]2025-05-26 04:47:24,567 - INFO - [Epoch 012 | Batch 0150] IWAE-loss 9823.7705 | mean log_px -0.0984 | KL -3558.63 + 151it [00:15, 9.79it/s] 153it [00:16, 9.54it/s] 154it [00:16, 9.62it/s] 156it [00:16, 9.80it/s] 157it [00:16, 9.48it/s] 158it [00:16, 9.58it/s] 160it [00:16, 9.76it/s] 161it [00:16, 9.81it/s] 162it [00:17, 9.46it/s] 164it [00:17, 9.68it/s] 166it [00:17, 9.50it/s] 167it [00:17, 9.59it/s] 169it [00:17, 9.76it/s] 170it [00:17, 9.29it/s] 171it [00:18, 9.35it/s] 172it [00:18, 9.48it/s] 173it [00:18, 9.61it/s] 174it [00:18, 9.64it/s] 175it [00:18, 9.73it/s] 176it [00:18, 9.79it/s] 177it [00:18, 9.80it/s] 178it [00:18, 9.33it/s] 180it [00:18, 9.65it/s] 181it [00:19, 9.72it/s] 182it [00:19, 9.20it/s] 183it [00:19, 9.40it/s] 184it [00:19, 9.56it/s] 186it [00:19, 9.77it/s] 187it [00:19, 9.73it/s] 188it [00:19, 9.79it/s] 189it [00:19, 9.29it/s] 191it [00:20, 9.59it/s] 192it [00:20, 9.68it/s] 193it [00:20, 9.74it/s] 194it [00:20, 9.80it/s] 195it [00:20, 9.43it/s] 196it [00:20, 9.47it/s] +2025-05-26 04:47:29,365 - INFO - Epoch: 12, Objective: tensor([11959.2480], device='cuda:0', grad_fn=), Loss: 0.12528853118419647, KL/n: 72.63204193115234 + 0it [00:00, ?it/s]2025-05-26 04:47:29,647 - INFO - [Epoch 013 | Batch 0000] IWAE-loss 10673.3086 | mean log_px -0.1125 | KL -3559.28 + 1it [00:00, 4.54it/s] 2it [00:00, 6.66it/s] 4it [00:00, 8.49it/s] 6it [00:00, 8.86it/s] 8it [00:00, 9.33it/s] 9it [00:01, 9.14it/s] 11it [00:01, 9.50it/s] 12it [00:01, 9.26it/s] 14it [00:01, 9.59it/s] 15it [00:01, 9.35it/s] 17it [00:01, 9.64it/s] 19it [00:02, 9.50it/s] 21it [00:02, 9.69it/s] 23it [00:02, 9.55it/s] 25it [00:02, 9.73it/s] 26it [00:02, 9.48it/s] 28it [00:03, 9.71it/s] 29it [00:03, 9.36it/s] 31it [00:03, 9.64it/s] 33it [00:03, 9.51it/s] 35it [00:03, 9.71it/s] 37it [00:03, 9.50it/s] 39it [00:04, 9.68it/s] 41it [00:04, 9.81it/s] 42it [00:04, 9.55it/s] 44it [00:04, 9.75it/s] 45it [00:04, 9.51it/s] 46it [00:04, 9.58it/s] 47it [00:04, 9.60it/s] 49it [00:05, 9.36it/s] 50it [00:05, 9.44it/s]2025-05-26 04:47:34,878 - INFO - [Epoch 013 | Batch 0050] IWAE-loss 14811.1055 | mean log_px -0.1740 | KL -3564.73 + 51it [00:05, 9.51it/s] 53it [00:05, 9.38it/s] 55it [00:05, 9.62it/s] 56it [00:05, 9.67it/s] 57it [00:06, 9.73it/s] 58it [00:06, 9.77it/s] 59it [00:06, 9.26it/s] 61it [00:06, 9.63it/s] 63it [00:06, 9.83it/s] 65it [00:06, 9.63it/s] 67it [00:07, 9.80it/s] 69it [00:07, 9.62it/s] 71it [00:07, 9.78it/s] 72it [00:07, 9.45it/s] 74it [00:07, 9.68it/s] 76it [00:08, 9.52it/s] 78it [00:08, 9.72it/s] 79it [00:08, 9.49it/s] 81it [00:08, 9.72it/s] 83it [00:08, 9.86it/s] 85it [00:08, 9.96it/s] 87it [00:09, 10.02it/s] 89it [00:09, 10.06it/s] 91it [00:09, 10.09it/s] 93it [00:09, 9.76it/s] 95it [00:09, 9.88it/s] 97it [00:10, 9.96it/s] 98it [00:10, 9.52it/s] 100it [00:10, 9.73it/s]2025-05-26 04:47:40,007 - INFO - [Epoch 013 | Batch 0100] IWAE-loss 11084.1914 | mean log_px -0.1101 | KL -3557.34 + 101it [00:10, 9.38it/s] 103it [00:10, 9.63it/s] 105it [00:10, 9.80it/s] 107it [00:11, 9.92it/s] 109it [00:11, 9.99it/s] 110it [00:11, 9.98it/s] 112it [00:11, 10.04it/s] 114it [00:11, 10.07it/s] 116it [00:12, 10.10it/s] 118it [00:12, 10.07it/s] 120it [00:12, 9.73it/s] 122it [00:12, 9.84it/s] 124it [00:12, 9.92it/s] 126it [00:13, 9.64it/s] 128it [00:13, 9.77it/s] 130it [00:13, 9.86it/s] 132it [00:13, 9.94it/s] 134it [00:13, 9.99it/s] 136it [00:14, 10.03it/s] 138it [00:14, 10.06it/s] 140it [00:14, 10.08it/s] 142it [00:14, 10.09it/s] 144it [00:14, 10.11it/s] 146it [00:15, 10.13it/s] 148it [00:15, 10.13it/s] 150it [00:15, 10.13it/s]2025-05-26 04:47:45,018 - INFO - [Epoch 013 | Batch 0150] IWAE-loss 8056.9863 | mean log_px -0.0642 | KL -3562.25 + 152it [00:15, 9.78it/s] 154it [00:15, 9.88it/s] 156it [00:16, 9.96it/s] 158it [00:16, 10.01it/s] 160it [00:16, 9.95it/s] 162it [00:16, 9.99it/s] 164it [00:16, 10.03it/s] 166it [00:17, 10.06it/s] 168it [00:17, 9.97it/s] 169it [00:17, 9.62it/s] 171it [00:17, 9.79it/s] 173it [00:17, 9.89it/s] 175it [00:17, 9.97it/s] 177it [00:18, 10.02it/s] 179it [00:18, 9.76it/s] 181it [00:18, 9.87it/s] 183it [00:18, 9.95it/s] 185it [00:18, 10.00it/s] 187it [00:19, 10.05it/s] 189it [00:19, 9.81it/s] 191it [00:19, 9.90it/s] 193it [00:19, 9.96it/s] 195it [00:20, 9.76it/s] 196it [00:20, 9.54it/s] 196it [00:20, 9.71it/s] +2025-05-26 04:47:49,688 - INFO - Epoch: 13, Objective: tensor([13255.1807], device='cuda:0', grad_fn=), Loss: 0.15383651852607727, KL/n: 72.70011138916016 + 0it [00:00, ?it/s]2025-05-26 04:47:50,155 - INFO - [Epoch 014 | Batch 0000] IWAE-loss 11022.1055 | mean log_px -0.1185 | KL -3559.76 + 1it [00:00, 2.68it/s] 2it [00:00, 4.47it/s] 4it [00:00, 6.86it/s] 6it [00:00, 8.07it/s] 7it [00:00, 8.48it/s] 9it [00:01, 9.08it/s] 10it [00:01, 9.27it/s] 12it [00:01, 9.55it/s] 14it [00:01, 9.71it/s] 16it [00:01, 9.82it/s] 17it [00:01, 9.85it/s] 18it [00:02, 9.86it/s] 20it [00:02, 9.93it/s] 21it [00:02, 9.95it/s] 22it [00:02, 9.73it/s] 23it [00:02, 9.45it/s] 24it [00:02, 9.33it/s] 25it [00:02, 9.41it/s] 26it [00:02, 9.44it/s] 27it [00:03, 9.49it/s] 28it [00:03, 9.50it/s] 29it [00:03, 9.54it/s] 30it [00:03, 9.51it/s] 31it [00:03, 9.54it/s] 32it [00:03, 9.54it/s] 33it [00:03, 9.53it/s] 34it [00:03, 9.52it/s] 35it [00:03, 9.65it/s] 36it [00:03, 9.73it/s] 37it [00:04, 9.08it/s] 38it [00:04, 9.33it/s] 40it [00:04, 9.62it/s] 41it [00:04, 9.23it/s] 42it [00:04, 9.39it/s] 43it [00:04, 9.50it/s] 44it [00:04, 9.58it/s] 45it [00:04, 9.63it/s] 46it [00:05, 9.68it/s] 47it [00:05, 9.68it/s] 48it [00:05, 9.70it/s] 49it [00:05, 9.71it/s] 50it [00:05, 9.73it/s]2025-05-26 04:47:55,327 - INFO - [Epoch 014 | Batch 0050] IWAE-loss 8267.6357 | mean log_px -0.0700 | KL -3559.77 + 51it [00:05, 9.68it/s] 52it [00:05, 9.70it/s] 53it [00:05, 9.70it/s] 54it [00:05, 9.15it/s] 55it [00:05, 9.34it/s] 56it [00:06, 9.44it/s] 57it [00:06, 9.55it/s] 58it [00:06, 9.63it/s] 59it [00:06, 9.06it/s] 60it [00:06, 9.12it/s] 61it [00:06, 9.17it/s] 62it [00:06, 8.81it/s] 63it [00:06, 9.07it/s] 64it [00:06, 9.25it/s] 65it [00:07, 8.90it/s] 66it [00:07, 9.12it/s] 67it [00:07, 9.12it/s] 68it [00:07, 9.25it/s] 69it [00:07, 8.89it/s] 70it [00:07, 9.13it/s] 71it [00:07, 9.30it/s] 72it [00:07, 8.91it/s] 73it [00:07, 9.16it/s] 74it [00:08, 9.32it/s] 75it [00:08, 8.93it/s] 76it [00:08, 9.16it/s] 77it [00:08, 9.33it/s] 78it [00:08, 8.93it/s] 79it [00:08, 9.17it/s] 80it [00:08, 9.30it/s] 81it [00:08, 9.40it/s] 82it [00:08, 8.98it/s] 83it [00:09, 9.21it/s] 84it [00:09, 9.38it/s] 85it [00:09, 8.96it/s] 86it [00:09, 9.14it/s] 87it [00:09, 9.34it/s] 88it [00:09, 8.96it/s] 89it [00:09, 9.18it/s] 90it [00:09, 9.32it/s] 91it [00:09, 8.92it/s] 92it [00:10, 9.13it/s] 93it [00:10, 9.30it/s] 94it [00:10, 8.91it/s] 95it [00:10, 9.17it/s] 96it [00:10, 9.33it/s] 97it [00:10, 8.95it/s] 98it [00:10, 9.16it/s] 99it [00:10, 9.34it/s] 100it [00:10, 8.93it/s]2025-05-26 04:48:00,792 - INFO - [Epoch 014 | Batch 0100] IWAE-loss 13712.4199 | mean log_px -0.1565 | KL -3561.90 + 101it [00:11, 9.15it/s] 102it [00:11, 9.32it/s] 103it [00:11, 8.94it/s] 104it [00:11, 9.15it/s] 105it [00:11, 9.32it/s] 106it [00:11, 8.92it/s] 107it [00:11, 9.17it/s] 108it [00:11, 9.32it/s] 109it [00:11, 9.43it/s] 110it [00:11, 8.97it/s] 111it [00:12, 9.02it/s] 112it [00:12, 9.19it/s] 113it [00:12, 9.37it/s] 114it [00:12, 8.96it/s] 115it [00:12, 9.18it/s] 116it [00:12, 9.35it/s] 117it [00:12, 8.95it/s] 118it [00:12, 9.15it/s] 119it [00:12, 9.32it/s] 120it [00:13, 8.93it/s] 121it [00:13, 9.17it/s] 122it [00:13, 9.33it/s] 123it [00:13, 8.94it/s] 124it [00:13, 9.15it/s] 125it [00:13, 9.33it/s] 126it [00:13, 8.94it/s] 127it [00:13, 9.19it/s] 128it [00:13, 9.35it/s] 129it [00:14, 8.96it/s] 130it [00:14, 9.17it/s] 131it [00:14, 9.33it/s] 132it [00:14, 8.93it/s] 133it [00:14, 9.17it/s] 134it [00:14, 9.31it/s] 135it [00:14, 8.91it/s] 136it [00:14, 9.02it/s] 137it [00:14, 9.18it/s] 138it [00:15, 8.75it/s] 139it [00:15, 8.99it/s] 140it [00:15, 9.13it/s] 141it [00:15, 9.24it/s] 142it [00:15, 8.87it/s] 143it [00:15, 9.10it/s] 144it [00:15, 9.28it/s] 145it [00:15, 8.85it/s] 146it [00:15, 9.10it/s] 147it [00:16, 9.29it/s] 148it [00:16, 9.38it/s] 149it [00:16, 8.95it/s] 150it [00:16, 9.15it/s]2025-05-26 04:48:06,263 - INFO - [Epoch 014 | Batch 0150] IWAE-loss 13030.7373 | mean log_px -0.1424 | KL -3557.82 + 151it [00:16, 9.32it/s] 152it [00:16, 8.94it/s] 153it [00:16, 9.17it/s] 154it [00:16, 9.32it/s] 155it [00:16, 8.91it/s] 156it [00:17, 9.14it/s] 157it [00:17, 9.28it/s] 158it [00:17, 8.90it/s] 159it [00:17, 9.15it/s] 160it [00:17, 9.31it/s] 161it [00:17, 8.92it/s] 162it [00:17, 9.16it/s] 163it [00:17, 9.30it/s] 164it [00:17, 8.90it/s] 165it [00:18, 9.12it/s] 166it [00:18, 9.28it/s] 167it [00:18, 8.90it/s] 168it [00:18, 9.09it/s] 169it [00:18, 9.28it/s] 170it [00:18, 8.83it/s] 171it [00:18, 8.98it/s] 172it [00:18, 9.17it/s] 173it [00:18, 8.84it/s] 174it [00:19, 9.06it/s] 175it [00:19, 9.25it/s] 176it [00:19, 8.87it/s] 177it [00:19, 9.06it/s] 178it [00:19, 9.26it/s] 179it [00:19, 8.90it/s] 180it [00:19, 9.10it/s] 181it [00:19, 9.29it/s] 182it [00:19, 8.89it/s] 183it [00:20, 9.12it/s] 184it [00:20, 9.28it/s] 185it [00:20, 9.20it/s] 186it [00:20, 8.71it/s] 187it [00:20, 9.04it/s] 188it [00:20, 9.29it/s] 189it [00:20, 8.91it/s] 190it [00:20, 9.18it/s] 191it [00:20, 9.40it/s] 192it [00:20, 9.55it/s] 193it [00:21, 9.06it/s] 194it [00:21, 9.29it/s] 195it [00:21, 8.94it/s] 196it [00:21, 8.86it/s] 196it [00:21, 9.11it/s] +2025-05-26 04:48:11,331 - INFO - Epoch: 14, Objective: tensor([11565.9922], device='cuda:0', grad_fn=), Loss: 0.11370649188756943, KL/n: 72.74580383300781 + 0it [00:00, ?it/s]2025-05-26 04:48:11,613 - INFO - [Epoch 015 | Batch 0000] IWAE-loss 10721.7217 | mean log_px -0.1022 | KL -3567.32 + 1it [00:00, 5.11it/s] 2it [00:00, 6.65it/s] 3it [00:00, 7.84it/s] 4it [00:00, 8.56it/s] 5it [00:00, 8.40it/s] 6it [00:00, 8.88it/s] 7it [00:00, 9.18it/s] 8it [00:00, 9.39it/s] 10it [00:01, 9.70it/s] 12it [00:01, 9.40it/s] 14it [00:01, 9.63it/s] 15it [00:01, 9.69it/s] 16it [00:01, 9.76it/s] 18it [00:01, 9.87it/s] 20it [00:02, 9.91it/s] 22it [00:02, 9.95it/s] 23it [00:02, 9.55it/s] 25it [00:02, 9.72it/s] 26it [00:02, 9.77it/s] 28it [00:02, 9.84it/s] 30it [00:03, 9.91it/s] 32it [00:03, 9.97it/s] 34it [00:03, 10.00it/s] 36it [00:03, 10.02it/s] 37it [00:03, 10.01it/s] 38it [00:03, 10.00it/s] 40it [00:04, 10.01it/s] 42it [00:04, 10.01it/s] 44it [00:04, 10.01it/s] 46it [00:04, 10.03it/s] 48it [00:04, 10.05it/s] 50it [00:05, 9.71it/s]2025-05-26 04:48:16,716 - INFO - [Epoch 015 | Batch 0050] IWAE-loss 11714.7119 | mean log_px -0.1263 | KL -3566.29 + 51it [00:05, 9.72it/s] 52it [00:05, 9.76it/s] 54it [00:05, 9.84it/s] 55it [00:05, 9.87it/s] 56it [00:05, 9.89it/s] 57it [00:05, 9.91it/s] 58it [00:06, 9.91it/s] 60it [00:06, 9.95it/s] 62it [00:06, 9.56it/s] 63it [00:06, 9.64it/s] 64it [00:06, 9.72it/s] 66it [00:06, 9.87it/s] 67it [00:06, 9.88it/s] 68it [00:07, 9.89it/s] 69it [00:07, 9.92it/s] 70it [00:07, 9.94it/s] 71it [00:07, 9.56it/s] 72it [00:07, 9.68it/s] 74it [00:07, 9.84it/s] 75it [00:07, 9.87it/s] 76it [00:07, 9.90it/s] 78it [00:08, 9.94it/s] 79it [00:08, 9.95it/s] 80it [00:08, 9.96it/s] 82it [00:08, 9.92it/s] 83it [00:08, 9.87it/s] 84it [00:08, 9.84it/s] 86it [00:08, 9.91it/s] 87it [00:08, 9.92it/s] 89it [00:09, 9.99it/s] 90it [00:09, 9.98it/s] 91it [00:09, 9.46it/s] 93it [00:09, 9.72it/s] 94it [00:09, 9.77it/s] 96it [00:09, 9.88it/s] 98it [00:10, 9.95it/s] 100it [00:10, 9.98it/s]2025-05-26 04:48:21,785 - INFO - [Epoch 015 | Batch 0100] IWAE-loss 10056.2070 | mean log_px -0.1000 | KL -3566.32 + 101it [00:10, 9.54it/s] 103it [00:10, 9.71it/s] 104it [00:10, 9.76it/s] 106it [00:10, 9.86it/s] 107it [00:10, 9.88it/s] 108it [00:11, 9.90it/s] 110it [00:11, 9.97it/s] 111it [00:11, 9.98it/s] 112it [00:11, 9.92it/s] 114it [00:11, 9.99it/s] 116it [00:11, 10.01it/s] 117it [00:11, 10.00it/s] 118it [00:12, 10.00it/s] 120it [00:12, 9.54it/s] 121it [00:12, 9.51it/s] 122it [00:12, 9.50it/s] 123it [00:12, 9.58it/s] 124it [00:12, 9.64it/s] 125it [00:12, 9.70it/s] 126it [00:12, 9.75it/s] 127it [00:13, 9.78it/s] 128it [00:13, 9.79it/s] 129it [00:13, 9.80it/s] 130it [00:13, 9.34it/s] 131it [00:13, 9.47it/s] 132it [00:13, 9.52it/s] 133it [00:13, 9.61it/s] 135it [00:13, 9.83it/s] 137it [00:14, 9.93it/s] 138it [00:14, 9.89it/s] 139it [00:14, 9.91it/s] 141it [00:14, 9.98it/s] 142it [00:14, 9.98it/s] 144it [00:14, 10.02it/s] 146it [00:14, 10.02it/s] 147it [00:15, 10.00it/s] 148it [00:15, 9.99it/s] 150it [00:15, 9.99it/s]2025-05-26 04:48:26,878 - INFO - [Epoch 015 | Batch 0150] IWAE-loss 9198.8525 | mean log_px -0.0873 | KL -3561.38 + 151it [00:15, 9.51it/s] 152it [00:15, 9.62it/s] 154it [00:15, 9.79it/s] 155it [00:15, 9.83it/s] 156it [00:15, 9.80it/s] 157it [00:16, 9.79it/s] 158it [00:16, 9.26it/s] 160it [00:16, 9.58it/s] 162it [00:16, 9.76it/s] 164it [00:16, 9.84it/s] 165it [00:16, 9.74it/s] 166it [00:17, 9.52it/s] 167it [00:17, 9.10it/s] 168it [00:17, 8.74it/s] 169it [00:17, 8.98it/s] 170it [00:17, 9.20it/s] 171it [00:17, 9.37it/s] 172it [00:17, 9.51it/s] 173it [00:17, 9.61it/s] 174it [00:17, 9.67it/s] 175it [00:17, 9.72it/s] 176it [00:18, 9.52it/s] 177it [00:18, 9.63it/s] 178it [00:18, 9.70it/s] 179it [00:18, 9.76it/s] 180it [00:18, 9.82it/s] 181it [00:18, 9.85it/s] 182it [00:18, 9.87it/s] 183it [00:18, 9.88it/s] 184it [00:18, 9.86it/s] 185it [00:19, 9.34it/s] 186it [00:19, 9.36it/s] 187it [00:19, 9.53it/s] 188it [00:19, 9.61it/s] 189it [00:19, 9.71it/s] 190it [00:19, 9.75it/s] 191it [00:19, 9.79it/s] 192it [00:19, 9.80it/s] 193it [00:19, 9.83it/s] 194it [00:19, 9.62it/s] 195it [00:20, 9.27it/s] 196it [00:20, 9.69it/s] +2025-05-26 04:48:31,679 - INFO - Epoch: 15, Objective: tensor([12319.4551], device='cuda:0', grad_fn=), Loss: 0.13309964537620544, KL/n: 72.79181671142578 + 0it [00:00, ?it/s]2025-05-26 04:48:31,947 - INFO - [Epoch 016 | Batch 0000] IWAE-loss 7340.2905 | mean log_px -0.0581 | KL -3566.00 + 1it [00:00, 4.84it/s] 2it [00:00, 6.94it/s] 4it [00:00, 8.61it/s] 6it [00:00, 8.63it/s] 7it [00:00, 8.93it/s] 8it [00:00, 9.18it/s] 10it [00:01, 6.66it/s] 12it [00:01, 7.64it/s] 14it [00:01, 8.05it/s] 16it [00:01, 8.62it/s] 18it [00:02, 9.04it/s] 19it [00:02, 8.87it/s] 21it [00:02, 9.26it/s] 22it [00:02, 9.40it/s] 24it [00:02, 9.64it/s] 25it [00:02, 9.37it/s] 27it [00:03, 9.62it/s] 28it [00:03, 9.70it/s] 30it [00:03, 9.50it/s] 31it [00:03, 9.60it/s] 32it [00:03, 9.67it/s] 33it [00:03, 9.74it/s] 34it [00:03, 9.34it/s] 36it [00:04, 9.61it/s] 38it [00:04, 9.43it/s] 40it [00:04, 9.62it/s] 41it [00:04, 9.69it/s] 43it [00:04, 9.52it/s] 44it [00:04, 9.59it/s] 45it [00:04, 9.31it/s] 46it [00:05, 9.46it/s] 48it [00:05, 9.70it/s] 50it [00:05, 9.83it/s]2025-05-26 04:48:37,364 - INFO - [Epoch 016 | Batch 0050] IWAE-loss 9277.7939 | mean log_px -0.0837 | KL -3565.87 + 51it [00:05, 9.87it/s] 52it [00:05, 9.48it/s] 53it [00:05, 9.51it/s] 55it [00:06, 9.29it/s] 56it [00:06, 9.42it/s] 58it [00:06, 9.64it/s] 60it [00:06, 9.40it/s] 62it [00:06, 9.61it/s] 64it [00:06, 9.75it/s] 65it [00:07, 9.79it/s] 66it [00:07, 9.82it/s] 68it [00:07, 9.48it/s] 70it [00:07, 9.67it/s] 72it [00:07, 9.51it/s] 73it [00:07, 9.59it/s] 74it [00:08, 9.65it/s] 76it [00:08, 9.78it/s] 77it [00:08, 9.80it/s] 79it [00:08, 9.59it/s] 80it [00:08, 9.66it/s] 82it [00:08, 9.78it/s] 83it [00:08, 9.45it/s] 85it [00:09, 9.68it/s] 86it [00:09, 9.74it/s] 87it [00:09, 9.78it/s] 88it [00:09, 9.43it/s] 90it [00:09, 9.69it/s] 91it [00:09, 9.73it/s] 92it [00:09, 9.38it/s] 93it [00:09, 9.06it/s] 95it [00:10, 9.44it/s] 97it [00:10, 9.67it/s] 98it [00:10, 9.70it/s] 99it [00:10, 9.76it/s] 100it [00:10, 9.80it/s]2025-05-26 04:48:42,568 - INFO - [Epoch 016 | Batch 0100] IWAE-loss 11751.0801 | mean log_px -0.1212 | KL -3566.18 + 101it [00:10, 9.84it/s] 102it [00:10, 9.75it/s] 104it [00:11, 9.50it/s] 105it [00:11, 9.60it/s] 106it [00:11, 9.69it/s] 108it [00:11, 9.85it/s] 109it [00:11, 9.51it/s] 110it [00:11, 9.61it/s] 112it [00:11, 9.78it/s] 113it [00:12, 9.32it/s] 114it [00:12, 9.46it/s] 116it [00:12, 9.67it/s] 117it [00:12, 9.26it/s] 119it [00:12, 9.54it/s] 120it [00:12, 9.63it/s] 121it [00:12, 9.23it/s] 122it [00:13, 9.40it/s] 124it [00:13, 9.64it/s] 126it [00:13, 9.79it/s] 127it [00:13, 9.82it/s] 129it [00:13, 9.91it/s] 130it [00:13, 9.56it/s] 132it [00:14, 9.73it/s] 134it [00:14, 9.83it/s] 135it [00:14, 9.52it/s] 136it [00:14, 9.61it/s] 138it [00:14, 9.76it/s] 139it [00:14, 9.42it/s] 140it [00:14, 9.54it/s] 141it [00:14, 9.63it/s] 142it [00:15, 9.69it/s] 143it [00:15, 9.76it/s] 144it [00:15, 9.80it/s] 146it [00:15, 9.49it/s] 148it [00:15, 9.68it/s] 150it [00:15, 9.50it/s]2025-05-26 04:48:47,776 - INFO - [Epoch 016 | Batch 0150] IWAE-loss 10209.6055 | mean log_px -0.0996 | KL -3564.47 + 151it [00:16, 9.58it/s] 153it [00:16, 9.75it/s] 154it [00:16, 9.80it/s] 155it [00:16, 9.81it/s] 156it [00:16, 9.42it/s] 157it [00:16, 9.54it/s] 158it [00:16, 9.64it/s] 159it [00:16, 9.72it/s] 160it [00:16, 9.32it/s] 162it [00:17, 9.61it/s] 163it [00:17, 9.69it/s] 164it [00:17, 9.72it/s] 165it [00:17, 9.79it/s] 166it [00:17, 9.38it/s] 168it [00:17, 9.67it/s] 170it [00:17, 9.49it/s] 171it [00:18, 9.58it/s] 172it [00:18, 9.67it/s] 174it [00:18, 9.47it/s] 176it [00:18, 9.67it/s] 178it [00:18, 9.78it/s] 179it [00:18, 9.49it/s] 180it [00:19, 9.58it/s] 182it [00:19, 9.75it/s] 183it [00:19, 9.45it/s] 184it [00:19, 9.55it/s] 186it [00:19, 9.74it/s] 187it [00:19, 9.78it/s] 188it [00:19, 9.32it/s] 190it [00:20, 9.19it/s] 191it [00:20, 9.34it/s] 192it [00:20, 9.49it/s] 193it [00:20, 9.61it/s] 194it [00:20, 9.70it/s] 195it [00:20, 9.38it/s] 196it [00:20, 9.44it/s] +2025-05-26 04:48:52,573 - INFO - Epoch: 16, Objective: tensor([10027.8145], device='cuda:0', grad_fn=), Loss: 0.09540171176195145, KL/n: 72.8223648071289 + 0it [00:00, ?it/s]2025-05-26 04:48:52,847 - INFO - [Epoch 017 | Batch 0000] IWAE-loss 10231.7510 | mean log_px -0.0985 | KL -3565.85 + 1it [00:00, 4.68it/s] 2it [00:00, 6.80it/s] 4it [00:00, 8.55it/s] 5it [00:00, 8.54it/s] 6it [00:00, 8.94it/s] 7it [00:00, 9.22it/s] 8it [00:00, 9.44it/s] 10it [00:01, 9.23it/s] 12it [00:01, 9.51it/s] 13it [00:01, 9.55it/s] 14it [00:01, 9.57it/s] 16it [00:01, 9.74it/s] 17it [00:01, 9.33it/s] 18it [00:01, 9.46it/s] 20it [00:02, 9.70it/s] 22it [00:02, 9.36it/s] 23it [00:02, 9.37it/s] 24it [00:02, 9.45it/s] 25it [00:02, 9.46it/s] 26it [00:02, 9.15it/s] 27it [00:02, 9.36it/s] 28it [00:03, 9.48it/s] 29it [00:03, 9.16it/s] 30it [00:03, 9.37it/s] 31it [00:03, 9.50it/s] 32it [00:03, 9.03it/s] 33it [00:03, 9.21it/s] 34it [00:03, 9.35it/s] 35it [00:03, 9.39it/s] 36it [00:03, 9.33it/s] 37it [00:04, 8.85it/s] 38it [00:04, 9.07it/s] 39it [00:04, 9.28it/s] 40it [00:04, 9.42it/s] 41it [00:04, 9.01it/s] 42it [00:04, 9.25it/s] 44it [00:04, 9.19it/s] 45it [00:04, 9.32it/s] 46it [00:04, 9.43it/s] 47it [00:05, 9.03it/s] 48it [00:05, 9.26it/s] 49it [00:05, 9.46it/s]2025-05-26 04:48:58,180 - INFO - [Epoch 017 | Batch 0050] IWAE-loss 8144.4380 | mean log_px -0.0670 | KL -3562.43 + 51it [00:05, 9.21it/s] 52it [00:05, 9.37it/s] 53it [00:05, 9.52it/s] 54it [00:05, 9.64it/s] 55it [00:05, 9.72it/s] 56it [00:06, 9.31it/s] 58it [00:06, 9.60it/s] 59it [00:06, 9.68it/s] 60it [00:06, 9.32it/s] 61it [00:06, 9.45it/s] 62it [00:06, 9.56it/s] 63it [00:06, 9.67it/s] 64it [00:06, 9.13it/s] 66it [00:07, 9.47it/s] 67it [00:07, 9.57it/s] 68it [00:07, 9.14it/s] 69it [00:07, 9.34it/s] 70it [00:07, 9.51it/s] 71it [00:07, 9.64it/s] 72it [00:07, 9.10it/s] 73it [00:07, 9.28it/s] 74it [00:07, 9.44it/s] 75it [00:08, 9.58it/s] 76it [00:08, 9.09it/s] 77it [00:08, 9.33it/s] 78it [00:08, 9.44it/s] 79it [00:08, 9.44it/s] 80it [00:08, 9.09it/s] 81it [00:08, 8.79it/s] 82it [00:08, 9.05it/s] 83it [00:08, 9.26it/s] 84it [00:09, 9.46it/s] 85it [00:09, 9.00it/s] 86it [00:09, 9.23it/s] 87it [00:09, 9.42it/s] 88it [00:09, 9.58it/s] 90it [00:09, 9.68it/s] 92it [00:09, 9.81it/s] 94it [00:10, 9.85it/s] 95it [00:10, 9.87it/s] 96it [00:10, 9.41it/s] 97it [00:10, 9.53it/s] 98it [00:10, 9.60it/s] 100it [00:10, 9.75it/s]2025-05-26 04:49:03,470 - INFO - [Epoch 017 | Batch 0100] IWAE-loss 8396.8623 | mean log_px -0.0690 | KL -3563.99 + 101it [00:10, 9.29it/s] 102it [00:10, 9.44it/s] 103it [00:11, 9.56it/s] 104it [00:11, 9.64it/s] 105it [00:11, 9.73it/s] 106it [00:11, 9.79it/s] 107it [00:11, 9.85it/s] 108it [00:11, 9.85it/s] 109it [00:11, 9.89it/s] 110it [00:11, 9.40it/s] 111it [00:11, 9.57it/s] 112it [00:11, 9.65it/s] 113it [00:12, 9.17it/s] 114it [00:12, 9.37it/s] 115it [00:12, 9.53it/s] 116it [00:12, 9.66it/s] 117it [00:12, 9.28it/s] 118it [00:12, 9.44it/s] 120it [00:12, 9.70it/s] 121it [00:12, 9.33it/s] 123it [00:13, 9.59it/s] 124it [00:13, 9.66it/s] 126it [00:13, 9.79it/s] 127it [00:13, 9.83it/s] 128it [00:13, 9.85it/s] 129it [00:13, 9.87it/s] 130it [00:13, 9.90it/s] 131it [00:13, 9.90it/s] 132it [00:14, 9.90it/s] 133it [00:14, 9.90it/s] 134it [00:14, 9.90it/s] 135it [00:14, 9.93it/s] 136it [00:14, 9.89it/s] 137it [00:14, 9.92it/s] 138it [00:14, 9.89it/s] 139it [00:14, 9.92it/s] 140it [00:14, 9.93it/s] 141it [00:14, 9.91it/s] 142it [00:15, 9.89it/s] 143it [00:15, 9.89it/s] 144it [00:15, 9.91it/s] 145it [00:15, 9.94it/s] 146it [00:15, 9.92it/s] 147it [00:15, 9.92it/s] 148it [00:15, 9.40it/s] 149it [00:15, 9.57it/s] 150it [00:15, 9.65it/s]2025-05-26 04:49:08,623 - INFO - [Epoch 017 | Batch 0150] IWAE-loss 9258.7881 | mean log_px -0.0835 | KL -3569.38 + 151it [00:15, 9.10it/s] 152it [00:16, 9.32it/s] 153it [00:16, 9.51it/s] 154it [00:16, 9.65it/s] 155it [00:16, 9.73it/s] 156it [00:16, 9.80it/s] 158it [00:16, 9.89it/s] 160it [00:16, 9.94it/s] 162it [00:17, 9.69it/s] 163it [00:17, 9.73it/s] 164it [00:17, 9.78it/s] 165it [00:17, 9.82it/s] 166it [00:17, 9.83it/s] 168it [00:17, 9.92it/s] 170it [00:17, 9.96it/s] 171it [00:18, 9.50it/s] 172it [00:18, 9.59it/s] 174it [00:18, 9.77it/s] 175it [00:18, 9.79it/s] 176it [00:18, 9.83it/s] 177it [00:18, 9.86it/s] 178it [00:18, 9.88it/s] 179it [00:18, 9.90it/s] 180it [00:18, 9.85it/s] 181it [00:19, 9.88it/s] 182it [00:19, 9.87it/s] 184it [00:19, 9.94it/s] 186it [00:19, 9.97it/s] 187it [00:19, 9.92it/s] 188it [00:19, 9.48it/s] 189it [00:19, 9.57it/s] 190it [00:19, 9.67it/s] 192it [00:20, 9.83it/s] 194it [00:20, 9.90it/s] 195it [00:20, 9.59it/s] 196it [00:20, 9.35it/s] 196it [00:20, 9.49it/s] +2025-05-26 04:49:13,350 - INFO - Epoch: 17, Objective: tensor([9598.7822], device='cuda:0', grad_fn=), Loss: 0.08933060616254807, KL/n: 72.83203125 + 0it [00:00, ?it/s]2025-05-26 04:49:13,817 - INFO - [Epoch 018 | Batch 0000] IWAE-loss 12348.8164 | mean log_px -0.1254 | KL -3569.31 + 1it [00:00, 5.28it/s] 2it [00:00, 6.76it/s] 4it [00:00, 8.50it/s] 6it [00:00, 9.15it/s] 8it [00:00, 9.15it/s] 10it [00:01, 9.47it/s] 12it [00:01, 9.29it/s] 14it [00:01, 9.52it/s] 16it [00:01, 9.68it/s] 18it [00:01, 9.80it/s] 20it [00:02, 9.87it/s] 22it [00:02, 9.92it/s] 24it [00:02, 9.96it/s] 26it [00:02, 10.00it/s] 28it [00:02, 10.02it/s] 30it [00:03, 10.00it/s] 32it [00:03, 10.00it/s] 33it [00:03, 9.85it/s] 34it [00:03, 9.52it/s] 36it [00:03, 9.70it/s] 38it [00:03, 9.83it/s] 40it [00:04, 9.89it/s] 42it [00:04, 9.94it/s] 44it [00:04, 9.99it/s] 46it [00:04, 10.00it/s] 48it [00:04, 10.02it/s] 50it [00:05, 10.01it/s]2025-05-26 04:49:18,896 - INFO - [Epoch 018 | Batch 0050] IWAE-loss 8044.7241 | mean log_px -0.0678 | KL -3567.06 + 51it [00:05, 9.51it/s] 52it [00:05, 9.60it/s] 53it [00:05, 9.59it/s] 54it [00:05, 9.28it/s] 56it [00:05, 9.57it/s] 58it [00:06, 9.71it/s] 59it [00:06, 9.63it/s] 60it [00:06, 9.23it/s] 61it [00:06, 9.39it/s] 62it [00:06, 9.51it/s] 63it [00:06, 9.60it/s] 64it [00:06, 9.13it/s] 65it [00:06, 9.24it/s] 66it [00:06, 9.43it/s] 67it [00:06, 9.56it/s] 68it [00:07, 9.10it/s] 70it [00:07, 9.54it/s] 72it [00:07, 9.32it/s] 74it [00:07, 9.38it/s] 76it [00:07, 9.28it/s] 78it [00:08, 9.53it/s] 80it [00:08, 9.45it/s] 82it [00:08, 9.65it/s] 84it [00:08, 9.53it/s] 86it [00:08, 9.69it/s] 88it [00:09, 9.56it/s] 89it [00:09, 9.62it/s] 91it [00:09, 9.49it/s] 93it [00:09, 9.70it/s] 95it [00:09, 9.48it/s] 97it [00:10, 9.67it/s] 99it [00:10, 9.54it/s]2025-05-26 04:49:24,168 - INFO - [Epoch 018 | Batch 0100] IWAE-loss 8123.0947 | mean log_px -0.0684 | KL -3570.99 + 101it [00:10, 9.69it/s] 103it [00:10, 9.55it/s] 105it [00:10, 9.73it/s] 107it [00:11, 9.59it/s] 108it [00:11, 9.63it/s] 110it [00:11, 9.50it/s] 111it [00:11, 9.55it/s] 113it [00:11, 9.76it/s] 115it [00:12, 9.52it/s] 117it [00:12, 9.71it/s] 119it [00:12, 9.57it/s] 121it [00:12, 9.74it/s] 122it [00:12, 9.49it/s] 124it [00:12, 9.71it/s] 126it [00:13, 9.47it/s] 128it [00:13, 9.66it/s] 129it [00:13, 9.42it/s] 131it [00:13, 9.65it/s] 133it [00:13, 9.81it/s] 134it [00:13, 9.45it/s] 136it [00:14, 9.69it/s] 138it [00:14, 9.70it/s] 139it [00:14, 9.11it/s] 140it [00:14, 9.27it/s] 142it [00:14, 9.54it/s] 143it [00:14, 9.61it/s] 144it [00:15, 9.66it/s] 145it [00:15, 9.71it/s] 146it [00:15, 9.76it/s] 148it [00:15, 9.85it/s] 149it [00:15, 9.88it/s] 150it [00:15, 9.82it/s]2025-05-26 04:49:29,366 - INFO - [Epoch 018 | Batch 0150] IWAE-loss 6793.8252 | mean log_px -0.0610 | KL -3563.42 + 151it [00:15, 9.30it/s] 152it [00:15, 9.42it/s] 153it [00:15, 9.33it/s] 154it [00:16, 9.50it/s] 155it [00:16, 8.96it/s] 156it [00:16, 9.24it/s] 158it [00:16, 9.09it/s] 159it [00:16, 9.30it/s] 160it [00:16, 9.47it/s] 161it [00:16, 9.09it/s] 163it [00:17, 9.52it/s] 164it [00:17, 9.18it/s] 166it [00:17, 9.53it/s] 167it [00:17, 9.19it/s] 169it [00:17, 9.54it/s] 171it [00:17, 9.75it/s] 172it [00:18, 9.39it/s] 174it [00:18, 9.64it/s] 176it [00:18, 9.43it/s] 178it [00:18, 9.65it/s] 180it [00:18, 9.46it/s] 182it [00:19, 9.65it/s] 184it [00:19, 9.79it/s] 185it [00:19, 9.46it/s] 187it [00:19, 9.66it/s] 189it [00:19, 9.45it/s] 191it [00:19, 9.65it/s] 193it [00:20, 9.46it/s] 195it [00:20, 9.42it/s] 196it [00:20, 9.20it/s] 196it [00:20, 9.52it/s] +2025-05-26 04:49:34,262 - INFO - Epoch: 18, Objective: tensor([8188.5557], device='cuda:0', grad_fn=), Loss: 0.07669003307819366, KL/n: 72.82756805419922 + 0it [00:00, ?it/s]2025-05-26 04:49:34,539 - INFO - [Epoch 019 | Batch 0000] IWAE-loss 6962.9434 | mean log_px -0.0530 | KL -3566.80 + 1it [00:00, 5.26it/s] 2it [00:00, 7.27it/s] 3it [00:00, 7.68it/s] 4it [00:00, 8.37it/s] 6it [00:00, 8.70it/s] 8it [00:00, 9.23it/s] 10it [00:01, 9.14it/s] 12it [00:01, 9.44it/s] 13it [00:01, 9.25it/s] 14it [00:01, 9.40it/s] 16it [00:01, 9.63it/s] 17it [00:01, 9.37it/s] 19it [00:02, 9.62it/s] 21it [00:02, 9.46it/s] 22it [00:02, 9.53it/s] 24it [00:02, 9.72it/s] 26it [00:02, 9.52it/s] 28it [00:03, 9.69it/s] 30it [00:03, 9.45it/s] 32it [00:03, 9.59it/s] 34it [00:03, 9.73it/s] 36it [00:03, 9.57it/s] 38it [00:04, 9.71it/s] 40it [00:04, 9.56it/s] 41it [00:04, 9.63it/s] 43it [00:04, 9.77it/s] 44it [00:04, 9.48it/s] 46it [00:04, 9.69it/s] 48it [00:05, 9.53it/s] 49it [00:05, 9.61it/s]2025-05-26 04:49:39,766 - INFO - [Epoch 019 | Batch 0050] IWAE-loss 11381.5762 | mean log_px -0.1166 | KL -3569.48 + 51it [00:05, 9.39it/s] 52it [00:05, 9.50it/s] 54it [00:05, 9.70it/s] 56it [00:05, 9.76it/s] 57it [00:06, 9.74it/s] 58it [00:06, 9.72it/s] 59it [00:06, 9.69it/s] 60it [00:06, 9.65it/s] 61it [00:06, 9.67it/s] 62it [00:06, 9.73it/s] 63it [00:06, 9.30it/s] 64it [00:06, 9.36it/s] 65it [00:06, 9.53it/s] 66it [00:06, 9.66it/s] 68it [00:07, 9.83it/s] 69it [00:07, 9.45it/s] 70it [00:07, 9.57it/s] 72it [00:07, 9.77it/s] 73it [00:07, 9.32it/s] 75it [00:07, 9.60it/s] 77it [00:08, 9.76it/s] 79it [00:08, 9.58it/s] 81it [00:08, 9.75it/s] 83it [00:08, 9.58it/s] 85it [00:08, 9.74it/s] 87it [00:09, 9.58it/s] 89it [00:09, 9.73it/s] 91it [00:09, 9.58it/s] 93it [00:09, 9.73it/s] 94it [00:09, 9.49it/s] 96it [00:10, 9.64it/s] 97it [00:10, 9.16it/s] 98it [00:10, 9.32it/s] 100it [00:10, 9.20it/s]2025-05-26 04:49:45,004 - INFO - [Epoch 019 | Batch 0100] IWAE-loss 8565.3213 | mean log_px -0.0776 | KL -3569.59 + 101it [00:10, 9.34it/s] 102it [00:10, 9.03it/s] 103it [00:10, 9.23it/s] 104it [00:10, 9.42it/s] 106it [00:11, 9.22it/s] 107it [00:11, 9.37it/s] 108it [00:11, 9.51it/s] 109it [00:11, 9.62it/s] 110it [00:11, 9.16it/s] 112it [00:11, 9.50it/s] 113it [00:11, 9.61it/s] 114it [00:12, 9.19it/s] 115it [00:12, 9.39it/s] 116it [00:12, 9.55it/s] 117it [00:12, 9.65it/s] 118it [00:12, 9.14it/s] 120it [00:12, 9.52it/s] 121it [00:12, 9.63it/s] 122it [00:12, 9.20it/s] 124it [00:13, 9.54it/s] 125it [00:13, 9.19it/s] 126it [00:13, 9.38it/s] 128it [00:13, 9.32it/s] 130it [00:13, 9.59it/s] 132it [00:13, 9.45it/s] 134it [00:14, 9.64it/s] 135it [00:14, 9.40it/s] 137it [00:14, 9.61it/s] 139it [00:14, 9.46it/s] 140it [00:14, 9.55it/s] 142it [00:14, 9.72it/s] 144it [00:15, 9.55it/s] 146it [00:15, 9.72it/s] 147it [00:15, 9.47it/s] 148it [00:15, 9.57it/s] 149it [00:15, 9.67it/s]2025-05-26 04:49:50,266 - INFO - [Epoch 019 | Batch 0150] IWAE-loss 7441.7295 | mean log_px -0.0628 | KL -3567.16 + 151it [00:15, 9.39it/s] 152it [00:16, 9.51it/s] 154it [00:16, 9.71it/s] 156it [00:16, 9.83it/s] 157it [00:16, 9.52it/s] 158it [00:16, 9.57it/s] 160it [00:16, 9.75it/s] 162it [00:17, 9.54it/s] 164it [00:17, 9.70it/s] 166it [00:17, 9.47it/s] 167it [00:17, 9.56it/s] 168it [00:17, 9.64it/s] 170it [00:17, 9.79it/s] 172it [00:18, 9.58it/s] 173it [00:18, 9.54it/s] 174it [00:18, 9.56it/s] 175it [00:18, 9.55it/s] 176it [00:18, 9.59it/s] 177it [00:18, 9.67it/s] 178it [00:18, 9.69it/s] 179it [00:18, 9.73it/s] 180it [00:18, 9.73it/s] 181it [00:19, 9.74it/s] 182it [00:19, 9.79it/s] 183it [00:19, 9.80it/s] 184it [00:19, 9.81it/s] 185it [00:19, 9.82it/s] 186it [00:19, 9.84it/s] 187it [00:19, 9.85it/s] 188it [00:19, 9.82it/s] 189it [00:19, 9.83it/s] 190it [00:19, 9.83it/s] 191it [00:20, 9.84it/s] 192it [00:20, 9.79it/s] 193it [00:20, 9.82it/s] 194it [00:20, 9.84it/s] 195it [00:20, 8.84it/s] 196it [00:20, 9.49it/s] +2025-05-26 04:49:55,047 - INFO - Epoch: 19, Objective: tensor([7893.3765], device='cuda:0', grad_fn=), Loss: 0.061493679881095886, KL/n: 72.83820343017578 + 0it [00:00, ?it/s]2025-05-26 04:49:55,500 - INFO - [Epoch 020 | Batch 0000] IWAE-loss 6628.0117 | mean log_px -0.0495 | KL -3568.11 + 1it [00:00, 5.44it/s] 2it [00:00, 6.75it/s] 4it [00:00, 8.49it/s] 5it [00:00, 8.89it/s] 6it [00:00, 8.64it/s] 8it [00:00, 9.23it/s] 10it [00:01, 9.14it/s] 11it [00:01, 9.29it/s] 12it [00:01, 9.43it/s] 13it [00:01, 9.54it/s] 14it [00:01, 9.12it/s] 15it [00:01, 9.34it/s] 16it [00:01, 8.95it/s] 18it [00:02, 9.38it/s] 19it [00:02, 9.51it/s] 20it [00:02, 9.11it/s] 22it [00:02, 9.49it/s] 23it [00:02, 9.14it/s] 24it [00:02, 9.34it/s] 26it [00:02, 9.62it/s] 27it [00:02, 9.37it/s] 29it [00:03, 9.63it/s] 30it [00:03, 9.35it/s] 32it [00:03, 9.61it/s] 33it [00:03, 9.34it/s] 35it [00:03, 9.22it/s] 36it [00:03, 9.34it/s] 37it [00:04, 9.37it/s] 38it [00:04, 9.32it/s] 39it [00:04, 8.98it/s] 40it [00:04, 9.20it/s] 41it [00:04, 9.38it/s] 42it [00:04, 8.96it/s] 43it [00:04, 9.22it/s] 44it [00:04, 8.86it/s] 45it [00:04, 9.15it/s] 46it [00:05, 9.34it/s] 47it [00:05, 9.49it/s] 48it [00:05, 9.02it/s] 49it [00:05, 9.29it/s] 50it [00:05, 9.47it/s]2025-05-26 04:50:00,856 - INFO - [Epoch 020 | Batch 0050] IWAE-loss 7019.3750 | mean log_px -0.0534 | KL -3567.79 + 51it [00:05, 9.60it/s] 52it [00:05, 9.10it/s] 54it [00:05, 9.52it/s] 56it [00:06, 9.30it/s] 58it [00:06, 9.48it/s] 59it [00:06, 9.56it/s] 60it [00:06, 9.08it/s] 62it [00:06, 9.44it/s] 64it [00:06, 9.67it/s] 66it [00:07, 9.49it/s] 67it [00:07, 9.39it/s] 68it [00:07, 9.46it/s] 69it [00:07, 9.54it/s] 71it [00:07, 9.76it/s] 72it [00:07, 9.81it/s] 74it [00:07, 9.58it/s] 76it [00:08, 9.78it/s] 77it [00:08, 9.50it/s] 79it [00:08, 9.71it/s] 80it [00:08, 9.76it/s] 81it [00:08, 9.73it/s] 82it [00:08, 9.27it/s] 84it [00:08, 9.61it/s] 86it [00:09, 9.80it/s] 87it [00:09, 9.51it/s] 89it [00:09, 9.73it/s] 90it [00:09, 9.44it/s] 91it [00:09, 9.56it/s] 92it [00:09, 9.62it/s] 93it [00:09, 9.66it/s] 95it [00:10, 9.84it/s] 96it [00:10, 9.49it/s] 97it [00:10, 9.61it/s] 99it [00:10, 9.36it/s]2025-05-26 04:50:06,088 - INFO - [Epoch 020 | Batch 0100] IWAE-loss 9756.4814 | mean log_px -0.0918 | KL -3565.89 + 101it [00:10, 9.60it/s] 102it [00:10, 9.65it/s] 104it [00:11, 9.81it/s] 105it [00:11, 9.50it/s] 106it [00:11, 9.57it/s] 108it [00:11, 9.77it/s] 109it [00:11, 9.74it/s] 111it [00:11, 9.53it/s] 113it [00:12, 9.74it/s] 115it [00:12, 9.56it/s] 117it [00:12, 9.73it/s] 118it [00:12, 9.39it/s] 119it [00:12, 9.48it/s] 121it [00:12, 9.73it/s] 123it [00:13, 9.85it/s] 124it [00:13, 9.49it/s] 125it [00:13, 9.57it/s] 127it [00:13, 9.79it/s] 128it [00:13, 9.48it/s] 130it [00:13, 9.72it/s] 131it [00:13, 9.44it/s] 133it [00:14, 9.70it/s] 135it [00:14, 9.77it/s] 136it [00:14, 9.41it/s] 137it [00:14, 9.53it/s] 139it [00:14, 9.76it/s] 140it [00:14, 9.46it/s] 142it [00:15, 9.71it/s] 143it [00:15, 9.43it/s] 145it [00:15, 9.69it/s] 147it [00:15, 9.54it/s] 149it [00:15, 9.73it/s]2025-05-26 04:50:11,268 - INFO - [Epoch 020 | Batch 0150] IWAE-loss 6741.2627 | mean log_px -0.0465 | KL -3565.47 + 151it [00:15, 9.50it/s] 153it [00:16, 9.69it/s] 155it [00:16, 9.55it/s] 156it [00:16, 9.62it/s] 158it [00:16, 9.79it/s] 159it [00:16, 9.43it/s] 161it [00:17, 9.66it/s] 163it [00:17, 9.53it/s] 165it [00:17, 9.69it/s] 167it [00:17, 9.55it/s] 168it [00:17, 9.62it/s] 170it [00:17, 9.79it/s] 172it [00:18, 9.61it/s] 174it [00:18, 9.77it/s] 176it [00:18, 9.54it/s] 178it [00:18, 9.72it/s] 179it [00:18, 9.48it/s] 181it [00:19, 9.70it/s] 182it [00:19, 9.45it/s] 184it [00:19, 9.68it/s] 186it [00:19, 9.54it/s] 188it [00:19, 9.72it/s] 189it [00:19, 9.48it/s] 190it [00:20, 9.58it/s] 191it [00:20, 9.62it/s] 192it [00:20, 9.32it/s] 194it [00:20, 9.65it/s] 195it [00:20, 8.93it/s] 196it [00:20, 9.46it/s] +2025-05-26 04:50:16,083 - INFO - Epoch: 20, Objective: tensor([5954.1396], device='cuda:0', grad_fn=), Loss: 0.034850478172302246, KL/n: 72.82156372070312 + 0it [00:00, ?it/s]2025-05-26 04:50:16,359 - INFO - [Epoch 021 | Batch 0000] IWAE-loss 7638.6367 | mean log_px -0.0598 | KL -3567.85 + 1it [00:00, 5.32it/s] 2it [00:00, 6.66it/s] 4it [00:00, 8.50it/s] 5it [00:00, 8.91it/s] 6it [00:00, 8.78it/s] 8it [00:00, 9.38it/s] 9it [00:01, 9.17it/s] 11it [00:01, 9.55it/s] 12it [00:01, 9.29it/s] 14it [00:01, 9.62it/s] 15it [00:01, 9.28it/s] 17it [00:01, 9.59it/s] 19it [00:02, 9.48it/s] 21it [00:02, 9.70it/s] 23it [00:02, 9.57it/s] 25it [00:02, 9.75it/s] 27it [00:02, 9.59it/s] 29it [00:03, 9.74it/s] 31it [00:03, 9.59it/s] 33it [00:03, 9.75it/s] 34it [00:03, 9.44it/s] 36it [00:03, 9.67it/s] 37it [00:03, 9.42it/s] 39it [00:04, 9.68it/s] 40it [00:04, 9.41it/s] 42it [00:04, 9.66it/s] 44it [00:04, 9.53it/s] 46it [00:04, 9.73it/s] 48it [00:05, 9.59it/s] 50it [00:05, 9.76it/s]2025-05-26 04:50:21,565 - INFO - [Epoch 021 | Batch 0050] IWAE-loss 12824.7617 | mean log_px -0.1392 | KL -3568.71 + 51it [00:05, 9.45it/s] 53it [00:05, 9.68it/s] 54it [00:05, 9.34it/s] 56it [00:05, 9.62it/s] 58it [00:06, 9.79it/s] 59it [00:06, 9.52it/s] 61it [00:06, 9.74it/s] 63it [00:06, 9.58it/s] 65it [00:06, 9.75it/s] 66it [00:06, 9.40it/s] 68it [00:07, 9.64it/s] 70it [00:07, 9.52it/s] 72it [00:07, 9.72it/s] 73it [00:07, 9.40it/s] 75it [00:07, 9.66it/s] 76it [00:08, 9.70it/s] 78it [00:08, 9.56it/s] 80it [00:08, 9.76it/s] 81it [00:08, 9.50it/s] 83it [00:08, 9.72it/s] 85it [00:08, 9.57it/s] 87it [00:09, 9.75it/s] 88it [00:09, 9.49it/s] 90it [00:09, 9.70it/s] 92it [00:09, 9.49it/s] 94it [00:09, 9.69it/s] 96it [00:10, 9.55it/s] 98it [00:10, 9.73it/s] 99it [00:10, 9.48it/s]2025-05-26 04:50:26,778 - INFO - [Epoch 021 | Batch 0100] IWAE-loss 9816.6523 | mean log_px -0.1053 | KL -3570.17 + 101it [00:10, 9.65it/s] 102it [00:10, 9.22it/s] 104it [00:10, 9.22it/s] 106it [00:11, 9.49it/s] 108it [00:11, 9.69it/s] 110it [00:11, 9.83it/s] 112it [00:11, 9.93it/s] 114it [00:11, 10.00it/s] 116it [00:12, 10.03it/s] 118it [00:12, 10.07it/s] 120it [00:12, 10.09it/s] 122it [00:12, 9.75it/s] 124it [00:12, 9.85it/s] 126it [00:13, 9.94it/s] 128it [00:13, 9.99it/s] 130it [00:13, 10.03it/s] 132it [00:13, 10.06it/s] 134it [00:13, 10.09it/s] 136it [00:14, 10.10it/s] 138it [00:14, 10.11it/s] 140it [00:14, 10.04it/s] 142it [00:14, 9.56it/s] 143it [00:14, 9.62it/s] 144it [00:14, 9.69it/s] 146it [00:15, 9.82it/s] 148it [00:15, 9.92it/s] 150it [00:15, 9.96it/s]2025-05-26 04:50:31,836 - INFO - [Epoch 021 | Batch 0150] IWAE-loss 6365.2271 | mean log_px -0.0422 | KL -3569.45 + 151it [00:15, 9.55it/s] 152it [00:15, 9.62it/s] 154it [00:15, 9.78it/s] 156it [00:16, 9.91it/s] 158it [00:16, 9.99it/s] 160it [00:16, 9.66it/s] 162it [00:16, 9.81it/s] 164it [00:16, 9.91it/s] 166it [00:17, 9.97it/s] 167it [00:17, 9.61it/s] 169it [00:17, 9.78it/s] 171it [00:17, 9.89it/s] 173it [00:17, 9.97it/s] 175it [00:18, 10.02it/s] 177it [00:18, 10.06it/s] 179it [00:18, 9.67it/s] 181it [00:18, 9.80it/s] 183it [00:18, 9.91it/s] 185it [00:19, 9.99it/s] 187it [00:19, 10.03it/s] 189it [00:19, 10.07it/s] 191it [00:19, 9.74it/s] 193it [00:19, 9.87it/s] 195it [00:20, 9.69it/s] 196it [00:20, 9.66it/s] +2025-05-26 04:50:36,511 - INFO - Epoch: 21, Objective: tensor([6160.0498], device='cuda:0', grad_fn=), Loss: 0.040021877735853195, KL/n: 72.79065704345703 + 0it [00:00, ?it/s]2025-05-26 04:50:36,969 - INFO - [Epoch 022 | Batch 0000] IWAE-loss 9817.3037 | mean log_px -0.0940 | KL -3564.62 + 1it [00:00, 4.72it/s] 3it [00:00, 7.80it/s] 5it [00:00, 8.81it/s] 6it [00:00, 9.09it/s] 8it [00:00, 9.50it/s] 10it [00:01, 9.71it/s] 12it [00:01, 9.83it/s] 13it [00:01, 9.79it/s] 14it [00:01, 9.32it/s] 16it [00:01, 9.60it/s] 18it [00:01, 9.76it/s] 19it [00:02, 9.70it/s] 20it [00:02, 9.76it/s] 22it [00:02, 9.88it/s] 24it [00:02, 9.97it/s] 26it [00:02, 10.00it/s] 28it [00:02, 10.02it/s] 29it [00:03, 9.97it/s] 30it [00:03, 9.97it/s] 31it [00:03, 9.97it/s] 32it [00:03, 9.97it/s] 33it [00:03, 9.96it/s] 34it [00:03, 9.94it/s] 35it [00:03, 9.84it/s] 36it [00:03, 9.84it/s] 37it [00:03, 9.87it/s] 38it [00:03, 9.87it/s] 39it [00:04, 9.87it/s] 40it [00:04, 9.88it/s] 42it [00:04, 9.95it/s] 44it [00:04, 9.99it/s] 46it [00:04, 10.01it/s] 47it [00:04, 9.97it/s] 48it [00:04, 9.97it/s] 50it [00:05, 9.77it/s]2025-05-26 04:50:42,043 - INFO - [Epoch 022 | Batch 0050] IWAE-loss 8459.5879 | mean log_px -0.0763 | KL -3567.08 + 51it [00:05, 9.45it/s] 52it [00:05, 9.57it/s] 53it [00:05, 9.63it/s] 54it [00:05, 9.70it/s] 55it [00:05, 9.74it/s] 56it [00:05, 9.31it/s] 58it [00:05, 9.62it/s] 59it [00:06, 9.70it/s] 61it [00:06, 9.84it/s] 63it [00:06, 9.92it/s] 64it [00:06, 9.92it/s] 66it [00:06, 9.98it/s] 68it [00:06, 10.01it/s] 70it [00:07, 10.03it/s] 72it [00:07, 10.03it/s] 74it [00:07, 9.65it/s] 75it [00:07, 9.71it/s] 77it [00:07, 9.83it/s] 78it [00:08, 9.86it/s] 80it [00:08, 9.92it/s] 82it [00:08, 9.96it/s] 83it [00:08, 9.54it/s] 84it [00:08, 9.63it/s] 85it [00:08, 9.72it/s] 86it [00:08, 9.79it/s] 88it [00:09, 9.90it/s] 90it [00:09, 9.95it/s] 92it [00:09, 9.99it/s] 93it [00:09, 9.56it/s] 95it [00:09, 9.74it/s] 96it [00:09, 9.78it/s] 98it [00:10, 9.86it/s] 100it [00:10, 9.92it/s]2025-05-26 04:50:47,141 - INFO - [Epoch 022 | Batch 0100] IWAE-loss 9265.9893 | mean log_px -0.0819 | KL -3570.15 + 101it [00:10, 9.50it/s] 103it [00:10, 9.69it/s] 105it [00:10, 9.82it/s] 106it [00:10, 9.85it/s] 108it [00:11, 9.52it/s] 109it [00:11, 9.61it/s] 110it [00:11, 9.67it/s] 111it [00:11, 9.69it/s] 112it [00:11, 9.72it/s] 113it [00:11, 9.78it/s] 114it [00:11, 9.79it/s] 115it [00:11, 9.85it/s] 116it [00:11, 9.86it/s] 117it [00:12, 9.26it/s] 118it [00:12, 9.43it/s] 120it [00:12, 9.60it/s] 121it [00:12, 9.65it/s] 122it [00:12, 9.72it/s] 124it [00:12, 9.31it/s] 125it [00:12, 9.46it/s] 127it [00:13, 9.68it/s] 128it [00:13, 9.39it/s] 130it [00:13, 9.63it/s] 132it [00:13, 9.78it/s] 134it [00:13, 9.87it/s] 136it [00:13, 9.93it/s] 138it [00:14, 9.97it/s] 140it [00:14, 10.00it/s] 142it [00:14, 10.02it/s] 144it [00:14, 10.03it/s] 146it [00:14, 10.03it/s] 148it [00:15, 10.03it/s] 150it [00:15, 10.04it/s]2025-05-26 04:50:52,258 - INFO - [Epoch 022 | Batch 0150] IWAE-loss 8519.6299 | mean log_px -0.0768 | KL -3566.00 + 152it [00:15, 9.70it/s] 154it [00:15, 9.80it/s] 156it [00:16, 9.55it/s] 158it [00:16, 9.69it/s] 160it [00:16, 9.80it/s] 161it [00:16, 9.44it/s] 162it [00:16, 9.53it/s] 164it [00:16, 9.71it/s] 166it [00:17, 9.82it/s] 168it [00:17, 9.89it/s] 169it [00:17, 9.90it/s] 170it [00:17, 9.91it/s] 172it [00:17, 9.96it/s] 174it [00:17, 9.60it/s] 175it [00:17, 9.66it/s] 176it [00:18, 9.72it/s] 178it [00:18, 9.85it/s] 180it [00:18, 9.92it/s] 182it [00:18, 9.96it/s] 184it [00:18, 9.99it/s] 186it [00:19, 9.65it/s] 188it [00:19, 9.75it/s] 190it [00:19, 9.85it/s] 192it [00:19, 9.91it/s] 194it [00:19, 9.62it/s] 195it [00:20, 9.40it/s] 196it [00:20, 9.23it/s] 196it [00:20, 9.70it/s] +2025-05-26 04:50:57,022 - INFO - Epoch: 22, Objective: tensor([8000.1289], device='cuda:0', grad_fn=), Loss: 0.06485095620155334, KL/n: 72.75353240966797 + 0it [00:00, ?it/s]2025-05-26 04:50:57,302 - INFO - [Epoch 023 | Batch 0000] IWAE-loss 10706.0791 | mean log_px -0.1055 | KL -3565.08 + 1it [00:00, 5.15it/s] 2it [00:00, 6.54it/s] 4it [00:00, 8.35it/s] 5it [00:00, 8.31it/s] 6it [00:00, 8.72it/s] 7it [00:00, 8.99it/s] 8it [00:00, 8.65it/s] 9it [00:01, 9.00it/s] 10it [00:01, 9.27it/s] 12it [00:01, 9.60it/s] 14it [00:01, 9.35it/s] 16it [00:01, 9.59it/s] 18it [00:02, 9.39it/s] 20it [00:02, 9.58it/s] 22it [00:02, 9.71it/s] 23it [00:02, 9.70it/s] 24it [00:02, 9.76it/s] 26it [00:02, 9.86it/s] 27it [00:02, 9.89it/s] 28it [00:03, 9.51it/s] 30it [00:03, 9.71it/s] 31it [00:03, 9.77it/s] 32it [00:03, 9.82it/s] 33it [00:03, 9.34it/s] 34it [00:03, 9.50it/s] 35it [00:03, 9.46it/s] 36it [00:03, 9.55it/s] 38it [00:04, 9.76it/s] 40it [00:04, 9.89it/s] 42it [00:04, 9.95it/s] 44it [00:04, 9.95it/s] 45it [00:04, 9.93it/s] 46it [00:04, 9.93it/s] 47it [00:04, 9.84it/s] 48it [00:05, 9.68it/s] 49it [00:05, 9.62it/s] 50it [00:05, 9.69it/s]2025-05-26 04:51:02,498 - INFO - [Epoch 023 | Batch 0050] IWAE-loss 6445.8760 | mean log_px -0.0427 | KL -3562.69 + 51it [00:05, 9.18it/s] 52it [00:05, 9.35it/s] 54it [00:05, 9.64it/s] 55it [00:05, 9.71it/s] 56it [00:05, 9.22it/s] 57it [00:06, 9.42it/s] 58it [00:06, 9.57it/s] 59it [00:06, 9.67it/s] 61it [00:06, 9.46it/s] 62it [00:06, 9.58it/s] 64it [00:06, 9.75it/s] 66it [00:06, 9.87it/s] 68it [00:07, 9.93it/s] 70it [00:07, 9.98it/s] 72it [00:07, 10.00it/s] 74it [00:07, 10.03it/s] 76it [00:07, 10.02it/s] 78it [00:08, 10.03it/s] 80it [00:08, 10.03it/s] 82it [00:08, 10.03it/s] 84it [00:08, 9.75it/s] 86it [00:08, 9.84it/s] 87it [00:09, 9.86it/s] 88it [00:09, 9.89it/s] 90it [00:09, 9.95it/s] 92it [00:09, 9.99it/s] 94it [00:09, 9.99it/s] 96it [00:09, 10.01it/s] 98it [00:10, 10.02it/s] 100it [00:10, 9.84it/s]2025-05-26 04:51:07,582 - INFO - [Epoch 023 | Batch 0100] IWAE-loss 9278.5117 | mean log_px -0.0849 | KL -3567.39 + 101it [00:10, 9.53it/s] 103it [00:10, 9.71it/s] 105it [00:10, 9.82it/s] 107it [00:11, 9.89it/s] 109it [00:11, 9.95it/s] 111it [00:11, 9.98it/s] 113it [00:11, 10.02it/s] 114it [00:11, 10.01it/s] 116it [00:11, 10.02it/s] 118it [00:12, 10.03it/s] 120it [00:12, 10.04it/s] 122it [00:12, 10.04it/s] 124it [00:12, 10.04it/s] 126it [00:12, 10.05it/s] 128it [00:13, 9.78it/s] 130it [00:13, 9.86it/s] 132it [00:13, 9.91it/s] 134it [00:13, 9.95it/s] 136it [00:13, 9.99it/s] 138it [00:14, 10.01it/s] 140it [00:14, 10.02it/s] 142it [00:14, 10.02it/s] 144it [00:14, 9.62it/s] 146it [00:15, 9.72it/s] 147it [00:15, 9.70it/s] 148it [00:15, 9.38it/s] 150it [00:15, 9.62it/s]2025-05-26 04:51:12,649 - INFO - [Epoch 023 | Batch 0150] IWAE-loss 9398.9590 | mean log_px -0.0833 | KL -3566.49 + 151it [00:15, 9.26it/s] 152it [00:15, 9.41it/s] 153it [00:15, 9.55it/s] 154it [00:15, 9.65it/s] 156it [00:16, 9.80it/s] 158it [00:16, 9.90it/s] 160it [00:16, 9.95it/s] 162it [00:16, 9.60it/s] 163it [00:16, 9.66it/s] 164it [00:16, 9.73it/s] 166it [00:17, 9.85it/s] 168it [00:17, 9.92it/s] 170it [00:17, 9.96it/s] 171it [00:17, 9.97it/s] 172it [00:17, 9.97it/s] 174it [00:17, 9.99it/s] 176it [00:18, 10.00it/s] 178it [00:18, 10.02it/s] 180it [00:18, 10.03it/s] 182it [00:18, 10.04it/s] 184it [00:18, 10.05it/s] 186it [00:19, 10.04it/s] 188it [00:19, 10.04it/s] 190it [00:19, 10.04it/s] 192it [00:19, 10.03it/s] 194it [00:19, 10.04it/s] 196it [00:20, 9.49it/s] 196it [00:20, 9.72it/s] +2025-05-26 04:51:17,316 - INFO - Epoch: 23, Objective: tensor([7036.1016], device='cuda:0', grad_fn=), Loss: 0.05605386570096016, KL/n: 72.70604705810547 + 0it [00:00, ?it/s]2025-05-26 04:51:17,771 - INFO - [Epoch 024 | Batch 0000] IWAE-loss 10053.7881 | mean log_px -0.0965 | KL -3562.36 + 1it [00:00, 5.33it/s] 2it [00:00, 6.68it/s] 4it [00:00, 8.48it/s] 6it [00:00, 9.16it/s] 8it [00:00, 9.52it/s] 10it [00:01, 9.72it/s] 12it [00:01, 9.79it/s] 14it [00:01, 9.88it/s] 16it [00:01, 9.94it/s] 18it [00:01, 9.99it/s] 20it [00:02, 10.01it/s] 22it [00:02, 10.03it/s] 24it [00:02, 9.70it/s] 26it [00:02, 9.80it/s] 27it [00:02, 9.83it/s] 28it [00:02, 9.51it/s] 29it [00:03, 9.61it/s] 30it [00:03, 9.69it/s] 31it [00:03, 9.76it/s] 32it [00:03, 9.81it/s] 34it [00:03, 9.94it/s] 36it [00:03, 9.98it/s] 38it [00:03, 10.01it/s] 40it [00:04, 9.65it/s] 42it [00:04, 9.77it/s] 44it [00:04, 9.86it/s] 46it [00:04, 9.93it/s] 48it [00:04, 9.98it/s] 50it [00:05, 10.01it/s]2025-05-26 04:51:22,835 - INFO - [Epoch 024 | Batch 0050] IWAE-loss 7944.3613 | mean log_px -0.0672 | KL -3565.10 + 52it [00:05, 9.68it/s] 54it [00:05, 9.79it/s] 56it [00:05, 9.88it/s] 58it [00:05, 9.92it/s] 59it [00:06, 9.56it/s] 60it [00:06, 9.65it/s] 62it [00:06, 9.78it/s] 64it [00:06, 9.85it/s] 65it [00:06, 9.88it/s] 66it [00:06, 9.90it/s] 68it [00:06, 9.93it/s] 69it [00:07, 9.89it/s] 70it [00:07, 9.40it/s] 71it [00:07, 9.55it/s] 72it [00:07, 9.66it/s] 74it [00:07, 9.83it/s] 76it [00:07, 9.91it/s] 78it [00:08, 9.97it/s] 80it [00:08, 10.01it/s] 81it [00:08, 10.01it/s] 83it [00:08, 10.04it/s] 85it [00:08, 10.05it/s] 87it [00:08, 10.05it/s] 89it [00:09, 10.01it/s] 91it [00:09, 9.53it/s] 92it [00:09, 9.60it/s] 94it [00:09, 9.75it/s] 95it [00:09, 9.47it/s] 96it [00:09, 9.58it/s] 98it [00:10, 9.75it/s] 99it [00:10, 9.80it/s]2025-05-26 04:51:27,943 - INFO - [Epoch 024 | Batch 0100] IWAE-loss 6554.0537 | mean log_px -0.0452 | KL -3559.28 + 101it [00:10, 9.47it/s] 102it [00:10, 9.58it/s] 104it [00:10, 9.75it/s] 106it [00:10, 9.87it/s] 108it [00:11, 9.94it/s] 110it [00:11, 9.98it/s] 112it [00:11, 10.02it/s] 114it [00:11, 10.03it/s] 116it [00:11, 10.04it/s] 118it [00:12, 10.05it/s] 120it [00:12, 10.06it/s] 122it [00:12, 10.06it/s] 124it [00:12, 10.06it/s] 126it [00:12, 10.06it/s] 128it [00:13, 10.06it/s] 130it [00:13, 10.05it/s] 132it [00:13, 10.07it/s] 134it [00:13, 10.07it/s] 136it [00:13, 10.09it/s] 138it [00:14, 10.08it/s] 140it [00:14, 10.07it/s] 142it [00:14, 10.06it/s] 144it [00:14, 10.06it/s] 146it [00:14, 10.07it/s] 148it [00:15, 10.06it/s] 150it [00:15, 10.06it/s]2025-05-26 04:51:32,938 - INFO - [Epoch 024 | Batch 0150] IWAE-loss 11166.3877 | mean log_px -0.1161 | KL -3563.05 + 152it [00:15, 9.63it/s] 154it [00:15, 9.75it/s] 156it [00:15, 9.84it/s] 157it [00:15, 9.74it/s] 158it [00:16, 9.62it/s] 159it [00:16, 9.56it/s] 160it [00:16, 9.62it/s] 161it [00:16, 9.69it/s] 162it [00:16, 9.76it/s] 163it [00:16, 9.80it/s] 164it [00:16, 9.79it/s] 165it [00:16, 9.84it/s] 166it [00:16, 9.86it/s] 167it [00:17, 9.88it/s] 168it [00:17, 9.86it/s] 169it [00:17, 9.83it/s] 170it [00:17, 9.83it/s] 171it [00:17, 9.87it/s] 172it [00:17, 9.89it/s] 173it [00:17, 9.20it/s] 174it [00:17, 9.40it/s] 176it [00:17, 9.69it/s] 177it [00:18, 9.26it/s] 178it [00:18, 9.44it/s] 180it [00:18, 9.70it/s] 182it [00:18, 9.83it/s] 184it [00:18, 9.91it/s] 186it [00:18, 9.95it/s] 187it [00:19, 9.62it/s] 188it [00:19, 9.69it/s] 189it [00:19, 9.75it/s] 190it [00:19, 9.80it/s] 192it [00:19, 9.89it/s] 194it [00:19, 9.94it/s] 195it [00:19, 9.62it/s] 196it [00:20, 9.38it/s] 196it [00:20, 9.76it/s] +2025-05-26 04:51:37,699 - INFO - Epoch: 24, Objective: tensor([7781.2070], device='cuda:0', grad_fn=), Loss: 0.06895510107278824, KL/n: 72.64373779296875 + 0it [00:00, ?it/s]2025-05-26 04:51:37,998 - INFO - [Epoch 025 | Batch 0000] IWAE-loss 5908.9863 | mean log_px -0.0345 | KL -3553.46 + 1it [00:00, 4.85it/s] 3it [00:00, 7.93it/s] 5it [00:00, 8.92it/s] 7it [00:00, 9.41it/s] 9it [00:00, 9.67it/s] 11it [00:01, 9.84it/s] 13it [00:01, 9.93it/s] 15it [00:01, 9.99it/s] 17it [00:01, 9.69it/s] 19it [00:02, 9.83it/s] 21it [00:02, 9.91it/s] 23it [00:02, 9.98it/s] 25it [00:02, 10.02it/s] 27it [00:02, 10.06it/s] 29it [00:02, 10.08it/s] 31it [00:03, 10.10it/s] 33it [00:03, 10.10it/s] 35it [00:03, 10.12it/s] 37it [00:03, 10.10it/s] 39it [00:03, 10.10it/s] 41it [00:04, 10.11it/s] 43it [00:04, 9.76it/s] 44it [00:04, 9.79it/s] 46it [00:04, 9.88it/s] 47it [00:04, 9.89it/s] 48it [00:04, 9.87it/s] 50it [00:05, 9.63it/s]2025-05-26 04:51:43,010 - INFO - [Epoch 025 | Batch 0050] IWAE-loss 5141.8364 | mean log_px -0.0226 | KL -3558.55 + 51it [00:05, 9.69it/s] 53it [00:05, 9.86it/s] 55it [00:05, 9.96it/s] 57it [00:05, 10.02it/s] 59it [00:06, 10.05it/s] 61it [00:06, 10.08it/s] 63it [00:06, 9.69it/s] 64it [00:06, 9.74it/s] 66it [00:06, 9.86it/s] 68it [00:06, 9.94it/s] 70it [00:07, 9.98it/s] 72it [00:07, 10.02it/s] 74it [00:07, 10.05it/s] 76it [00:07, 9.74it/s] 78it [00:07, 9.85it/s] 80it [00:08, 9.94it/s] 81it [00:08, 9.65it/s] 83it [00:08, 9.80it/s] 85it [00:08, 9.91it/s] 86it [00:08, 9.52it/s] 87it [00:08, 9.51it/s] 88it [00:08, 9.59it/s] 89it [00:09, 9.67it/s] 90it [00:09, 9.73it/s] 92it [00:09, 9.88it/s] 94it [00:09, 9.96it/s] 96it [00:09, 10.00it/s] 98it [00:09, 10.04it/s] 100it [00:10, 10.05it/s]2025-05-26 04:51:48,061 - INFO - [Epoch 025 | Batch 0100] IWAE-loss 6209.9375 | mean log_px -0.0399 | KL -3555.98 + 102it [00:10, 9.71it/s] 104it [00:10, 9.79it/s] 105it [00:10, 9.32it/s] 106it [00:10, 9.22it/s] 107it [00:10, 9.34it/s] 108it [00:11, 9.46it/s] 109it [00:11, 9.57it/s] 110it [00:11, 9.65it/s] 111it [00:11, 9.29it/s] 112it [00:11, 9.46it/s] 113it [00:11, 9.59it/s] 114it [00:11, 9.67it/s] 115it [00:11, 9.12it/s] 116it [00:11, 9.31it/s] 117it [00:11, 9.50it/s] 118it [00:12, 9.64it/s] 120it [00:12, 9.73it/s] 121it [00:12, 9.78it/s] 123it [00:12, 9.91it/s] 125it [00:12, 9.99it/s] 126it [00:12, 9.64it/s] 128it [00:13, 9.41it/s] 130it [00:13, 9.63it/s] 132it [00:13, 9.43it/s] 134it [00:13, 9.65it/s] 135it [00:13, 9.35it/s] 137it [00:14, 9.61it/s] 139it [00:14, 9.78it/s] 141it [00:14, 9.89it/s] 143it [00:14, 9.98it/s] 145it [00:14, 10.03it/s] 147it [00:15, 10.07it/s] 149it [00:15, 10.10it/s]2025-05-26 04:51:53,234 - INFO - [Epoch 025 | Batch 0150] IWAE-loss 8218.2256 | mean log_px -0.0712 | KL -3553.84 + 151it [00:15, 9.75it/s] 153it [00:15, 9.86it/s] 155it [00:15, 9.94it/s] 157it [00:16, 10.00it/s] 159it [00:16, 10.06it/s] 161it [00:16, 9.81it/s] 163it [00:16, 9.92it/s] 165it [00:16, 9.99it/s] 167it [00:17, 10.04it/s] 169it [00:17, 10.07it/s] 171it [00:17, 10.09it/s] 173it [00:17, 10.11it/s] 175it [00:17, 9.78it/s] 177it [00:18, 9.89it/s] 179it [00:18, 9.96it/s] 181it [00:18, 10.02it/s] 183it [00:18, 10.06it/s] 185it [00:18, 9.73it/s] 186it [00:18, 9.77it/s] 188it [00:19, 9.89it/s] 189it [00:19, 9.51it/s] 191it [00:19, 9.72it/s] 193it [00:19, 9.85it/s] 195it [00:19, 9.68it/s] 196it [00:20, 9.47it/s] 196it [00:20, 9.76it/s] +2025-05-26 04:51:57,912 - INFO - Epoch: 25, Objective: tensor([8688.2051], device='cuda:0', grad_fn=), Loss: 0.08251015841960907, KL/n: 72.58772277832031 + 0it [00:00, ?it/s]2025-05-26 04:51:58,345 - INFO - [Epoch 026 | Batch 0000] IWAE-loss 7151.1875 | mean log_px -0.0637 | KL -3554.05 + 1it [00:00, 5.49it/s] 3it [00:00, 8.25it/s] 4it [00:00, 8.78it/s] 6it [00:00, 9.37it/s] 8it [00:00, 9.62it/s] 10it [00:01, 9.76it/s] 12it [00:01, 9.86it/s] 14it [00:01, 9.92it/s] 15it [00:01, 9.93it/s] 16it [00:01, 9.94it/s] 17it [00:01, 9.95it/s] 18it [00:01, 9.95it/s] 20it [00:02, 9.98it/s] 21it [00:02, 9.58it/s] 23it [00:02, 9.76it/s] 24it [00:02, 9.81it/s] 26it [00:02, 9.89it/s] 28it [00:02, 9.93it/s] 30it [00:03, 9.95it/s] 31it [00:03, 9.54it/s] 32it [00:03, 9.63it/s] 34it [00:03, 9.80it/s] 35it [00:03, 9.82it/s] 36it [00:03, 9.85it/s] 38it [00:03, 9.93it/s] 39it [00:04, 9.94it/s] 40it [00:04, 9.94it/s] 42it [00:04, 9.98it/s] 44it [00:04, 10.00it/s] 46it [00:04, 10.02it/s] 48it [00:04, 10.02it/s] 50it [00:05, 10.03it/s]2025-05-26 04:52:03,405 - INFO - [Epoch 026 | Batch 0050] IWAE-loss 8084.2090 | mean log_px -0.0655 | KL -3553.26 + 52it [00:05, 9.66it/s] 53it [00:05, 9.72it/s] 54it [00:05, 9.76it/s] 55it [00:05, 9.81it/s] 56it [00:05, 9.85it/s] 58it [00:05, 9.92it/s] 60it [00:06, 9.96it/s] 62it [00:06, 9.98it/s] 64it [00:06, 10.00it/s] 66it [00:06, 10.00it/s] 68it [00:06, 9.44it/s] 69it [00:07, 9.52it/s] 70it [00:07, 9.61it/s] 72it [00:07, 9.77it/s] 74it [00:07, 9.86it/s] 75it [00:07, 9.89it/s] 76it [00:07, 9.91it/s] 78it [00:07, 9.97it/s] 79it [00:08, 9.57it/s] 80it [00:08, 9.59it/s] 81it [00:08, 9.54it/s] 82it [00:08, 9.12it/s] 83it [00:08, 8.72it/s] 84it [00:08, 8.98it/s] 86it [00:08, 9.42it/s] 87it [00:08, 9.55it/s] 88it [00:09, 9.64it/s] 90it [00:09, 9.36it/s] 92it [00:09, 9.61it/s] 94it [00:09, 9.76it/s] 96it [00:09, 9.86it/s] 98it [00:10, 9.92it/s] 100it [00:10, 9.96it/s]2025-05-26 04:52:08,564 - INFO - [Epoch 026 | Batch 0100] IWAE-loss 6382.7183 | mean log_px -0.0501 | KL -3556.70 + 101it [00:10, 9.54it/s] 102it [00:10, 9.56it/s] 104it [00:10, 9.74it/s] 106it [00:10, 9.85it/s] 108it [00:11, 9.91it/s] 110it [00:11, 9.95it/s] 111it [00:11, 9.86it/s] 112it [00:11, 9.51it/s] 114it [00:11, 9.70it/s] 116it [00:11, 9.82it/s] 118it [00:12, 9.90it/s] 120it [00:12, 9.78it/s] 121it [00:12, 9.42it/s] 122it [00:12, 9.49it/s] 123it [00:12, 9.54it/s] 124it [00:12, 9.65it/s] 126it [00:12, 9.78it/s] 127it [00:13, 9.83it/s] 129it [00:13, 9.91it/s] 130it [00:13, 9.93it/s] 131it [00:13, 9.28it/s] 132it [00:13, 9.44it/s] 133it [00:13, 9.58it/s] 134it [00:13, 9.67it/s] 136it [00:13, 9.84it/s] 137it [00:14, 9.46it/s] 138it [00:14, 9.59it/s] 140it [00:14, 9.76it/s] 142it [00:14, 9.83it/s] 144it [00:14, 9.90it/s] 146it [00:15, 9.95it/s] 148it [00:15, 9.99it/s] 150it [00:15, 10.02it/s]2025-05-26 04:52:13,694 - INFO - [Epoch 026 | Batch 0150] IWAE-loss 8474.0977 | mean log_px -0.0783 | KL -3551.70 + 151it [00:15, 9.59it/s] 153it [00:15, 9.74it/s] 155it [00:15, 9.85it/s] 157it [00:16, 9.91it/s] 158it [00:16, 9.60it/s] 160it [00:16, 9.68it/s] 161it [00:16, 9.71it/s] 162it [00:16, 9.74it/s] 163it [00:16, 9.75it/s] 164it [00:16, 9.80it/s] 166it [00:17, 9.90it/s] 168it [00:17, 9.94it/s] 169it [00:17, 9.94it/s] 170it [00:17, 9.95it/s] 172it [00:17, 9.99it/s] 173it [00:17, 9.78it/s] 174it [00:17, 9.43it/s] 175it [00:17, 9.57it/s] 176it [00:18, 9.65it/s] 177it [00:18, 9.74it/s] 178it [00:18, 9.80it/s] 179it [00:18, 9.86it/s] 180it [00:18, 9.85it/s] 181it [00:18, 9.79it/s] 182it [00:18, 9.33it/s] 184it [00:18, 9.65it/s] 186it [00:19, 9.80it/s] 188it [00:19, 9.89it/s] 190it [00:19, 9.57it/s] 192it [00:19, 9.72it/s] 194it [00:19, 9.83it/s] 195it [00:20, 9.57it/s] 196it [00:20, 9.35it/s] 196it [00:20, 9.69it/s] +2025-05-26 04:52:18,449 - INFO - Epoch: 26, Objective: tensor([10124.8457], device='cuda:0', grad_fn=), Loss: 0.10262526571750641, KL/n: 72.52192687988281 + 0it [00:00, ?it/s]2025-05-26 04:52:18,731 - INFO - [Epoch 027 | Batch 0000] IWAE-loss 5660.2915 | mean log_px -0.0403 | KL -3550.19 + 1it [00:00, 5.12it/s] 2it [00:00, 6.67it/s] 4it [00:00, 8.53it/s] 6it [00:00, 9.23it/s] 7it [00:00, 9.06it/s] 9it [00:01, 9.49it/s] 11it [00:01, 9.73it/s] 13it [00:01, 9.88it/s] 15it [00:01, 9.98it/s] 17it [00:01, 10.03it/s] 19it [00:02, 10.06it/s] 21it [00:02, 10.09it/s] 23it [00:02, 10.05it/s] 25it [00:02, 9.97it/s] 27it [00:02, 10.03it/s] 29it [00:03, 10.06it/s] 31it [00:03, 10.07it/s] 33it [00:03, 10.09it/s] 35it [00:03, 9.83it/s] 37it [00:03, 9.59it/s] 39it [00:04, 9.73it/s] 41it [00:04, 9.86it/s] 43it [00:04, 9.95it/s] 45it [00:04, 10.01it/s] 47it [00:04, 10.05it/s] 49it [00:05, 10.09it/s]2025-05-26 04:52:23,751 - INFO - [Epoch 027 | Batch 0050] IWAE-loss 7041.8789 | mean log_px -0.0514 | KL -3547.65 + 51it [00:05, 9.74it/s] 53it [00:05, 9.86it/s] 55it [00:05, 9.95it/s] 56it [00:05, 9.66it/s] 58it [00:05, 9.82it/s] 60it [00:06, 9.57it/s] 62it [00:06, 9.74it/s] 64it [00:06, 9.87it/s] 66it [00:06, 9.95it/s] 68it [00:06, 10.02it/s] 70it [00:07, 10.06it/s] 72it [00:07, 9.74it/s] 74it [00:07, 9.84it/s] 76it [00:07, 9.94it/s] 78it [00:07, 10.00it/s] 80it [00:08, 9.66it/s] 82it [00:08, 9.79it/s] 83it [00:08, 9.81it/s] 85it [00:08, 9.90it/s] 86it [00:08, 9.90it/s] 88it [00:09, 9.65it/s] 90it [00:09, 9.80it/s] 92it [00:09, 9.92it/s] 94it [00:09, 9.99it/s] 96it [00:09, 10.04it/s] 98it [00:09, 10.06it/s] 100it [00:10, 9.74it/s]2025-05-26 04:52:28,845 - INFO - [Epoch 027 | Batch 0100] IWAE-loss 7957.1924 | mean log_px -0.0696 | KL -3551.78 + 102it [00:10, 9.84it/s] 104it [00:10, 9.93it/s] 106it [00:10, 9.99it/s] 108it [00:10, 10.04it/s] 110it [00:11, 10.09it/s] 112it [00:11, 10.10it/s] 114it [00:11, 10.12it/s] 116it [00:11, 10.13it/s] 118it [00:11, 10.12it/s] 120it [00:12, 9.79it/s] 121it [00:12, 9.82it/s] 123it [00:12, 9.93it/s] 125it [00:12, 9.99it/s] 127it [00:12, 10.04it/s] 129it [00:13, 10.05it/s] 131it [00:13, 10.09it/s] 133it [00:13, 10.12it/s] 135it [00:13, 10.14it/s] 137it [00:13, 10.10it/s] 139it [00:14, 10.05it/s] 141it [00:14, 10.09it/s] 143it [00:14, 9.98it/s] 144it [00:14, 9.69it/s] 146it [00:14, 9.84it/s] 148it [00:14, 9.94it/s] 150it [00:15, 9.72it/s]2025-05-26 04:52:33,850 - INFO - [Epoch 027 | Batch 0150] IWAE-loss 7002.5981 | mean log_px -0.0568 | KL -3547.20 + 151it [00:15, 9.75it/s] 153it [00:15, 9.86it/s] 155it [00:15, 9.95it/s] 157it [00:15, 10.03it/s] 159it [00:16, 9.71it/s] 161it [00:16, 9.83it/s] 163it [00:16, 9.92it/s] 164it [00:16, 9.86it/s] 165it [00:16, 9.57it/s] 167it [00:16, 9.78it/s] 169it [00:17, 9.54it/s] 171it [00:17, 9.72it/s] 173it [00:17, 9.86it/s] 175it [00:17, 9.96it/s] 177it [00:17, 9.90it/s] 178it [00:18, 9.77it/s] 179it [00:18, 9.16it/s] 180it [00:18, 9.31it/s] 181it [00:18, 9.45it/s] 182it [00:18, 9.58it/s] 183it [00:18, 9.67it/s] 184it [00:18, 9.73it/s] 185it [00:18, 9.80it/s] 186it [00:18, 9.83it/s] 187it [00:19, 9.88it/s] 188it [00:19, 9.90it/s] 189it [00:19, 9.87it/s] 191it [00:19, 9.98it/s] 193it [00:19, 10.06it/s] 195it [00:19, 9.78it/s] 196it [00:19, 9.53it/s] 196it [00:19, 9.81it/s] +2025-05-26 04:52:38,564 - INFO - Epoch: 27, Objective: tensor([5026.2368], device='cuda:0', grad_fn=), Loss: 0.021482713520526886, KL/n: 72.46076965332031 + 0it [00:00, ?it/s]2025-05-26 04:52:39,019 - INFO - [Epoch 028 | Batch 0000] IWAE-loss 6144.6147 | mean log_px -0.0405 | KL -3548.91 + 1it [00:00, 5.40it/s] 2it [00:00, 6.83it/s] 4it [00:00, 8.54it/s] 5it [00:00, 8.95it/s] 6it [00:00, 8.56it/s] 8it [00:00, 9.17it/s] 9it [00:01, 9.34it/s] 10it [00:01, 9.48it/s] 12it [00:01, 9.71it/s] 13it [00:01, 9.78it/s] 14it [00:01, 9.82it/s] 15it [00:01, 9.84it/s] 16it [00:01, 9.86it/s] 17it [00:01, 9.32it/s] 18it [00:01, 9.44it/s] 20it [00:02, 9.72it/s] 21it [00:02, 9.78it/s] 22it [00:02, 9.79it/s] 23it [00:02, 9.84it/s] 24it [00:02, 9.87it/s] 26it [00:02, 9.95it/s] 27it [00:02, 9.93it/s] 28it [00:02, 9.90it/s] 29it [00:03, 9.86it/s] 30it [00:03, 9.88it/s] 32it [00:03, 9.89it/s] 33it [00:03, 9.91it/s] 35it [00:03, 9.96it/s] 36it [00:03, 9.95it/s] 37it [00:03, 9.48it/s] 38it [00:03, 9.56it/s] 39it [00:04, 9.63it/s] 40it [00:04, 9.70it/s] 41it [00:04, 9.22it/s] 42it [00:04, 9.41it/s] 43it [00:04, 9.56it/s] 44it [00:04, 9.65it/s] 45it [00:04, 9.15it/s] 46it [00:04, 9.37it/s] 47it [00:04, 9.41it/s] 48it [00:05, 9.51it/s] 49it [00:05, 9.05it/s] 50it [00:05, 9.28it/s]2025-05-26 04:52:44,213 - INFO - [Epoch 028 | Batch 0050] IWAE-loss 7022.5996 | mean log_px -0.0538 | KL -3548.01 + 51it [00:05, 9.46it/s] 52it [00:05, 9.60it/s] 53it [00:05, 9.14it/s] 54it [00:05, 9.34it/s] 55it [00:05, 9.51it/s] 56it [00:05, 9.62it/s] 57it [00:06, 9.13it/s] 58it [00:06, 9.33it/s] 60it [00:06, 9.65it/s] 61it [00:06, 9.24it/s] 62it [00:06, 9.41it/s] 63it [00:06, 9.55it/s] 64it [00:06, 9.63it/s] 65it [00:06, 9.15it/s] 66it [00:06, 9.34it/s] 67it [00:07, 9.48it/s] 68it [00:07, 9.60it/s] 69it [00:07, 9.12it/s] 70it [00:07, 9.32it/s] 71it [00:07, 9.49it/s] 72it [00:07, 9.05it/s] 73it [00:07, 9.27it/s] 74it [00:07, 9.47it/s] 75it [00:07, 9.55it/s] 76it [00:08, 9.04it/s] 77it [00:08, 9.30it/s] 78it [00:08, 9.48it/s] 80it [00:08, 9.34it/s] 81it [00:08, 9.49it/s] 82it [00:08, 9.58it/s] 83it [00:08, 9.24it/s] 84it [00:08, 9.42it/s] 85it [00:08, 9.54it/s] 86it [00:09, 9.04it/s] 87it [00:09, 9.30it/s] 88it [00:09, 9.48it/s] 89it [00:09, 9.61it/s] 90it [00:09, 9.58it/s] 91it [00:09, 9.09it/s] 92it [00:09, 9.30it/s] 93it [00:09, 9.43it/s] 94it [00:09, 9.53it/s] 95it [00:10, 9.05it/s] 96it [00:10, 9.28it/s] 97it [00:10, 9.44it/s] 98it [00:10, 9.56it/s] 99it [00:10, 9.07it/s] 100it [00:10, 9.29it/s]2025-05-26 04:52:49,548 - INFO - [Epoch 028 | Batch 0100] IWAE-loss 7795.5220 | mean log_px -0.0668 | KL -3546.89 + 101it [00:10, 9.45it/s] 102it [00:10, 9.58it/s] 103it [00:10, 9.06it/s] 104it [00:11, 9.29it/s] 106it [00:11, 9.62it/s] 107it [00:11, 9.20it/s] 108it [00:11, 9.37it/s] 109it [00:11, 9.51it/s] 110it [00:11, 9.62it/s] 112it [00:11, 9.42it/s] 114it [00:12, 9.67it/s] 115it [00:12, 9.36it/s] 116it [00:12, 9.50it/s] 118it [00:12, 9.71it/s] 120it [00:12, 9.83it/s] 121it [00:12, 9.42it/s] 122it [00:12, 9.54it/s] 123it [00:13, 9.64it/s] 124it [00:13, 9.16it/s] 125it [00:13, 9.36it/s] 127it [00:13, 9.67it/s] 129it [00:13, 9.82it/s] 130it [00:13, 9.85it/s] 131it [00:13, 9.46it/s] 132it [00:13, 9.54it/s] 134it [00:14, 9.75it/s] 135it [00:14, 9.33it/s] 136it [00:14, 9.48it/s] 138it [00:14, 9.69it/s] 139it [00:14, 9.75it/s] 140it [00:14, 9.80it/s] 142it [00:14, 9.90it/s] 143it [00:15, 9.90it/s] 144it [00:15, 9.92it/s] 145it [00:15, 9.39it/s] 146it [00:15, 9.52it/s] 147it [00:15, 9.60it/s] 148it [00:15, 9.68it/s] 149it [00:15, 9.77it/s] 150it [00:15, 9.78it/s]2025-05-26 04:52:54,754 - INFO - [Epoch 028 | Batch 0150] IWAE-loss 6129.2549 | mean log_px -0.0445 | KL -3552.00 + 151it [00:15, 9.21it/s] 152it [00:16, 9.43it/s] 153it [00:16, 9.59it/s] 154it [00:16, 9.70it/s] 155it [00:16, 9.77it/s] 156it [00:16, 9.69it/s] 157it [00:16, 9.74it/s] 158it [00:16, 9.81it/s] 159it [00:16, 9.86it/s] 160it [00:16, 9.87it/s] 161it [00:16, 9.90it/s] 162it [00:17, 9.90it/s] 163it [00:17, 9.91it/s] 164it [00:17, 9.91it/s] 166it [00:17, 9.97it/s] 168it [00:17, 9.98it/s] 169it [00:17, 9.95it/s] 170it [00:17, 9.90it/s] 171it [00:17, 9.68it/s] 172it [00:18, 9.19it/s] 174it [00:18, 9.52it/s] 175it [00:18, 9.60it/s] 176it [00:18, 9.65it/s] 177it [00:18, 9.73it/s] 178it [00:18, 9.78it/s] 180it [00:18, 9.87it/s] 181it [00:18, 9.89it/s] 182it [00:19, 9.71it/s] 183it [00:19, 9.33it/s] 184it [00:19, 9.50it/s] 185it [00:19, 9.58it/s] 186it [00:19, 9.10it/s] 187it [00:19, 9.34it/s] 188it [00:19, 9.46it/s] 190it [00:19, 9.73it/s] 192it [00:20, 9.85it/s] 193it [00:20, 9.87it/s] 194it [00:20, 9.89it/s] 195it [00:20, 9.52it/s] 196it [00:20, 9.50it/s] +2025-05-26 04:52:59,504 - INFO - Epoch: 28, Objective: tensor([7316.0479], device='cuda:0', grad_fn=), Loss: 0.06041298806667328, KL/n: 72.37413787841797 + 0it [00:00, ?it/s]2025-05-26 04:52:59,780 - INFO - [Epoch 029 | Batch 0000] IWAE-loss 5790.9482 | mean log_px -0.0366 | KL -3544.11 + 1it [00:00, 4.70it/s] 3it [00:00, 7.79it/s] 5it [00:00, 8.83it/s] 7it [00:00, 9.34it/s] 8it [00:00, 9.45it/s] 9it [00:01, 9.05it/s] 11it [00:01, 9.46it/s] 13it [00:01, 9.70it/s] 15it [00:01, 9.83it/s] 17it [00:01, 9.92it/s] 19it [00:02, 9.98it/s] 21it [00:02, 9.76it/s] 22it [00:02, 9.73it/s] 24it [00:02, 9.84it/s] 26it [00:02, 9.91it/s] 28it [00:02, 9.96it/s] 30it [00:03, 9.98it/s] 32it [00:03, 10.01it/s] 34it [00:03, 10.04it/s] 36it [00:03, 9.70it/s] 38it [00:03, 9.82it/s] 40it [00:04, 9.91it/s] 42it [00:04, 9.69it/s] 44it [00:04, 9.81it/s] 46it [00:04, 9.89it/s] 48it [00:04, 9.90it/s] 49it [00:05, 9.79it/s] 50it [00:05, 9.45it/s]2025-05-26 04:53:04,887 - INFO - [Epoch 029 | Batch 0050] IWAE-loss 8045.6401 | mean log_px -0.0730 | KL -3546.79 + 51it [00:05, 9.54it/s] 53it [00:05, 9.75it/s] 55it [00:05, 9.87it/s] 57it [00:05, 9.95it/s] 59it [00:06, 10.00it/s] 61it [00:06, 9.67it/s] 62it [00:06, 9.72it/s] 64it [00:06, 9.84it/s] 66it [00:06, 9.93it/s] 68it [00:07, 9.94it/s] 69it [00:07, 9.86it/s] 70it [00:07, 9.53it/s] 72it [00:07, 9.74it/s] 74it [00:07, 9.86it/s] 75it [00:07, 9.47it/s] 77it [00:07, 9.68it/s] 78it [00:08, 9.74it/s] 79it [00:08, 9.33it/s] 80it [00:08, 9.18it/s] 81it [00:08, 9.21it/s] 82it [00:08, 9.15it/s] 83it [00:08, 9.35it/s] 84it [00:08, 9.49it/s] 85it [00:08, 9.61it/s] 86it [00:08, 9.25it/s] 87it [00:09, 9.44it/s] 88it [00:09, 9.58it/s] 89it [00:09, 9.66it/s] 90it [00:09, 9.72it/s] 91it [00:09, 9.76it/s] 92it [00:09, 9.18it/s] 94it [00:09, 9.57it/s] 96it [00:09, 9.76it/s] 98it [00:10, 9.87it/s] 100it [00:10, 9.94it/s]2025-05-26 04:53:10,040 - INFO - [Epoch 029 | Batch 0100] IWAE-loss 7717.3555 | mean log_px -0.0658 | KL -3546.15 + 101it [00:10, 9.53it/s] 102it [00:10, 9.62it/s] 104it [00:10, 9.80it/s] 106it [00:10, 9.90it/s] 108it [00:11, 9.97it/s] 110it [00:11, 10.01it/s] 112it [00:11, 10.04it/s] 114it [00:11, 10.06it/s] 116it [00:11, 10.07it/s] 118it [00:12, 9.99it/s] 119it [00:12, 9.61it/s] 121it [00:12, 9.76it/s] 122it [00:12, 9.80it/s] 123it [00:12, 9.83it/s] 124it [00:12, 9.34it/s] 125it [00:12, 9.48it/s] 126it [00:13, 9.42it/s] 127it [00:13, 9.32it/s] 128it [00:13, 9.00it/s] 130it [00:13, 9.45it/s] 132it [00:13, 9.68it/s] 134it [00:13, 9.84it/s] 136it [00:14, 9.93it/s] 138it [00:14, 9.58it/s] 140it [00:14, 9.73it/s] 142it [00:14, 9.84it/s] 144it [00:14, 9.59it/s] 146it [00:15, 9.74it/s] 148it [00:15, 9.86it/s] 150it [00:15, 9.93it/s]2025-05-26 04:53:15,166 - INFO - [Epoch 029 | Batch 0150] IWAE-loss 9115.5293 | mean log_px -0.0874 | KL -3541.34 + 151it [00:15, 9.55it/s] 153it [00:15, 9.74it/s] 155it [00:15, 9.86it/s] 157it [00:16, 9.95it/s] 159it [00:16, 9.99it/s] 161it [00:16, 10.02it/s] 163it [00:16, 10.05it/s] 165it [00:16, 10.06it/s] 167it [00:17, 10.07it/s] 169it [00:17, 10.06it/s] 171it [00:17, 10.08it/s] 173it [00:17, 9.96it/s] 174it [00:17, 9.67it/s] 176it [00:18, 9.80it/s] 178it [00:18, 9.89it/s] 179it [00:18, 9.85it/s] 180it [00:18, 9.84it/s] 182it [00:18, 9.87it/s] 183it [00:18, 9.86it/s] 184it [00:18, 9.87it/s] 185it [00:19, 9.85it/s] 186it [00:19, 9.77it/s] 187it [00:19, 9.80it/s] 188it [00:19, 9.79it/s] 189it [00:19, 9.78it/s] 190it [00:19, 9.77it/s] 191it [00:19, 9.80it/s] 192it [00:19, 9.82it/s] 193it [00:19, 9.84it/s] 194it [00:19, 9.84it/s] 195it [00:20, 9.42it/s] 196it [00:20, 9.17it/s] 196it [00:20, 9.69it/s] +2025-05-26 04:53:19,851 - INFO - Epoch: 29, Objective: tensor([7595.7744], device='cuda:0', grad_fn=), Loss: 0.06281988322734833, KL/n: 72.2783432006836 + 0it [00:00, ?it/s]2025-05-26 04:53:20,301 - INFO - [Epoch 030 | Batch 0000] IWAE-loss 7184.0381 | mean log_px -0.0520 | KL -3540.00 + 1it [00:00, 5.57it/s] 2it [00:00, 6.98it/s] 4it [00:00, 8.70it/s] 5it [00:00, 8.54it/s] 7it [00:00, 9.20it/s] 9it [00:01, 9.54it/s] 11it [00:01, 9.75it/s] 13it [00:01, 9.89it/s] 15it [00:01, 9.97it/s] 17it [00:01, 10.01it/s] 19it [00:01, 10.03it/s] 21it [00:02, 10.06it/s] 23it [00:02, 10.08it/s] 25it [00:02, 10.09it/s] 27it [00:02, 9.88it/s] 29it [00:03, 9.96it/s] 31it [00:03, 10.00it/s] 33it [00:03, 10.04it/s] 35it [00:03, 10.08it/s] 37it [00:03, 9.87it/s] 39it [00:04, 9.95it/s] 41it [00:04, 10.00it/s] 43it [00:04, 10.04it/s] 45it [00:04, 10.06it/s] 47it [00:04, 10.07it/s] 49it [00:04, 10.07it/s]2025-05-26 04:53:25,314 - INFO - [Epoch 030 | Batch 0050] IWAE-loss 5986.0142 | mean log_px -0.0354 | KL -3537.95 + 51it [00:05, 9.73it/s] 53it [00:05, 9.86it/s] 55it [00:05, 9.61it/s] 57it [00:05, 9.76it/s] 59it [00:06, 9.87it/s] 61it [00:06, 9.95it/s] 63it [00:06, 10.01it/s] 65it [00:06, 9.73it/s] 66it [00:06, 9.77it/s] 68it [00:06, 9.51it/s] 70it [00:07, 9.68it/s] 72it [00:07, 9.81it/s] 73it [00:07, 9.83it/s] 74it [00:07, 9.86it/s] 76it [00:07, 9.97it/s] 78it [00:07, 10.04it/s] 80it [00:08, 10.06it/s] 82it [00:08, 10.08it/s] 84it [00:08, 10.08it/s] 86it [00:08, 10.10it/s] 88it [00:08, 10.11it/s] 90it [00:09, 10.09it/s] 92it [00:09, 10.03it/s] 94it [00:09, 10.05it/s] 96it [00:09, 10.04it/s] 98it [00:09, 9.98it/s] 100it [00:10, 10.04it/s]2025-05-26 04:53:30,362 - INFO - [Epoch 030 | Batch 0100] IWAE-loss 5398.5059 | mean log_px -0.0280 | KL -3539.20 + 102it [00:10, 9.72it/s] 104it [00:10, 9.84it/s] 106it [00:10, 9.92it/s] 107it [00:10, 9.56it/s] 109it [00:11, 9.75it/s] 110it [00:11, 9.79it/s] 112it [00:11, 9.52it/s] 114it [00:11, 9.70it/s] 116it [00:11, 9.84it/s] 118it [00:11, 9.93it/s] 120it [00:12, 9.97it/s] 121it [00:12, 9.96it/s] 122it [00:12, 9.48it/s] 123it [00:12, 9.54it/s] 124it [00:12, 9.56it/s] 125it [00:12, 9.63it/s] 126it [00:12, 9.71it/s] 128it [00:13, 9.86it/s] 130it [00:13, 9.97it/s] 132it [00:13, 10.03it/s] 134it [00:13, 10.07it/s] 136it [00:13, 10.09it/s] 138it [00:14, 10.12it/s] 140it [00:14, 10.13it/s] 142it [00:14, 10.14it/s] 144it [00:14, 10.11it/s] 146it [00:14, 10.12it/s] 148it [00:15, 9.84it/s] 150it [00:15, 9.93it/s]2025-05-26 04:53:35,433 - INFO - [Epoch 030 | Batch 0150] IWAE-loss 8095.3145 | mean log_px -0.0698 | KL -3535.73 + 151it [00:15, 9.57it/s] 153it [00:15, 9.76it/s] 155it [00:15, 9.88it/s] 156it [00:15, 9.51it/s] 158it [00:16, 9.73it/s] 160it [00:16, 9.87it/s] 162it [00:16, 9.96it/s] 164it [00:16, 9.66it/s] 166it [00:16, 9.79it/s] 168it [00:17, 9.89it/s] 170it [00:17, 9.76it/s] 172it [00:17, 9.88it/s] 174it [00:17, 9.95it/s] 176it [00:17, 10.00it/s] 178it [00:18, 10.04it/s] 180it [00:18, 10.07it/s] 182it [00:18, 10.09it/s] 184it [00:18, 10.11it/s] 186it [00:18, 9.78it/s] 188it [00:19, 9.81it/s] 189it [00:19, 9.42it/s] 190it [00:19, 9.43it/s] 191it [00:19, 9.54it/s] 192it [00:19, 9.63it/s] 193it [00:19, 9.71it/s] 194it [00:19, 9.20it/s] 195it [00:19, 8.98it/s] 196it [00:20, 9.80it/s] +2025-05-26 04:53:40,170 - INFO - Epoch: 30, Objective: tensor([8346.3223], device='cuda:0', grad_fn=), Loss: 0.08652433753013611, KL/n: 72.18109130859375 + 0it [00:00, ?it/s]2025-05-26 04:53:40,444 - INFO - [Epoch 031 | Batch 0000] IWAE-loss 7981.7705 | mean log_px -0.0697 | KL -3537.61 + 1it [00:00, 4.83it/s] 2it [00:00, 6.88it/s] 4it [00:00, 8.00it/s] 5it [00:00, 8.51it/s] 6it [00:00, 8.89it/s] 8it [00:00, 8.96it/s] 10it [00:01, 9.35it/s] 12it [00:01, 9.22it/s] 13it [00:01, 9.36it/s] 15it [00:01, 9.61it/s] 16it [00:01, 9.24it/s] 17it [00:01, 9.39it/s] 18it [00:02, 9.49it/s] 20it [00:02, 9.72it/s] 22it [00:02, 9.84it/s] 23it [00:02, 9.87it/s] 24it [00:02, 9.89it/s] 25it [00:02, 9.91it/s] 27it [00:02, 9.51it/s] 28it [00:03, 9.61it/s] 30it [00:03, 9.78it/s] 31it [00:03, 9.82it/s] 33it [00:03, 9.91it/s] 34it [00:03, 9.93it/s] 35it [00:03, 9.44it/s] 36it [00:03, 9.57it/s] 37it [00:03, 9.63it/s] 38it [00:04, 9.67it/s] 40it [00:04, 9.82it/s] 41it [00:04, 9.84it/s] 42it [00:04, 9.85it/s] 43it [00:04, 9.28it/s] 44it [00:04, 9.44it/s] 46it [00:04, 9.68it/s] 47it [00:04, 9.71it/s] 48it [00:05, 9.78it/s] 50it [00:05, 9.89it/s]2025-05-26 04:53:45,642 - INFO - [Epoch 031 | Batch 0050] IWAE-loss 7131.4248 | mean log_px -0.0549 | KL -3539.47 + 51it [00:05, 9.43it/s] 53it [00:05, 9.66it/s] 55it [00:05, 9.80it/s] 57it [00:06, 9.89it/s] 58it [00:06, 9.91it/s] 60it [00:06, 9.94it/s] 62it [00:06, 9.67it/s] 63it [00:06, 9.72it/s] 65it [00:06, 9.85it/s] 66it [00:06, 9.87it/s] 67it [00:07, 9.88it/s] 68it [00:07, 9.56it/s] 70it [00:07, 9.74it/s] 72it [00:07, 9.85it/s] 74it [00:07, 9.54it/s] 75it [00:07, 9.62it/s] 77it [00:08, 9.77it/s] 78it [00:08, 9.81it/s] 80it [00:08, 9.49it/s] 81it [00:08, 9.58it/s] 83it [00:08, 9.75it/s] 84it [00:08, 9.80it/s] 85it [00:08, 9.85it/s] 86it [00:09, 9.35it/s] 88it [00:09, 9.63it/s] 90it [00:09, 9.79it/s] 91it [00:09, 9.38it/s] 92it [00:09, 9.51it/s] 93it [00:09, 9.62it/s] 94it [00:09, 9.72it/s] 96it [00:10, 9.87it/s] 98it [00:10, 9.94it/s] 100it [00:10, 9.88it/s]2025-05-26 04:53:50,784 - INFO - [Epoch 031 | Batch 0100] IWAE-loss 6414.5449 | mean log_px -0.0424 | KL -3538.34 + 101it [00:10, 9.46it/s] 102it [00:10, 9.57it/s] 104it [00:10, 9.74it/s] 106it [00:11, 9.83it/s] 107it [00:11, 9.81it/s] 108it [00:11, 9.84it/s] 109it [00:11, 9.88it/s] 110it [00:11, 9.89it/s] 111it [00:11, 9.56it/s] 112it [00:11, 9.68it/s] 113it [00:11, 9.19it/s] 114it [00:11, 9.39it/s] 115it [00:11, 9.32it/s] 116it [00:12, 9.35it/s] 117it [00:12, 9.36it/s] 118it [00:12, 8.84it/s] 119it [00:12, 9.10it/s] 120it [00:12, 9.31it/s] 121it [00:12, 9.02it/s] 123it [00:12, 9.47it/s] 124it [00:12, 9.18it/s] 126it [00:13, 9.52it/s] 128it [00:13, 9.71it/s] 130it [00:13, 9.82it/s] 132it [00:13, 9.54it/s] 134it [00:13, 9.69it/s] 136it [00:14, 9.81it/s] 137it [00:14, 9.39it/s] 138it [00:14, 9.48it/s] 139it [00:14, 9.57it/s] 140it [00:14, 9.58it/s] 141it [00:14, 9.21it/s] 142it [00:14, 9.39it/s] 143it [00:14, 9.54it/s] 144it [00:15, 9.66it/s] 145it [00:15, 9.75it/s] 146it [00:15, 9.82it/s] 147it [00:15, 9.85it/s] 148it [00:15, 9.89it/s] 149it [00:15, 9.60it/s] 150it [00:15, 9.11it/s]2025-05-26 04:53:56,048 - INFO - [Epoch 031 | Batch 0150] IWAE-loss 7563.3599 | mean log_px -0.0640 | KL -3531.75 + 151it [00:15, 9.32it/s] 152it [00:15, 9.51it/s] 154it [00:16, 9.75it/s] 155it [00:16, 9.79it/s] 156it [00:16, 9.72it/s] 157it [00:16, 9.74it/s] 158it [00:16, 9.23it/s] 159it [00:16, 9.43it/s] 160it [00:16, 9.57it/s] 162it [00:16, 9.76it/s] 163it [00:17, 9.79it/s] 164it [00:17, 9.43it/s] 165it [00:17, 9.57it/s] 167it [00:17, 9.77it/s] 168it [00:17, 9.82it/s] 170it [00:17, 9.47it/s] 171it [00:17, 9.57it/s] 172it [00:17, 9.67it/s] 174it [00:18, 9.80it/s] 176it [00:18, 9.89it/s] 177it [00:18, 9.46it/s] 178it [00:18, 9.52it/s] 180it [00:18, 9.71it/s] 182it [00:18, 9.84it/s] 183it [00:19, 9.82it/s] 184it [00:19, 9.45it/s] 186it [00:19, 9.68it/s] 188it [00:19, 9.79it/s] 190it [00:19, 9.57it/s] 191it [00:19, 9.64it/s] 192it [00:20, 9.67it/s] 193it [00:20, 9.69it/s] 194it [00:20, 9.76it/s] 195it [00:20, 9.42it/s] 196it [00:20, 9.06it/s] 196it [00:20, 9.55it/s] +2025-05-26 04:54:00,825 - INFO - Epoch: 31, Objective: tensor([6049.7988], device='cuda:0', grad_fn=), Loss: 0.03925026208162308, KL/n: 72.08685302734375 + 0it [00:00, ?it/s]2025-05-26 04:54:01,275 - INFO - [Epoch 032 | Batch 0000] IWAE-loss 5750.3301 | mean log_px -0.0349 | KL -3535.57 + 1it [00:00, 5.40it/s] 2it [00:00, 6.77it/s] 3it [00:00, 7.93it/s] 4it [00:00, 8.37it/s] 5it [00:00, 8.26it/s] 6it [00:00, 8.76it/s] 7it [00:00, 9.08it/s] 8it [00:00, 9.33it/s] 10it [00:01, 9.66it/s] 12it [00:01, 9.82it/s] 13it [00:01, 9.85it/s] 14it [00:01, 9.87it/s] 15it [00:01, 9.38it/s] 16it [00:01, 9.54it/s] 18it [00:01, 9.77it/s] 20it [00:02, 9.86it/s] 22it [00:02, 9.94it/s] 24it [00:02, 9.60it/s] 25it [00:02, 9.58it/s] 26it [00:02, 9.63it/s] 27it [00:02, 9.67it/s] 28it [00:02, 9.75it/s] 29it [00:03, 9.76it/s] 30it [00:03, 9.21it/s] 31it [00:03, 9.41it/s] 33it [00:03, 9.68it/s] 35it [00:03, 9.82it/s] 37it [00:03, 9.91it/s] 39it [00:04, 9.96it/s] 40it [00:04, 9.53it/s] 41it [00:04, 9.61it/s] 42it [00:04, 9.67it/s] 44it [00:04, 9.79it/s] 45it [00:04, 9.83it/s] 46it [00:04, 9.86it/s] 48it [00:05, 9.88it/s] 49it [00:05, 9.90it/s] 50it [00:05, 9.93it/s]2025-05-26 04:54:06,438 - INFO - [Epoch 032 | Batch 0050] IWAE-loss 5072.8218 | mean log_px -0.0260 | KL -3529.07 + 51it [00:05, 9.36it/s] 52it [00:05, 9.50it/s] 53it [00:05, 9.62it/s] 54it [00:05, 9.72it/s] 55it [00:05, 9.27it/s] 56it [00:05, 9.46it/s] 58it [00:06, 9.70it/s] 60it [00:06, 9.51it/s] 62it [00:06, 9.68it/s] 63it [00:06, 9.73it/s] 64it [00:06, 9.78it/s] 66it [00:06, 9.87it/s] 67it [00:07, 9.89it/s] 68it [00:07, 9.90it/s] 70it [00:07, 9.96it/s] 71it [00:07, 9.96it/s] 72it [00:07, 9.96it/s] 73it [00:07, 9.95it/s] 74it [00:07, 9.67it/s] 75it [00:07, 9.33it/s] 77it [00:08, 9.64it/s] 78it [00:08, 9.72it/s] 80it [00:08, 9.85it/s] 82it [00:08, 9.92it/s] 84it [00:08, 9.96it/s] 85it [00:08, 9.97it/s] 86it [00:08, 9.50it/s] 88it [00:09, 9.68it/s] 90it [00:09, 9.80it/s] 91it [00:09, 9.83it/s] 92it [00:09, 9.38it/s] 93it [00:09, 9.33it/s] 94it [00:09, 9.38it/s] 95it [00:09, 9.52it/s] 96it [00:09, 9.62it/s] 97it [00:10, 9.73it/s] 98it [00:10, 9.80it/s] 99it [00:10, 9.84it/s] 100it [00:10, 9.88it/s]2025-05-26 04:54:11,591 - INFO - [Epoch 032 | Batch 0100] IWAE-loss 6324.5918 | mean log_px -0.0521 | KL -3526.06 + 101it [00:10, 9.29it/s] 102it [00:10, 9.48it/s] 103it [00:10, 9.62it/s] 104it [00:10, 9.08it/s] 105it [00:10, 9.32it/s] 106it [00:11, 9.49it/s] 108it [00:11, 9.72it/s] 109it [00:11, 9.78it/s] 110it [00:11, 9.79it/s] 111it [00:11, 9.84it/s] 112it [00:11, 9.86it/s] 114it [00:11, 9.97it/s] 115it [00:11, 9.97it/s] 116it [00:12, 9.95it/s] 117it [00:12, 9.95it/s] 118it [00:12, 9.95it/s] 120it [00:12, 9.98it/s] 122it [00:12, 10.00it/s] 124it [00:12, 10.00it/s] 125it [00:12, 9.56it/s] 126it [00:13, 9.64it/s] 128it [00:13, 9.79it/s] 130it [00:13, 9.88it/s] 131it [00:13, 9.89it/s] 133it [00:13, 9.97it/s] 135it [00:13, 9.95it/s] 136it [00:14, 9.90it/s] 137it [00:14, 9.89it/s] 138it [00:14, 9.92it/s] 140it [00:14, 9.62it/s] 142it [00:14, 9.79it/s] 143it [00:14, 9.83it/s] 144it [00:14, 9.86it/s] 145it [00:14, 9.89it/s] 146it [00:15, 9.91it/s] 148it [00:15, 9.95it/s] 150it [00:15, 10.00it/s]2025-05-26 04:54:16,685 - INFO - [Epoch 032 | Batch 0150] IWAE-loss 7815.7627 | mean log_px -0.0678 | KL -3526.52 + 151it [00:15, 9.53it/s] 152it [00:15, 9.60it/s] 153it [00:15, 9.70it/s] 154it [00:15, 9.77it/s] 156it [00:16, 9.40it/s] 158it [00:16, 9.65it/s] 160it [00:16, 9.79it/s] 161it [00:16, 9.83it/s] 162it [00:16, 9.85it/s] 164it [00:16, 9.50it/s] 165it [00:17, 9.60it/s] 166it [00:17, 9.69it/s] 167it [00:17, 9.76it/s] 168it [00:17, 9.78it/s] 169it [00:17, 9.83it/s] 171it [00:17, 9.93it/s] 173it [00:17, 10.00it/s] 174it [00:17, 9.98it/s] 176it [00:18, 10.01it/s] 178it [00:18, 10.01it/s] 180it [00:18, 9.63it/s] 182it [00:18, 9.77it/s] 183it [00:18, 9.80it/s] 185it [00:19, 9.90it/s] 186it [00:19, 9.91it/s] 187it [00:19, 9.93it/s] 189it [00:19, 9.98it/s] 190it [00:19, 9.61it/s] 191it [00:19, 9.69it/s] 192it [00:19, 9.75it/s] 193it [00:19, 9.78it/s] 195it [00:20, 9.19it/s] 196it [00:20, 9.66it/s] +2025-05-26 04:54:21,428 - INFO - Epoch: 32, Objective: tensor([5291.6196], device='cuda:0', grad_fn=), Loss: 0.03124961443245411, KL/n: 71.98877716064453 + 0it [00:00, ?it/s]2025-05-26 04:54:21,699 - INFO - [Epoch 033 | Batch 0000] IWAE-loss 5486.5654 | mean log_px -0.0308 | KL -3528.38 + 1it [00:00, 5.51it/s] 2it [00:00, 6.92it/s] 4it [00:00, 8.60it/s] 6it [00:00, 8.87it/s] 8it [00:00, 9.32it/s] 9it [00:01, 9.42it/s] 11it [00:01, 9.67it/s] 13it [00:01, 9.81it/s] 14it [00:01, 9.85it/s] 16it [00:01, 9.92it/s] 18it [00:01, 9.98it/s] 20it [00:02, 10.00it/s] 21it [00:02, 9.60it/s] 22it [00:02, 9.68it/s] 23it [00:02, 9.75it/s] 24it [00:02, 9.29it/s] 26it [00:02, 9.58it/s] 28it [00:02, 9.74it/s] 30it [00:03, 9.84it/s] 31it [00:03, 9.52it/s] 32it [00:03, 9.62it/s] 34it [00:03, 9.78it/s] 36it [00:03, 9.87it/s] 38it [00:03, 9.94it/s] 40it [00:04, 9.96it/s] 41it [00:04, 9.55it/s] 42it [00:04, 9.64it/s] 43it [00:04, 9.71it/s] 44it [00:04, 9.77it/s] 46it [00:04, 9.88it/s] 47it [00:04, 9.84it/s] 49it [00:05, 9.91it/s] 50it [00:05, 9.93it/s]2025-05-26 04:54:26,817 - INFO - [Epoch 033 | Batch 0050] IWAE-loss 5826.6826 | mean log_px -0.0356 | KL -3525.49 + 51it [00:05, 9.40it/s] 53it [00:05, 9.65it/s] 55it [00:05, 9.79it/s] 56it [00:05, 9.83it/s] 58it [00:06, 9.50it/s] 59it [00:06, 9.60it/s] 60it [00:06, 9.69it/s] 62it [00:06, 9.49it/s] 63it [00:06, 9.49it/s] 65it [00:06, 9.70it/s] 67it [00:06, 9.85it/s] 68it [00:07, 9.87it/s] 70it [00:07, 9.94it/s] 71it [00:07, 9.86it/s] 72it [00:07, 9.88it/s] 74it [00:07, 9.94it/s] 76it [00:07, 9.97it/s] 78it [00:08, 10.01it/s] 80it [00:08, 9.66it/s] 82it [00:08, 9.78it/s] 84it [00:08, 9.86it/s] 86it [00:08, 9.91it/s] 88it [00:09, 9.94it/s] 90it [00:09, 9.97it/s] 91it [00:09, 9.66it/s] 92it [00:09, 9.73it/s] 94it [00:09, 9.84it/s] 96it [00:09, 9.90it/s] 98it [00:10, 9.95it/s] 100it [00:10, 9.98it/s]2025-05-26 04:54:31,917 - INFO - [Epoch 033 | Batch 0100] IWAE-loss 7603.5825 | mean log_px -0.0618 | KL -3521.97 + 101it [00:10, 9.57it/s] 102it [00:10, 9.64it/s] 104it [00:10, 9.79it/s] 106it [00:10, 9.51it/s] 108it [00:11, 9.68it/s] 110it [00:11, 9.78it/s] 112it [00:11, 9.85it/s] 114it [00:11, 9.91it/s] 116it [00:11, 9.96it/s] 118it [00:12, 9.98it/s] 120it [00:12, 10.01it/s] 122it [00:12, 9.75it/s] 123it [00:12, 9.79it/s] 124it [00:12, 9.83it/s] 126it [00:12, 9.92it/s] 128it [00:13, 9.97it/s] 130it [00:13, 10.00it/s] 132it [00:13, 10.01it/s] 134it [00:13, 10.02it/s] 136it [00:13, 10.03it/s] 138it [00:14, 9.75it/s] 140it [00:14, 9.84it/s] 141it [00:14, 9.49it/s] 142it [00:14, 9.58it/s] 144it [00:14, 9.74it/s] 145it [00:14, 9.79it/s] 146it [00:14, 9.84it/s] 148it [00:15, 9.92it/s] 149it [00:15, 9.58it/s] 150it [00:15, 9.66it/s]2025-05-26 04:54:37,024 - INFO - [Epoch 033 | Batch 0150] IWAE-loss 5245.3364 | mean log_px -0.0273 | KL -3525.40 + 151it [00:15, 9.70it/s] 153it [00:15, 9.39it/s] 154it [00:15, 9.52it/s] 156it [00:16, 9.71it/s] 158it [00:16, 9.36it/s] 159it [00:16, 9.47it/s] 160it [00:16, 9.58it/s] 161it [00:16, 9.18it/s] 162it [00:16, 9.27it/s] 163it [00:16, 9.43it/s] 164it [00:16, 9.58it/s] 165it [00:16, 9.68it/s] 166it [00:17, 9.74it/s] 168it [00:17, 9.87it/s] 170it [00:17, 9.94it/s] 171it [00:17, 9.87it/s] 172it [00:17, 9.47it/s] 174it [00:17, 9.69it/s] 176it [00:18, 9.81it/s] 178it [00:18, 9.88it/s] 180it [00:18, 9.57it/s] 182it [00:18, 9.72it/s] 184it [00:18, 9.82it/s] 186it [00:19, 9.89it/s] 187it [00:19, 9.89it/s] 188it [00:19, 9.91it/s] 190it [00:19, 9.96it/s] 192it [00:19, 9.99it/s] 193it [00:19, 9.98it/s] 194it [00:19, 9.60it/s] 195it [00:20, 9.29it/s] 196it [00:20, 9.69it/s] +2025-05-26 04:54:41,780 - INFO - Epoch: 33, Objective: tensor([9180.2832], device='cuda:0', grad_fn=), Loss: 0.08810441941022873, KL/n: 71.89595794677734 + 0it [00:00, ?it/s]2025-05-26 04:54:42,252 - INFO - [Epoch 034 | Batch 0000] IWAE-loss 7107.1201 | mean log_px -0.0598 | KL -3525.40 + 1it [00:00, 2.51it/s] 2it [00:00, 4.42it/s] 3it [00:00, 5.88it/s] 4it [00:00, 6.57it/s] 5it [00:00, 7.46it/s] 6it [00:00, 8.13it/s] 7it [00:01, 8.61it/s] 8it [00:01, 8.43it/s] 9it [00:01, 8.80it/s] 10it [00:01, 8.99it/s] 11it [00:01, 9.02it/s] 12it [00:01, 8.51it/s] 13it [00:01, 8.89it/s] 14it [00:01, 9.15it/s] 15it [00:01, 9.39it/s] 16it [00:02, 8.96it/s] 17it [00:02, 9.22it/s] 18it [00:02, 9.41it/s] 19it [00:02, 9.54it/s] 20it [00:02, 9.04it/s] 21it [00:02, 9.29it/s] 22it [00:02, 9.43it/s] 23it [00:02, 9.57it/s] 24it [00:02, 9.09it/s] 25it [00:02, 9.24it/s] 26it [00:03, 9.33it/s] 27it [00:03, 9.49it/s] 28it [00:03, 9.04it/s] 29it [00:03, 9.28it/s] 30it [00:03, 9.45it/s] 31it [00:03, 9.58it/s] 32it [00:03, 9.08it/s] 33it [00:03, 9.33it/s] 34it [00:03, 9.49it/s] 35it [00:04, 9.61it/s] 36it [00:04, 9.23it/s] 38it [00:04, 9.60it/s] 40it [00:04, 9.45it/s] 42it [00:04, 9.67it/s] 43it [00:04, 9.29it/s] 44it [00:05, 9.44it/s] 46it [00:05, 9.67it/s] 47it [00:05, 9.29it/s] 48it [00:05, 9.43it/s] 50it [00:05, 9.68it/s]2025-05-26 04:54:47,614 - INFO - [Epoch 034 | Batch 0050] IWAE-loss 5209.7563 | mean log_px -0.0287 | KL -3518.90 + 52it [00:05, 9.41it/s] 54it [00:06, 9.62it/s] 55it [00:06, 9.69it/s] 56it [00:06, 9.75it/s] 58it [00:06, 9.87it/s] 59it [00:06, 9.53it/s] 61it [00:06, 9.73it/s] 62it [00:06, 9.78it/s] 64it [00:07, 9.55it/s] 66it [00:07, 9.64it/s] 67it [00:07, 9.70it/s] 69it [00:07, 9.50it/s] 70it [00:07, 9.59it/s] 72it [00:07, 9.33it/s] 73it [00:08, 9.40it/s] 74it [00:08, 9.46it/s] 75it [00:08, 9.50it/s] 76it [00:08, 9.56it/s] 77it [00:08, 9.61it/s] 79it [00:08, 9.81it/s] 80it [00:08, 9.84it/s] 82it [00:08, 9.93it/s] 83it [00:09, 9.58it/s] 84it [00:09, 9.68it/s] 86it [00:09, 9.83it/s] 88it [00:09, 9.59it/s] 90it [00:09, 9.74it/s] 91it [00:09, 9.37it/s] 93it [00:10, 9.59it/s] 94it [00:10, 9.66it/s] 96it [00:10, 9.79it/s] 98it [00:10, 9.57it/s] 99it [00:10, 9.63it/s] 100it [00:10, 9.70it/s]2025-05-26 04:54:52,807 - INFO - [Epoch 034 | Batch 0100] IWAE-loss 6808.0835 | mean log_px -0.0500 | KL -3514.93 + 101it [00:10, 9.74it/s] 102it [00:11, 9.26it/s] 104it [00:11, 9.56it/s] 105it [00:11, 9.66it/s] 106it [00:11, 9.72it/s] 107it [00:11, 9.35it/s] 108it [00:11, 9.50it/s] 110it [00:11, 9.27it/s] 111it [00:11, 9.43it/s] 112it [00:12, 9.56it/s] 113it [00:12, 9.66it/s] 115it [00:12, 9.81it/s] 116it [00:12, 9.85it/s] 118it [00:12, 9.88it/s] 119it [00:12, 9.91it/s] 120it [00:12, 9.52it/s] 121it [00:13, 9.64it/s] 122it [00:13, 9.72it/s] 124it [00:13, 9.50it/s] 126it [00:13, 9.71it/s] 128it [00:13, 9.53it/s] 129it [00:13, 9.57it/s] 131it [00:14, 9.74it/s] 133it [00:14, 9.55it/s] 134it [00:14, 9.63it/s] 136it [00:14, 9.77it/s] 137it [00:14, 9.48it/s] 138it [00:14, 9.58it/s] 139it [00:14, 9.68it/s] 140it [00:14, 9.74it/s] 142it [00:15, 9.50it/s] 144it [00:15, 9.70it/s] 145it [00:15, 9.74it/s] 146it [00:15, 9.40it/s] 148it [00:15, 9.66it/s] 149it [00:15, 9.36it/s] 150it [00:16, 9.50it/s]2025-05-26 04:54:58,018 - INFO - [Epoch 034 | Batch 0150] IWAE-loss 7905.4756 | mean log_px -0.0700 | KL -3521.38 + 151it [00:16, 9.62it/s] 152it [00:16, 9.71it/s] 154it [00:16, 9.82it/s] 155it [00:16, 9.48it/s] 157it [00:16, 9.71it/s] 158it [00:16, 9.77it/s] 159it [00:16, 9.36it/s] 160it [00:17, 9.51it/s] 162it [00:17, 9.73it/s] 164it [00:17, 9.52it/s] 166it [00:17, 9.68it/s] 168it [00:17, 9.43it/s] 170it [00:18, 9.61it/s] 172it [00:18, 9.72it/s] 174it [00:18, 9.82it/s] 175it [00:18, 9.55it/s] 176it [00:18, 9.55it/s] 177it [00:18, 9.64it/s] 179it [00:19, 9.80it/s] 180it [00:19, 9.46it/s] 181it [00:19, 9.57it/s] 182it [00:19, 9.64it/s] 183it [00:19, 9.63it/s] 184it [00:19, 9.58it/s] 185it [00:19, 9.67it/s] 186it [00:19, 9.76it/s] 187it [00:19, 9.19it/s] 188it [00:19, 9.42it/s] 189it [00:20, 9.57it/s] 190it [00:20, 9.52it/s] 191it [00:20, 8.92it/s] 192it [00:20, 9.14it/s] 193it [00:20, 9.30it/s] 194it [00:20, 8.91it/s] 195it [00:20, 8.80it/s] 196it [00:20, 9.36it/s] +2025-05-26 04:55:02,859 - INFO - Epoch: 34, Objective: tensor([7032.6973], device='cuda:0', grad_fn=), Loss: 0.05743390694260597, KL/n: 71.76044464111328 + 0it [00:00, ?it/s]2025-05-26 04:55:03,143 - INFO - [Epoch 035 | Batch 0000] IWAE-loss 5518.7554 | mean log_px -0.0321 | KL -3518.21 + 1it [00:00, 4.48it/s] 2it [00:00, 6.57it/s] 4it [00:00, 7.96it/s] 6it [00:00, 8.84it/s] 8it [00:00, 8.93it/s] 10it [00:01, 9.31it/s] 12it [00:01, 9.57it/s] 13it [00:01, 9.27it/s] 15it [00:01, 9.55it/s] 17it [00:01, 9.37it/s] 19it [00:02, 9.60it/s] 21it [00:02, 9.76it/s] 22it [00:02, 9.42it/s] 24it [00:02, 9.64it/s] 26it [00:02, 9.42it/s] 28it [00:03, 9.62it/s] 30it [00:03, 9.43it/s] 32it [00:03, 9.63it/s] 34it [00:03, 9.45it/s] 36it [00:03, 9.61it/s] 38it [00:04, 9.43it/s] 40it [00:04, 9.62it/s] 42it [00:04, 9.43it/s] 44it [00:04, 9.63it/s] 46it [00:04, 9.44it/s] 48it [00:05, 9.63it/s] 50it [00:05, 9.36it/s]2025-05-26 04:55:08,412 - INFO - [Epoch 035 | Batch 0050] IWAE-loss 10205.3838 | mean log_px -0.0955 | KL -3515.78 + 51it [00:05, 9.46it/s] 53it [00:05, 9.67it/s] 54it [00:05, 9.43it/s] 56it [00:05, 9.65it/s] 57it [00:06, 9.40it/s] 59it [00:06, 9.66it/s] 61it [00:06, 9.52it/s] 62it [00:06, 9.54it/s] 63it [00:06, 9.52it/s] 64it [00:06, 9.26it/s] 66it [00:07, 9.59it/s] 68it [00:07, 9.79it/s] 70it [00:07, 9.61it/s] 72it [00:07, 9.74it/s] 74it [00:07, 9.58it/s] 76it [00:08, 9.75it/s] 78it [00:08, 9.60it/s] 80it [00:08, 9.77it/s] 81it [00:08, 9.53it/s] 82it [00:08, 9.56it/s] 84it [00:08, 9.65it/s] 86it [00:09, 9.78it/s] 87it [00:09, 9.51it/s] 88it [00:09, 9.40it/s] 89it [00:09, 9.52it/s] 90it [00:09, 9.63it/s] 92it [00:09, 9.84it/s] 93it [00:09, 9.41it/s] 95it [00:10, 9.68it/s] 97it [00:10, 9.53it/s] 99it [00:10, 9.72it/s] 100it [00:10, 9.46it/s]2025-05-26 04:55:13,616 - INFO - [Epoch 035 | Batch 0100] IWAE-loss 7475.6548 | mean log_px -0.0570 | KL -3514.94 + 102it [00:10, 9.68it/s] 104it [00:10, 9.58it/s] 106it [00:11, 9.75it/s] 108it [00:11, 9.59it/s] 110it [00:11, 9.76it/s] 112it [00:11, 9.74it/s] 113it [00:11, 9.41it/s] 114it [00:12, 9.41it/s] 115it [00:12, 9.52it/s] 116it [00:12, 9.60it/s] 117it [00:12, 9.68it/s] 118it [00:12, 9.74it/s] 119it [00:12, 9.80it/s] 120it [00:12, 9.84it/s] 121it [00:12, 9.87it/s] 122it [00:12, 9.40it/s] 124it [00:13, 9.62it/s] 125it [00:13, 9.70it/s] 126it [00:13, 9.36it/s] 128it [00:13, 9.68it/s] 129it [00:13, 9.38it/s] 131it [00:13, 9.67it/s] 133it [00:13, 9.52it/s] 135it [00:14, 9.72it/s] 136it [00:14, 9.46it/s] 138it [00:14, 9.71it/s] 140it [00:14, 9.55it/s] 142it [00:14, 9.74it/s] 143it [00:15, 9.41it/s] 145it [00:15, 9.65it/s] 147it [00:15, 9.79it/s] 148it [00:15, 9.51it/s] 150it [00:15, 9.74it/s]2025-05-26 04:55:18,800 - INFO - [Epoch 035 | Batch 0150] IWAE-loss 5995.6523 | mean log_px -0.0361 | KL -3514.44 + 152it [00:15, 9.57it/s] 154it [00:16, 9.75it/s] 156it [00:16, 9.59it/s] 158it [00:16, 9.75it/s] 159it [00:16, 9.52it/s] 161it [00:16, 9.72it/s] 162it [00:17, 9.47it/s] 164it [00:17, 9.70it/s] 165it [00:17, 9.44it/s] 167it [00:17, 9.69it/s] 168it [00:17, 9.42it/s] 170it [00:17, 9.68it/s] 172it [00:18, 9.52it/s] 174it [00:18, 9.72it/s] 175it [00:18, 9.46it/s] 177it [00:18, 9.71it/s] 178it [00:18, 9.44it/s] 180it [00:18, 9.67it/s] 182it [00:19, 9.47it/s] 184it [00:19, 9.68it/s] 186it [00:19, 9.55it/s] 188it [00:19, 9.71it/s] 190it [00:19, 9.56it/s] 192it [00:20, 9.73it/s] 193it [00:20, 9.50it/s] 195it [00:20, 9.45it/s] 196it [00:20, 9.51it/s] +2025-05-26 04:55:23,596 - INFO - Epoch: 35, Objective: tensor([5837.2930], device='cuda:0', grad_fn=), Loss: 0.03758452087640762, KL/n: 71.64217376708984 + 0it [00:00, ?it/s]2025-05-26 04:55:24,044 - INFO - [Epoch 036 | Batch 0000] IWAE-loss 5874.6455 | mean log_px -0.0372 | KL -3509.21 + 1it [00:00, 4.78it/s] 3it [00:00, 7.82it/s] 4it [00:00, 7.87it/s] 6it [00:00, 8.82it/s] 7it [00:00, 9.09it/s] 8it [00:00, 8.83it/s] 10it [00:01, 9.31it/s] 11it [00:01, 9.01it/s] 13it [00:01, 9.43it/s] 14it [00:01, 9.54it/s] 15it [00:01, 9.18it/s] 17it [00:01, 9.53it/s] 18it [00:01, 9.62it/s] 19it [00:02, 9.26it/s] 21it [00:02, 9.58it/s] 22it [00:02, 9.32it/s] 24it [00:02, 9.60it/s] 25it [00:02, 9.35it/s] 26it [00:02, 9.49it/s] 27it [00:02, 9.34it/s] 28it [00:03, 9.09it/s] 30it [00:03, 9.49it/s] 31it [00:03, 9.60it/s] 32it [00:03, 9.69it/s] 34it [00:03, 9.83it/s] 36it [00:03, 9.56it/s] 37it [00:03, 9.64it/s] 38it [00:04, 9.70it/s] 40it [00:04, 9.50it/s] 42it [00:04, 9.69it/s] 44it [00:04, 9.55it/s] 46it [00:04, 9.72it/s] 48it [00:05, 9.55it/s] 49it [00:05, 9.62it/s]2025-05-26 04:55:29,308 - INFO - [Epoch 036 | Batch 0050] IWAE-loss 5224.4829 | mean log_px -0.0283 | KL -3501.39 + 51it [00:05, 9.40it/s] 53it [00:05, 9.61it/s] 55it [00:05, 9.75it/s] 57it [00:06, 9.56it/s] 59it [00:06, 9.71it/s] 61it [00:06, 9.54it/s] 63it [00:06, 9.69it/s] 65it [00:06, 9.53it/s] 67it [00:07, 9.69it/s] 69it [00:07, 9.54it/s] 70it [00:07, 9.61it/s] 72it [00:07, 9.76it/s] 74it [00:07, 9.55it/s] 76it [00:08, 9.70it/s] 77it [00:08, 9.37it/s] 78it [00:08, 9.49it/s] 80it [00:08, 9.69it/s] 82it [00:08, 9.80it/s] 83it [00:08, 9.84it/s] 84it [00:08, 9.39it/s] 86it [00:09, 9.64it/s] 88it [00:09, 9.78it/s] 89it [00:09, 9.49it/s] 90it [00:09, 9.58it/s] 92it [00:09, 9.76it/s] 94it [00:09, 9.47it/s] 96it [00:10, 9.65it/s] 98it [00:10, 9.78it/s] 99it [00:10, 9.50it/s] 100it [00:10, 9.60it/s]2025-05-26 04:55:34,513 - INFO - [Epoch 036 | Batch 0100] IWAE-loss 8589.2041 | mean log_px -0.0804 | KL -3509.35 + 101it [00:10, 9.67it/s] 102it [00:10, 9.29it/s] 103it [00:10, 9.43it/s] 104it [00:10, 9.53it/s] 105it [00:11, 9.45it/s] 106it [00:11, 9.10it/s] 107it [00:11, 9.33it/s] 108it [00:11, 9.46it/s] 109it [00:11, 9.59it/s] 110it [00:11, 9.22it/s] 111it [00:11, 9.34it/s] 112it [00:11, 9.50it/s] 113it [00:11, 8.96it/s] 114it [00:12, 9.21it/s] 115it [00:12, 8.87it/s] 116it [00:12, 9.16it/s] 117it [00:12, 9.31it/s] 118it [00:12, 9.40it/s] 119it [00:12, 8.99it/s] 120it [00:12, 9.27it/s] 121it [00:12, 9.45it/s] 122it [00:12, 8.99it/s] 124it [00:13, 9.44it/s] 125it [00:13, 9.08it/s] 127it [00:13, 9.46it/s] 128it [00:13, 9.56it/s] 129it [00:13, 9.24it/s] 130it [00:13, 9.36it/s] 131it [00:13, 9.52it/s] 132it [00:13, 9.59it/s] 133it [00:14, 9.67it/s] 134it [00:14, 9.18it/s] 136it [00:14, 9.54it/s] 138it [00:14, 9.72it/s] 140it [00:14, 9.83it/s] 141it [00:14, 9.51it/s] 142it [00:15, 9.57it/s] 143it [00:15, 9.66it/s] 144it [00:15, 9.74it/s] 146it [00:15, 9.50it/s] 148it [00:15, 9.69it/s] 149it [00:15, 9.75it/s] 150it [00:15, 9.32it/s]2025-05-26 04:55:39,830 - INFO - [Epoch 036 | Batch 0150] IWAE-loss 5136.7231 | mean log_px -0.0261 | KL -3499.86 + 151it [00:15, 9.44it/s] 152it [00:16, 9.58it/s] 154it [00:16, 9.77it/s] 156it [00:16, 9.55it/s] 158it [00:16, 9.72it/s] 160it [00:16, 9.55it/s] 162it [00:17, 9.71it/s] 163it [00:17, 9.76it/s] 164it [00:17, 9.68it/s] 165it [00:17, 9.39it/s] 166it [00:17, 9.51it/s] 167it [00:17, 9.62it/s] 168it [00:17, 9.70it/s] 169it [00:17, 9.78it/s] 170it [00:17, 9.24it/s] 172it [00:18, 9.56it/s] 174it [00:18, 9.73it/s] 176it [00:18, 9.84it/s] 177it [00:18, 9.52it/s] 178it [00:18, 9.53it/s] 179it [00:18, 9.64it/s] 181it [00:19, 9.81it/s] 182it [00:19, 9.47it/s] 184it [00:19, 9.70it/s] 186it [00:19, 9.51it/s] 187it [00:19, 9.51it/s] 188it [00:19, 9.41it/s] 189it [00:19, 9.04it/s] 190it [00:20, 9.11it/s] 191it [00:20, 8.81it/s] 192it [00:20, 8.96it/s] 194it [00:20, 8.98it/s] 195it [00:20, 8.88it/s] 196it [00:20, 9.43it/s] +2025-05-26 04:55:44,685 - INFO - Epoch: 36, Objective: tensor([6148.1465], device='cuda:0', grad_fn=), Loss: 0.04331137239933014, KL/n: 71.53656005859375 + 0it [00:00, ?it/s]2025-05-26 04:55:44,958 - INFO - [Epoch 037 | Batch 0000] IWAE-loss 5157.5024 | mean log_px -0.0263 | KL -3506.90 + 1it [00:00, 4.71it/s] 2it [00:00, 6.76it/s] 4it [00:00, 8.00it/s] 6it [00:00, 8.84it/s] 8it [00:00, 8.91it/s] 9it [00:01, 9.11it/s] 11it [00:01, 9.08it/s] 12it [00:01, 9.13it/s] 13it [00:01, 9.17it/s] 14it [00:01, 9.11it/s] 15it [00:01, 9.33it/s] 16it [00:01, 9.47it/s] 18it [00:02, 9.72it/s] 19it [00:02, 9.77it/s] 20it [00:02, 9.82it/s] 22it [00:02, 9.90it/s] 23it [00:02, 9.91it/s] 24it [00:02, 9.54it/s] 25it [00:02, 9.40it/s] 27it [00:02, 9.68it/s] 28it [00:03, 9.68it/s] 29it [00:03, 9.71it/s] 31it [00:03, 9.40it/s] 32it [00:03, 9.52it/s] 33it [00:03, 9.63it/s] 34it [00:03, 9.71it/s] 36it [00:03, 9.84it/s] 37it [00:03, 9.87it/s] 38it [00:04, 9.89it/s] 40it [00:04, 9.94it/s] 42it [00:04, 9.55it/s] 43it [00:04, 9.64it/s] 45it [00:04, 9.79it/s] 47it [00:04, 9.87it/s] 48it [00:05, 9.89it/s] 50it [00:05, 9.93it/s]2025-05-26 04:55:50,161 - INFO - [Epoch 037 | Batch 0050] IWAE-loss 6418.6987 | mean log_px -0.0469 | KL -3502.43 + 51it [00:05, 9.94it/s] 52it [00:05, 9.95it/s] 54it [00:05, 9.98it/s] 55it [00:05, 9.97it/s] 56it [00:05, 9.97it/s] 58it [00:06, 9.99it/s] 60it [00:06, 10.01it/s] 62it [00:06, 10.03it/s] 64it [00:06, 9.66it/s] 66it [00:06, 9.78it/s] 68it [00:07, 9.86it/s] 70it [00:07, 9.92it/s] 72it [00:07, 9.96it/s] 74it [00:07, 9.98it/s] 75it [00:07, 9.99it/s] 77it [00:08, 10.01it/s] 79it [00:08, 10.01it/s] 81it [00:08, 10.03it/s] 83it [00:08, 10.04it/s] 85it [00:08, 10.03it/s] 87it [00:08, 10.04it/s] 89it [00:09, 10.04it/s] 91it [00:09, 10.03it/s] 93it [00:09, 10.02it/s] 95it [00:09, 10.02it/s] 97it [00:09, 10.03it/s] 99it [00:10, 10.04it/s]2025-05-26 04:55:55,168 - INFO - [Epoch 037 | Batch 0100] IWAE-loss 5038.2764 | mean log_px -0.0247 | KL -3498.83 + 101it [00:10, 10.03it/s] 103it [00:10, 10.03it/s] 105it [00:10, 10.04it/s] 107it [00:11, 9.65it/s] 108it [00:11, 9.70it/s] 110it [00:11, 9.82it/s] 112it [00:11, 9.89it/s] 114it [00:11, 9.94it/s] 115it [00:11, 9.94it/s] 116it [00:11, 9.95it/s] 117it [00:12, 9.44it/s] 118it [00:12, 9.57it/s] 119it [00:12, 9.66it/s] 121it [00:12, 9.81it/s] 122it [00:12, 9.84it/s] 124it [00:12, 9.92it/s] 126it [00:12, 9.95it/s] 128it [00:13, 9.98it/s] 130it [00:13, 9.99it/s] 132it [00:13, 10.01it/s] 133it [00:13, 10.00it/s] 134it [00:13, 9.96it/s] 135it [00:13, 9.96it/s] 137it [00:14, 10.00it/s] 138it [00:14, 9.99it/s] 140it [00:14, 10.01it/s] 141it [00:14, 10.01it/s] 142it [00:14, 9.90it/s] 143it [00:14, 9.88it/s] 144it [00:14, 9.89it/s] 146it [00:14, 9.92it/s] 147it [00:15, 9.86it/s] 148it [00:15, 9.87it/s] 149it [00:15, 9.89it/s] 150it [00:15, 9.91it/s]2025-05-26 04:56:00,228 - INFO - [Epoch 037 | Batch 0150] IWAE-loss 6093.8408 | mean log_px -0.0371 | KL -3496.12 + 151it [00:15, 9.91it/s] 153it [00:15, 9.97it/s] 154it [00:15, 9.96it/s] 156it [00:15, 10.00it/s] 158it [00:16, 10.01it/s] 160it [00:16, 10.01it/s] 162it [00:16, 10.03it/s] 164it [00:16, 9.98it/s] 166it [00:16, 10.01it/s] 168it [00:17, 10.02it/s] 170it [00:17, 10.02it/s] 172it [00:17, 10.02it/s] 174it [00:17, 10.03it/s] 176it [00:17, 10.03it/s] 178it [00:18, 10.03it/s] 180it [00:18, 10.03it/s] 182it [00:18, 10.03it/s] 184it [00:18, 10.03it/s] 186it [00:18, 10.04it/s] 188it [00:19, 10.04it/s] 190it [00:19, 9.69it/s] 192it [00:19, 9.79it/s] 194it [00:19, 9.85it/s] 195it [00:19, 9.60it/s] 196it [00:20, 9.78it/s] +2025-05-26 04:56:04,851 - INFO - Epoch: 37, Objective: tensor([7495.4062], device='cuda:0', grad_fn=), Loss: 0.06337570399045944, KL/n: 71.414794921875 + 0it [00:00, ?it/s]2025-05-26 04:56:05,308 - INFO - [Epoch 038 | Batch 0000] IWAE-loss 8049.1758 | mean log_px -0.0730 | KL -3499.70 + 1it [00:00, 4.66it/s] 2it [00:00, 6.73it/s] 4it [00:00, 8.47it/s] 6it [00:00, 9.14it/s] 8it [00:00, 9.49it/s] 10it [00:01, 9.66it/s] 12it [00:01, 9.78it/s] 14it [00:01, 9.84it/s] 15it [00:01, 9.87it/s] 16it [00:01, 9.88it/s] 18it [00:01, 9.93it/s] 20it [00:02, 9.98it/s] 21it [00:02, 9.97it/s] 22it [00:02, 9.96it/s] 23it [00:02, 9.96it/s] 24it [00:02, 9.95it/s] 25it [00:02, 9.96it/s] 26it [00:02, 9.95it/s] 27it [00:02, 9.91it/s] 28it [00:02, 9.91it/s] 30it [00:03, 9.96it/s] 32it [00:03, 10.00it/s] 33it [00:03, 9.99it/s] 34it [00:03, 9.98it/s] 35it [00:03, 9.97it/s] 36it [00:03, 9.97it/s] 37it [00:03, 9.97it/s] 38it [00:03, 9.96it/s] 39it [00:04, 9.97it/s] 40it [00:04, 9.97it/s] 42it [00:04, 10.00it/s] 44it [00:04, 10.01it/s] 45it [00:04, 10.00it/s] 46it [00:04, 9.98it/s] 48it [00:04, 9.99it/s] 50it [00:05, 10.01it/s]2025-05-26 04:56:10,344 - INFO - [Epoch 038 | Batch 0050] IWAE-loss 5952.2158 | mean log_px -0.0410 | KL -3503.08 + 52it [00:05, 9.98it/s] 54it [00:05, 10.00it/s] 56it [00:05, 9.93it/s] 57it [00:05, 9.92it/s] 58it [00:05, 9.93it/s] 60it [00:06, 9.96it/s] 62it [00:06, 9.98it/s] 63it [00:06, 9.97it/s] 64it [00:06, 9.94it/s] 65it [00:06, 9.94it/s] 66it [00:06, 9.94it/s] 68it [00:06, 10.01it/s] 70it [00:07, 10.01it/s] 71it [00:07, 9.99it/s] 72it [00:07, 9.98it/s] 73it [00:07, 9.98it/s] 74it [00:07, 9.97it/s] 76it [00:07, 9.97it/s] 78it [00:07, 9.98it/s] 80it [00:08, 10.00it/s] 82it [00:08, 10.00it/s] 83it [00:08, 9.99it/s] 85it [00:08, 10.01it/s] 87it [00:08, 10.02it/s] 89it [00:09, 10.03it/s] 91it [00:09, 10.02it/s] 93it [00:09, 9.58it/s] 94it [00:09, 9.64it/s] 95it [00:09, 9.69it/s] 97it [00:09, 9.82it/s] 98it [00:09, 9.85it/s] 100it [00:10, 9.92it/s]2025-05-26 04:56:15,379 - INFO - [Epoch 038 | Batch 0100] IWAE-loss 7382.7646 | mean log_px -0.0584 | KL -3494.08 + 101it [00:10, 9.48it/s] 102it [00:10, 9.57it/s] 104it [00:10, 9.78it/s] 105it [00:10, 9.34it/s] 106it [00:10, 9.49it/s] 107it [00:10, 9.61it/s] 108it [00:11, 9.71it/s] 110it [00:11, 9.85it/s] 112it [00:11, 9.93it/s] 113it [00:11, 9.56it/s] 114it [00:11, 9.65it/s] 115it [00:11, 9.73it/s] 116it [00:11, 9.79it/s] 118it [00:12, 9.50it/s] 120it [00:12, 9.69it/s] 122it [00:12, 9.20it/s] 123it [00:12, 9.16it/s] 124it [00:12, 9.15it/s] 125it [00:12, 9.16it/s] 126it [00:12, 8.70it/s] 127it [00:13, 8.82it/s] 128it [00:13, 8.94it/s] 129it [00:13, 8.63it/s] 130it [00:13, 8.89it/s] 131it [00:13, 9.14it/s] 132it [00:13, 9.29it/s] 133it [00:13, 9.44it/s] 134it [00:13, 9.53it/s] 136it [00:13, 9.76it/s] 138it [00:14, 9.87it/s] 140it [00:14, 9.94it/s] 142it [00:14, 9.97it/s] 144it [00:14, 9.99it/s] 146it [00:14, 10.02it/s] 148it [00:15, 10.01it/s] 150it [00:15, 10.04it/s]2025-05-26 04:56:20,610 - INFO - [Epoch 038 | Batch 0150] IWAE-loss 5241.9893 | mean log_px -0.0268 | KL -3495.52 + 152it [00:15, 10.02it/s] 154it [00:15, 10.01it/s] 156it [00:15, 10.00it/s] 158it [00:16, 9.99it/s] 160it [00:16, 9.99it/s] 162it [00:16, 10.00it/s] 164it [00:16, 10.01it/s] 166it [00:16, 9.93it/s] 167it [00:17, 9.90it/s] 168it [00:17, 9.89it/s] 170it [00:17, 9.95it/s] 172it [00:17, 10.00it/s] 174it [00:17, 10.03it/s] 176it [00:17, 10.02it/s] 178it [00:18, 10.02it/s] 180it [00:18, 10.03it/s] 182it [00:18, 10.02it/s] 184it [00:18, 10.03it/s] 186it [00:18, 10.05it/s] 188it [00:19, 10.03it/s] 190it [00:19, 10.04it/s] 192it [00:19, 9.58it/s] 194it [00:19, 9.71it/s] 195it [00:19, 9.11it/s] 196it [00:20, 9.74it/s] +2025-05-26 04:56:25,284 - INFO - Epoch: 38, Objective: tensor([6876.5137], device='cuda:0', grad_fn=), Loss: 0.05297667905688286, KL/n: 71.28185272216797 + 0it [00:00, ?it/s]2025-05-26 04:56:25,566 - INFO - [Epoch 039 | Batch 0000] IWAE-loss 6343.7041 | mean log_px -0.0524 | KL -3491.50 + 1it [00:00, 5.16it/s] 2it [00:00, 7.18it/s] 4it [00:00, 8.75it/s] 6it [00:00, 9.31it/s] 8it [00:00, 9.59it/s] 10it [00:01, 9.75it/s] 12it [00:01, 9.78it/s] 13it [00:01, 9.81it/s] 14it [00:01, 9.83it/s] 16it [00:01, 9.91it/s] 18it [00:01, 9.93it/s] 20it [00:02, 9.97it/s] 22it [00:02, 9.99it/s] 24it [00:02, 10.01it/s] 26it [00:02, 10.02it/s] 28it [00:02, 10.02it/s] 30it [00:03, 10.04it/s] 32it [00:03, 10.05it/s] 34it [00:03, 10.03it/s] 36it [00:03, 10.02it/s] 38it [00:03, 10.03it/s] 40it [00:04, 10.04it/s] 42it [00:04, 10.02it/s] 44it [00:04, 10.03it/s] 46it [00:04, 9.80it/s] 48it [00:04, 9.86it/s] 49it [00:05, 9.86it/s] 50it [00:05, 9.85it/s]2025-05-26 04:56:30,581 - INFO - [Epoch 039 | Batch 0050] IWAE-loss 5679.2578 | mean log_px -0.0351 | KL -3490.73 + 51it [00:05, 9.87it/s] 52it [00:05, 9.88it/s] 54it [00:05, 9.94it/s] 55it [00:05, 9.94it/s] 56it [00:05, 9.95it/s] 57it [00:05, 9.96it/s] 58it [00:05, 9.95it/s] 59it [00:06, 9.96it/s] 60it [00:06, 9.94it/s] 61it [00:06, 9.94it/s] 62it [00:06, 9.95it/s] 64it [00:06, 9.98it/s] 65it [00:06, 9.85it/s] 66it [00:06, 9.84it/s] 68it [00:06, 9.92it/s] 70it [00:07, 9.96it/s] 72it [00:07, 9.99it/s] 73it [00:07, 9.96it/s] 75it [00:07, 10.00it/s] 76it [00:07, 9.99it/s] 78it [00:07, 10.00it/s] 79it [00:08, 9.99it/s] 80it [00:08, 9.82it/s] 81it [00:08, 9.82it/s] 82it [00:08, 9.81it/s] 83it [00:08, 9.80it/s] 84it [00:08, 9.79it/s] 85it [00:08, 9.82it/s] 86it [00:08, 9.80it/s] 87it [00:08, 9.82it/s] 88it [00:08, 9.59it/s] 89it [00:09, 9.56it/s] 90it [00:09, 9.28it/s] 91it [00:09, 9.13it/s] 92it [00:09, 9.36it/s] 93it [00:09, 9.49it/s] 94it [00:09, 9.60it/s] 95it [00:09, 9.64it/s] 96it [00:09, 9.70it/s] 97it [00:09, 9.76it/s] 98it [00:09, 9.79it/s] 100it [00:10, 9.84it/s]2025-05-26 04:56:35,670 - INFO - [Epoch 039 | Batch 0100] IWAE-loss 5635.9746 | mean log_px -0.0364 | KL -3484.96 + 101it [00:10, 9.81it/s] 102it [00:10, 9.85it/s] 103it [00:10, 9.85it/s] 104it [00:10, 9.83it/s] 105it [00:10, 9.84it/s] 107it [00:10, 9.88it/s] 108it [00:11, 9.91it/s] 109it [00:11, 9.89it/s] 110it [00:11, 9.85it/s] 111it [00:11, 9.85it/s] 112it [00:11, 9.82it/s] 114it [00:11, 9.87it/s] 115it [00:11, 9.90it/s] 117it [00:11, 9.97it/s] 118it [00:12, 9.93it/s] 119it [00:12, 9.92it/s] 120it [00:12, 9.92it/s] 121it [00:12, 9.90it/s] 122it [00:12, 9.91it/s] 123it [00:12, 9.91it/s] 124it [00:12, 9.90it/s] 125it [00:12, 9.87it/s] 126it [00:12, 9.88it/s] 127it [00:12, 9.84it/s] 129it [00:13, 9.70it/s] 130it [00:13, 9.76it/s] 131it [00:13, 9.81it/s] 132it [00:13, 9.28it/s] 133it [00:13, 9.45it/s] 134it [00:13, 9.59it/s] 135it [00:13, 9.68it/s] 136it [00:13, 9.74it/s] 137it [00:13, 9.79it/s] 138it [00:14, 9.81it/s] 139it [00:14, 9.68it/s] 140it [00:14, 9.72it/s] 141it [00:14, 9.78it/s] 142it [00:14, 9.81it/s] 143it [00:14, 9.85it/s] 144it [00:14, 9.88it/s] 145it [00:14, 9.90it/s] 146it [00:14, 9.91it/s] 148it [00:15, 9.98it/s] 149it [00:15, 9.98it/s] 150it [00:15, 9.97it/s]2025-05-26 04:56:40,754 - INFO - [Epoch 039 | Batch 0150] IWAE-loss 6551.1885 | mean log_px -0.0438 | KL -3480.69 + 151it [00:15, 9.96it/s] 152it [00:15, 9.94it/s] 153it [00:15, 9.95it/s] 154it [00:15, 9.94it/s] 155it [00:15, 9.95it/s] 157it [00:15, 9.98it/s] 158it [00:16, 9.96it/s] 159it [00:16, 9.94it/s] 160it [00:16, 9.87it/s] 161it [00:16, 9.89it/s] 162it [00:16, 9.89it/s] 163it [00:16, 9.86it/s] 165it [00:16, 9.92it/s] 166it [00:16, 9.84it/s] 167it [00:16, 9.87it/s] 168it [00:17, 9.90it/s] 169it [00:17, 9.89it/s] 170it [00:17, 9.84it/s] 171it [00:17, 9.82it/s] 172it [00:17, 9.79it/s] 173it [00:17, 9.84it/s] 174it [00:17, 9.83it/s] 175it [00:17, 9.87it/s] 176it [00:17, 9.88it/s] 177it [00:18, 9.89it/s] 178it [00:18, 9.81it/s] 179it [00:18, 9.83it/s] 180it [00:18, 9.82it/s] 181it [00:18, 9.85it/s] 182it [00:18, 9.82it/s] 183it [00:18, 9.87it/s] 184it [00:18, 9.81it/s] 185it [00:18, 9.80it/s] 186it [00:18, 9.80it/s] 187it [00:19, 9.76it/s] 188it [00:19, 9.79it/s] 189it [00:19, 9.82it/s] 190it [00:19, 9.80it/s] 191it [00:19, 9.86it/s] 192it [00:19, 9.76it/s] 193it [00:19, 9.67it/s] 194it [00:19, 9.67it/s] 195it [00:19, 9.26it/s] 196it [00:20, 9.79it/s] +2025-05-26 04:56:45,441 - INFO - Epoch: 39, Objective: tensor([6474.6235], device='cuda:0', grad_fn=), Loss: 0.045537568628787994, KL/n: 71.1382827758789 + 0it [00:00, ?it/s]2025-05-26 04:56:45,899 - INFO - [Epoch 040 | Batch 0000] IWAE-loss 7672.9946 | mean log_px -0.0628 | KL -3483.29 + 1it [00:00, 5.28it/s] 2it [00:00, 7.26it/s] 3it [00:00, 8.25it/s] 4it [00:00, 8.80it/s] 5it [00:00, 9.06it/s] 6it [00:00, 9.07it/s] 7it [00:00, 9.18it/s] 8it [00:00, 9.22it/s] 9it [00:01, 9.41it/s] 10it [00:01, 9.55it/s] 12it [00:01, 9.71it/s] 13it [00:01, 9.71it/s] 14it [00:01, 9.71it/s] 15it [00:01, 9.76it/s] 16it [00:01, 9.78it/s] 17it [00:01, 9.83it/s] 18it [00:01, 9.85it/s] 19it [00:02, 9.86it/s] 20it [00:02, 9.84it/s] 21it [00:02, 9.88it/s] 22it [00:02, 9.82it/s] 23it [00:02, 9.87it/s] 24it [00:02, 9.87it/s] 26it [00:02, 9.94it/s] 28it [00:02, 9.61it/s] 29it [00:03, 9.68it/s] 30it [00:03, 9.58it/s] 31it [00:03, 9.55it/s] 32it [00:03, 9.40it/s] 33it [00:03, 9.50it/s] 34it [00:03, 9.62it/s] 35it [00:03, 9.69it/s] 36it [00:03, 9.72it/s] 38it [00:03, 9.87it/s] 40it [00:04, 9.92it/s] 42it [00:04, 9.94it/s] 44it [00:04, 9.66it/s] 45it [00:04, 9.68it/s] 46it [00:04, 9.73it/s] 47it [00:04, 9.71it/s] 48it [00:05, 9.73it/s] 49it [00:05, 9.79it/s] 50it [00:05, 9.82it/s]2025-05-26 04:56:51,034 - INFO - [Epoch 040 | Batch 0050] IWAE-loss 5287.8018 | mean log_px -0.0307 | KL -3482.75 + 51it [00:05, 9.85it/s] 53it [00:05, 9.94it/s] 55it [00:05, 9.97it/s] 56it [00:05, 9.95it/s] 57it [00:05, 9.95it/s] 58it [00:06, 9.91it/s] 59it [00:06, 9.92it/s] 60it [00:06, 9.92it/s] 62it [00:06, 9.95it/s] 63it [00:06, 9.42it/s] 64it [00:06, 9.55it/s] 65it [00:06, 9.65it/s] 66it [00:06, 9.74it/s] 68it [00:07, 9.38it/s] 70it [00:07, 9.62it/s] 71it [00:07, 9.66it/s] 72it [00:07, 9.33it/s] 73it [00:07, 9.46it/s] 74it [00:07, 9.58it/s] 75it [00:07, 9.65it/s] 76it [00:07, 9.71it/s] 77it [00:08, 9.73it/s] 78it [00:08, 9.41it/s] 79it [00:08, 9.55it/s] 80it [00:08, 9.66it/s] 81it [00:08, 9.74it/s] 82it [00:08, 9.76it/s] 83it [00:08, 9.22it/s] 84it [00:08, 9.40it/s] 85it [00:08, 9.57it/s] 86it [00:08, 9.67it/s] 87it [00:09, 9.77it/s] 88it [00:09, 9.80it/s] 90it [00:09, 9.89it/s] 92it [00:09, 9.95it/s] 93it [00:09, 9.94it/s] 94it [00:09, 9.93it/s] 95it [00:09, 9.49it/s] 96it [00:09, 9.60it/s] 97it [00:10, 9.63it/s] 98it [00:10, 9.69it/s] 99it [00:10, 9.76it/s] 100it [00:10, 9.78it/s]2025-05-26 04:56:56,189 - INFO - [Epoch 040 | Batch 0100] IWAE-loss 6247.6255 | mean log_px -0.0492 | KL -3478.28 + 101it [00:10, 9.23it/s] 102it [00:10, 9.21it/s] 103it [00:10, 9.32it/s] 104it [00:10, 9.47it/s] 105it [00:10, 9.58it/s] 106it [00:11, 9.68it/s] 107it [00:11, 9.73it/s] 108it [00:11, 9.80it/s] 109it [00:11, 9.84it/s] 110it [00:11, 9.88it/s] 111it [00:11, 9.89it/s] 112it [00:11, 9.89it/s] 113it [00:11, 9.90it/s] 114it [00:11, 9.88it/s] 116it [00:12, 9.94it/s] 117it [00:12, 9.95it/s] 118it [00:12, 9.94it/s] 119it [00:12, 9.94it/s] 120it [00:12, 9.95it/s] 121it [00:12, 9.49it/s] 122it [00:12, 9.61it/s] 123it [00:12, 9.71it/s] 124it [00:12, 9.77it/s] 125it [00:12, 9.83it/s] 126it [00:13, 9.39it/s] 127it [00:13, 9.56it/s] 129it [00:13, 9.39it/s] 130it [00:13, 9.50it/s] 131it [00:13, 9.59it/s] 132it [00:13, 9.67it/s] 134it [00:13, 9.82it/s] 135it [00:13, 9.85it/s] 136it [00:14, 9.88it/s] 137it [00:14, 9.90it/s] 138it [00:14, 9.88it/s] 139it [00:14, 9.27it/s] 140it [00:14, 9.46it/s] 142it [00:14, 9.70it/s] 143it [00:14, 9.76it/s] 144it [00:14, 9.78it/s] 145it [00:15, 9.84it/s] 146it [00:15, 9.83it/s] 148it [00:15, 9.91it/s] 149it [00:15, 9.92it/s] 150it [00:15, 9.94it/s]2025-05-26 04:57:01,330 - INFO - [Epoch 040 | Batch 0150] IWAE-loss 6392.1655 | mean log_px -0.0420 | KL -3472.99 + 151it [00:15, 9.36it/s] 152it [00:15, 9.51it/s] 153it [00:15, 9.63it/s] 154it [00:15, 9.71it/s] 155it [00:16, 9.26it/s] 156it [00:16, 9.43it/s] 157it [00:16, 9.58it/s] 158it [00:16, 9.66it/s] 159it [00:16, 9.72it/s] 160it [00:16, 9.28it/s] 161it [00:16, 9.48it/s] 162it [00:16, 9.56it/s] 163it [00:16, 9.67it/s] 164it [00:17, 9.25it/s] 165it [00:17, 9.45it/s] 166it [00:17, 9.60it/s] 167it [00:17, 9.70it/s] 168it [00:17, 9.15it/s] 169it [00:17, 9.38it/s] 170it [00:17, 9.53it/s] 171it [00:17, 9.65it/s] 172it [00:17, 9.74it/s] 173it [00:17, 9.30it/s] 174it [00:18, 9.47it/s] 176it [00:18, 9.71it/s] 177it [00:18, 9.78it/s] 178it [00:18, 9.81it/s] 180it [00:18, 9.90it/s] 182it [00:18, 9.95it/s] 184it [00:19, 9.98it/s] 186it [00:19, 9.99it/s] 187it [00:19, 9.99it/s] 189it [00:19, 10.00it/s] 190it [00:19, 9.98it/s] 191it [00:19, 9.98it/s] 192it [00:19, 9.98it/s] 193it [00:19, 9.96it/s] 194it [00:20, 9.95it/s] 195it [00:20, 9.52it/s] 196it [00:20, 9.64it/s] +2025-05-26 04:57:06,091 - INFO - Epoch: 40, Objective: tensor([5746.3809], device='cuda:0', grad_fn=), Loss: 0.034290388226509094, KL/n: 70.98202514648438 + 0it [00:00, ?it/s]2025-05-26 04:57:06,383 - INFO - [Epoch 041 | Batch 0000] IWAE-loss 5749.5537 | mean log_px -0.0346 | KL -3479.12 + 1it [00:00, 4.46it/s] 3it [00:00, 7.61it/s] 5it [00:00, 8.40it/s] 7it [00:00, 8.66it/s] 9it [00:01, 9.16it/s] 11it [00:01, 9.46it/s] 13it [00:01, 9.68it/s] 14it [00:01, 9.70it/s] 15it [00:01, 9.73it/s] 17it [00:01, 9.87it/s] 19it [00:02, 9.96it/s] 21it [00:02, 10.00it/s] 23it [00:02, 10.05it/s] 25it [00:02, 10.07it/s] 27it [00:02, 10.08it/s] 29it [00:03, 10.10it/s] 31it [00:03, 10.10it/s] 33it [00:03, 10.12it/s] 35it [00:03, 9.89it/s] 36it [00:03, 9.91it/s] 38it [00:03, 9.98it/s] 40it [00:04, 10.02it/s] 42it [00:04, 10.05it/s] 44it [00:04, 10.08it/s] 46it [00:04, 10.09it/s] 48it [00:04, 10.10it/s] 50it [00:05, 10.10it/s]2025-05-26 04:57:11,415 - INFO - [Epoch 041 | Batch 0050] IWAE-loss 5837.0518 | mean log_px -0.0380 | KL -3473.68 + 52it [00:05, 10.09it/s] 54it [00:05, 10.09it/s] 56it [00:05, 9.86it/s] 58it [00:05, 9.93it/s] 59it [00:06, 9.94it/s] 60it [00:06, 9.93it/s] 62it [00:06, 9.98it/s] 64it [00:06, 10.01it/s] 66it [00:06, 10.05it/s] 68it [00:06, 10.06it/s] 70it [00:07, 10.07it/s] 72it [00:07, 10.09it/s] 74it [00:07, 10.09it/s] 76it [00:07, 10.09it/s] 78it [00:07, 10.09it/s] 80it [00:08, 10.09it/s] 82it [00:08, 10.11it/s] 84it [00:08, 10.02it/s] 86it [00:08, 10.05it/s] 88it [00:08, 10.07it/s] 90it [00:09, 10.09it/s] 92it [00:09, 10.10it/s] 94it [00:09, 10.11it/s] 96it [00:09, 10.11it/s] 98it [00:09, 10.11it/s] 100it [00:10, 9.84it/s]2025-05-26 04:57:16,407 - INFO - [Epoch 041 | Batch 0100] IWAE-loss 5281.2070 | mean log_px -0.0259 | KL -3478.21 + 102it [00:10, 9.91it/s] 104it [00:10, 9.98it/s] 105it [00:10, 9.98it/s] 107it [00:10, 10.03it/s] 109it [00:11, 10.06it/s] 111it [00:11, 10.07it/s] 113it [00:11, 10.10it/s] 115it [00:11, 10.10it/s] 117it [00:11, 10.11it/s] 119it [00:12, 10.10it/s] 121it [00:12, 10.05it/s] 123it [00:12, 10.08it/s] 125it [00:12, 10.09it/s] 127it [00:12, 10.10it/s] 129it [00:13, 9.70it/s] 130it [00:13, 9.75it/s] 132it [00:13, 9.87it/s] 134it [00:13, 9.95it/s] 135it [00:13, 9.47it/s] 136it [00:13, 9.54it/s] 138it [00:13, 9.75it/s] 140it [00:14, 9.32it/s] 141it [00:14, 9.29it/s] 142it [00:14, 9.35it/s] 144it [00:14, 9.62it/s] 146it [00:14, 9.79it/s] 148it [00:15, 9.53it/s] 150it [00:15, 9.71it/s]2025-05-26 04:57:21,488 - INFO - [Epoch 041 | Batch 0150] IWAE-loss 5604.3018 | mean log_px -0.0409 | KL -3472.15 + 152it [00:15, 9.45it/s] 154it [00:15, 9.64it/s] 156it [00:15, 9.78it/s] 158it [00:16, 9.87it/s] 160it [00:16, 9.68it/s] 162it [00:16, 9.81it/s] 164it [00:16, 9.90it/s] 166it [00:16, 9.96it/s] 168it [00:17, 10.02it/s] 170it [00:17, 9.98it/s] 171it [00:17, 9.69it/s] 173it [00:17, 9.83it/s] 175it [00:17, 9.92it/s] 176it [00:17, 9.71it/s] 177it [00:17, 9.18it/s] 178it [00:18, 9.17it/s] 179it [00:18, 9.25it/s] 180it [00:18, 9.32it/s] 181it [00:18, 9.39it/s] 182it [00:18, 9.44it/s] 183it [00:18, 9.49it/s] 184it [00:18, 9.50it/s] 185it [00:18, 9.54it/s] 186it [00:18, 9.55it/s] 187it [00:19, 9.59it/s] 188it [00:19, 8.99it/s] 189it [00:19, 9.11it/s] 190it [00:19, 9.26it/s] 191it [00:19, 9.32it/s] 192it [00:19, 9.39it/s] 193it [00:19, 9.38it/s] 194it [00:19, 9.39it/s] 195it [00:19, 8.84it/s] 196it [00:20, 9.08it/s] 196it [00:20, 9.76it/s] +2025-05-26 04:57:26,309 - INFO - Epoch: 41, Objective: tensor([4431.4009], device='cuda:0', grad_fn=), Loss: 0.017086666077375412, KL/n: 70.84024810791016 + 0it [00:00, ?it/s]2025-05-26 04:57:26,765 - INFO - [Epoch 042 | Batch 0000] IWAE-loss 7730.5332 | mean log_px -0.0675 | KL -3471.14 + 1it [00:00, 4.83it/s] 2it [00:00, 6.73it/s] 3it [00:00, 7.79it/s] 4it [00:00, 7.79it/s] 5it [00:00, 8.37it/s] 6it [00:00, 8.69it/s] 7it [00:00, 8.94it/s] 8it [00:00, 9.11it/s] 9it [00:01, 9.26it/s] 10it [00:01, 9.28it/s] 11it [00:01, 9.38it/s] 12it [00:01, 9.42it/s] 13it [00:01, 9.51it/s] 14it [00:01, 9.45it/s] 15it [00:01, 9.49it/s] 16it [00:01, 9.53it/s] 17it [00:01, 9.52it/s] 18it [00:02, 9.47it/s] 19it [00:02, 9.55it/s] 20it [00:02, 8.99it/s] 21it [00:02, 9.17it/s] 22it [00:02, 9.25it/s] 23it [00:02, 9.31it/s] 24it [00:02, 9.37it/s] 25it [00:02, 8.86it/s] 26it [00:02, 9.06it/s] 27it [00:03, 9.19it/s] 28it [00:03, 9.27it/s] 29it [00:03, 9.37it/s] 30it [00:03, 9.40it/s] 31it [00:03, 9.48it/s] 32it [00:03, 9.48it/s] 33it [00:03, 9.53it/s] 34it [00:03, 9.51it/s] 35it [00:03, 8.97it/s] 36it [00:03, 9.05it/s] 37it [00:04, 9.23it/s] 38it [00:04, 9.35it/s] 39it [00:04, 9.34it/s] 40it [00:04, 9.39it/s] 41it [00:04, 9.45it/s] 42it [00:04, 9.46it/s] 43it [00:04, 9.51it/s] 44it [00:04, 8.91it/s] 45it [00:04, 9.07it/s] 46it [00:05, 9.20it/s] 47it [00:05, 9.30it/s] 48it [00:05, 9.28it/s] 49it [00:05, 9.36it/s] 50it [00:05, 9.40it/s]2025-05-26 04:57:32,155 - INFO - [Epoch 042 | Batch 0050] IWAE-loss 6543.3037 | mean log_px -0.0493 | KL -3464.77 + 51it [00:05, 9.38it/s] 52it [00:05, 9.43it/s] 53it [00:05, 9.39it/s] 54it [00:05, 8.91it/s] 55it [00:06, 9.12it/s] 56it [00:06, 9.20it/s] 57it [00:06, 9.31it/s] 58it [00:06, 9.36it/s] 59it [00:06, 9.41it/s] 60it [00:06, 9.46it/s] 61it [00:06, 9.49it/s] 62it [00:06, 8.96it/s] 63it [00:06, 9.12it/s] 64it [00:06, 9.25it/s] 65it [00:07, 9.28it/s] 66it [00:07, 9.30it/s] 67it [00:07, 9.36it/s] 68it [00:07, 9.42it/s] 69it [00:07, 9.43it/s] 70it [00:07, 9.45it/s] 71it [00:07, 9.39it/s] 72it [00:07, 8.90it/s] 73it [00:07, 9.11it/s] 74it [00:08, 9.24it/s] 75it [00:08, 9.29it/s] 76it [00:08, 9.35it/s] 77it [00:08, 9.41it/s] 78it [00:08, 9.44it/s] 79it [00:08, 8.80it/s] 80it [00:08, 8.69it/s] 81it [00:08, 8.84it/s] 82it [00:08, 9.01it/s] 83it [00:09, 9.17it/s] 84it [00:09, 9.26it/s] 85it [00:09, 9.38it/s] 86it [00:09, 9.44it/s] 87it [00:09, 9.48it/s] 88it [00:09, 9.51it/s] 89it [00:09, 9.52it/s] 90it [00:09, 9.50it/s] 91it [00:09, 8.97it/s] 92it [00:10, 9.09it/s] 93it [00:10, 9.22it/s] 94it [00:10, 8.96it/s] 95it [00:10, 9.07it/s] 96it [00:10, 9.18it/s] 97it [00:10, 9.30it/s] 98it [00:10, 8.83it/s] 99it [00:10, 9.05it/s] 100it [00:10, 9.19it/s]2025-05-26 04:57:37,579 - INFO - [Epoch 042 | Batch 0100] IWAE-loss 4768.8535 | mean log_px -0.0224 | KL -3467.10 + 101it [00:11, 9.24it/s] 102it [00:11, 9.32it/s] 103it [00:11, 9.32it/s] 104it [00:11, 9.35it/s] 105it [00:11, 9.38it/s] 106it [00:11, 9.42it/s] 107it [00:11, 9.48it/s] 108it [00:11, 9.49it/s] 109it [00:11, 9.49it/s] 110it [00:11, 9.51it/s] 111it [00:12, 9.50it/s] 112it [00:12, 9.50it/s] 113it [00:12, 9.51it/s] 114it [00:12, 9.50it/s] 115it [00:12, 9.52it/s] 116it [00:12, 9.52it/s] 117it [00:12, 8.98it/s] 118it [00:12, 9.15it/s] 119it [00:12, 9.26it/s] 120it [00:13, 9.15it/s] 121it [00:13, 9.21it/s] 122it [00:13, 9.31it/s] 123it [00:13, 9.38it/s] 124it [00:13, 9.35it/s] 125it [00:13, 9.36it/s] 126it [00:13, 9.38it/s] 127it [00:13, 9.42it/s] 128it [00:13, 9.45it/s] 129it [00:13, 9.47it/s] 130it [00:14, 9.49it/s] 131it [00:14, 9.47it/s] 132it [00:14, 9.01it/s] 133it [00:14, 9.18it/s] 134it [00:14, 9.32it/s] 135it [00:14, 9.41it/s] 136it [00:14, 8.95it/s] 137it [00:14, 9.09it/s] 138it [00:14, 9.21it/s] 139it [00:15, 9.16it/s] 140it [00:15, 9.28it/s] 141it [00:15, 8.79it/s] 142it [00:15, 9.01it/s] 143it [00:15, 9.18it/s] 144it [00:15, 9.26it/s] 145it [00:15, 9.34it/s] 146it [00:15, 9.40it/s] 147it [00:15, 9.47it/s] 148it [00:16, 8.99it/s] 149it [00:16, 9.12it/s] 150it [00:16, 9.23it/s]2025-05-26 04:57:42,955 - INFO - [Epoch 042 | Batch 0150] IWAE-loss 5339.9580 | mean log_px -0.0337 | KL -3464.08 + 151it [00:16, 9.26it/s] 152it [00:16, 9.32it/s] 153it [00:16, 9.40it/s] 154it [00:16, 9.39it/s] 155it [00:16, 9.43it/s] 156it [00:16, 9.45it/s] 157it [00:17, 9.47it/s] 158it [00:17, 9.49it/s] 159it [00:17, 9.48it/s] 160it [00:17, 9.50it/s] 161it [00:17, 9.50it/s] 162it [00:17, 9.53it/s] 163it [00:17, 9.51it/s] 164it [00:17, 9.47it/s] 165it [00:17, 9.53it/s] 166it [00:17, 9.52it/s] 167it [00:18, 9.52it/s] 168it [00:18, 9.54it/s] 169it [00:18, 9.52it/s] 170it [00:18, 9.45it/s] 171it [00:18, 9.47it/s] 172it [00:18, 9.48it/s] 173it [00:18, 9.46it/s] 174it [00:18, 9.49it/s] 175it [00:18, 9.54it/s] 176it [00:19, 9.53it/s] 177it [00:19, 9.00it/s] 178it [00:19, 9.12it/s] 179it [00:19, 9.21it/s] 180it [00:19, 9.27it/s] 181it [00:19, 9.38it/s] 182it [00:19, 9.43it/s] 183it [00:19, 9.41it/s] 184it [00:19, 9.45it/s] 185it [00:19, 9.44it/s] 186it [00:20, 9.45it/s] 187it [00:20, 8.94it/s] 188it [00:20, 9.11it/s] 189it [00:20, 9.22it/s] 190it [00:20, 9.23it/s] 191it [00:20, 9.33it/s] 192it [00:20, 9.38it/s] 193it [00:20, 9.41it/s] 194it [00:20, 9.41it/s] 195it [00:21, 8.85it/s] 196it [00:21, 9.02it/s] 196it [00:21, 9.22it/s] +2025-05-26 04:57:47,869 - INFO - Epoch: 42, Objective: tensor([5298.1240], device='cuda:0', grad_fn=), Loss: 0.0280563123524189, KL/n: 70.67806243896484 + 0it [00:00, ?it/s]2025-05-26 04:57:48,164 - INFO - [Epoch 043 | Batch 0000] IWAE-loss 4510.7559 | mean log_px -0.0216 | KL -3460.82 + 1it [00:00, 4.37it/s] 2it [00:00, 6.46it/s] 3it [00:00, 7.63it/s] 4it [00:00, 8.27it/s] 5it [00:00, 8.79it/s] 6it [00:00, 9.04it/s] 7it [00:00, 8.63it/s] 8it [00:00, 8.89it/s] 9it [00:01, 9.11it/s] 10it [00:01, 9.25it/s] 11it [00:01, 9.41it/s] 12it [00:01, 9.46it/s] 13it [00:01, 9.49it/s] 14it [00:01, 9.49it/s] 15it [00:01, 9.49it/s] 16it [00:01, 9.08it/s] 17it [00:01, 9.24it/s] 18it [00:02, 9.34it/s] 19it [00:02, 9.42it/s] 20it [00:02, 9.49it/s] 21it [00:02, 8.93it/s] 22it [00:02, 9.10it/s] 23it [00:02, 9.29it/s] 24it [00:02, 9.36it/s] 25it [00:02, 9.41it/s] 26it [00:02, 9.01it/s] 27it [00:03, 9.19it/s] 28it [00:03, 9.24it/s] 29it [00:03, 9.19it/s] 30it [00:03, 9.30it/s] 31it [00:03, 9.42it/s] 32it [00:03, 9.45it/s] 33it [00:03, 9.46it/s] 34it [00:03, 9.43it/s] 35it [00:03, 8.63it/s] 36it [00:04, 8.66it/s] 37it [00:04, 8.87it/s] 38it [00:04, 9.09it/s] 39it [00:04, 9.21it/s] 40it [00:04, 9.31it/s] 41it [00:04, 9.37it/s] 42it [00:04, 9.37it/s] 43it [00:04, 9.38it/s] 44it [00:04, 8.79it/s] 45it [00:04, 8.94it/s] 46it [00:05, 9.10it/s] 47it [00:05, 9.20it/s] 48it [00:05, 8.74it/s] 49it [00:05, 8.69it/s] 50it [00:05, 8.96it/s]2025-05-26 04:57:53,611 - INFO - [Epoch 043 | Batch 0050] IWAE-loss 4645.6123 | mean log_px -0.0196 | KL -3460.41 + 51it [00:05, 9.13it/s] 52it [00:05, 9.27it/s] 53it [00:05, 9.29it/s] 54it [00:05, 9.36it/s] 55it [00:06, 9.44it/s] 56it [00:06, 9.49it/s] 57it [00:06, 9.54it/s] 58it [00:06, 9.53it/s] 59it [00:06, 9.53it/s] 60it [00:06, 9.57it/s] 61it [00:06, 9.59it/s] 62it [00:06, 9.61it/s] 63it [00:06, 9.60it/s] 64it [00:07, 9.03it/s] 65it [00:07, 9.21it/s] 66it [00:07, 9.30it/s] 67it [00:07, 9.39it/s] 68it [00:07, 9.46it/s] 69it [00:07, 9.49it/s] 70it [00:07, 9.52it/s] 71it [00:07, 9.07it/s] 72it [00:07, 9.21it/s] 73it [00:07, 9.35it/s] 74it [00:08, 9.39it/s] 75it [00:08, 9.43it/s] 76it [00:08, 8.93it/s] 77it [00:08, 9.06it/s] 78it [00:08, 9.18it/s] 79it [00:08, 9.30it/s] 80it [00:08, 9.38it/s] 81it [00:08, 9.08it/s] 82it [00:08, 9.20it/s] 83it [00:09, 9.19it/s] 84it [00:09, 8.72it/s] 85it [00:09, 8.86it/s] 86it [00:09, 9.11it/s] 87it [00:09, 9.25it/s] 88it [00:09, 9.37it/s] 89it [00:09, 9.46it/s] 90it [00:09, 9.51it/s] 91it [00:09, 9.51it/s] 92it [00:10, 9.51it/s] 93it [00:10, 9.54it/s] 94it [00:10, 9.57it/s] 95it [00:10, 9.05it/s] 96it [00:10, 9.14it/s] 97it [00:10, 9.29it/s] 98it [00:10, 9.36it/s] 99it [00:10, 9.44it/s] 100it [00:10, 9.50it/s]2025-05-26 04:57:58,959 - INFO - [Epoch 043 | Batch 0100] IWAE-loss 7542.3433 | mean log_px -0.0583 | KL -3461.22 + 101it [00:10, 9.59it/s] 102it [00:11, 9.62it/s] 103it [00:11, 9.60it/s] 104it [00:11, 9.01it/s] 105it [00:11, 9.20it/s] 106it [00:11, 9.31it/s] 107it [00:11, 9.43it/s] 108it [00:11, 9.46it/s] 109it [00:11, 9.52it/s] 110it [00:11, 9.56it/s] 111it [00:12, 9.59it/s] 112it [00:12, 9.60it/s] 113it [00:12, 9.02it/s] 114it [00:12, 9.20it/s] 115it [00:12, 9.35it/s] 116it [00:12, 9.43it/s] 117it [00:12, 9.47it/s] 118it [00:12, 9.52it/s] 119it [00:12, 9.15it/s] 120it [00:13, 9.26it/s] 121it [00:13, 9.38it/s] 122it [00:13, 9.44it/s] 123it [00:13, 8.94it/s] 124it [00:13, 9.08it/s] 125it [00:13, 9.25it/s] 126it [00:13, 9.37it/s] 127it [00:13, 9.39it/s] 128it [00:13, 9.46it/s] 129it [00:13, 9.47it/s] 130it [00:14, 9.08it/s] 131it [00:14, 9.25it/s] 132it [00:14, 9.32it/s] 133it [00:14, 9.44it/s] 134it [00:14, 9.51it/s] 135it [00:14, 9.52it/s] 136it [00:14, 9.53it/s] 137it [00:14, 9.03it/s] 138it [00:14, 9.20it/s] 139it [00:15, 9.25it/s] 140it [00:15, 9.34it/s] 141it [00:15, 9.45it/s] 142it [00:15, 9.52it/s] 143it [00:15, 9.58it/s] 144it [00:15, 9.55it/s] 145it [00:15, 9.57it/s] 146it [00:15, 9.59it/s] 147it [00:15, 9.59it/s] 148it [00:16, 9.59it/s] 149it [00:16, 9.57it/s] 150it [00:16, 9.57it/s]2025-05-26 04:58:04,283 - INFO - [Epoch 043 | Batch 0150] IWAE-loss 4443.6572 | mean log_px -0.0191 | KL -3451.98 + 151it [00:16, 9.60it/s] 152it [00:16, 9.57it/s] 153it [00:16, 9.61it/s] 154it [00:16, 9.61it/s] 155it [00:16, 9.25it/s] 156it [00:16, 9.03it/s] 157it [00:16, 8.87it/s] 158it [00:17, 9.06it/s] 159it [00:17, 9.24it/s] 160it [00:17, 9.36it/s] 161it [00:17, 9.42it/s] 162it [00:17, 9.47it/s] 163it [00:17, 9.53it/s] 164it [00:17, 9.57it/s] 165it [00:17, 9.62it/s] 166it [00:17, 9.61it/s] 167it [00:18, 9.62it/s] 168it [00:18, 9.65it/s] 169it [00:18, 9.66it/s] 170it [00:18, 9.61it/s] 171it [00:18, 9.62it/s] 172it [00:18, 9.59it/s] 173it [00:18, 9.63it/s] 174it [00:18, 9.64it/s] 175it [00:18, 9.03it/s] 176it [00:18, 9.20it/s] 177it [00:19, 9.30it/s] 178it [00:19, 9.28it/s] 179it [00:19, 9.37it/s] 180it [00:19, 9.32it/s] 181it [00:19, 8.89it/s] 182it [00:19, 9.04it/s] 183it [00:19, 9.21it/s] 184it [00:19, 9.32it/s] 185it [00:19, 9.41it/s] 186it [00:20, 9.48it/s] 187it [00:20, 9.51it/s] 188it [00:20, 9.53it/s] 189it [00:20, 9.53it/s] 190it [00:20, 9.50it/s] 191it [00:20, 9.55it/s] 192it [00:20, 9.58it/s] 193it [00:20, 9.63it/s] 194it [00:20, 9.02it/s] 195it [00:21, 8.61it/s] 196it [00:21, 8.88it/s] 196it [00:21, 9.25it/s] +2025-05-26 04:58:09,204 - INFO - Epoch: 43, Objective: tensor([4990.5254], device='cuda:0', grad_fn=), Loss: 0.022801268845796585, KL/n: 70.53202056884766 + 0it [00:00, ?it/s]2025-05-26 04:58:09,669 - INFO - [Epoch 044 | Batch 0000] IWAE-loss 8241.9609 | mean log_px -0.0746 | KL -3451.67 + 1it [00:00, 5.37it/s] 2it [00:00, 6.80it/s] 3it [00:00, 7.93it/s] 4it [00:00, 8.59it/s] 5it [00:00, 9.04it/s] 6it [00:00, 9.31it/s] 7it [00:00, 9.46it/s] 8it [00:00, 9.56it/s] 9it [00:01, 9.67it/s] 10it [00:01, 9.72it/s] 11it [00:01, 9.78it/s] 12it [00:01, 9.81it/s] 13it [00:01, 9.84it/s] 14it [00:01, 9.82it/s] 15it [00:01, 9.84it/s] 16it [00:01, 9.84it/s] 17it [00:01, 9.88it/s] 18it [00:01, 9.88it/s] 19it [00:02, 9.91it/s] 20it [00:02, 9.90it/s] 21it [00:02, 9.90it/s] 22it [00:02, 9.51it/s] 23it [00:02, 9.62it/s] 24it [00:02, 9.67it/s] 25it [00:02, 9.74it/s] 26it [00:02, 9.76it/s] 27it [00:02, 9.78it/s] 28it [00:02, 9.74it/s] 29it [00:03, 9.80it/s] 30it [00:03, 9.81it/s] 31it [00:03, 9.82it/s] 32it [00:03, 9.28it/s] 33it [00:03, 9.45it/s] 34it [00:03, 9.57it/s] 35it [00:03, 9.67it/s] 36it [00:03, 9.72it/s] 37it [00:03, 9.76it/s] 38it [00:03, 9.77it/s] 39it [00:04, 9.79it/s] 40it [00:04, 9.78it/s] 41it [00:04, 9.81it/s] 42it [00:04, 9.81it/s] 43it [00:04, 9.81it/s] 44it [00:04, 9.82it/s] 45it [00:04, 9.81it/s] 46it [00:04, 9.83it/s] 47it [00:04, 9.86it/s] 48it [00:05, 9.85it/s] 49it [00:05, 9.87it/s] 50it [00:05, 9.87it/s]2025-05-26 04:58:14,795 - INFO - [Epoch 044 | Batch 0050] IWAE-loss 8636.9531 | mean log_px -0.0781 | KL -3454.60 + 51it [00:05, 9.25it/s] 52it [00:05, 9.43it/s] 53it [00:05, 9.57it/s] 54it [00:05, 9.67it/s] 55it [00:05, 9.74it/s] 56it [00:05, 9.78it/s] 57it [00:05, 9.20it/s] 58it [00:06, 9.39it/s] 59it [00:06, 9.53it/s] 60it [00:06, 9.62it/s] 61it [00:06, 9.71it/s] 62it [00:06, 9.76it/s] 63it [00:06, 9.80it/s] 64it [00:06, 9.83it/s] 65it [00:06, 9.65it/s] 66it [00:06, 9.59it/s] 67it [00:06, 9.61it/s] 68it [00:07, 9.68it/s] 69it [00:07, 9.73it/s] 70it [00:07, 9.75it/s] 71it [00:07, 9.15it/s] 72it [00:07, 9.33it/s] 73it [00:07, 9.48it/s] 74it [00:07, 8.99it/s] 75it [00:07, 9.24it/s] 76it [00:07, 9.40it/s] 77it [00:08, 9.55it/s] 78it [00:08, 9.63it/s] 79it [00:08, 9.19it/s] 80it [00:08, 9.37it/s] 81it [00:08, 9.52it/s] 82it [00:08, 9.62it/s] 83it [00:08, 9.71it/s] 84it [00:08, 9.73it/s] 85it [00:08, 9.75it/s] 86it [00:08, 9.81it/s] 87it [00:09, 9.83it/s] 88it [00:09, 9.82it/s] 89it [00:09, 9.84it/s] 90it [00:09, 9.22it/s] 91it [00:09, 9.41it/s] 92it [00:09, 9.53it/s] 93it [00:09, 9.63it/s] 94it [00:09, 9.69it/s] 95it [00:09, 9.76it/s] 96it [00:10, 9.80it/s] 97it [00:10, 9.83it/s] 98it [00:10, 9.84it/s] 99it [00:10, 9.85it/s] 100it [00:10, 9.85it/s]2025-05-26 04:58:20,010 - INFO - [Epoch 044 | Batch 0100] IWAE-loss 4468.0703 | mean log_px -0.0182 | KL -3448.35 + 101it [00:10, 9.82it/s] 102it [00:10, 9.81it/s] 103it [00:10, 9.82it/s] 104it [00:10, 9.82it/s] 105it [00:10, 9.86it/s] 106it [00:11, 9.86it/s] 107it [00:11, 9.85it/s] 108it [00:11, 9.86it/s] 109it [00:11, 9.24it/s] 110it [00:11, 9.41it/s] 111it [00:11, 9.55it/s] 112it [00:11, 9.65it/s] 113it [00:11, 9.72it/s] 114it [00:11, 9.16it/s] 115it [00:11, 9.37it/s] 116it [00:12, 9.51it/s] 117it [00:12, 9.62it/s] 118it [00:12, 9.69it/s] 119it [00:12, 9.74it/s] 120it [00:12, 9.75it/s] 121it [00:12, 9.79it/s] 122it [00:12, 9.80it/s] 123it [00:12, 9.63it/s] 124it [00:12, 9.70it/s] 125it [00:13, 9.76it/s] 126it [00:13, 9.80it/s] 127it [00:13, 9.85it/s] 128it [00:13, 9.79it/s] 129it [00:13, 9.20it/s] 130it [00:13, 9.38it/s] 131it [00:13, 9.34it/s] 132it [00:13, 9.23it/s] 133it [00:13, 8.96it/s] 134it [00:13, 9.19it/s] 135it [00:14, 9.37it/s] 136it [00:14, 9.50it/s] 137it [00:14, 9.57it/s] 138it [00:14, 9.50it/s] 139it [00:14, 9.58it/s] 140it [00:14, 9.61it/s] 141it [00:14, 9.04it/s] 142it [00:14, 9.15it/s] 143it [00:14, 9.18it/s] 144it [00:15, 9.29it/s] 145it [00:15, 9.40it/s] 146it [00:15, 9.44it/s] 147it [00:15, 8.90it/s] 148it [00:15, 9.08it/s] 149it [00:15, 9.25it/s] 150it [00:15, 9.36it/s]2025-05-26 04:58:25,285 - INFO - [Epoch 044 | Batch 0150] IWAE-loss 5638.1201 | mean log_px -0.0363 | KL -3448.95 + 151it [00:15, 9.41it/s] 152it [00:15, 9.46it/s] 153it [00:16, 9.47it/s] 154it [00:16, 9.57it/s] 155it [00:16, 9.63it/s] 156it [00:16, 9.70it/s] 157it [00:16, 9.75it/s] 158it [00:16, 9.75it/s] 159it [00:16, 9.80it/s] 160it [00:16, 9.80it/s] 161it [00:16, 9.75it/s] 162it [00:16, 9.77it/s] 163it [00:17, 9.79it/s] 164it [00:17, 9.77it/s] 165it [00:17, 9.79it/s] 166it [00:17, 9.23it/s] 167it [00:17, 9.43it/s] 168it [00:17, 9.55it/s] 169it [00:17, 9.65it/s] 170it [00:17, 9.67it/s] 171it [00:17, 9.09it/s] 172it [00:17, 9.25it/s] 173it [00:18, 9.31it/s] 174it [00:18, 9.47it/s] 175it [00:18, 9.59it/s] 176it [00:18, 9.65it/s] 177it [00:18, 9.64it/s] 178it [00:18, 9.69it/s] 179it [00:18, 9.73it/s] 180it [00:18, 9.69it/s] 181it [00:18, 9.72it/s] 182it [00:19, 9.76it/s] 183it [00:19, 9.32it/s] 184it [00:19, 9.49it/s] 185it [00:19, 9.60it/s] 186it [00:19, 9.66it/s] 187it [00:19, 9.72it/s] 188it [00:19, 9.74it/s] 189it [00:19, 9.77it/s] 190it [00:19, 9.78it/s] 191it [00:19, 9.78it/s] 192it [00:20, 9.79it/s] 193it [00:20, 9.49it/s] 194it [00:20, 9.47it/s] 195it [00:20, 9.15it/s] 196it [00:20, 9.54it/s] +2025-05-26 04:58:30,078 - INFO - Epoch: 44, Objective: tensor([5709.1240], device='cuda:0', grad_fn=), Loss: 0.03686925023794174, KL/n: 70.38143920898438 + 0it [00:00, ?it/s]2025-05-26 04:58:30,347 - INFO - [Epoch 045 | Batch 0000] IWAE-loss 6154.7354 | mean log_px -0.0426 | KL -3452.68 + 1it [00:00, 4.75it/s] 2it [00:00, 6.81it/s] 3it [00:00, 7.91it/s] 4it [00:00, 8.59it/s] 5it [00:00, 8.99it/s] 6it [00:00, 9.22it/s] 7it [00:00, 9.45it/s] 8it [00:00, 9.59it/s] 9it [00:01, 9.71it/s] 10it [00:01, 9.77it/s] 11it [00:01, 9.82it/s] 12it [00:01, 9.85it/s] 13it [00:01, 9.87it/s] 14it [00:01, 9.87it/s] 16it [00:01, 9.91it/s] 17it [00:01, 9.93it/s] 18it [00:01, 9.90it/s] 19it [00:02, 9.81it/s] 20it [00:02, 9.81it/s] 21it [00:02, 9.85it/s] 22it [00:02, 9.87it/s] 23it [00:02, 9.89it/s] 24it [00:02, 9.90it/s] 25it [00:02, 9.90it/s] 26it [00:02, 9.89it/s] 27it [00:02, 9.92it/s] 28it [00:02, 9.92it/s] 29it [00:03, 9.94it/s] 30it [00:03, 9.93it/s] 31it [00:03, 9.94it/s] 32it [00:03, 9.94it/s] 33it [00:03, 9.42it/s] 34it [00:03, 9.57it/s] 35it [00:03, 9.67it/s] 36it [00:03, 9.74it/s] 37it [00:03, 9.80it/s] 38it [00:03, 9.83it/s] 39it [00:04, 9.86it/s] 40it [00:04, 9.88it/s] 41it [00:04, 9.89it/s] 42it [00:04, 9.88it/s] 43it [00:04, 9.89it/s] 44it [00:04, 9.89it/s] 45it [00:04, 9.89it/s] 46it [00:04, 9.89it/s] 47it [00:04, 9.91it/s] 48it [00:04, 9.85it/s] 49it [00:05, 9.71it/s] 50it [00:05, 9.72it/s]2025-05-26 04:58:35,456 - INFO - [Epoch 045 | Batch 0050] IWAE-loss 4413.5903 | mean log_px -0.0159 | KL -3443.76 + 51it [00:05, 9.11it/s] 52it [00:05, 9.29it/s] 53it [00:05, 9.47it/s] 54it [00:05, 9.59it/s] 55it [00:05, 9.61it/s] 56it [00:05, 9.63it/s] 57it [00:05, 9.06it/s] 58it [00:06, 9.29it/s] 59it [00:06, 9.46it/s] 60it [00:06, 9.59it/s] 61it [00:06, 9.69it/s] 62it [00:06, 9.75it/s] 63it [00:06, 9.81it/s] 64it [00:06, 9.40it/s] 65it [00:06, 9.56it/s] 66it [00:06, 9.66it/s] 67it [00:06, 9.73it/s] 68it [00:07, 9.77it/s] 69it [00:07, 9.81it/s] 70it [00:07, 9.83it/s] 71it [00:07, 9.86it/s] 72it [00:07, 9.24it/s] 73it [00:07, 9.44it/s] 74it [00:07, 9.58it/s] 75it [00:07, 9.66it/s] 76it [00:07, 9.72it/s] 77it [00:08, 9.14it/s] 78it [00:08, 9.33it/s] 79it [00:08, 9.46it/s] 80it [00:08, 9.57it/s] 81it [00:08, 9.69it/s] 82it [00:08, 9.74it/s] 83it [00:08, 9.80it/s] 84it [00:08, 9.83it/s] 85it [00:08, 9.70it/s] 86it [00:08, 9.72it/s] 87it [00:09, 9.78it/s] 88it [00:09, 9.19it/s] 89it [00:09, 9.41it/s] 90it [00:09, 9.55it/s] 91it [00:09, 9.65it/s] 92it [00:09, 9.71it/s] 93it [00:09, 9.76it/s] 94it [00:09, 9.78it/s] 95it [00:09, 9.83it/s] 96it [00:09, 9.85it/s] 97it [00:10, 9.86it/s] 98it [00:10, 9.34it/s] 99it [00:10, 9.48it/s] 100it [00:10, 9.51it/s]2025-05-26 04:58:40,679 - INFO - [Epoch 045 | Batch 0100] IWAE-loss 5534.2393 | mean log_px -0.0361 | KL -3439.78 + 101it [00:10, 8.99it/s] 102it [00:10, 9.24it/s] 103it [00:10, 8.83it/s] 104it [00:10, 9.12it/s] 105it [00:10, 9.36it/s] 106it [00:11, 9.51it/s] 107it [00:11, 9.64it/s] 108it [00:11, 9.71it/s] 109it [00:11, 9.79it/s] 110it [00:11, 9.79it/s] 111it [00:11, 9.83it/s] 112it [00:11, 9.84it/s] 113it [00:11, 9.87it/s] 114it [00:11, 9.24it/s] 115it [00:11, 9.43it/s] 116it [00:12, 9.54it/s] 117it [00:12, 9.63it/s] 118it [00:12, 9.71it/s] 119it [00:12, 9.78it/s] 120it [00:12, 9.81it/s] 121it [00:12, 9.84it/s] 122it [00:12, 9.15it/s] 123it [00:12, 9.27it/s] 124it [00:12, 9.37it/s] 125it [00:13, 9.47it/s] 126it [00:13, 9.02it/s] 127it [00:13, 9.25it/s] 128it [00:13, 9.43it/s] 129it [00:13, 9.57it/s] 130it [00:13, 9.66it/s] 131it [00:13, 9.74it/s] 132it [00:13, 9.28it/s] 133it [00:13, 9.48it/s] 134it [00:13, 9.60it/s] 135it [00:14, 9.67it/s] 136it [00:14, 9.70it/s] 137it [00:14, 9.75it/s] 138it [00:14, 9.80it/s] 139it [00:14, 9.21it/s] 140it [00:14, 9.40it/s] 141it [00:14, 9.54it/s] 142it [00:14, 9.62it/s] 143it [00:14, 9.71it/s] 144it [00:15, 9.73it/s] 145it [00:15, 9.78it/s] 146it [00:15, 9.31it/s] 147it [00:15, 9.50it/s] 148it [00:15, 9.61it/s] 149it [00:15, 9.72it/s] 150it [00:15, 9.77it/s]2025-05-26 04:58:45,921 - INFO - [Epoch 045 | Batch 0150] IWAE-loss 5436.4814 | mean log_px -0.0340 | KL -3438.98 + 151it [00:15, 9.19it/s] 152it [00:15, 9.39it/s] 153it [00:15, 9.54it/s] 154it [00:16, 9.65it/s] 155it [00:16, 9.69it/s] 156it [00:16, 9.77it/s] 157it [00:16, 9.83it/s] 158it [00:16, 9.85it/s] 159it [00:16, 9.88it/s] 160it [00:16, 9.88it/s] 161it [00:16, 9.91it/s] 162it [00:16, 9.91it/s] 163it [00:16, 9.92it/s] 164it [00:17, 9.91it/s] 165it [00:17, 9.92it/s] 166it [00:17, 9.90it/s] 167it [00:17, 9.93it/s] 168it [00:17, 9.91it/s] 169it [00:17, 9.91it/s] 170it [00:17, 9.89it/s] 171it [00:17, 9.91it/s] 172it [00:17, 9.91it/s] 173it [00:17, 9.92it/s] 174it [00:18, 9.91it/s] 175it [00:18, 9.89it/s] 176it [00:18, 9.90it/s] 177it [00:18, 9.89it/s] 178it [00:18, 9.87it/s] 179it [00:18, 9.89it/s] 180it [00:18, 9.83it/s] 181it [00:18, 9.87it/s] 182it [00:18, 9.82it/s] 183it [00:19, 9.83it/s] 184it [00:19, 9.24it/s] 185it [00:19, 9.43it/s] 186it [00:19, 9.56it/s] 187it [00:19, 9.60it/s] 188it [00:19, 9.68it/s] 189it [00:19, 9.72it/s] 190it [00:19, 9.73it/s] 191it [00:19, 9.79it/s] 192it [00:19, 9.75it/s] 193it [00:20, 9.80it/s] 194it [00:20, 9.75it/s] 195it [00:20, 8.48it/s] 196it [00:20, 8.85it/s] 196it [00:20, 9.58it/s] +2025-05-26 04:58:50,674 - INFO - Epoch: 45, Objective: tensor([5079.6650], device='cuda:0', grad_fn=), Loss: 0.031979966908693314, KL/n: 70.21158599853516 + 0it [00:00, ?it/s]2025-05-26 04:58:51,147 - INFO - [Epoch 046 | Batch 0000] IWAE-loss 4801.6733 | mean log_px -0.0225 | KL -3436.86 + 1it [00:00, 2.63it/s] 2it [00:00, 4.38it/s] 3it [00:00, 5.88it/s] 4it [00:00, 7.00it/s] 5it [00:00, 7.82it/s] 6it [00:00, 8.41it/s] 7it [00:01, 8.82it/s] 8it [00:01, 9.11it/s] 9it [00:01, 8.76it/s] 10it [00:01, 9.07it/s] 11it [00:01, 9.33it/s] 12it [00:01, 9.49it/s] 13it [00:01, 9.63it/s] 14it [00:01, 9.69it/s] 15it [00:01, 9.76it/s] 16it [00:01, 9.78it/s] 17it [00:02, 9.82it/s] 18it [00:02, 9.83it/s] 19it [00:02, 9.86it/s] 20it [00:02, 9.87it/s] 21it [00:02, 9.88it/s] 22it [00:02, 9.36it/s] 23it [00:02, 9.51it/s] 24it [00:02, 9.57it/s] 25it [00:02, 9.66it/s] 26it [00:02, 9.71it/s] 27it [00:03, 9.77it/s] 28it [00:03, 9.79it/s] 29it [00:03, 9.20it/s] 30it [00:03, 9.36it/s] 31it [00:03, 9.44it/s] 32it [00:03, 9.56it/s] 33it [00:03, 9.61it/s] 34it [00:03, 9.41it/s] 35it [00:03, 9.42it/s] 36it [00:04, 9.23it/s] 37it [00:04, 8.96it/s] 38it [00:04, 8.98it/s] 39it [00:04, 9.23it/s] 40it [00:04, 9.39it/s] 41it [00:04, 9.55it/s] 42it [00:04, 9.64it/s] 43it [00:04, 9.70it/s] 44it [00:04, 9.74it/s] 45it [00:04, 9.80it/s] 46it [00:05, 9.82it/s] 47it [00:05, 9.80it/s] 48it [00:05, 9.15it/s] 49it [00:05, 9.30it/s] 50it [00:05, 9.43it/s]2025-05-26 04:58:56,388 - INFO - [Epoch 046 | Batch 0050] IWAE-loss 4658.3813 | mean log_px -0.0175 | KL -3431.65 + 51it [00:05, 9.53it/s] 52it [00:05, 9.04it/s] 53it [00:05, 9.25it/s] 54it [00:05, 9.37it/s] 55it [00:06, 9.01it/s] 56it [00:06, 9.20it/s] 57it [00:06, 8.71it/s] 58it [00:06, 9.01it/s] 59it [00:06, 9.22it/s] 60it [00:06, 9.36it/s] 61it [00:06, 8.94it/s] 62it [00:06, 9.21it/s] 63it [00:06, 9.40it/s] 64it [00:07, 9.53it/s] 65it [00:07, 9.05it/s] 66it [00:07, 9.27it/s] 67it [00:07, 9.45it/s] 68it [00:07, 9.55it/s] 69it [00:07, 9.06it/s] 70it [00:07, 9.29it/s] 71it [00:07, 9.45it/s] 72it [00:07, 9.55it/s] 73it [00:08, 9.08it/s] 74it [00:08, 9.29it/s] 75it [00:08, 9.48it/s] 76it [00:08, 9.59it/s] 77it [00:08, 9.10it/s] 78it [00:08, 9.31it/s] 79it [00:08, 9.46it/s] 80it [00:08, 9.57it/s] 81it [00:08, 9.08it/s] 82it [00:08, 9.30it/s] 83it [00:09, 9.47it/s] 84it [00:09, 9.57it/s] 85it [00:09, 9.06it/s] 86it [00:09, 9.29it/s] 87it [00:09, 9.45it/s] 88it [00:09, 9.55it/s] 89it [00:09, 9.07it/s] 90it [00:09, 9.28it/s] 91it [00:09, 9.44it/s] 92it [00:10, 9.55it/s] 93it [00:10, 9.03it/s] 94it [00:10, 9.26it/s] 95it [00:10, 9.45it/s] 96it [00:10, 9.57it/s] 97it [00:10, 9.04it/s] 98it [00:10, 9.21it/s] 99it [00:10, 9.34it/s] 100it [00:10, 9.48it/s]2025-05-26 04:59:01,768 - INFO - [Epoch 046 | Batch 0100] IWAE-loss 5551.6338 | mean log_px -0.0332 | KL -3436.21 + 101it [00:11, 8.98it/s] 102it [00:11, 9.18it/s] 103it [00:11, 9.37it/s] 104it [00:11, 9.53it/s] 105it [00:11, 9.65it/s] 106it [00:11, 9.71it/s] 107it [00:11, 9.26it/s] 108it [00:11, 9.45it/s] 109it [00:11, 9.59it/s] 110it [00:11, 9.69it/s] 111it [00:12, 9.77it/s] 112it [00:12, 9.33it/s] 113it [00:12, 9.51it/s] 114it [00:12, 9.63it/s] 115it [00:12, 9.13it/s] 116it [00:12, 9.34it/s] 117it [00:12, 9.50it/s] 118it [00:12, 9.61it/s] 119it [00:12, 9.71it/s] 120it [00:13, 9.76it/s] 121it [00:13, 9.81it/s] 122it [00:13, 9.21it/s] 123it [00:13, 9.41it/s] 124it [00:13, 9.56it/s] 125it [00:13, 9.66it/s] 126it [00:13, 9.69it/s] 127it [00:13, 9.76it/s] 128it [00:13, 9.79it/s] 129it [00:13, 9.83it/s] 130it [00:14, 9.82it/s] 131it [00:14, 9.77it/s] 132it [00:14, 9.79it/s] 133it [00:14, 9.83it/s] 134it [00:14, 9.83it/s] 135it [00:14, 9.75it/s] 136it [00:14, 9.75it/s] 137it [00:14, 9.71it/s] 138it [00:14, 9.73it/s] 139it [00:14, 9.73it/s] 140it [00:15, 9.73it/s] 141it [00:15, 9.75it/s] 142it [00:15, 9.76it/s] 143it [00:15, 9.74it/s] 144it [00:15, 9.77it/s] 145it [00:15, 9.82it/s] 146it [00:15, 9.84it/s] 147it [00:15, 9.86it/s] 148it [00:15, 9.86it/s] 149it [00:15, 9.87it/s] 150it [00:16, 9.84it/s]2025-05-26 04:59:06,948 - INFO - [Epoch 046 | Batch 0150] IWAE-loss 5915.6621 | mean log_px -0.0405 | KL -3435.87 + 151it [00:16, 9.22it/s] 152it [00:16, 9.42it/s] 153it [00:16, 9.55it/s] 154it [00:16, 9.63it/s] 155it [00:16, 9.72it/s] 156it [00:16, 9.76it/s] 157it [00:16, 9.81it/s] 158it [00:16, 9.83it/s] 159it [00:17, 9.86it/s] 160it [00:17, 9.86it/s] 161it [00:17, 9.89it/s] 162it [00:17, 9.89it/s] 163it [00:17, 9.91it/s] 164it [00:17, 9.92it/s] 165it [00:17, 9.92it/s] 166it [00:17, 9.90it/s] 167it [00:17, 9.28it/s] 168it [00:17, 9.45it/s] 169it [00:18, 9.59it/s] 170it [00:18, 9.68it/s] 171it [00:18, 9.75it/s] 172it [00:18, 9.80it/s] 173it [00:18, 9.82it/s] 174it [00:18, 9.83it/s] 175it [00:18, 9.86it/s] 176it [00:18, 9.87it/s] 177it [00:18, 9.89it/s] 178it [00:18, 9.88it/s] 179it [00:19, 9.89it/s] 180it [00:19, 9.87it/s] 181it [00:19, 9.89it/s] 182it [00:19, 9.88it/s] 183it [00:19, 9.89it/s] 184it [00:19, 9.82it/s] 185it [00:19, 9.86it/s] 186it [00:19, 9.87it/s] 187it [00:19, 9.87it/s] 188it [00:19, 9.88it/s] 189it [00:20, 9.90it/s] 190it [00:20, 9.87it/s] 191it [00:20, 9.89it/s] 192it [00:20, 9.89it/s] 193it [00:20, 9.91it/s] 194it [00:20, 9.91it/s] 195it [00:20, 9.44it/s] 196it [00:20, 9.16it/s] 196it [00:20, 9.39it/s] +2025-05-26 04:59:11,680 - INFO - Epoch: 46, Objective: tensor([5599.3286], device='cuda:0', grad_fn=), Loss: 0.028604112565517426, KL/n: 70.04393768310547 + 0it [00:00, ?it/s]2025-05-26 04:59:11,968 - INFO - [Epoch 047 | Batch 0000] IWAE-loss 6606.0967 | mean log_px -0.0507 | KL -3426.96 + 1it [00:00, 5.13it/s] 2it [00:00, 6.55it/s] 3it [00:00, 7.69it/s] 4it [00:00, 8.41it/s] 5it [00:00, 8.90it/s] 6it [00:00, 9.21it/s] 7it [00:00, 8.95it/s] 8it [00:00, 9.24it/s] 10it [00:01, 9.58it/s] 11it [00:01, 9.68it/s] 12it [00:01, 9.63it/s] 13it [00:01, 9.69it/s] 14it [00:01, 9.74it/s] 15it [00:01, 9.81it/s] 16it [00:01, 9.36it/s] 17it [00:01, 9.52it/s] 18it [00:01, 9.63it/s] 19it [00:02, 9.72it/s] 20it [00:02, 9.78it/s] 21it [00:02, 9.85it/s] 22it [00:02, 9.87it/s] 23it [00:02, 9.90it/s] 24it [00:02, 9.90it/s] 25it [00:02, 9.92it/s] 26it [00:02, 9.93it/s] 27it [00:02, 9.94it/s] 28it [00:02, 9.94it/s] 29it [00:03, 9.96it/s] 30it [00:03, 9.94it/s] 31it [00:03, 9.95it/s] 32it [00:03, 9.94it/s] 33it [00:03, 9.96it/s] 34it [00:03, 9.93it/s] 35it [00:03, 9.94it/s] 36it [00:03, 9.92it/s] 37it [00:03, 9.94it/s] 38it [00:03, 9.94it/s] 39it [00:04, 9.93it/s] 40it [00:04, 9.94it/s] 41it [00:04, 9.94it/s] 42it [00:04, 9.94it/s] 43it [00:04, 9.95it/s] 44it [00:04, 9.94it/s] 45it [00:04, 9.95it/s] 46it [00:04, 9.92it/s] 47it [00:04, 9.93it/s] 48it [00:04, 9.91it/s] 49it [00:05, 9.91it/s] 50it [00:05, 9.91it/s]2025-05-26 04:59:17,070 - INFO - [Epoch 047 | Batch 0050] IWAE-loss 5071.6953 | mean log_px -0.0309 | KL -3429.48 + 51it [00:05, 9.26it/s] 52it [00:05, 9.44it/s] 53it [00:05, 9.58it/s] 54it [00:05, 9.67it/s] 55it [00:05, 9.75it/s] 56it [00:05, 9.80it/s] 57it [00:05, 9.85it/s] 58it [00:06, 9.87it/s] 60it [00:06, 9.93it/s] 61it [00:06, 9.94it/s] 62it [00:06, 9.94it/s] 63it [00:06, 9.94it/s] 64it [00:06, 9.92it/s] 65it [00:06, 9.92it/s] 66it [00:06, 9.92it/s] 67it [00:06, 9.92it/s] 68it [00:07, 9.71it/s] 69it [00:07, 9.30it/s] 70it [00:07, 9.45it/s] 71it [00:07, 9.58it/s] 72it [00:07, 9.67it/s] 73it [00:07, 9.75it/s] 74it [00:07, 9.71it/s] 75it [00:07, 9.11it/s] 76it [00:07, 9.08it/s] 77it [00:08, 9.11it/s] 78it [00:08, 9.33it/s] 79it [00:08, 8.91it/s] 80it [00:08, 9.18it/s] 81it [00:08, 9.39it/s] 82it [00:08, 9.54it/s] 83it [00:08, 9.67it/s] 84it [00:08, 9.73it/s] 85it [00:08, 9.55it/s] 86it [00:08, 8.73it/s] 87it [00:09, 8.74it/s] 88it [00:09, 8.93it/s] 89it [00:09, 9.17it/s] 90it [00:09, 8.83it/s] 91it [00:09, 9.13it/s] 92it [00:09, 9.34it/s] 93it [00:09, 9.51it/s] 94it [00:09, 9.13it/s] 95it [00:09, 9.36it/s] 96it [00:10, 9.52it/s] 97it [00:10, 9.65it/s] 98it [00:10, 9.72it/s] 99it [00:10, 9.78it/s] 100it [00:10, 9.19it/s]2025-05-26 04:59:22,358 - INFO - [Epoch 047 | Batch 0100] IWAE-loss 4540.6260 | mean log_px -0.0246 | KL -3428.07 + 101it [00:10, 9.37it/s] 102it [00:10, 9.51it/s] 103it [00:10, 9.62it/s] 104it [00:10, 9.10it/s] 105it [00:11, 9.32it/s] 106it [00:11, 9.46it/s] 107it [00:11, 9.59it/s] 108it [00:11, 9.09it/s] 109it [00:11, 9.33it/s] 110it [00:11, 9.49it/s] 111it [00:11, 9.61it/s] 112it [00:11, 9.21it/s] 113it [00:11, 9.39it/s] 114it [00:11, 9.52it/s] 115it [00:12, 9.63it/s] 116it [00:12, 9.11it/s] 117it [00:12, 9.33it/s] 118it [00:12, 9.44it/s] 119it [00:12, 9.57it/s] 120it [00:12, 9.05it/s] 121it [00:12, 9.02it/s] 122it [00:12, 9.11it/s] 123it [00:12, 9.30it/s] 124it [00:13, 8.87it/s] 125it [00:13, 9.17it/s] 126it [00:13, 9.39it/s] 127it [00:13, 9.55it/s] 128it [00:13, 9.65it/s] 129it [00:13, 9.74it/s] 130it [00:13, 9.29it/s] 131it [00:13, 9.47it/s] 132it [00:13, 9.60it/s] 133it [00:13, 9.70it/s] 134it [00:14, 9.77it/s] 135it [00:14, 9.82it/s] 136it [00:14, 9.85it/s] 137it [00:14, 9.83it/s] 138it [00:14, 9.13it/s] 139it [00:14, 9.04it/s] 140it [00:14, 9.16it/s] 141it [00:14, 9.27it/s] 142it [00:14, 9.34it/s] 143it [00:15, 9.09it/s] 144it [00:15, 9.22it/s] 145it [00:15, 9.31it/s] 146it [00:15, 9.38it/s] 147it [00:15, 9.42it/s] 148it [00:15, 9.44it/s] 149it [00:15, 9.35it/s] 150it [00:15, 9.22it/s]2025-05-26 04:59:27,687 - INFO - [Epoch 047 | Batch 0150] IWAE-loss 4956.0400 | mean log_px -0.0260 | KL -3420.03 + 151it [00:15, 9.44it/s] 152it [00:16, 9.54it/s] 153it [00:16, 9.65it/s] 154it [00:16, 9.31it/s] 155it [00:16, 9.49it/s] 156it [00:16, 9.63it/s] 157it [00:16, 9.74it/s] 158it [00:16, 9.81it/s] 160it [00:16, 9.90it/s] 161it [00:16, 9.93it/s] 162it [00:17, 9.94it/s] 163it [00:17, 9.95it/s] 164it [00:17, 9.96it/s] 166it [00:17, 9.98it/s] 168it [00:17, 9.99it/s] 170it [00:17, 9.99it/s] 172it [00:18, 9.99it/s] 174it [00:18, 10.00it/s] 175it [00:18, 9.99it/s] 176it [00:18, 9.98it/s] 177it [00:18, 9.58it/s] 178it [00:18, 9.66it/s] 179it [00:18, 9.74it/s] 180it [00:18, 9.79it/s] 181it [00:18, 9.82it/s] 182it [00:19, 9.86it/s] 184it [00:19, 9.92it/s] 186it [00:19, 9.96it/s] 188it [00:19, 9.97it/s] 190it [00:19, 9.98it/s] 192it [00:20, 10.00it/s] 193it [00:20, 9.58it/s] 194it [00:20, 9.66it/s] 195it [00:20, 9.37it/s] 196it [00:20, 9.54it/s] +2025-05-26 04:59:32,367 - INFO - Epoch: 47, Objective: tensor([5860.7812], device='cuda:0', grad_fn=), Loss: 0.03282099589705467, KL/n: 69.88233184814453 + 0it [00:00, ?it/s]2025-05-26 04:59:32,648 - INFO - [Epoch 048 | Batch 0000] IWAE-loss 4398.5654 | mean log_px -0.0148 | KL -3425.91 + 1it [00:00, 4.51it/s] 2it [00:00, 6.58it/s] 4it [00:00, 8.38it/s] 6it [00:00, 9.09it/s] 8it [00:00, 9.44it/s] 10it [00:01, 9.62it/s] 11it [00:01, 9.28it/s] 12it [00:01, 9.42it/s] 13it [00:01, 9.53it/s] 14it [00:01, 9.63it/s] 15it [00:01, 9.19it/s] 16it [00:01, 9.38it/s] 17it [00:01, 9.54it/s] 18it [00:01, 9.63it/s] 19it [00:02, 9.15it/s] 20it [00:02, 9.35it/s] 22it [00:02, 9.53it/s] 23it [00:02, 6.71it/s] 24it [00:02, 7.33it/s] 26it [00:02, 8.27it/s] 28it [00:03, 8.53it/s] 29it [00:03, 8.80it/s] 30it [00:03, 8.95it/s] 31it [00:03, 9.12it/s] 32it [00:03, 9.33it/s] 33it [00:03, 9.50it/s] 34it [00:03, 9.62it/s] 35it [00:03, 9.72it/s] 36it [00:04, 9.79it/s] 37it [00:04, 9.83it/s] 38it [00:04, 9.86it/s] 39it [00:04, 9.37it/s] 40it [00:04, 9.53it/s] 41it [00:04, 9.66it/s] 42it [00:04, 9.74it/s] 44it [00:04, 9.86it/s] 45it [00:04, 9.89it/s] 46it [00:05, 9.90it/s] 47it [00:05, 9.92it/s] 48it [00:05, 9.92it/s] 50it [00:05, 9.96it/s]2025-05-26 04:59:37,999 - INFO - [Epoch 048 | Batch 0050] IWAE-loss 5411.3506 | mean log_px -0.0329 | KL -3426.38 + 51it [00:05, 9.97it/s] 52it [00:05, 9.97it/s] 53it [00:05, 9.96it/s] 54it [00:05, 9.94it/s] 55it [00:05, 9.95it/s] 56it [00:06, 9.95it/s] 57it [00:06, 9.96it/s] 58it [00:06, 9.95it/s] 59it [00:06, 9.96it/s] 60it [00:06, 9.94it/s] 61it [00:06, 9.96it/s] 62it [00:06, 9.95it/s] 63it [00:06, 9.95it/s] 64it [00:06, 9.94it/s] 65it [00:06, 9.95it/s] 66it [00:07, 9.96it/s] 67it [00:07, 9.32it/s] 68it [00:07, 9.50it/s] 70it [00:07, 9.72it/s] 72it [00:07, 9.84it/s] 73it [00:07, 9.84it/s] 74it [00:07, 9.87it/s] 75it [00:07, 9.90it/s] 76it [00:08, 9.91it/s] 77it [00:08, 9.93it/s] 78it [00:08, 9.33it/s] 79it [00:08, 9.50it/s] 80it [00:08, 9.62it/s] 81it [00:08, 9.73it/s] 82it [00:08, 9.78it/s] 83it [00:08, 9.84it/s] 84it [00:08, 9.86it/s] 85it [00:09, 9.90it/s] 86it [00:09, 9.91it/s] 87it [00:09, 9.90it/s] 88it [00:09, 9.89it/s] 90it [00:09, 9.63it/s] 91it [00:09, 9.71it/s] 92it [00:09, 9.77it/s] 93it [00:09, 9.80it/s] 94it [00:09, 9.84it/s] 95it [00:10, 9.86it/s] 96it [00:10, 9.87it/s] 97it [00:10, 9.90it/s] 98it [00:10, 9.91it/s] 100it [00:10, 9.95it/s]2025-05-26 04:59:43,084 - INFO - [Epoch 048 | Batch 0100] IWAE-loss 5481.2749 | mean log_px -0.0403 | KL -3417.41 + 101it [00:10, 9.95it/s] 102it [00:10, 9.95it/s] 103it [00:10, 9.96it/s] 104it [00:10, 9.95it/s] 106it [00:11, 9.97it/s] 107it [00:11, 9.98it/s] 108it [00:11, 9.97it/s] 109it [00:11, 9.92it/s] 110it [00:11, 9.42it/s] 111it [00:11, 9.55it/s] 112it [00:11, 9.67it/s] 113it [00:11, 9.75it/s] 114it [00:11, 9.81it/s] 115it [00:12, 9.81it/s] 116it [00:12, 9.65it/s] 117it [00:12, 9.60it/s] 118it [00:12, 9.69it/s] 119it [00:12, 9.73it/s] 120it [00:12, 9.79it/s] 122it [00:12, 9.89it/s] 124it [00:12, 9.90it/s] 125it [00:13, 9.81it/s] 126it [00:13, 9.30it/s] 127it [00:13, 9.45it/s] 128it [00:13, 9.59it/s] 129it [00:13, 9.69it/s] 130it [00:13, 9.76it/s] 131it [00:13, 9.22it/s] 132it [00:13, 9.42it/s] 133it [00:13, 9.58it/s] 134it [00:14, 9.68it/s] 135it [00:14, 9.75it/s] 136it [00:14, 9.79it/s] 137it [00:14, 9.77it/s] 138it [00:14, 9.20it/s] 139it [00:14, 9.41it/s] 140it [00:14, 9.54it/s] 141it [00:14, 9.67it/s] 142it [00:14, 9.75it/s] 143it [00:14, 9.65it/s] 144it [00:15, 9.72it/s] 145it [00:15, 9.80it/s] 146it [00:15, 9.84it/s] 147it [00:15, 9.89it/s] 148it [00:15, 9.91it/s] 149it [00:15, 9.31it/s] 150it [00:15, 9.47it/s]2025-05-26 04:59:48,251 - INFO - [Epoch 048 | Batch 0150] IWAE-loss 4167.0127 | mean log_px -0.0108 | KL -3420.06 + 151it [00:15, 9.58it/s] 152it [00:15, 9.67it/s] 153it [00:15, 9.76it/s] 154it [00:16, 9.80it/s] 155it [00:16, 9.85it/s] 156it [00:16, 9.87it/s] 157it [00:16, 9.89it/s] 158it [00:16, 9.91it/s] 159it [00:16, 9.93it/s] 160it [00:16, 9.93it/s] 161it [00:16, 9.95it/s] 162it [00:16, 9.32it/s] 163it [00:17, 9.49it/s] 164it [00:17, 9.63it/s] 165it [00:17, 9.73it/s] 166it [00:17, 9.79it/s] 167it [00:17, 9.23it/s] 168it [00:17, 9.44it/s] 169it [00:17, 9.60it/s] 170it [00:17, 9.70it/s] 171it [00:17, 9.78it/s] 172it [00:17, 9.83it/s] 173it [00:18, 9.88it/s] 174it [00:18, 9.90it/s] 175it [00:18, 9.92it/s] 176it [00:18, 9.92it/s] 177it [00:18, 9.93it/s] 178it [00:18, 9.92it/s] 179it [00:18, 9.94it/s] 180it [00:18, 9.94it/s] 181it [00:18, 9.96it/s] 182it [00:18, 9.95it/s] 183it [00:19, 9.96it/s] 184it [00:19, 9.94it/s] 185it [00:19, 9.95it/s] 186it [00:19, 9.63it/s] 187it [00:19, 9.24it/s] 188it [00:19, 9.44it/s] 189it [00:19, 9.59it/s] 190it [00:19, 9.69it/s] 191it [00:19, 9.77it/s] 192it [00:19, 9.83it/s] 194it [00:20, 9.90it/s] 195it [00:20, 9.53it/s] 196it [00:20, 9.17it/s] 196it [00:20, 9.56it/s] +2025-05-26 04:59:52,990 - INFO - Epoch: 48, Objective: tensor([5577.5146], device='cuda:0', grad_fn=), Loss: 0.034665796905756, KL/n: 69.71744537353516 + 0it [00:00, ?it/s]2025-05-26 04:59:53,268 - INFO - [Epoch 049 | Batch 0000] IWAE-loss 4387.7876 | mean log_px -0.0154 | KL -3415.77 + 1it [00:00, 5.38it/s] 2it [00:00, 7.33it/s] 3it [00:00, 8.33it/s] 4it [00:00, 8.88it/s] 5it [00:00, 9.22it/s] 6it [00:00, 9.43it/s] 7it [00:00, 9.59it/s] 8it [00:00, 9.68it/s] 10it [00:01, 9.80it/s] 11it [00:01, 9.84it/s] 12it [00:01, 9.85it/s] 14it [00:01, 9.87it/s] 15it [00:01, 9.90it/s] 16it [00:01, 9.90it/s] 18it [00:01, 9.93it/s] 19it [00:02, 9.92it/s] 20it [00:02, 9.90it/s] 21it [00:02, 9.92it/s] 22it [00:02, 9.90it/s] 23it [00:02, 9.91it/s] 24it [00:02, 9.88it/s] 25it [00:02, 9.28it/s] 26it [00:02, 9.46it/s] 27it [00:02, 9.60it/s] 28it [00:02, 9.69it/s] 29it [00:03, 9.78it/s] 30it [00:03, 9.81it/s] 31it [00:03, 9.87it/s] 32it [00:03, 9.89it/s] 33it [00:03, 9.91it/s] 34it [00:03, 9.83it/s] 35it [00:03, 9.86it/s] 36it [00:03, 9.47it/s] 37it [00:03, 9.60it/s] 38it [00:03, 9.09it/s] 39it [00:04, 9.33it/s] 40it [00:04, 9.48it/s] 41it [00:04, 9.59it/s] 42it [00:04, 9.65it/s] 43it [00:04, 9.72it/s] 44it [00:04, 8.98it/s] 45it [00:04, 8.92it/s] 46it [00:04, 9.13it/s] 47it [00:04, 9.34it/s] 48it [00:05, 9.48it/s] 49it [00:05, 9.62it/s] 50it [00:05, 9.70it/s]2025-05-26 04:59:58,425 - INFO - [Epoch 049 | Batch 0050] IWAE-loss 6286.7646 | mean log_px -0.0480 | KL -3411.50 + 51it [00:05, 9.15it/s] 52it [00:05, 9.38it/s] 53it [00:05, 9.54it/s] 54it [00:05, 9.63it/s] 55it [00:05, 9.71it/s] 56it [00:05, 9.76it/s] 57it [00:05, 9.82it/s] 58it [00:06, 9.83it/s] 59it [00:06, 9.80it/s] 60it [00:06, 9.72it/s] 61it [00:06, 9.75it/s] 62it [00:06, 9.79it/s] 63it [00:06, 9.84it/s] 64it [00:06, 9.85it/s] 65it [00:06, 9.83it/s] 66it [00:06, 9.80it/s] 67it [00:07, 9.17it/s] 68it [00:07, 9.34it/s] 69it [00:07, 9.49it/s] 70it [00:07, 9.61it/s] 71it [00:07, 9.66it/s] 72it [00:07, 9.72it/s] 73it [00:07, 9.75it/s] 74it [00:07, 9.79it/s] 75it [00:07, 9.83it/s] 76it [00:07, 9.86it/s] 77it [00:08, 9.88it/s] 78it [00:08, 9.85it/s] 79it [00:08, 9.86it/s] 80it [00:08, 9.86it/s] 81it [00:08, 9.75it/s] 82it [00:08, 9.75it/s] 83it [00:08, 9.49it/s] 84it [00:08, 9.10it/s] 85it [00:08, 9.30it/s] 86it [00:08, 9.46it/s] 87it [00:09, 9.59it/s] 88it [00:09, 9.65it/s] 89it [00:09, 9.63it/s] 90it [00:09, 8.81it/s] 91it [00:09, 9.06it/s] 92it [00:09, 9.22it/s] 93it [00:09, 9.40it/s] 94it [00:09, 9.51it/s] 95it [00:09, 9.65it/s] 96it [00:10, 9.66it/s] 97it [00:10, 9.66it/s] 98it [00:10, 9.66it/s] 99it [00:10, 9.68it/s] 100it [00:10, 9.70it/s]2025-05-26 05:00:03,632 - INFO - [Epoch 049 | Batch 0100] IWAE-loss 6288.9609 | mean log_px -0.0417 | KL -3411.01 + 101it [00:10, 9.12it/s] 102it [00:10, 9.34it/s] 103it [00:10, 9.52it/s] 104it [00:10, 9.63it/s] 105it [00:10, 9.71it/s] 106it [00:11, 9.75it/s] 107it [00:11, 9.80it/s] 108it [00:11, 9.82it/s] 109it [00:11, 9.85it/s] 110it [00:11, 9.86it/s] 111it [00:11, 9.88it/s] 112it [00:11, 9.87it/s] 113it [00:11, 9.88it/s] 114it [00:11, 9.88it/s] 115it [00:11, 9.90it/s] 116it [00:12, 9.90it/s] 117it [00:12, 9.86it/s] 118it [00:12, 9.85it/s] 119it [00:12, 9.86it/s] 120it [00:12, 9.23it/s] 121it [00:12, 9.43it/s] 122it [00:12, 9.54it/s] 123it [00:12, 9.65it/s] 124it [00:12, 9.69it/s] 125it [00:13, 9.74it/s] 126it [00:13, 9.17it/s] 127it [00:13, 9.32it/s] 128it [00:13, 9.49it/s] 129it [00:13, 9.63it/s] 130it [00:13, 9.71it/s] 131it [00:13, 9.75it/s] 132it [00:13, 9.78it/s] 133it [00:13, 9.83it/s] 134it [00:13, 9.86it/s] 135it [00:14, 9.87it/s] 136it [00:14, 9.86it/s] 137it [00:14, 9.89it/s] 138it [00:14, 9.87it/s] 139it [00:14, 9.89it/s] 140it [00:14, 9.87it/s] 141it [00:14, 9.90it/s] 142it [00:14, 9.88it/s] 143it [00:14, 9.91it/s] 144it [00:14, 9.90it/s] 145it [00:15, 9.90it/s] 146it [00:15, 9.90it/s] 147it [00:15, 9.92it/s] 148it [00:15, 9.92it/s] 149it [00:15, 9.26it/s] 150it [00:15, 9.44it/s]2025-05-26 05:00:08,783 - INFO - [Epoch 049 | Batch 0150] IWAE-loss 5174.5752 | mean log_px -0.0317 | KL -3409.79 + 151it [00:15, 9.52it/s] 152it [00:15, 9.58it/s] 153it [00:15, 9.65it/s] 154it [00:16, 9.72it/s] 155it [00:16, 9.64it/s] 156it [00:16, 9.57it/s] 157it [00:16, 9.57it/s] 158it [00:16, 9.48it/s] 159it [00:16, 9.49it/s] 160it [00:16, 9.61it/s] 161it [00:16, 9.70it/s] 162it [00:16, 9.69it/s] 163it [00:16, 9.74it/s] 164it [00:17, 9.80it/s] 165it [00:17, 9.83it/s] 166it [00:17, 9.22it/s] 167it [00:17, 9.42it/s] 168it [00:17, 9.45it/s] 169it [00:17, 9.53it/s] 170it [00:17, 9.49it/s] 171it [00:17, 9.44it/s] 172it [00:17, 9.36it/s] 173it [00:18, 9.47it/s] 174it [00:18, 9.55it/s] 175it [00:18, 9.61it/s] 176it [00:18, 9.50it/s] 177it [00:18, 9.40it/s] 178it [00:18, 9.05it/s] 179it [00:18, 9.29it/s] 180it [00:18, 9.47it/s] 181it [00:18, 9.60it/s] 182it [00:18, 9.68it/s] 183it [00:19, 9.75it/s] 184it [00:19, 9.73it/s] 185it [00:19, 9.72it/s] 186it [00:19, 9.76it/s] 187it [00:19, 9.80it/s] 188it [00:19, 9.78it/s] 189it [00:19, 9.79it/s] 190it [00:19, 9.78it/s] 191it [00:19, 9.82it/s] 192it [00:19, 9.84it/s] 193it [00:20, 9.85it/s] 194it [00:20, 9.80it/s] 195it [00:20, 9.37it/s] 196it [00:20, 8.98it/s] 196it [00:20, 9.58it/s] +2025-05-26 05:00:13,594 - INFO - Epoch: 49, Objective: tensor([5592.1567], device='cuda:0', grad_fn=), Loss: 0.03624124079942703, KL/n: 69.54737854003906 + 0it [00:00, ?it/s]2025-05-26 05:00:13,872 - INFO - [Epoch 050 | Batch 0000] IWAE-loss 4820.5073 | mean log_px -0.0246 | KL -3407.40 + 1it [00:00, 5.39it/s] 2it [00:00, 6.82it/s] 3it [00:00, 7.97it/s] 4it [00:00, 8.65it/s] 5it [00:00, 9.07it/s] 6it [00:00, 9.31it/s] 8it [00:00, 9.64it/s] 9it [00:01, 9.72it/s] 10it [00:01, 9.77it/s] 11it [00:01, 9.83it/s] 12it [00:01, 9.86it/s] 14it [00:01, 6.99it/s] 15it [00:01, 7.28it/s] 16it [00:01, 7.81it/s] 17it [00:02, 8.30it/s] 18it [00:02, 8.69it/s] 19it [00:02, 8.94it/s] 20it [00:02, 9.20it/s] 21it [00:02, 8.86it/s] 22it [00:02, 9.14it/s] 23it [00:02, 9.37it/s] 24it [00:02, 9.53it/s] 26it [00:02, 9.74it/s] 27it [00:03, 9.79it/s] 28it [00:03, 9.76it/s] 29it [00:03, 9.21it/s] 30it [00:03, 9.39it/s] 32it [00:03, 9.65it/s] 33it [00:03, 9.71it/s] 34it [00:03, 9.12it/s] 35it [00:03, 9.29it/s] 36it [00:04, 9.45it/s] 37it [00:04, 9.59it/s] 38it [00:04, 9.67it/s] 39it [00:04, 9.76it/s] 40it [00:04, 9.80it/s] 41it [00:04, 9.85it/s] 42it [00:04, 9.81it/s] 43it [00:04, 9.86it/s] 44it [00:04, 9.88it/s] 45it [00:04, 9.90it/s] 46it [00:05, 9.92it/s] 47it [00:05, 9.19it/s] 48it [00:05, 9.39it/s] 49it [00:05, 9.56it/s] 50it [00:05, 9.66it/s]2025-05-26 05:00:19,241 - INFO - [Epoch 050 | Batch 0050] IWAE-loss 6266.3530 | mean log_px -0.0450 | KL -3405.55 + 51it [00:05, 9.12it/s] 52it [00:05, 9.34it/s] 53it [00:05, 9.51it/s] 54it [00:05, 9.63it/s] 55it [00:05, 9.71it/s] 56it [00:06, 9.78it/s] 57it [00:06, 9.82it/s] 58it [00:06, 9.86it/s] 59it [00:06, 9.88it/s] 60it [00:06, 9.88it/s] 61it [00:06, 9.85it/s] 62it [00:06, 9.87it/s] 63it [00:06, 9.90it/s] 64it [00:06, 9.27it/s] 66it [00:07, 9.58it/s] 67it [00:07, 9.67it/s] 68it [00:07, 9.72it/s] 69it [00:07, 9.77it/s] 70it [00:07, 9.80it/s] 71it [00:07, 9.83it/s] 72it [00:07, 9.84it/s] 73it [00:07, 9.88it/s] 74it [00:07, 9.90it/s] 75it [00:08, 9.92it/s] 76it [00:08, 9.92it/s] 77it [00:08, 9.93it/s] 78it [00:08, 9.92it/s] 79it [00:08, 9.92it/s] 80it [00:08, 9.84it/s] 81it [00:08, 9.67it/s] 82it [00:08, 9.73it/s] 83it [00:08, 9.79it/s] 84it [00:08, 9.81it/s] 85it [00:09, 9.86it/s] 86it [00:09, 9.85it/s] 87it [00:09, 9.89it/s] 88it [00:09, 9.90it/s] 89it [00:09, 9.92it/s] 90it [00:09, 9.92it/s] 91it [00:09, 9.94it/s] 92it [00:09, 9.93it/s] 93it [00:09, 9.94it/s] 94it [00:09, 9.93it/s] 95it [00:10, 9.93it/s] 96it [00:10, 9.91it/s] 97it [00:10, 9.93it/s] 98it [00:10, 9.93it/s] 99it [00:10, 9.92it/s] 100it [00:10, 9.90it/s]2025-05-26 05:00:24,338 - INFO - [Epoch 050 | Batch 0100] IWAE-loss 5081.3320 | mean log_px -0.0248 | KL -3404.80 + 101it [00:10, 9.28it/s] 102it [00:10, 9.47it/s] 103it [00:10, 9.61it/s] 104it [00:10, 9.67it/s] 105it [00:11, 9.73it/s] 106it [00:11, 9.77it/s] 107it [00:11, 9.81it/s] 108it [00:11, 9.82it/s] 109it [00:11, 9.79it/s] 110it [00:11, 9.82it/s] 111it [00:11, 9.86it/s] 112it [00:11, 9.86it/s] 113it [00:11, 9.89it/s] 114it [00:11, 9.89it/s] 115it [00:12, 9.91it/s] 116it [00:12, 9.91it/s] 117it [00:12, 9.91it/s] 118it [00:12, 9.91it/s] 119it [00:12, 9.90it/s] 120it [00:12, 9.89it/s] 121it [00:12, 9.90it/s] 122it [00:12, 9.90it/s] 123it [00:12, 9.89it/s] 124it [00:12, 9.89it/s] 125it [00:13, 9.87it/s] 126it [00:13, 9.85it/s] 127it [00:13, 9.39it/s] 128it [00:13, 9.53it/s] 129it [00:13, 9.63it/s] 130it [00:13, 9.65it/s] 131it [00:13, 9.24it/s] 132it [00:13, 9.41it/s] 133it [00:13, 9.57it/s] 134it [00:14, 9.67it/s] 135it [00:14, 9.74it/s] 136it [00:14, 9.78it/s] 137it [00:14, 9.84it/s] 138it [00:14, 9.86it/s] 139it [00:14, 9.87it/s] 140it [00:14, 9.88it/s] 141it [00:14, 9.83it/s] 142it [00:14, 9.53it/s] 143it [00:14, 8.84it/s] 144it [00:15, 9.04it/s] 145it [00:15, 9.22it/s] 146it [00:15, 9.31it/s] 147it [00:15, 8.90it/s] 148it [00:15, 9.09it/s] 149it [00:15, 9.25it/s] 150it [00:15, 8.84it/s]2025-05-26 05:00:29,562 - INFO - [Epoch 050 | Batch 0150] IWAE-loss 5562.5117 | mean log_px -0.0343 | KL -3396.77 + 151it [00:15, 9.02it/s] 152it [00:15, 9.17it/s] 153it [00:16, 8.77it/s] 154it [00:16, 8.93it/s] 155it [00:16, 8.92it/s] 156it [00:16, 8.88it/s] 157it [00:16, 8.64it/s] 158it [00:16, 8.89it/s] 159it [00:16, 9.12it/s] 160it [00:16, 9.23it/s] 161it [00:16, 9.32it/s] 162it [00:17, 9.40it/s] 163it [00:17, 9.48it/s] 164it [00:17, 9.50it/s] 165it [00:17, 9.53it/s] 166it [00:17, 9.54it/s] 167it [00:17, 9.54it/s] 168it [00:17, 9.58it/s] 169it [00:17, 9.54it/s] 170it [00:17, 9.50it/s] 171it [00:18, 9.47it/s] 172it [00:18, 9.35it/s] 173it [00:18, 9.41it/s] 174it [00:18, 9.50it/s] 175it [00:18, 9.58it/s] 176it [00:18, 9.05it/s] 177it [00:18, 9.18it/s] 178it [00:18, 9.27it/s] 179it [00:18, 9.32it/s] 180it [00:18, 9.39it/s] 181it [00:19, 8.94it/s] 182it [00:19, 9.12it/s] 183it [00:19, 9.25it/s] 184it [00:19, 9.38it/s] 185it [00:19, 9.41it/s] 186it [00:19, 9.42it/s] 187it [00:19, 9.46it/s] 188it [00:19, 9.50it/s] 189it [00:19, 9.39it/s] 190it [00:20, 9.49it/s] 191it [00:20, 9.50it/s] 192it [00:20, 9.49it/s] 193it [00:20, 9.48it/s] 194it [00:20, 9.52it/s] 195it [00:20, 8.45it/s] 196it [00:20, 8.73it/s] 196it [00:20, 9.42it/s] +2025-05-26 05:00:34,534 - INFO - Epoch: 50, Objective: tensor([5149.9160], device='cuda:0', grad_fn=), Loss: 0.02591179683804512, KL/n: 69.36389923095703 + 0it [00:00, ?it/s]2025-05-26 05:00:34,820 - INFO - [Epoch 051 | Batch 0000] IWAE-loss 4607.3794 | mean log_px -0.0298 | KL -3396.73 + 1it [00:00, 5.12it/s] 2it [00:00, 6.95it/s] 3it [00:00, 7.94it/s] 4it [00:00, 8.51it/s] 5it [00:00, 8.85it/s] 6it [00:00, 9.07it/s] 7it [00:00, 9.20it/s] 8it [00:00, 9.30it/s] 9it [00:01, 9.33it/s] 10it [00:01, 9.38it/s] 11it [00:01, 9.45it/s] 12it [00:01, 9.44it/s] 13it [00:01, 9.47it/s] 14it [00:01, 9.50it/s] 15it [00:01, 9.57it/s] 16it [00:01, 9.54it/s] 17it [00:01, 9.56it/s] 18it [00:01, 9.60it/s] 19it [00:02, 9.60it/s] 20it [00:02, 9.39it/s] 21it [00:02, 9.45it/s] 22it [00:02, 9.46it/s] 23it [00:02, 9.54it/s] 24it [00:02, 9.53it/s] 25it [00:02, 9.55it/s] 26it [00:02, 9.54it/s] 27it [00:02, 9.54it/s] 28it [00:03, 9.52it/s] 29it [00:03, 9.53it/s] 30it [00:03, 9.52it/s] 31it [00:03, 9.55it/s] 32it [00:03, 9.52it/s] 33it [00:03, 9.54it/s] 34it [00:03, 9.34it/s] 35it [00:03, 9.37it/s] 36it [00:03, 9.42it/s] 37it [00:03, 9.46it/s] 38it [00:04, 9.47it/s] 39it [00:04, 9.50it/s] 40it [00:04, 9.53it/s] 41it [00:04, 9.50it/s] 42it [00:04, 9.49it/s] 43it [00:04, 9.53it/s] 44it [00:04, 9.46it/s] 45it [00:04, 9.47it/s] 46it [00:04, 9.48it/s] 47it [00:05, 9.49it/s] 48it [00:05, 9.49it/s] 49it [00:05, 9.48it/s] 50it [00:05, 9.45it/s]2025-05-26 05:00:40,085 - INFO - [Epoch 051 | Batch 0050] IWAE-loss 4357.4595 | mean log_px -0.0165 | KL -3393.12 + 51it [00:05, 9.44it/s] 52it [00:05, 9.47it/s] 53it [00:05, 9.47it/s] 54it [00:05, 9.47it/s] 55it [00:05, 9.51it/s] 56it [00:05, 9.52it/s] 57it [00:06, 9.49it/s] 58it [00:06, 9.49it/s] 59it [00:06, 9.49it/s] 60it [00:06, 9.22it/s] 61it [00:06, 9.33it/s] 62it [00:06, 9.35it/s] 63it [00:06, 9.42it/s] 64it [00:06, 9.43it/s] 65it [00:06, 9.44it/s] 66it [00:07, 9.48it/s] 67it [00:07, 9.45it/s] 68it [00:07, 9.45it/s] 69it [00:07, 9.49it/s] 70it [00:07, 9.48it/s] 71it [00:07, 9.52it/s] 72it [00:07, 9.48it/s] 73it [00:07, 9.49it/s] 74it [00:07, 9.48it/s] 75it [00:07, 9.50it/s] 76it [00:08, 9.50it/s] 77it [00:08, 9.49it/s] 78it [00:08, 9.48it/s] 79it [00:08, 9.51it/s] 80it [00:08, 9.56it/s] 81it [00:08, 9.54it/s] 82it [00:08, 9.52it/s] 83it [00:08, 9.53it/s] 84it [00:08, 9.48it/s] 85it [00:09, 9.51it/s] 86it [00:09, 9.53it/s] 87it [00:09, 9.56it/s] 88it [00:09, 9.54it/s] 89it [00:09, 9.55it/s] 90it [00:09, 9.52it/s] 91it [00:09, 9.57it/s] 92it [00:09, 9.53it/s] 93it [00:09, 9.54it/s] 94it [00:09, 9.55it/s] 95it [00:10, 9.56it/s] 96it [00:10, 9.51it/s] 97it [00:10, 9.57it/s] 98it [00:10, 9.62it/s] 99it [00:10, 9.49it/s] 100it [00:10, 9.55it/s]2025-05-26 05:00:45,350 - INFO - [Epoch 051 | Batch 0100] IWAE-loss 4766.6494 | mean log_px -0.0259 | KL -3393.81 + 101it [00:10, 9.56it/s] 102it [00:10, 9.50it/s] 103it [00:10, 9.54it/s] 104it [00:11, 9.57it/s] 105it [00:11, 9.54it/s] 106it [00:11, 9.52it/s] 107it [00:11, 9.51it/s] 108it [00:11, 9.51it/s] 109it [00:11, 9.53it/s] 110it [00:11, 9.32it/s] 111it [00:11, 9.40it/s] 112it [00:11, 9.44it/s] 113it [00:11, 9.49it/s] 114it [00:12, 9.54it/s] 115it [00:12, 9.53it/s] 116it [00:12, 9.35it/s] 117it [00:12, 9.42it/s] 118it [00:12, 9.45it/s] 119it [00:12, 9.51it/s] 120it [00:12, 9.48it/s] 121it [00:12, 9.48it/s] 122it [00:12, 9.50it/s] 123it [00:13, 9.49it/s] 124it [00:13, 9.51it/s] 125it [00:13, 9.50it/s] 126it [00:13, 9.56it/s] 127it [00:13, 9.56it/s] 128it [00:13, 9.55it/s] 129it [00:13, 9.52it/s] 130it [00:13, 9.52it/s] 131it [00:13, 9.54it/s] 132it [00:13, 9.53it/s] 133it [00:14, 9.56it/s] 134it [00:14, 9.50it/s] 135it [00:14, 9.54it/s] 136it [00:14, 9.56it/s] 137it [00:14, 9.60it/s] 138it [00:14, 9.55it/s] 139it [00:14, 9.60it/s] 140it [00:14, 9.58it/s] 141it [00:14, 9.61it/s] 142it [00:15, 9.55it/s] 143it [00:15, 9.50it/s] 144it [00:15, 9.53it/s] 145it [00:15, 9.49it/s] 146it [00:15, 9.51it/s] 147it [00:15, 8.98it/s] 148it [00:15, 9.05it/s] 149it [00:15, 9.18it/s] 150it [00:15, 9.31it/s]2025-05-26 05:00:50,629 - INFO - [Epoch 051 | Batch 0150] IWAE-loss 5195.3750 | mean log_px -0.0258 | KL -3389.90 + 151it [00:16, 9.40it/s] 152it [00:16, 9.44it/s] 153it [00:16, 9.44it/s] 154it [00:16, 9.06it/s] 155it [00:16, 9.18it/s] 156it [00:16, 9.28it/s] 157it [00:16, 9.36it/s] 158it [00:16, 9.42it/s] 159it [00:16, 8.94it/s] 160it [00:16, 9.11it/s] 161it [00:17, 9.24it/s] 162it [00:17, 9.33it/s] 163it [00:17, 9.40it/s] 164it [00:17, 9.45it/s] 165it [00:17, 9.50it/s] 166it [00:17, 9.52it/s] 167it [00:17, 9.53it/s] 168it [00:17, 9.53it/s] 169it [00:17, 9.48it/s] 170it [00:18, 9.56it/s] 171it [00:18, 9.54it/s] 172it [00:18, 9.50it/s] 173it [00:18, 9.51it/s] 174it [00:18, 9.48it/s] 175it [00:18, 8.99it/s] 176it [00:18, 9.15it/s] 177it [00:18, 9.25it/s] 178it [00:18, 9.33it/s] 179it [00:19, 9.34it/s] 180it [00:19, 9.41it/s] 181it [00:19, 9.47it/s] 182it [00:19, 9.49it/s] 183it [00:19, 9.51it/s] 184it [00:19, 9.51it/s] 185it [00:19, 8.97it/s] 186it [00:19, 9.15it/s] 187it [00:19, 9.25it/s] 188it [00:19, 9.27it/s] 189it [00:20, 9.39it/s] 190it [00:20, 9.48it/s] 191it [00:20, 9.45it/s] 192it [00:20, 9.48it/s] 193it [00:20, 9.53it/s] 194it [00:20, 9.55it/s] 195it [00:20, 8.95it/s] 196it [00:20, 9.17it/s] 196it [00:20, 9.39it/s] +2025-05-26 05:00:55,549 - INFO - Epoch: 51, Objective: tensor([5151.0229], device='cuda:0', grad_fn=), Loss: 0.03177899122238159, KL/n: 69.16956329345703 + 0it [00:00, ?it/s]2025-05-26 05:00:55,828 - INFO - [Epoch 052 | Batch 0000] IWAE-loss 4369.1685 | mean log_px -0.0140 | KL -3385.86 + 1it [00:00, 4.73it/s] 2it [00:00, 6.71it/s] 3it [00:00, 7.73it/s] 4it [00:00, 8.32it/s] 5it [00:00, 8.18it/s] 6it [00:00, 8.55it/s] 7it [00:00, 8.85it/s] 8it [00:00, 8.93it/s] 9it [00:01, 9.13it/s] 10it [00:01, 8.67it/s] 11it [00:01, 8.88it/s] 12it [00:01, 9.04it/s] 13it [00:01, 9.17it/s] 14it [00:01, 5.81it/s] 15it [00:01, 6.57it/s] 16it [00:02, 7.24it/s] 17it [00:02, 7.79it/s] 18it [00:02, 8.23it/s] 19it [00:02, 8.54it/s] 20it [00:02, 8.80it/s] 21it [00:02, 8.52it/s] 22it [00:02, 8.76it/s] 23it [00:02, 8.98it/s] 24it [00:02, 9.10it/s] 25it [00:03, 8.69it/s] 26it [00:03, 8.87it/s] 27it [00:03, 9.05it/s] 28it [00:03, 9.14it/s] 29it [00:03, 8.76it/s] 30it [00:03, 9.00it/s] 31it [00:03, 9.19it/s] 32it [00:03, 9.32it/s] 33it [00:03, 9.34it/s] 34it [00:04, 9.30it/s] 35it [00:04, 8.94it/s] 36it [00:04, 9.08it/s] 37it [00:04, 9.24it/s] 38it [00:04, 9.32it/s] 39it [00:04, 8.84it/s] 40it [00:04, 9.02it/s] 41it [00:04, 9.13it/s] 42it [00:04, 9.24it/s] 43it [00:05, 9.33it/s] 44it [00:05, 9.30it/s] 45it [00:05, 9.36it/s] 46it [00:05, 8.89it/s] 47it [00:05, 9.05it/s] 48it [00:05, 9.09it/s] 49it [00:05, 9.10it/s] 50it [00:05, 8.39it/s]2025-05-26 05:01:01,563 - INFO - [Epoch 052 | Batch 0050] IWAE-loss 4918.5332 | mean log_px -0.0245 | KL -3388.32 + 51it [00:05, 8.66it/s] 52it [00:06, 8.92it/s] 53it [00:06, 9.12it/s] 54it [00:06, 9.23it/s] 55it [00:06, 9.35it/s] 56it [00:06, 8.95it/s] 57it [00:06, 9.15it/s] 58it [00:06, 9.26it/s] 59it [00:06, 9.34it/s] 60it [00:06, 9.36it/s] 61it [00:06, 9.43it/s] 62it [00:07, 8.86it/s] 63it [00:07, 9.05it/s] 64it [00:07, 9.01it/s] 65it [00:07, 9.10it/s] 66it [00:07, 9.21it/s] 67it [00:07, 9.31it/s] 68it [00:07, 9.33it/s] 69it [00:07, 9.34it/s] 70it [00:07, 9.38it/s] 71it [00:08, 9.35it/s] 72it [00:08, 9.34it/s] 73it [00:08, 9.40it/s] 74it [00:08, 9.40it/s] 75it [00:08, 9.45it/s] 76it [00:08, 8.99it/s] 77it [00:08, 9.13it/s] 78it [00:08, 9.18it/s] 79it [00:08, 9.14it/s] 80it [00:09, 9.23it/s] 81it [00:09, 9.36it/s] 82it [00:09, 8.97it/s] 83it [00:09, 9.03it/s] 84it [00:09, 9.14it/s] 85it [00:09, 9.26it/s] 86it [00:09, 9.26it/s] 87it [00:09, 9.30it/s] 88it [00:09, 9.39it/s] 89it [00:10, 9.45it/s] 90it [00:10, 9.44it/s] 91it [00:10, 9.45it/s] 92it [00:10, 9.50it/s] 93it [00:10, 9.52it/s] 94it [00:10, 8.98it/s] 95it [00:10, 9.18it/s] 96it [00:10, 9.22it/s] 97it [00:10, 9.30it/s] 98it [00:10, 9.31it/s] 99it [00:11, 9.37it/s] 100it [00:11, 9.39it/s]2025-05-26 05:01:06,947 - INFO - [Epoch 052 | Batch 0100] IWAE-loss 4805.5391 | mean log_px -0.0203 | KL -3385.52 + 101it [00:11, 8.98it/s] 102it [00:11, 9.10it/s] 103it [00:11, 9.21it/s] 104it [00:11, 9.29it/s] 105it [00:11, 9.35it/s] 106it [00:11, 9.38it/s] 107it [00:11, 9.41it/s] 108it [00:12, 9.37it/s] 109it [00:12, 9.42it/s] 110it [00:12, 9.47it/s] 111it [00:12, 9.35it/s] 112it [00:12, 8.97it/s] 113it [00:12, 9.09it/s] 114it [00:12, 9.20it/s] 115it [00:12, 9.27it/s] 116it [00:12, 9.29it/s] 117it [00:13, 9.32it/s] 118it [00:13, 9.34it/s] 119it [00:13, 9.39it/s] 120it [00:13, 8.98it/s] 121it [00:13, 9.18it/s] 122it [00:13, 9.21it/s] 123it [00:13, 9.36it/s] 124it [00:13, 9.36it/s] 125it [00:13, 9.40it/s] 126it [00:14, 9.43it/s] 127it [00:14, 9.47it/s] 128it [00:14, 9.47it/s] 129it [00:14, 9.49it/s] 130it [00:14, 9.47it/s] 131it [00:14, 9.48it/s] 132it [00:14, 8.95it/s] 133it [00:14, 9.07it/s] 134it [00:14, 9.20it/s] 135it [00:14, 9.34it/s] 136it [00:15, 9.37it/s] 137it [00:15, 9.41it/s] 138it [00:15, 9.44it/s] 139it [00:15, 9.47it/s] 140it [00:15, 9.45it/s] 141it [00:15, 9.50it/s] 142it [00:15, 9.46it/s] 143it [00:15, 9.45it/s] 144it [00:15, 9.47it/s] 145it [00:16, 9.03it/s] 146it [00:16, 9.13it/s] 147it [00:16, 9.25it/s] 148it [00:16, 9.29it/s] 149it [00:16, 8.84it/s] 150it [00:16, 9.01it/s]2025-05-26 05:01:12,339 - INFO - [Epoch 052 | Batch 0150] IWAE-loss 5867.5352 | mean log_px -0.0419 | KL -3378.72 + 151it [00:16, 9.18it/s] 152it [00:16, 9.30it/s] 153it [00:16, 9.39it/s] 154it [00:17, 9.46it/s] 155it [00:17, 9.53it/s] 156it [00:17, 9.51it/s] 157it [00:17, 9.57it/s] 158it [00:17, 9.11it/s] 159it [00:17, 9.23it/s] 160it [00:17, 9.24it/s] 161it [00:17, 9.34it/s] 162it [00:17, 9.35it/s] 163it [00:17, 9.35it/s] 164it [00:18, 9.41it/s] 165it [00:18, 9.43it/s] 166it [00:18, 9.46it/s] 167it [00:18, 9.47it/s] 168it [00:18, 9.51it/s] 169it [00:18, 8.96it/s] 170it [00:18, 9.12it/s] 171it [00:18, 9.23it/s] 172it [00:18, 9.34it/s] 173it [00:19, 9.37it/s] 174it [00:19, 9.43it/s] 175it [00:19, 9.46it/s] 176it [00:19, 9.47it/s] 177it [00:19, 8.96it/s] 178it [00:19, 9.15it/s] 179it [00:19, 9.26it/s] 180it [00:19, 9.32it/s] 181it [00:19, 9.36it/s] 182it [00:20, 9.45it/s] 183it [00:20, 9.45it/s] 184it [00:20, 9.45it/s] 185it [00:20, 9.49it/s] 186it [00:20, 9.48it/s] 187it [00:20, 9.53it/s] 188it [00:20, 8.98it/s] 189it [00:20, 9.14it/s] 190it [00:20, 9.21it/s] 191it [00:20, 9.28it/s] 192it [00:21, 9.33it/s] 193it [00:21, 9.35it/s] 194it [00:21, 9.38it/s] 195it [00:21, 8.83it/s] 196it [00:21, 9.10it/s] 196it [00:21, 9.08it/s] +2025-05-26 05:01:17,277 - INFO - Epoch: 52, Objective: tensor([5528.3022], device='cuda:0', grad_fn=), Loss: 0.03874513879418373, KL/n: 69.0050048828125 + 0it [00:00, ?it/s]2025-05-26 05:01:17,547 - INFO - [Epoch 053 | Batch 0000] IWAE-loss 5155.4536 | mean log_px -0.0254 | KL -3377.25 + 1it [00:00, 4.73it/s] 2it [00:00, 6.32it/s] 3it [00:00, 7.50it/s] 4it [00:00, 8.12it/s] 5it [00:00, 8.53it/s] 6it [00:00, 8.81it/s] 7it [00:00, 8.92it/s] 8it [00:00, 9.09it/s] 9it [00:01, 9.19it/s] 10it [00:01, 9.25it/s] 11it [00:01, 9.32it/s] 12it [00:01, 9.42it/s] 13it [00:01, 9.46it/s] 14it [00:01, 9.44it/s] 15it [00:01, 9.43it/s] 16it [00:01, 9.44it/s] 17it [00:01, 9.47it/s] 18it [00:02, 9.40it/s] 19it [00:02, 9.42it/s] 20it [00:02, 9.46it/s] 21it [00:02, 9.43it/s] 22it [00:02, 9.43it/s] 23it [00:02, 9.43it/s] 24it [00:02, 9.44it/s] 25it [00:02, 9.42it/s] 26it [00:02, 9.43it/s] 27it [00:02, 9.45it/s] 28it [00:03, 9.48it/s] 29it [00:03, 9.49it/s] 30it [00:03, 9.53it/s] 31it [00:03, 9.52it/s] 32it [00:03, 9.52it/s] 33it [00:03, 9.44it/s] 34it [00:03, 9.46it/s] 35it [00:03, 9.45it/s] 36it [00:03, 9.39it/s] 37it [00:04, 9.40it/s] 38it [00:04, 9.42it/s] 39it [00:04, 9.45it/s] 40it [00:04, 9.46it/s] 41it [00:04, 9.47it/s] 42it [00:04, 9.44it/s] 43it [00:04, 8.87it/s] 44it [00:04, 9.15it/s] 45it [00:04, 9.34it/s] 46it [00:05, 9.31it/s] 47it [00:05, 9.37it/s] 48it [00:05, 9.43it/s] 49it [00:05, 9.46it/s] 50it [00:05, 9.44it/s]2025-05-26 05:01:22,898 - INFO - [Epoch 053 | Batch 0050] IWAE-loss 4669.8696 | mean log_px -0.0194 | KL -3377.31 + 51it [00:05, 9.40it/s] 52it [00:05, 9.43it/s] 53it [00:05, 9.47it/s] 54it [00:05, 9.49it/s] 55it [00:05, 9.48it/s] 56it [00:06, 9.51it/s] 57it [00:06, 9.52it/s] 58it [00:06, 9.49it/s] 59it [00:06, 9.49it/s] 60it [00:06, 9.48it/s] 61it [00:06, 9.43it/s] 62it [00:06, 9.41it/s] 63it [00:06, 9.45it/s] 64it [00:06, 9.44it/s] 65it [00:07, 9.48it/s] 66it [00:07, 9.47it/s] 67it [00:07, 9.36it/s] 68it [00:07, 9.43it/s] 69it [00:07, 9.44it/s] 70it [00:07, 9.50it/s] 71it [00:07, 9.50it/s] 72it [00:07, 9.51it/s] 73it [00:07, 9.51it/s] 74it [00:07, 9.50it/s] 75it [00:08, 9.52it/s] 76it [00:08, 9.51it/s] 77it [00:08, 9.53it/s] 78it [00:08, 9.49it/s] 79it [00:08, 9.49it/s] 80it [00:08, 9.51it/s] 81it [00:08, 9.55it/s] 82it [00:08, 9.59it/s] 83it [00:08, 9.59it/s] 84it [00:09, 9.54it/s] 85it [00:09, 9.52it/s] 86it [00:09, 9.48it/s] 87it [00:09, 9.56it/s] 88it [00:09, 9.16it/s] 89it [00:09, 9.29it/s] 90it [00:09, 8.97it/s] 91it [00:09, 9.13it/s] 92it [00:09, 9.19it/s] 93it [00:10, 8.94it/s] 94it [00:10, 9.08it/s] 95it [00:10, 9.18it/s] 96it [00:10, 9.27it/s] 97it [00:10, 9.31it/s] 98it [00:10, 9.35it/s] 99it [00:10, 9.40it/s] 100it [00:10, 9.42it/s]2025-05-26 05:01:28,209 - INFO - [Epoch 053 | Batch 0100] IWAE-loss 5013.9473 | mean log_px -0.0243 | KL -3370.79 + 101it [00:10, 9.43it/s] 102it [00:10, 9.45it/s] 103it [00:11, 9.39it/s] 104it [00:11, 9.42it/s] 105it [00:11, 9.45it/s] 106it [00:11, 9.45it/s] 107it [00:11, 9.42it/s] 108it [00:11, 9.42it/s] 109it [00:11, 9.48it/s] 110it [00:11, 9.48it/s] 111it [00:11, 9.50it/s] 112it [00:12, 9.46it/s] 113it [00:12, 9.48it/s] 114it [00:12, 9.49it/s] 115it [00:12, 9.51it/s] 116it [00:12, 9.49it/s] 117it [00:12, 9.55it/s] 118it [00:12, 9.50it/s] 119it [00:12, 9.49it/s] 120it [00:12, 9.47it/s] 121it [00:12, 9.46it/s] 122it [00:13, 9.42it/s] 123it [00:13, 9.42it/s] 124it [00:13, 9.38it/s] 125it [00:13, 9.36it/s] 126it [00:13, 9.39it/s] 127it [00:13, 9.45it/s] 128it [00:13, 9.43it/s] 129it [00:13, 9.43it/s] 130it [00:13, 9.44it/s] 131it [00:14, 9.43it/s] 132it [00:14, 9.45it/s] 133it [00:14, 9.02it/s] 134it [00:14, 9.14it/s] 135it [00:14, 9.22it/s] 136it [00:14, 9.29it/s] 137it [00:14, 8.86it/s] 138it [00:14, 9.03it/s] 139it [00:14, 9.14it/s] 140it [00:15, 9.21it/s] 141it [00:15, 9.30it/s] 142it [00:15, 9.23it/s] 143it [00:15, 9.07it/s] 144it [00:15, 9.02it/s] 145it [00:15, 9.12it/s] 146it [00:15, 9.27it/s] 147it [00:15, 9.34it/s] 148it [00:15, 9.44it/s] 149it [00:15, 9.52it/s] 150it [00:16, 9.55it/s]2025-05-26 05:01:33,547 - INFO - [Epoch 053 | Batch 0150] IWAE-loss 5491.2100 | mean log_px -0.0358 | KL -3374.70 + 151it [00:16, 9.57it/s] 152it [00:16, 9.59it/s] 153it [00:16, 9.61it/s] 154it [00:16, 9.60it/s] 155it [00:16, 9.61it/s] 156it [00:16, 9.57it/s] 157it [00:16, 9.56it/s] 158it [00:16, 9.53it/s] 159it [00:17, 9.51it/s] 160it [00:17, 9.50it/s] 161it [00:17, 9.56it/s] 162it [00:17, 9.61it/s] 163it [00:17, 9.57it/s] 164it [00:17, 9.57it/s] 165it [00:17, 9.55it/s] 166it [00:17, 9.54it/s] 167it [00:17, 9.58it/s] 168it [00:17, 9.59it/s] 169it [00:18, 9.57it/s] 170it [00:18, 9.41it/s] 171it [00:18, 9.20it/s] 172it [00:18, 9.21it/s] 173it [00:18, 9.35it/s] 174it [00:18, 9.41it/s] 175it [00:18, 9.49it/s] 176it [00:18, 9.51it/s] 177it [00:18, 9.54it/s] 178it [00:19, 9.58it/s] 179it [00:19, 9.57it/s] 180it [00:19, 9.56it/s] 181it [00:19, 9.59it/s] 182it [00:19, 9.49it/s] 183it [00:19, 9.32it/s] 184it [00:19, 9.39it/s] 185it [00:19, 9.40it/s] 186it [00:19, 9.44it/s] 187it [00:19, 9.50it/s] 188it [00:20, 9.52it/s] 189it [00:20, 9.53it/s] 190it [00:20, 9.53it/s] 191it [00:20, 9.55it/s] 192it [00:20, 9.59it/s] 193it [00:20, 9.56it/s] 194it [00:20, 9.56it/s] 195it [00:20, 8.92it/s] 196it [00:20, 8.98it/s] 196it [00:21, 9.33it/s] +2025-05-26 05:01:38,409 - INFO - Epoch: 53, Objective: tensor([5285.0635], device='cuda:0', grad_fn=), Loss: 0.031190963461995125, KL/n: 68.80663299560547 + 0it [00:00, ?it/s]2025-05-26 05:01:38,666 - INFO - [Epoch 054 | Batch 0000] IWAE-loss 4559.8145 | mean log_px -0.0225 | KL -3372.25 + 1it [00:00, 6.04it/s] 2it [00:00, 7.68it/s] 3it [00:00, 8.33it/s] 4it [00:00, 8.71it/s] 5it [00:00, 8.95it/s] 6it [00:00, 9.07it/s] 7it [00:00, 9.13it/s] 8it [00:00, 9.13it/s] 9it [00:01, 9.18it/s] 10it [00:01, 9.19it/s] 11it [00:01, 9.22it/s] 12it [00:01, 9.25it/s] 13it [00:01, 9.33it/s] 14it [00:01, 9.37it/s] 15it [00:01, 9.40it/s] 16it [00:01, 9.35it/s] 17it [00:01, 9.32it/s] 18it [00:01, 9.38it/s] 19it [00:02, 9.40it/s] 20it [00:02, 9.39it/s] 21it [00:02, 9.43it/s] 22it [00:02, 9.43it/s] 23it [00:02, 9.41it/s] 24it [00:02, 9.41it/s] 25it [00:02, 9.50it/s] 26it [00:02, 9.47it/s] 27it [00:02, 9.46it/s] 28it [00:03, 6.23it/s] 29it [00:03, 6.84it/s] 30it [00:03, 7.47it/s] 31it [00:03, 7.85it/s] 32it [00:03, 8.22it/s] 33it [00:03, 8.53it/s] 34it [00:03, 8.84it/s] 35it [00:03, 8.83it/s] 36it [00:04, 9.05it/s] 37it [00:04, 9.23it/s] 38it [00:04, 9.27it/s] 39it [00:04, 9.31it/s] 40it [00:04, 9.35it/s] 41it [00:04, 9.38it/s] 42it [00:04, 9.45it/s] 43it [00:04, 9.43it/s] 44it [00:04, 9.45it/s] 45it [00:05, 9.46it/s] 46it [00:05, 9.45it/s] 47it [00:05, 9.47it/s] 48it [00:05, 9.47it/s] 49it [00:05, 9.49it/s] 50it [00:05, 9.48it/s]2025-05-26 05:01:44,176 - INFO - [Epoch 054 | Batch 0050] IWAE-loss 4990.6138 | mean log_px -0.0290 | KL -3365.03 + 51it [00:05, 9.48it/s] 52it [00:05, 9.49it/s] 53it [00:05, 9.48it/s] 54it [00:05, 9.47it/s] 55it [00:06, 9.43it/s] 56it [00:06, 9.45it/s] 57it [00:06, 9.46it/s] 58it [00:06, 9.42it/s] 59it [00:06, 9.45it/s] 60it [00:06, 9.47it/s] 61it [00:06, 9.41it/s] 62it [00:06, 9.42it/s] 63it [00:06, 9.41it/s] 64it [00:07, 9.42it/s] 65it [00:07, 9.41it/s] 66it [00:07, 9.35it/s] 67it [00:07, 9.42it/s] 68it [00:07, 9.44it/s] 69it [00:07, 9.43it/s] 70it [00:07, 9.22it/s] 71it [00:07, 9.30it/s] 72it [00:07, 9.32it/s] 73it [00:08, 9.34it/s] 74it [00:08, 9.32it/s] 75it [00:08, 9.28it/s] 76it [00:08, 9.26it/s] 77it [00:08, 9.30it/s] 78it [00:08, 9.31it/s] 79it [00:08, 9.28it/s] 80it [00:08, 9.27it/s] 81it [00:08, 9.28it/s] 82it [00:08, 9.24it/s] 83it [00:09, 9.35it/s] 84it [00:09, 9.39it/s] 85it [00:09, 9.32it/s] 86it [00:09, 9.35it/s] 87it [00:09, 9.41it/s] 88it [00:09, 9.35it/s] 89it [00:09, 9.32it/s] 90it [00:09, 9.19it/s] 91it [00:09, 9.16it/s] 92it [00:10, 9.14it/s] 93it [00:10, 9.12it/s] 94it [00:10, 9.15it/s] 95it [00:10, 9.18it/s] 96it [00:10, 9.25it/s] 97it [00:10, 9.39it/s] 98it [00:10, 9.32it/s] 99it [00:10, 9.32it/s] 100it [00:10, 9.28it/s]2025-05-26 05:01:49,539 - INFO - [Epoch 054 | Batch 0100] IWAE-loss 5274.8164 | mean log_px -0.0305 | KL -3364.53 + 101it [00:11, 9.20it/s] 102it [00:11, 9.21it/s] 103it [00:11, 9.28it/s] 104it [00:11, 9.26it/s] 105it [00:11, 9.23it/s] 106it [00:11, 9.15it/s] 107it [00:11, 9.15it/s] 108it [00:11, 9.19it/s] 109it [00:11, 9.25it/s] 110it [00:12, 9.30it/s] 111it [00:12, 9.30it/s] 112it [00:12, 9.28it/s] 113it [00:12, 9.25it/s] 114it [00:12, 9.17it/s] 115it [00:12, 9.24it/s] 116it [00:12, 9.28it/s] 117it [00:12, 9.30it/s] 118it [00:12, 9.29it/s] 119it [00:12, 9.22it/s] 120it [00:13, 9.18it/s] 121it [00:13, 9.27it/s] 122it [00:13, 9.28it/s] 123it [00:13, 9.30it/s] 124it [00:13, 9.28it/s] 125it [00:13, 9.25it/s] 126it [00:13, 9.27it/s] 127it [00:13, 9.24it/s] 128it [00:13, 9.23it/s] 129it [00:14, 9.14it/s] 130it [00:14, 9.18it/s] 131it [00:14, 9.16it/s] 132it [00:14, 9.18it/s] 133it [00:14, 9.25it/s] 134it [00:14, 9.25it/s] 135it [00:14, 9.27it/s] 136it [00:14, 9.30it/s] 137it [00:14, 9.37it/s] 138it [00:15, 9.27it/s] 139it [00:15, 9.32it/s] 140it [00:15, 9.33it/s] 141it [00:15, 9.25it/s] 142it [00:15, 9.24it/s] 143it [00:15, 9.31it/s] 144it [00:15, 9.35it/s] 145it [00:15, 9.36it/s] 146it [00:15, 9.44it/s] 147it [00:15, 9.43it/s] 148it [00:16, 9.43it/s] 149it [00:16, 9.40it/s] 150it [00:16, 9.45it/s]2025-05-26 05:01:54,924 - INFO - [Epoch 054 | Batch 0150] IWAE-loss 4747.6250 | mean log_px -0.0197 | KL -3364.11 + 151it [00:16, 9.48it/s] 152it [00:16, 9.43it/s] 153it [00:16, 9.42it/s] 154it [00:16, 9.41it/s] 155it [00:16, 9.42it/s] 156it [00:16, 9.45it/s] 157it [00:17, 9.44it/s] 158it [00:17, 9.23it/s] 159it [00:17, 9.28it/s] 160it [00:17, 9.32it/s] 161it [00:17, 9.35it/s] 162it [00:17, 9.42it/s] 163it [00:17, 9.44it/s] 164it [00:17, 9.48it/s] 165it [00:17, 9.52it/s] 166it [00:18, 9.50it/s] 167it [00:18, 9.50it/s] 168it [00:18, 9.49it/s] 169it [00:18, 9.29it/s] 170it [00:18, 9.18it/s] 171it [00:18, 9.24it/s] 172it [00:18, 9.32it/s] 173it [00:18, 9.36it/s] 174it [00:18, 9.43it/s] 175it [00:18, 9.38it/s] 176it [00:19, 9.40it/s] 177it [00:19, 9.43it/s] 178it [00:19, 9.45it/s] 179it [00:19, 9.46it/s] 180it [00:19, 9.45it/s] 181it [00:19, 9.41it/s] 182it [00:19, 9.41it/s] 183it [00:19, 9.44it/s] 184it [00:19, 9.47it/s] 185it [00:20, 9.46it/s] 186it [00:20, 9.46it/s] 187it [00:20, 9.53it/s] 188it [00:20, 9.51it/s] 189it [00:20, 9.56it/s] 190it [00:20, 9.54it/s] 191it [00:20, 9.54it/s] 192it [00:20, 9.52it/s] 193it [00:20, 9.53it/s] 194it [00:20, 9.56it/s] 195it [00:21, 8.90it/s] 196it [00:21, 9.06it/s] 196it [00:21, 9.21it/s] +2025-05-26 05:01:59,827 - INFO - Epoch: 54, Objective: tensor([5742.4844], device='cuda:0', grad_fn=), Loss: 0.04035816341638565, KL/n: 68.60377502441406 + 0it [00:00, ?it/s]2025-05-26 05:02:00,110 - INFO - [Epoch 055 | Batch 0000] IWAE-loss 4954.8682 | mean log_px -0.0264 | KL -3363.76 + 1it [00:00, 5.21it/s] 2it [00:00, 7.10it/s] 3it [00:00, 8.02it/s] 4it [00:00, 8.56it/s] 5it [00:00, 8.89it/s] 6it [00:00, 9.05it/s] 7it [00:00, 9.25it/s] 8it [00:00, 9.34it/s] 9it [00:01, 8.86it/s] 10it [00:01, 9.03it/s] 11it [00:01, 9.15it/s] 12it [00:01, 9.27it/s] 13it [00:01, 9.31it/s] 14it [00:01, 9.40it/s] 15it [00:01, 9.42it/s] 16it [00:01, 9.41it/s] 17it [00:01, 9.45it/s] 18it [00:02, 9.50it/s] 19it [00:02, 9.50it/s] 20it [00:02, 9.52it/s] 21it [00:02, 9.49it/s] 22it [00:02, 9.50it/s] 23it [00:02, 9.54it/s] 24it [00:02, 9.51it/s] 25it [00:02, 9.50it/s] 26it [00:02, 9.49it/s] 27it [00:02, 9.56it/s] 28it [00:03, 9.00it/s] 29it [00:03, 9.19it/s] 30it [00:03, 9.33it/s] 31it [00:03, 9.43it/s] 32it [00:03, 9.47it/s] 33it [00:03, 9.53it/s] 34it [00:03, 8.98it/s] 35it [00:03, 9.12it/s] 36it [00:03, 9.24it/s] 37it [00:04, 8.81it/s] 38it [00:04, 8.88it/s] 39it [00:04, 8.94it/s] 40it [00:04, 8.90it/s] 41it [00:04, 8.88it/s] 42it [00:04, 8.98it/s] 43it [00:04, 9.09it/s] 44it [00:04, 8.99it/s] 45it [00:04, 9.09it/s] 46it [00:05, 8.67it/s] 47it [00:05, 8.91it/s] 48it [00:05, 8.94it/s] 49it [00:05, 9.05it/s] 50it [00:05, 8.98it/s]2025-05-26 05:02:05,523 - INFO - [Epoch 055 | Batch 0050] IWAE-loss 5218.8096 | mean log_px -0.0286 | KL -3357.67 + 51it [00:05, 9.17it/s] 52it [00:05, 8.58it/s] 53it [00:05, 8.87it/s] 54it [00:05, 9.07it/s] 55it [00:06, 9.17it/s] 56it [00:06, 9.27it/s] 57it [00:06, 9.33it/s] 58it [00:06, 9.32it/s] 59it [00:06, 9.38it/s] 60it [00:06, 9.41it/s] 61it [00:06, 9.48it/s] 62it [00:06, 9.50it/s] 63it [00:06, 9.48it/s] 64it [00:07, 9.43it/s] 65it [00:07, 9.48it/s] 66it [00:07, 9.53it/s] 67it [00:07, 9.54it/s] 68it [00:07, 9.50it/s] 69it [00:07, 9.53it/s] 70it [00:07, 9.50it/s] 71it [00:07, 9.53it/s] 72it [00:07, 9.56it/s] 73it [00:07, 9.61it/s] 74it [00:08, 9.02it/s] 75it [00:08, 9.17it/s] 76it [00:08, 9.27it/s] 77it [00:08, 9.31it/s] 78it [00:08, 8.83it/s] 79it [00:08, 8.98it/s] 80it [00:08, 9.15it/s] 81it [00:08, 9.23it/s] 82it [00:08, 8.79it/s] 83it [00:09, 9.00it/s] 84it [00:09, 8.92it/s] 85it [00:09, 9.00it/s] 86it [00:09, 9.08it/s] 87it [00:09, 9.09it/s] 88it [00:09, 9.12it/s] 89it [00:09, 9.17it/s] 90it [00:09, 8.64it/s] 91it [00:09, 8.75it/s] 92it [00:10, 8.83it/s] 93it [00:10, 8.97it/s] 94it [00:10, 9.05it/s] 95it [00:10, 9.05it/s] 96it [00:10, 8.66it/s] 97it [00:10, 8.81it/s] 98it [00:10, 8.96it/s] 99it [00:10, 9.06it/s] 100it [00:10, 9.06it/s]2025-05-26 05:02:10,986 - INFO - [Epoch 055 | Batch 0100] IWAE-loss 5689.7671 | mean log_px -0.0453 | KL -3352.47 + 101it [00:11, 9.12it/s] 102it [00:11, 9.29it/s] 103it [00:11, 9.28it/s] 104it [00:11, 9.35it/s] 105it [00:11, 8.83it/s] 106it [00:11, 9.05it/s] 107it [00:11, 9.05it/s] 108it [00:11, 9.07it/s] 109it [00:11, 9.13it/s] 110it [00:12, 8.66it/s] 111it [00:12, 8.85it/s] 112it [00:12, 9.08it/s] 113it [00:12, 9.13it/s] 114it [00:12, 9.12it/s] 115it [00:12, 9.22it/s] 116it [00:12, 8.79it/s] 117it [00:12, 8.87it/s] 118it [00:12, 8.97it/s] 119it [00:13, 9.05it/s] 120it [00:13, 8.56it/s] 121it [00:13, 8.72it/s] 122it [00:13, 8.91it/s] 123it [00:13, 9.07it/s] 124it [00:13, 9.08it/s] 125it [00:13, 9.19it/s] 126it [00:13, 9.19it/s] 127it [00:13, 8.78it/s] 128it [00:14, 9.03it/s] 129it [00:14, 9.24it/s] 130it [00:14, 9.39it/s] 131it [00:14, 9.50it/s] 132it [00:14, 9.43it/s] 133it [00:14, 9.47it/s] 134it [00:14, 9.43it/s] 135it [00:14, 9.30it/s] 136it [00:14, 9.33it/s] 137it [00:15, 9.37it/s] 138it [00:15, 9.32it/s] 139it [00:15, 9.34it/s] 140it [00:15, 9.37it/s] 141it [00:15, 8.91it/s] 142it [00:15, 9.01it/s] 143it [00:15, 9.14it/s] 144it [00:15, 9.24it/s] 145it [00:15, 8.81it/s] 146it [00:16, 9.02it/s] 147it [00:16, 9.15it/s] 148it [00:16, 8.75it/s] 149it [00:16, 8.96it/s] 150it [00:16, 9.04it/s]2025-05-26 05:02:16,482 - INFO - [Epoch 055 | Batch 0150] IWAE-loss 5461.5342 | mean log_px -0.0355 | KL -3352.60 + 151it [00:16, 9.16it/s] 152it [00:16, 9.23it/s] 153it [00:16, 9.29it/s] 154it [00:16, 9.34it/s] 155it [00:16, 9.36it/s] 156it [00:17, 9.35it/s] 157it [00:17, 9.28it/s] 158it [00:17, 9.30it/s] 159it [00:17, 8.77it/s] 160it [00:17, 8.90it/s] 161it [00:17, 9.05it/s] 162it [00:17, 9.13it/s] 163it [00:17, 8.69it/s] 164it [00:17, 8.85it/s] 165it [00:18, 9.02it/s] 166it [00:18, 9.17it/s] 167it [00:18, 8.94it/s] 168it [00:18, 9.05it/s] 169it [00:18, 9.19it/s] 170it [00:18, 9.24it/s] 171it [00:18, 9.29it/s] 172it [00:18, 9.34it/s] 173it [00:18, 9.41it/s] 174it [00:19, 9.57it/s] 175it [00:19, 9.69it/s] 176it [00:19, 9.76it/s] 178it [00:19, 9.90it/s] 180it [00:19, 9.61it/s] 181it [00:19, 9.69it/s] 182it [00:19, 9.76it/s] 184it [00:20, 9.52it/s] 186it [00:20, 9.71it/s] 188it [00:20, 9.80it/s] 189it [00:20, 9.51it/s] 190it [00:20, 9.59it/s] 192it [00:20, 9.75it/s] 193it [00:21, 9.44it/s] 195it [00:21, 9.27it/s] 196it [00:21, 9.15it/s] +2025-05-26 05:02:21,373 - INFO - Epoch: 55, Objective: tensor([5165.6812], device='cuda:0', grad_fn=), Loss: 0.03494435176253319, KL/n: 68.38105010986328 + 0it [00:00, ?it/s]2025-05-26 05:02:21,643 - INFO - [Epoch 056 | Batch 0000] IWAE-loss 4359.5181 | mean log_px -0.0144 | KL -3346.51 + 1it [00:00, 4.76it/s] 3it [00:00, 7.85it/s] 4it [00:00, 7.97it/s] 6it [00:00, 8.94it/s] 7it [00:00, 8.83it/s] 9it [00:01, 9.36it/s] 10it [00:01, 9.09it/s] 12it [00:01, 9.50it/s] 14it [00:01, 9.43it/s] 16it [00:01, 9.68it/s] 18it [00:01, 9.54it/s] 20it [00:02, 9.73it/s] 22it [00:02, 9.87it/s] 24it [00:02, 9.96it/s] 26it [00:02, 10.01it/s] 28it [00:02, 10.04it/s] 30it [00:03, 10.08it/s] 32it [00:03, 10.09it/s] 34it [00:03, 10.05it/s] 36it [00:03, 10.08it/s] 38it [00:03, 10.11it/s] 40it [00:04, 10.12it/s] 42it [00:04, 10.13it/s] 44it [00:04, 7.88it/s] 45it [00:04, 7.99it/s] 47it [00:05, 8.55it/s] 48it [00:05, 8.78it/s] 50it [00:05, 8.93it/s]2025-05-26 05:02:26,932 - INFO - [Epoch 056 | Batch 0050] IWAE-loss 7072.4180 | mean log_px -0.0646 | KL -3344.14 + 52it [00:05, 9.28it/s] 54it [00:05, 9.55it/s] 56it [00:05, 9.73it/s] 58it [00:06, 9.86it/s] 60it [00:06, 9.97it/s] 62it [00:06, 10.02it/s] 64it [00:06, 10.07it/s] 66it [00:06, 10.09it/s] 68it [00:07, 10.03it/s] 70it [00:07, 10.05it/s] 72it [00:07, 10.10it/s] 74it [00:07, 10.13it/s] 76it [00:07, 10.15it/s] 78it [00:08, 10.17it/s] 80it [00:08, 10.17it/s] 82it [00:08, 10.16it/s] 84it [00:08, 10.17it/s] 86it [00:08, 10.11it/s] 88it [00:09, 10.04it/s] 90it [00:09, 9.80it/s] 92it [00:09, 9.90it/s] 94it [00:09, 9.98it/s] 96it [00:09, 10.02it/s] 98it [00:10, 10.06it/s] 100it [00:10, 9.82it/s]2025-05-26 05:02:31,905 - INFO - [Epoch 056 | Batch 0100] IWAE-loss 4897.2031 | mean log_px -0.0227 | KL -3343.42 + 102it [00:10, 9.89it/s] 104it [00:10, 9.96it/s] 106it [00:10, 10.02it/s] 108it [00:11, 10.05it/s] 110it [00:11, 9.81it/s] 112it [00:11, 9.91it/s] 114it [00:11, 9.99it/s] 116it [00:11, 10.03it/s] 118it [00:12, 9.72it/s] 120it [00:12, 9.83it/s] 122it [00:12, 9.93it/s] 124it [00:12, 10.01it/s] 126it [00:12, 10.05it/s] 128it [00:13, 10.08it/s] 130it [00:13, 10.10it/s] 132it [00:13, 10.09it/s] 134it [00:13, 9.99it/s] 135it [00:13, 9.51it/s] 136it [00:13, 9.40it/s] 137it [00:14, 9.43it/s] 138it [00:14, 9.48it/s] 139it [00:14, 9.60it/s] 140it [00:14, 9.69it/s] 142it [00:14, 9.83it/s] 144it [00:14, 9.49it/s] 146it [00:15, 9.68it/s] 148it [00:15, 9.81it/s] 150it [00:15, 9.90it/s]2025-05-26 05:02:36,975 - INFO - [Epoch 056 | Batch 0150] IWAE-loss 4315.8975 | mean log_px -0.0143 | KL -3342.45 + 151it [00:15, 9.52it/s] 153it [00:15, 9.73it/s] 155it [00:15, 9.87it/s] 157it [00:16, 9.94it/s] 158it [00:16, 9.54it/s] 160it [00:16, 9.74it/s] 162it [00:16, 9.88it/s] 164it [00:16, 9.96it/s] 166it [00:17, 10.03it/s] 168it [00:17, 10.06it/s] 170it [00:17, 10.08it/s] 172it [00:17, 10.10it/s] 174it [00:17, 10.12it/s] 176it [00:18, 10.12it/s] 178it [00:18, 10.04it/s] 180it [00:18, 10.08it/s] 182it [00:18, 9.96it/s] 184it [00:18, 10.01it/s] 186it [00:19, 10.06it/s] 188it [00:19, 10.08it/s] 190it [00:19, 9.75it/s] 191it [00:19, 9.78it/s] 193it [00:19, 9.90it/s] 195it [00:19, 9.70it/s] 196it [00:20, 9.48it/s] 196it [00:20, 9.73it/s] +2025-05-26 05:02:41,637 - INFO - Epoch: 56, Objective: tensor([5050.2954], device='cuda:0', grad_fn=), Loss: 0.02728617750108242, KL/n: 68.18730926513672 + 0it [00:00, ?it/s]2025-05-26 05:02:41,908 - INFO - [Epoch 057 | Batch 0000] IWAE-loss 4560.9824 | mean log_px -0.0185 | KL -3340.02 + 1it [00:00, 5.47it/s] 2it [00:00, 6.88it/s] 4it [00:00, 8.58it/s] 5it [00:00, 8.44it/s] 6it [00:00, 8.85it/s] 8it [00:00, 9.37it/s] 10it [00:01, 9.63it/s] 12it [00:01, 9.78it/s] 14it [00:01, 9.86it/s] 16it [00:01, 9.92it/s] 17it [00:01, 9.93it/s] 18it [00:01, 9.93it/s] 20it [00:02, 9.97it/s] 21it [00:02, 9.96it/s] 22it [00:02, 9.97it/s] 24it [00:02, 9.98it/s] 25it [00:02, 9.98it/s] 26it [00:02, 9.97it/s] 28it [00:02, 9.98it/s] 29it [00:03, 9.98it/s] 31it [00:03, 10.03it/s] 33it [00:03, 9.99it/s] 34it [00:03, 9.99it/s] 35it [00:03, 9.51it/s] 36it [00:03, 9.62it/s] 38it [00:03, 9.78it/s] 40it [00:04, 9.88it/s] 42it [00:04, 9.94it/s] 44it [00:04, 9.98it/s] 46it [00:04, 9.98it/s] 47it [00:04, 9.98it/s] 49it [00:05, 10.02it/s] 50it [00:05, 9.96it/s]2025-05-26 05:02:46,970 - INFO - [Epoch 057 | Batch 0050] IWAE-loss 4015.7031 | mean log_px -0.0109 | KL -3334.84 + 51it [00:05, 9.49it/s] 53it [00:05, 9.71it/s] 54it [00:05, 9.77it/s] 56it [00:05, 9.86it/s] 57it [00:05, 9.88it/s] 59it [00:06, 9.96it/s] 60it [00:06, 9.97it/s] 62it [00:06, 9.99it/s] 63it [00:06, 9.99it/s] 64it [00:06, 9.98it/s] 66it [00:06, 10.01it/s] 68it [00:06, 10.02it/s] 70it [00:07, 9.62it/s] 72it [00:07, 9.76it/s] 74it [00:07, 9.87it/s] 76it [00:07, 9.92it/s] 77it [00:07, 9.93it/s] 79it [00:08, 9.98it/s] 80it [00:08, 9.98it/s] 82it [00:08, 10.00it/s] 84it [00:08, 10.01it/s] 86it [00:08, 10.02it/s] 88it [00:08, 10.02it/s] 90it [00:09, 10.00it/s] 92it [00:09, 10.01it/s] 94it [00:09, 10.01it/s] 96it [00:09, 9.92it/s] 97it [00:09, 9.53it/s] 98it [00:10, 9.61it/s] 100it [00:10, 9.77it/s]2025-05-26 05:02:52,033 - INFO - [Epoch 057 | Batch 0100] IWAE-loss 4555.8833 | mean log_px -0.0193 | KL -3332.19 + 101it [00:10, 9.37it/s] 102it [00:10, 9.50it/s] 104it [00:10, 9.73it/s] 106it [00:10, 9.82it/s] 107it [00:10, 9.86it/s] 108it [00:11, 9.89it/s] 110it [00:11, 9.95it/s] 111it [00:11, 9.94it/s] 112it [00:11, 9.93it/s] 113it [00:11, 9.94it/s] 114it [00:11, 9.95it/s] 115it [00:11, 9.95it/s] 117it [00:11, 9.99it/s] 119it [00:12, 10.01it/s] 120it [00:12, 9.99it/s] 122it [00:12, 9.60it/s] 124it [00:12, 9.76it/s] 125it [00:12, 9.80it/s] 127it [00:12, 9.91it/s] 128it [00:13, 9.92it/s] 130it [00:13, 9.96it/s] 132it [00:13, 9.99it/s] 133it [00:13, 9.99it/s] 134it [00:13, 9.98it/s] 136it [00:13, 9.99it/s] 138it [00:14, 10.01it/s] 140it [00:14, 10.02it/s] 142it [00:14, 10.00it/s] 144it [00:14, 10.02it/s] 146it [00:14, 10.02it/s] 148it [00:15, 9.98it/s] 149it [00:15, 9.98it/s] 150it [00:15, 9.72it/s]2025-05-26 05:02:57,091 - INFO - [Epoch 057 | Batch 0150] IWAE-loss 4984.7964 | mean log_px -0.0261 | KL -3333.72 + 151it [00:15, 9.70it/s] 153it [00:15, 9.84it/s] 155it [00:15, 9.91it/s] 156it [00:15, 9.50it/s] 157it [00:15, 9.47it/s] 158it [00:16, 9.22it/s] 159it [00:16, 9.18it/s] 160it [00:16, 9.14it/s] 161it [00:16, 9.33it/s] 163it [00:16, 9.64it/s] 165it [00:16, 9.80it/s] 166it [00:16, 9.83it/s] 168it [00:17, 9.90it/s] 170it [00:17, 9.96it/s] 171it [00:17, 9.96it/s] 173it [00:17, 9.98it/s] 174it [00:17, 9.98it/s] 176it [00:17, 9.98it/s] 177it [00:18, 9.97it/s] 179it [00:18, 10.00it/s] 180it [00:18, 9.99it/s] 181it [00:18, 9.99it/s] 182it [00:18, 9.97it/s] 184it [00:18, 10.01it/s] 186it [00:18, 10.00it/s] 187it [00:19, 10.00it/s] 188it [00:19, 10.00it/s] 189it [00:19, 9.98it/s] 190it [00:19, 9.96it/s] 192it [00:19, 9.99it/s] 193it [00:19, 9.95it/s] 194it [00:19, 9.75it/s] 195it [00:19, 9.38it/s] 196it [00:19, 9.17it/s] 196it [00:20, 9.78it/s] +2025-05-26 05:03:01,798 - INFO - Epoch: 57, Objective: tensor([5603.3149], device='cuda:0', grad_fn=), Loss: 0.03557281568646431, KL/n: 67.98454284667969 + 0it [00:00, ?it/s]2025-05-26 05:03:02,067 - INFO - [Epoch 058 | Batch 0000] IWAE-loss 4603.7197 | mean log_px -0.0217 | KL -3329.28 + 1it [00:00, 5.50it/s] 2it [00:00, 6.94it/s] 4it [00:00, 8.67it/s] 6it [00:00, 9.31it/s] 8it [00:00, 9.64it/s] 9it [00:00, 9.62it/s] 11it [00:01, 9.83it/s] 13it [00:01, 9.95it/s] 14it [00:01, 9.52it/s] 16it [00:01, 9.74it/s] 18it [00:01, 9.88it/s] 20it [00:02, 9.98it/s] 22it [00:02, 10.04it/s] 24it [00:02, 9.78it/s] 25it [00:02, 9.78it/s] 27it [00:02, 9.45it/s] 29it [00:03, 9.67it/s] 31it [00:03, 9.81it/s] 33it [00:03, 9.92it/s] 35it [00:03, 9.99it/s] 36it [00:03, 9.98it/s] 38it [00:03, 10.05it/s] 40it [00:04, 10.08it/s] 42it [00:04, 9.74it/s] 44it [00:04, 9.86it/s] 46it [00:04, 9.94it/s] 47it [00:04, 9.89it/s] 48it [00:05, 6.80it/s] 50it [00:05, 7.73it/s]2025-05-26 05:03:07,352 - INFO - [Epoch 058 | Batch 0050] IWAE-loss 4924.8784 | mean log_px -0.0293 | KL -3323.80 + 51it [00:05, 7.82it/s] 53it [00:05, 8.55it/s] 55it [00:05, 9.04it/s] 57it [00:06, 9.34it/s] 59it [00:06, 9.57it/s] 61it [00:06, 9.74it/s] 63it [00:06, 9.58it/s] 65it [00:06, 9.74it/s] 67it [00:07, 9.86it/s] 69it [00:07, 9.95it/s] 71it [00:07, 10.01it/s] 73it [00:07, 10.05it/s] 75it [00:07, 10.08it/s] 77it [00:08, 10.10it/s] 79it [00:08, 10.13it/s] 81it [00:08, 10.14it/s] 83it [00:08, 10.14it/s] 85it [00:08, 10.15it/s] 87it [00:09, 10.13it/s] 89it [00:09, 10.14it/s] 91it [00:09, 10.14it/s] 93it [00:09, 10.15it/s] 95it [00:09, 10.13it/s] 97it [00:10, 10.13it/s] 99it [00:10, 9.86it/s] 100it [00:10, 9.89it/s]2025-05-26 05:03:12,347 - INFO - [Epoch 058 | Batch 0100] IWAE-loss 4599.8813 | mean log_px -0.0212 | KL -3328.67 + 101it [00:10, 9.50it/s] 103it [00:10, 9.72it/s] 105it [00:10, 9.87it/s] 107it [00:11, 9.93it/s] 109it [00:11, 9.98it/s] 110it [00:11, 9.98it/s] 112it [00:11, 10.03it/s] 114it [00:11, 9.70it/s] 116it [00:11, 9.83it/s] 118it [00:12, 9.92it/s] 119it [00:12, 9.54it/s] 120it [00:12, 9.58it/s] 122it [00:12, 9.69it/s] 124it [00:12, 9.83it/s] 126it [00:13, 9.94it/s] 127it [00:13, 9.70it/s] 128it [00:13, 9.42it/s] 130it [00:13, 9.69it/s] 132it [00:13, 9.85it/s] 134it [00:13, 9.95it/s] 136it [00:14, 10.02it/s] 138it [00:14, 10.06it/s] 140it [00:14, 10.10it/s] 142it [00:14, 10.11it/s] 144it [00:14, 10.11it/s] 146it [00:15, 9.76it/s] 148it [00:15, 9.87it/s] 150it [00:15, 9.95it/s]2025-05-26 05:03:17,419 - INFO - [Epoch 058 | Batch 0150] IWAE-loss 4261.2881 | mean log_px -0.0143 | KL -3324.48 + 151it [00:15, 9.57it/s] 153it [00:15, 9.76it/s] 155it [00:15, 9.89it/s] 157it [00:16, 9.97it/s] 159it [00:16, 10.02it/s] 161it [00:16, 10.06it/s] 163it [00:16, 10.08it/s] 165it [00:16, 10.09it/s] 167it [00:17, 10.10it/s] 169it [00:17, 10.10it/s] 171it [00:17, 9.84it/s] 173it [00:17, 9.93it/s] 175it [00:17, 10.00it/s] 177it [00:18, 10.02it/s] 179it [00:18, 10.06it/s] 181it [00:18, 10.09it/s] 183it [00:18, 10.10it/s] 185it [00:18, 10.12it/s] 187it [00:19, 10.13it/s] 189it [00:19, 10.14it/s] 191it [00:19, 10.14it/s] 193it [00:19, 10.14it/s] 195it [00:19, 9.71it/s] 196it [00:20, 9.39it/s] 196it [00:20, 9.74it/s] +2025-05-26 05:03:22,058 - INFO - Epoch: 58, Objective: tensor([4525.3076], device='cuda:0', grad_fn=), Loss: 0.021634532138705254, KL/n: 67.80258178710938 + 0it [00:00, ?it/s]2025-05-26 05:03:22,317 - INFO - [Epoch 059 | Batch 0000] IWAE-loss 4513.4170 | mean log_px -0.0270 | KL -3325.71 + 1it [00:00, 6.09it/s] 2it [00:00, 7.86it/s] 3it [00:00, 7.98it/s] 4it [00:00, 8.60it/s] 5it [00:00, 8.96it/s] 6it [00:00, 9.14it/s] 7it [00:00, 8.62it/s] 8it [00:00, 8.90it/s] 9it [00:01, 9.05it/s] 10it [00:01, 9.22it/s] 11it [00:01, 9.37it/s] 13it [00:01, 9.70it/s] 15it [00:01, 9.51it/s] 17it [00:01, 9.73it/s] 19it [00:02, 9.86it/s] 21it [00:02, 9.94it/s] 23it [00:02, 9.98it/s] 25it [00:02, 10.02it/s] 27it [00:02, 9.69it/s] 29it [00:03, 9.82it/s] 30it [00:03, 9.83it/s] 31it [00:03, 9.44it/s] 32it [00:03, 9.45it/s] 33it [00:03, 9.55it/s] 35it [00:03, 9.76it/s] 37it [00:03, 9.89it/s] 39it [00:04, 9.96it/s] 40it [00:04, 9.64it/s] 42it [00:04, 9.80it/s] 43it [00:04, 9.83it/s] 44it [00:04, 9.87it/s] 46it [00:04, 9.95it/s] 48it [00:05, 10.01it/s] 50it [00:05, 10.01it/s]2025-05-26 05:03:27,461 - INFO - [Epoch 059 | Batch 0050] IWAE-loss 4204.3833 | mean log_px -0.0140 | KL -3318.27 + 52it [00:05, 10.02it/s] 54it [00:05, 10.06it/s] 56it [00:05, 10.08it/s] 58it [00:05, 10.08it/s] 60it [00:06, 10.07it/s] 62it [00:06, 9.76it/s] 64it [00:06, 9.86it/s] 65it [00:06, 9.51it/s] 67it [00:06, 9.66it/s] 69it [00:07, 9.81it/s] 71it [00:07, 9.85it/s] 72it [00:07, 9.86it/s] 74it [00:07, 9.95it/s] 76it [00:07, 9.72it/s] 78it [00:08, 9.85it/s] 79it [00:08, 9.57it/s] 81it [00:08, 9.75it/s] 82it [00:08, 9.47it/s] 83it [00:08, 9.58it/s] 85it [00:08, 9.78it/s] 87it [00:08, 9.58it/s] 88it [00:09, 9.66it/s] 90it [00:09, 9.51it/s] 92it [00:09, 9.71it/s] 94it [00:09, 9.56it/s] 96it [00:09, 9.72it/s] 98it [00:10, 9.57it/s] 100it [00:10, 9.73it/s]2025-05-26 05:03:32,592 - INFO - [Epoch 059 | Batch 0100] IWAE-loss 4880.2090 | mean log_px -0.0276 | KL -3318.33 + 101it [00:10, 9.77it/s] 102it [00:10, 9.77it/s] 103it [00:10, 9.79it/s] 104it [00:10, 9.82it/s] 105it [00:10, 9.84it/s] 106it [00:10, 9.83it/s] 107it [00:11, 9.85it/s] 108it [00:11, 9.84it/s] 109it [00:11, 9.85it/s] 110it [00:11, 9.83it/s] 111it [00:11, 9.83it/s] 112it [00:11, 9.84it/s] 113it [00:11, 9.86it/s] 114it [00:11, 9.86it/s] 115it [00:11, 9.23it/s] 116it [00:11, 9.42it/s] 117it [00:12, 9.55it/s] 118it [00:12, 9.02it/s] 119it [00:12, 9.27it/s] 120it [00:12, 9.44it/s] 121it [00:12, 9.58it/s] 122it [00:12, 9.66it/s] 123it [00:12, 9.74it/s] 124it [00:12, 9.79it/s] 125it [00:12, 9.85it/s] 126it [00:13, 9.85it/s] 127it [00:13, 9.88it/s] 128it [00:13, 9.88it/s] 129it [00:13, 9.89it/s] 130it [00:13, 9.26it/s] 131it [00:13, 9.46it/s] 132it [00:13, 9.58it/s] 133it [00:13, 9.68it/s] 134it [00:13, 9.73it/s] 135it [00:13, 9.79it/s] 136it [00:14, 9.81it/s] 137it [00:14, 9.84it/s] 138it [00:14, 9.83it/s] 139it [00:14, 9.85it/s] 140it [00:14, 9.22it/s] 141it [00:14, 9.41it/s] 142it [00:14, 9.53it/s] 143it [00:14, 9.64it/s] 144it [00:14, 9.58it/s] 145it [00:14, 9.64it/s] 146it [00:15, 9.71it/s] 147it [00:15, 9.77it/s] 148it [00:15, 9.45it/s] 149it [00:15, 9.12it/s] 150it [00:15, 9.34it/s]2025-05-26 05:03:37,782 - INFO - [Epoch 059 | Batch 0150] IWAE-loss 4119.4390 | mean log_px -0.0125 | KL -3316.20 + 151it [00:15, 9.49it/s] 152it [00:15, 9.60it/s] 153it [00:15, 9.69it/s] 154it [00:15, 9.04it/s] 155it [00:16, 9.11it/s] 156it [00:16, 9.14it/s] 157it [00:16, 9.15it/s] 158it [00:16, 9.21it/s] 159it [00:16, 9.27it/s] 160it [00:16, 9.30it/s] 161it [00:16, 9.33it/s] 162it [00:16, 9.34it/s] 163it [00:16, 9.36it/s] 164it [00:17, 9.37it/s] 165it [00:17, 9.38it/s] 166it [00:17, 9.38it/s] 167it [00:17, 9.38it/s] 168it [00:17, 8.97it/s] 169it [00:17, 9.24it/s] 170it [00:17, 9.44it/s] 171it [00:17, 9.59it/s] 172it [00:17, 9.20it/s] 173it [00:17, 9.41it/s] 174it [00:18, 9.56it/s] 175it [00:18, 9.68it/s] 176it [00:18, 9.76it/s] 177it [00:18, 9.81it/s] 178it [00:18, 9.35it/s] 179it [00:18, 9.51it/s] 180it [00:18, 9.63it/s] 181it [00:18, 9.61it/s] 182it [00:18, 9.70it/s] 183it [00:19, 9.77it/s] 184it [00:19, 9.81it/s] 185it [00:19, 9.85it/s] 186it [00:19, 9.88it/s] 187it [00:19, 9.85it/s] 188it [00:19, 9.86it/s] 189it [00:19, 9.37it/s] 190it [00:19, 9.53it/s] 191it [00:19, 9.65it/s] 192it [00:19, 9.23it/s] 193it [00:20, 9.42it/s] 194it [00:20, 9.56it/s] 195it [00:20, 9.25it/s] 196it [00:20, 9.59it/s] +2025-05-26 05:03:42,633 - INFO - Epoch: 59, Objective: tensor([5065.8369], device='cuda:0', grad_fn=), Loss: 0.029969044029712677, KL/n: 67.60353088378906 + 0it [00:00, ?it/s]2025-05-26 05:03:42,910 - INFO - [Epoch 060 | Batch 0000] IWAE-loss 5187.5234 | mean log_px -0.0315 | KL -3310.47 + 1it [00:00, 4.66it/s] 3it [00:00, 7.75it/s] 4it [00:00, 8.39it/s] 5it [00:00, 8.86it/s] 6it [00:00, 9.18it/s] 7it [00:00, 9.42it/s] 8it [00:00, 9.58it/s] 9it [00:01, 9.70it/s] 11it [00:01, 9.88it/s] 12it [00:01, 9.89it/s] 14it [00:01, 9.94it/s] 16it [00:01, 9.99it/s] 18it [00:01, 10.01it/s] 20it [00:02, 10.01it/s] 22it [00:02, 9.95it/s] 24it [00:02, 9.96it/s] 25it [00:02, 9.96it/s] 26it [00:02, 9.95it/s] 28it [00:02, 9.97it/s] 29it [00:03, 9.95it/s] 30it [00:03, 9.96it/s] 31it [00:03, 9.95it/s] 32it [00:03, 9.95it/s] 34it [00:03, 10.00it/s] 35it [00:03, 9.99it/s] 36it [00:03, 9.98it/s] 37it [00:03, 9.52it/s] 38it [00:03, 9.63it/s] 39it [00:04, 9.73it/s] 40it [00:04, 9.79it/s] 42it [00:04, 6.98it/s] 44it [00:04, 7.91it/s] 45it [00:04, 8.28it/s] 46it [00:04, 8.63it/s] 48it [00:05, 9.17it/s] 50it [00:05, 9.45it/s]2025-05-26 05:03:48,148 - INFO - [Epoch 060 | Batch 0050] IWAE-loss 4562.0859 | mean log_px -0.0215 | KL -3308.93 + 51it [00:05, 9.55it/s] 53it [00:05, 9.73it/s] 54it [00:05, 9.69it/s] 56it [00:05, 9.81it/s] 57it [00:06, 9.40it/s] 58it [00:06, 9.52it/s] 59it [00:06, 9.60it/s] 60it [00:06, 9.67it/s] 61it [00:06, 9.75it/s] 63it [00:06, 9.90it/s] 64it [00:06, 9.92it/s] 66it [00:06, 9.95it/s] 68it [00:07, 9.99it/s] 69it [00:07, 9.98it/s] 70it [00:07, 9.98it/s] 72it [00:07, 9.99it/s] 74it [00:07, 10.01it/s] 76it [00:07, 10.04it/s] 78it [00:08, 10.01it/s] 80it [00:08, 10.02it/s] 82it [00:08, 10.01it/s] 84it [00:08, 10.01it/s] 86it [00:08, 10.02it/s] 88it [00:09, 10.05it/s] 90it [00:09, 10.05it/s] 92it [00:09, 10.03it/s] 94it [00:09, 9.75it/s] 96it [00:09, 9.85it/s] 97it [00:10, 9.48it/s] 99it [00:10, 9.68it/s] 100it [00:10, 9.73it/s]2025-05-26 05:03:53,209 - INFO - [Epoch 060 | Batch 0100] IWAE-loss 4293.2979 | mean log_px -0.0141 | KL -3304.83 + 101it [00:10, 9.77it/s] 102it [00:10, 9.38it/s] 104it [00:10, 9.62it/s] 106it [00:11, 9.77it/s] 108it [00:11, 9.84it/s] 110it [00:11, 9.92it/s] 111it [00:11, 9.92it/s] 113it [00:11, 9.97it/s] 114it [00:11, 9.88it/s] 116it [00:12, 9.97it/s] 117it [00:12, 9.68it/s] 119it [00:12, 9.82it/s] 120it [00:12, 9.84it/s] 122it [00:12, 9.90it/s] 124it [00:12, 9.93it/s] 125it [00:12, 9.49it/s] 127it [00:13, 9.70it/s] 128it [00:13, 9.75it/s] 129it [00:13, 9.80it/s] 130it [00:13, 9.83it/s] 131it [00:13, 9.35it/s] 132it [00:13, 9.52it/s] 133it [00:13, 9.62it/s] 134it [00:13, 9.64it/s] 136it [00:14, 9.80it/s] 138it [00:14, 9.83it/s] 139it [00:14, 9.83it/s] 140it [00:14, 9.83it/s] 141it [00:14, 9.34it/s] 142it [00:14, 9.48it/s] 143it [00:14, 9.59it/s] 144it [00:14, 9.68it/s] 145it [00:15, 9.77it/s] 146it [00:15, 9.81it/s] 147it [00:15, 9.84it/s] 148it [00:15, 9.87it/s] 150it [00:15, 9.95it/s]2025-05-26 05:03:58,329 - INFO - [Epoch 060 | Batch 0150] IWAE-loss 4515.0557 | mean log_px -0.0186 | KL -3300.35 + 151it [00:15, 9.83it/s] 152it [00:15, 9.70it/s] 153it [00:15, 9.23it/s] 154it [00:15, 9.26it/s] 155it [00:16, 9.36it/s] 156it [00:16, 9.36it/s] 157it [00:16, 9.27it/s] 158it [00:16, 9.31it/s] 159it [00:16, 9.31it/s] 160it [00:16, 9.32it/s] 161it [00:16, 9.32it/s] 162it [00:16, 9.31it/s] 163it [00:16, 9.33it/s] 164it [00:17, 9.34it/s] 165it [00:17, 9.33it/s] 166it [00:17, 9.37it/s] 167it [00:17, 9.36it/s] 168it [00:17, 9.37it/s] 169it [00:17, 8.87it/s] 170it [00:17, 9.08it/s] 171it [00:17, 9.15it/s] 172it [00:17, 9.24it/s] 173it [00:17, 9.23it/s] 174it [00:18, 9.29it/s] 175it [00:18, 9.31it/s] 176it [00:18, 9.29it/s] 177it [00:18, 9.37it/s] 178it [00:18, 9.41it/s] 179it [00:18, 9.45it/s] 180it [00:18, 9.42it/s] 181it [00:18, 9.45it/s] 182it [00:18, 9.42it/s] 183it [00:19, 9.44it/s] 184it [00:19, 9.41it/s] 185it [00:19, 9.28it/s] 186it [00:19, 9.33it/s] 187it [00:19, 9.39it/s] 188it [00:19, 9.02it/s] 189it [00:19, 9.16it/s] 190it [00:19, 9.13it/s] 191it [00:19, 9.21it/s] 192it [00:20, 9.30it/s] 193it [00:20, 9.30it/s] 194it [00:20, 9.37it/s] 195it [00:20, 8.81it/s] 196it [00:20, 9.07it/s] 196it [00:20, 9.54it/s] +2025-05-26 05:04:03,305 - INFO - Epoch: 60, Objective: tensor([4183.7256], device='cuda:0', grad_fn=), Loss: 0.01641184277832508, KL/n: 67.38818359375 + 0it [00:00, ?it/s]2025-05-26 05:04:03,575 - INFO - [Epoch 061 | Batch 0000] IWAE-loss 4341.6694 | mean log_px -0.0202 | KL -3302.52 + 1it [00:00, 5.61it/s] 2it [00:00, 7.38it/s] 3it [00:00, 8.25it/s] 4it [00:00, 8.67it/s] 5it [00:00, 8.95it/s] 6it [00:00, 9.06it/s] 7it [00:00, 9.27it/s] 8it [00:00, 9.35it/s] 9it [00:01, 9.39it/s] 10it [00:01, 9.43it/s] 11it [00:01, 9.45it/s] 12it [00:01, 9.48it/s] 13it [00:01, 9.48it/s] 14it [00:01, 9.46it/s] 15it [00:01, 9.47it/s] 16it [00:01, 9.46it/s] 17it [00:01, 9.51it/s] 18it [00:01, 9.52it/s] 19it [00:02, 9.56it/s] 20it [00:02, 9.52it/s] 21it [00:02, 9.49it/s] 22it [00:02, 9.50it/s] 23it [00:02, 9.47it/s] 24it [00:02, 9.45it/s] 25it [00:02, 9.49it/s] 26it [00:02, 9.48it/s] 27it [00:02, 9.49it/s] 28it [00:03, 9.47it/s] 29it [00:03, 9.44it/s] 30it [00:03, 9.39it/s] 31it [00:03, 9.43it/s] 32it [00:03, 9.38it/s] 33it [00:03, 9.41it/s] 34it [00:03, 9.40it/s] 35it [00:03, 9.49it/s] 36it [00:03, 9.44it/s] 37it [00:03, 9.48it/s] 38it [00:04, 9.47it/s] 39it [00:04, 9.48it/s] 40it [00:04, 9.49it/s] 41it [00:04, 9.49it/s] 42it [00:04, 9.48it/s] 43it [00:04, 9.45it/s] 44it [00:04, 9.45it/s] 45it [00:04, 9.47it/s] 46it [00:04, 9.48it/s] 47it [00:05, 9.51it/s] 48it [00:05, 9.50it/s] 49it [00:05, 9.51it/s] 50it [00:05, 9.53it/s]2025-05-26 05:04:08,847 - INFO - [Epoch 061 | Batch 0050] IWAE-loss 4877.6030 | mean log_px -0.0282 | KL -3295.02 + 51it [00:05, 9.51it/s] 52it [00:05, 9.50it/s] 53it [00:05, 9.50it/s] 54it [00:05, 9.50it/s] 55it [00:05, 9.51it/s] 56it [00:05, 9.47it/s] 57it [00:06, 9.14it/s] 58it [00:06, 8.95it/s] 59it [00:06, 9.06it/s] 60it [00:06, 9.21it/s] 61it [00:06, 9.35it/s] 62it [00:06, 9.39it/s] 63it [00:06, 9.43it/s] 64it [00:06, 9.46it/s] 65it [00:06, 9.49it/s] 66it [00:07, 9.52it/s] 67it [00:07, 9.54it/s] 68it [00:07, 9.55it/s] 69it [00:07, 9.57it/s] 70it [00:07, 9.51it/s] 71it [00:07, 9.51it/s] 72it [00:07, 9.47it/s] 73it [00:07, 9.48it/s] 74it [00:07, 9.50it/s] 75it [00:08, 9.48it/s] 76it [00:08, 9.51it/s] 77it [00:08, 9.54it/s] 78it [00:08, 9.50it/s] 79it [00:08, 9.49it/s] 80it [00:08, 9.49it/s] 81it [00:08, 9.29it/s] 82it [00:08, 9.34it/s] 83it [00:08, 9.35it/s] 84it [00:08, 9.35it/s] 85it [00:09, 9.41it/s] 86it [00:09, 9.43it/s] 87it [00:09, 9.47it/s] 88it [00:09, 9.46it/s] 89it [00:09, 9.48it/s] 90it [00:09, 9.41it/s] 91it [00:09, 9.40it/s] 92it [00:09, 9.39it/s] 93it [00:09, 9.44it/s] 94it [00:10, 9.44it/s] 95it [00:10, 9.41it/s] 96it [00:10, 9.40it/s] 97it [00:10, 9.43it/s] 98it [00:10, 9.42it/s] 99it [00:10, 9.45it/s] 100it [00:10, 9.45it/s]2025-05-26 05:04:14,154 - INFO - [Epoch 061 | Batch 0100] IWAE-loss 4193.9419 | mean log_px -0.0158 | KL -3287.98 + 101it [00:10, 9.47it/s] 102it [00:10, 9.43it/s] 103it [00:10, 9.47it/s] 104it [00:11, 9.51it/s] 105it [00:11, 9.57it/s] 106it [00:11, 9.64it/s] 107it [00:11, 9.71it/s] 108it [00:11, 9.75it/s] 109it [00:11, 9.72it/s] 110it [00:11, 9.77it/s] 111it [00:11, 9.81it/s] 112it [00:11, 9.82it/s] 113it [00:11, 9.83it/s] 114it [00:12, 9.83it/s] 115it [00:12, 9.85it/s] 116it [00:12, 9.85it/s] 117it [00:12, 9.87it/s] 118it [00:12, 9.87it/s] 119it [00:12, 9.88it/s] 120it [00:12, 9.85it/s] 121it [00:12, 9.87it/s] 122it [00:12, 9.86it/s] 123it [00:13, 9.88it/s] 124it [00:13, 9.87it/s] 125it [00:13, 9.88it/s] 126it [00:13, 9.87it/s] 127it [00:13, 9.87it/s] 128it [00:13, 9.84it/s] 129it [00:13, 9.84it/s] 130it [00:13, 9.84it/s] 131it [00:13, 9.86it/s] 132it [00:13, 9.86it/s] 133it [00:14, 9.85it/s] 134it [00:14, 9.84it/s] 135it [00:14, 9.85it/s] 136it [00:14, 9.86it/s] 137it [00:14, 9.86it/s] 138it [00:14, 9.85it/s] 139it [00:14, 9.86it/s] 140it [00:14, 9.86it/s] 141it [00:14, 9.87it/s] 142it [00:14, 9.87it/s] 143it [00:15, 9.85it/s] 144it [00:15, 9.83it/s] 145it [00:15, 9.84it/s] 146it [00:15, 9.84it/s] 147it [00:15, 9.86it/s] 148it [00:15, 9.80it/s] 149it [00:15, 9.83it/s] 150it [00:15, 9.83it/s]2025-05-26 05:04:19,245 - INFO - [Epoch 061 | Batch 0150] IWAE-loss 4477.5815 | mean log_px -0.0203 | KL -3289.90 + 151it [00:15, 9.84it/s] 152it [00:15, 9.63it/s] 153it [00:16, 9.70it/s] 154it [00:16, 9.66it/s] 155it [00:16, 9.65it/s] 156it [00:16, 9.65it/s] 157it [00:16, 9.73it/s] 158it [00:16, 9.77it/s] 159it [00:16, 9.81it/s] 160it [00:16, 9.83it/s] 161it [00:16, 9.87it/s] 162it [00:16, 9.87it/s] 163it [00:17, 9.88it/s] 164it [00:17, 9.87it/s] 165it [00:17, 9.89it/s] 166it [00:17, 9.88it/s] 167it [00:17, 9.88it/s] 168it [00:17, 9.85it/s] 169it [00:17, 9.87it/s] 170it [00:17, 9.87it/s] 171it [00:17, 9.88it/s] 172it [00:17, 9.89it/s] 173it [00:18, 9.89it/s] 174it [00:18, 9.89it/s] 175it [00:18, 9.86it/s] 176it [00:18, 9.84it/s] 177it [00:18, 9.84it/s] 178it [00:18, 9.84it/s] 179it [00:18, 9.87it/s] 180it [00:18, 9.86it/s] 181it [00:18, 9.88it/s] 182it [00:19, 9.72it/s] 183it [00:19, 9.76it/s] 184it [00:19, 9.79it/s] 185it [00:19, 9.82it/s] 186it [00:19, 9.84it/s] 187it [00:19, 9.85it/s] 188it [00:19, 9.86it/s] 189it [00:19, 9.87it/s] 190it [00:19, 9.87it/s] 191it [00:19, 9.86it/s] 192it [00:20, 9.86it/s] 193it [00:20, 9.89it/s] 194it [00:20, 9.87it/s] 195it [00:20, 8.70it/s] 196it [00:20, 9.55it/s] +2025-05-26 05:04:23,964 - INFO - Epoch: 61, Objective: tensor([6526.4443], device='cuda:0', grad_fn=), Loss: 0.049620795994997025, KL/n: 67.15840148925781 + 0it [00:00, ?it/s]2025-05-26 05:04:24,233 - INFO - [Epoch 062 | Batch 0000] IWAE-loss 4576.0898 | mean log_px -0.0238 | KL -3289.67 + 1it [00:00, 5.50it/s] 2it [00:00, 7.45it/s] 3it [00:00, 8.42it/s] 4it [00:00, 8.93it/s] 5it [00:00, 9.26it/s] 6it [00:00, 9.42it/s] 7it [00:00, 9.58it/s] 8it [00:00, 9.67it/s] 9it [00:00, 9.74it/s] 10it [00:01, 9.77it/s] 11it [00:01, 9.82it/s] 12it [00:01, 9.84it/s] 13it [00:01, 9.85it/s] 14it [00:01, 9.86it/s] 15it [00:01, 9.87it/s] 16it [00:01, 9.87it/s] 17it [00:01, 9.89it/s] 18it [00:01, 9.90it/s] 19it [00:02, 9.90it/s] 20it [00:02, 9.88it/s] 21it [00:02, 9.26it/s] 22it [00:02, 9.44it/s] 23it [00:02, 9.57it/s] 24it [00:02, 9.62it/s] 25it [00:02, 9.23it/s] 26it [00:02, 9.36it/s] 27it [00:02, 9.49it/s] 28it [00:02, 9.55it/s] 29it [00:03, 9.04it/s] 30it [00:03, 9.27it/s] 31it [00:03, 9.45it/s] 32it [00:03, 9.53it/s] 33it [00:03, 9.63it/s] 34it [00:03, 9.69it/s] 35it [00:03, 9.75it/s] 36it [00:03, 9.77it/s] 37it [00:03, 9.80it/s] 38it [00:03, 9.81it/s] 39it [00:04, 9.84it/s] 40it [00:04, 9.85it/s] 41it [00:04, 9.87it/s] 42it [00:04, 9.86it/s] 43it [00:04, 9.88it/s] 44it [00:04, 9.86it/s] 45it [00:04, 9.88it/s] 46it [00:05, 6.04it/s] 47it [00:05, 6.84it/s] 48it [00:05, 7.54it/s] 49it [00:05, 8.13it/s] 50it [00:05, 8.57it/s]2025-05-26 05:04:29,581 - INFO - [Epoch 062 | Batch 0050] IWAE-loss 4915.9707 | mean log_px -0.0268 | KL -3286.16 + 51it [00:05, 8.91it/s] 52it [00:05, 9.17it/s] 53it [00:05, 9.38it/s] 54it [00:05, 9.52it/s] 55it [00:05, 9.64it/s] 56it [00:06, 9.71it/s] 57it [00:06, 9.77it/s] 58it [00:06, 9.79it/s] 59it [00:06, 9.64it/s] 60it [00:06, 9.65it/s] 61it [00:06, 9.72it/s] 62it [00:06, 9.75it/s] 63it [00:06, 9.79it/s] 64it [00:06, 9.80it/s] 65it [00:06, 9.21it/s] 66it [00:07, 9.40it/s] 67it [00:07, 9.55it/s] 68it [00:07, 9.63it/s] 69it [00:07, 9.72it/s] 70it [00:07, 9.75it/s] 71it [00:07, 9.78it/s] 72it [00:07, 9.80it/s] 73it [00:07, 9.83it/s] 74it [00:07, 9.84it/s] 75it [00:07, 9.84it/s] 76it [00:08, 9.84it/s] 77it [00:08, 9.85it/s] 78it [00:08, 9.86it/s] 79it [00:08, 9.88it/s] 80it [00:08, 9.88it/s] 81it [00:08, 9.88it/s] 82it [00:08, 9.87it/s] 83it [00:08, 9.84it/s] 84it [00:08, 9.85it/s] 85it [00:09, 9.24it/s] 86it [00:09, 9.41it/s] 87it [00:09, 9.56it/s] 88it [00:09, 9.64it/s] 89it [00:09, 9.72it/s] 90it [00:09, 9.76it/s] 91it [00:09, 9.80it/s] 92it [00:09, 9.81it/s] 93it [00:09, 9.65it/s] 94it [00:09, 9.64it/s] 95it [00:10, 9.18it/s] 96it [00:10, 9.38it/s] 97it [00:10, 9.52it/s] 98it [00:10, 9.64it/s] 99it [00:10, 9.72it/s] 100it [00:10, 9.76it/s]2025-05-26 05:04:34,729 - INFO - [Epoch 062 | Batch 0100] IWAE-loss 4170.7461 | mean log_px -0.0182 | KL -3282.61 + 101it [00:10, 9.79it/s] 102it [00:10, 9.82it/s] 103it [00:10, 9.86it/s] 104it [00:11, 9.23it/s] 105it [00:11, 9.43it/s] 106it [00:11, 9.57it/s] 107it [00:11, 9.67it/s] 108it [00:11, 9.73it/s] 109it [00:11, 9.78it/s] 110it [00:11, 9.19it/s] 111it [00:11, 9.39it/s] 112it [00:11, 9.53it/s] 113it [00:11, 9.64it/s] 114it [00:12, 9.08it/s] 115it [00:12, 9.32it/s] 116it [00:12, 9.47it/s] 117it [00:12, 9.60it/s] 118it [00:12, 9.66it/s] 119it [00:12, 9.73it/s] 120it [00:12, 9.76it/s] 121it [00:12, 9.23it/s] 122it [00:12, 9.41it/s] 123it [00:12, 9.50it/s] 124it [00:13, 9.12it/s] 125it [00:13, 9.34it/s] 126it [00:13, 9.48it/s] 127it [00:13, 9.59it/s] 128it [00:13, 9.66it/s] 129it [00:13, 9.72it/s] 130it [00:13, 9.75it/s] 131it [00:13, 9.80it/s] 132it [00:13, 9.82it/s] 133it [00:14, 9.83it/s] 134it [00:14, 9.84it/s] 135it [00:14, 9.84it/s] 136it [00:14, 9.84it/s] 137it [00:14, 9.86it/s] 138it [00:14, 9.86it/s] 139it [00:14, 9.87it/s] 140it [00:14, 9.85it/s] 141it [00:14, 9.87it/s] 142it [00:14, 9.25it/s] 143it [00:15, 9.43it/s] 144it [00:15, 9.55it/s] 145it [00:15, 9.66it/s] 146it [00:15, 9.72it/s] 147it [00:15, 9.77it/s] 148it [00:15, 9.79it/s] 149it [00:15, 9.83it/s] 150it [00:15, 9.41it/s]2025-05-26 05:04:39,941 - INFO - [Epoch 062 | Batch 0150] IWAE-loss 4884.0713 | mean log_px -0.0360 | KL -3281.47 + 151it [00:15, 9.54it/s] 152it [00:15, 9.64it/s] 153it [00:16, 9.72it/s] 154it [00:16, 9.77it/s] 155it [00:16, 9.82it/s] 156it [00:16, 9.84it/s] 157it [00:16, 9.86it/s] 158it [00:16, 9.86it/s] 159it [00:16, 9.87it/s] 160it [00:16, 9.86it/s] 161it [00:16, 9.08it/s] 162it [00:17, 9.06it/s] 163it [00:17, 9.14it/s] 164it [00:17, 9.34it/s] 165it [00:17, 9.51it/s] 166it [00:17, 9.62it/s] 167it [00:17, 9.68it/s] 168it [00:17, 9.12it/s] 169it [00:17, 9.34it/s] 170it [00:17, 9.48it/s] 171it [00:17, 9.57it/s] 172it [00:18, 9.66it/s] 173it [00:18, 9.18it/s] 174it [00:18, 9.36it/s] 175it [00:18, 9.52it/s] 176it [00:18, 9.53it/s] 177it [00:18, 9.53it/s] 178it [00:18, 9.56it/s] 179it [00:18, 9.65it/s] 180it [00:18, 9.70it/s] 181it [00:19, 9.58it/s] 182it [00:19, 9.66it/s] 183it [00:19, 9.73it/s] 184it [00:19, 9.77it/s] 185it [00:19, 9.81it/s] 186it [00:19, 9.82it/s] 187it [00:19, 9.84it/s] 188it [00:19, 9.85it/s] 189it [00:19, 9.44it/s] 190it [00:19, 9.55it/s] 191it [00:20, 9.65it/s] 192it [00:20, 9.71it/s] 193it [00:20, 9.77it/s] 194it [00:20, 9.56it/s] 195it [00:20, 8.64it/s] 196it [00:20, 8.74it/s] 196it [00:20, 9.47it/s] +2025-05-26 05:04:44,784 - INFO - Epoch: 62, Objective: tensor([5284.1826], device='cuda:0', grad_fn=), Loss: 0.03511318191885948, KL/n: 66.92284393310547 + 0it [00:00, ?it/s]2025-05-26 05:04:45,055 - INFO - [Epoch 063 | Batch 0000] IWAE-loss 4192.7603 | mean log_px -0.0176 | KL -3279.23 + 1it [00:00, 4.73it/s] 2it [00:00, 6.76it/s] 3it [00:00, 7.66it/s] 4it [00:00, 8.22it/s] 5it [00:00, 8.65it/s] 6it [00:00, 8.92it/s] 7it [00:00, 9.12it/s] 8it [00:00, 9.20it/s] 9it [00:01, 9.31it/s] 10it [00:01, 9.37it/s] 11it [00:01, 9.44it/s] 12it [00:01, 9.48it/s] 13it [00:01, 9.49it/s] 14it [00:01, 9.50it/s] 15it [00:01, 9.49it/s] 16it [00:01, 9.49it/s] 17it [00:01, 9.56it/s] 18it [00:02, 9.57it/s] 19it [00:02, 9.10it/s] 20it [00:02, 9.25it/s] 21it [00:02, 9.36it/s] 22it [00:02, 9.41it/s] 23it [00:02, 9.48it/s] 24it [00:02, 9.50it/s] 25it [00:02, 9.54it/s] 26it [00:02, 9.52it/s] 27it [00:02, 9.55it/s] 28it [00:03, 9.09it/s] 29it [00:03, 9.22it/s] 30it [00:03, 9.35it/s] 31it [00:03, 9.40it/s] 32it [00:03, 9.45it/s] 33it [00:03, 9.48it/s] 34it [00:03, 9.09it/s] 35it [00:03, 9.24it/s] 36it [00:03, 9.32it/s] 37it [00:04, 9.34it/s] 38it [00:04, 9.41it/s] 39it [00:04, 9.50it/s] 40it [00:04, 9.08it/s] 41it [00:04, 9.21it/s] 42it [00:04, 9.28it/s] 43it [00:04, 9.36it/s] 44it [00:04, 9.38it/s] 45it [00:04, 9.48it/s] 46it [00:04, 9.50it/s] 47it [00:05, 9.48it/s] 48it [00:05, 9.47it/s] 49it [00:05, 9.47it/s] 50it [00:05, 9.46it/s]2025-05-26 05:04:50,395 - INFO - [Epoch 063 | Batch 0050] IWAE-loss 4688.5366 | mean log_px -0.0212 | KL -3273.02 + 51it [00:05, 9.51it/s] 52it [00:05, 9.51it/s] 53it [00:05, 9.53it/s] 54it [00:05, 9.53it/s] 55it [00:05, 9.53it/s] 56it [00:06, 9.52it/s] 57it [00:06, 9.58it/s] 58it [00:06, 9.13it/s] 59it [00:06, 9.29it/s] 60it [00:06, 9.34it/s] 61it [00:06, 9.42it/s] 62it [00:06, 9.46it/s] 63it [00:06, 9.49it/s] 64it [00:06, 9.50it/s] 65it [00:07, 9.50it/s] 66it [00:07, 9.52it/s] 67it [00:07, 9.51it/s] 68it [00:07, 9.52it/s] 69it [00:07, 9.10it/s] 70it [00:07, 9.22it/s] 71it [00:07, 9.31it/s] 72it [00:07, 9.36it/s] 73it [00:07, 9.38it/s] 74it [00:07, 9.39it/s] 75it [00:08, 9.41it/s] 76it [00:08, 9.46it/s] 77it [00:08, 9.49it/s] 78it [00:08, 9.47it/s] 79it [00:08, 9.55it/s] 80it [00:08, 9.60it/s] 81it [00:08, 9.15it/s] 82it [00:08, 9.30it/s] 83it [00:08, 9.38it/s] 84it [00:09, 8.90it/s] 85it [00:09, 9.05it/s] 86it [00:09, 9.17it/s] 87it [00:09, 9.29it/s] 88it [00:09, 9.36it/s] 89it [00:09, 9.38it/s] 90it [00:09, 9.42it/s] 91it [00:09, 9.45it/s] 92it [00:09, 9.49it/s] 93it [00:09, 9.54it/s] 94it [00:10, 9.53it/s] 95it [00:10, 9.54it/s] 96it [00:10, 9.55it/s] 97it [00:10, 9.01it/s] 98it [00:10, 9.15it/s] 99it [00:10, 9.23it/s] 100it [00:10, 9.29it/s]2025-05-26 05:04:55,728 - INFO - [Epoch 063 | Batch 0100] IWAE-loss 4749.5503 | mean log_px -0.0224 | KL -3273.87 + 101it [00:10, 9.35it/s] 102it [00:10, 9.39it/s] 103it [00:11, 9.42it/s] 104it [00:11, 9.46it/s] 105it [00:11, 9.49it/s] 106it [00:11, 9.50it/s] 107it [00:11, 9.52it/s] 108it [00:11, 9.49it/s] 109it [00:11, 8.97it/s] 110it [00:11, 9.09it/s] 111it [00:11, 9.13it/s] 112it [00:12, 9.27it/s] 113it [00:12, 9.30it/s] 114it [00:12, 8.96it/s] 115it [00:12, 9.12it/s] 116it [00:12, 9.23it/s] 117it [00:12, 9.32it/s] 118it [00:12, 9.39it/s] 119it [00:12, 9.45it/s] 120it [00:12, 9.48it/s] 121it [00:12, 9.54it/s] 122it [00:13, 9.57it/s] 123it [00:13, 9.52it/s] 124it [00:13, 8.92it/s] 125it [00:13, 9.10it/s] 126it [00:13, 9.22it/s] 127it [00:13, 9.31it/s] 128it [00:13, 9.39it/s] 129it [00:13, 9.44it/s] 130it [00:13, 9.04it/s] 131it [00:14, 9.16it/s] 132it [00:14, 9.31it/s] 133it [00:14, 9.44it/s] 134it [00:14, 9.44it/s] 135it [00:14, 9.46it/s] 136it [00:14, 9.47it/s] 137it [00:14, 9.47it/s] 138it [00:14, 9.55it/s] 139it [00:14, 9.53it/s] 140it [00:15, 9.58it/s] 141it [00:15, 9.59it/s] 142it [00:15, 9.59it/s] 143it [00:15, 9.64it/s] 144it [00:15, 9.60it/s] 145it [00:15, 9.60it/s] 146it [00:15, 9.58it/s] 147it [00:15, 9.60it/s] 148it [00:15, 9.54it/s] 149it [00:15, 9.55it/s] 150it [00:16, 9.54it/s]2025-05-26 05:05:01,047 - INFO - [Epoch 063 | Batch 0150] IWAE-loss 3977.1768 | mean log_px -0.0134 | KL -3273.26 + 151it [00:16, 9.50it/s] 152it [00:16, 9.50it/s] 153it [00:16, 9.49it/s] 154it [00:16, 9.43it/s] 155it [00:16, 8.92it/s] 156it [00:16, 8.94it/s] 157it [00:16, 9.11it/s] 158it [00:16, 9.26it/s] 159it [00:17, 8.85it/s] 160it [00:17, 8.99it/s] 161it [00:17, 9.15it/s] 162it [00:17, 9.14it/s] 163it [00:17, 8.60it/s] 164it [00:17, 8.74it/s] 165it [00:17, 8.97it/s] 166it [00:17, 9.11it/s] 167it [00:17, 8.76it/s] 168it [00:18, 8.95it/s] 169it [00:18, 9.13it/s] 170it [00:18, 9.22it/s] 171it [00:18, 8.82it/s] 172it [00:18, 9.05it/s] 173it [00:18, 9.17it/s] 174it [00:18, 9.26it/s] 175it [00:18, 8.82it/s] 176it [00:18, 8.97it/s] 177it [00:19, 9.10it/s] 178it [00:19, 9.22it/s] 179it [00:19, 8.82it/s] 180it [00:19, 9.06it/s] 181it [00:19, 9.23it/s] 182it [00:19, 9.34it/s] 183it [00:19, 8.85it/s] 184it [00:19, 9.02it/s] 185it [00:19, 9.03it/s] 186it [00:20, 9.15it/s] 187it [00:20, 9.28it/s] 188it [00:20, 8.86it/s] 189it [00:20, 9.05it/s] 190it [00:20, 9.20it/s] 191it [00:20, 9.31it/s] 192it [00:20, 8.90it/s] 193it [00:20, 9.13it/s] 194it [00:20, 9.20it/s] 195it [00:21, 8.75it/s] 196it [00:21, 8.64it/s] 196it [00:21, 9.23it/s] +2025-05-26 05:05:06,147 - INFO - Epoch: 63, Objective: tensor([5113.3408], device='cuda:0', grad_fn=), Loss: 0.03467189148068428, KL/n: 66.71068572998047 + 0it [00:00, ?it/s]2025-05-26 05:05:06,422 - INFO - [Epoch 064 | Batch 0000] IWAE-loss 4048.0391 | mean log_px -0.0111 | KL -3268.86 + 1it [00:00, 5.24it/s] 2it [00:00, 7.13it/s] 3it [00:00, 8.01it/s] 4it [00:00, 8.49it/s] 5it [00:00, 8.82it/s] 6it [00:00, 9.07it/s] 7it [00:00, 8.67it/s] 8it [00:00, 8.97it/s] 9it [00:01, 9.10it/s] 10it [00:01, 9.27it/s] 11it [00:01, 9.40it/s] 12it [00:01, 9.46it/s] 13it [00:01, 9.53it/s] 14it [00:01, 9.53it/s] 15it [00:01, 9.53it/s] 16it [00:01, 9.47it/s] 17it [00:01, 9.51it/s] 18it [00:01, 9.56it/s] 19it [00:02, 9.54it/s] 20it [00:02, 9.56it/s] 21it [00:02, 9.56it/s] 22it [00:02, 9.57it/s] 23it [00:02, 9.59it/s] 24it [00:02, 9.58it/s] 25it [00:02, 9.60it/s] 26it [00:02, 9.60it/s] 27it [00:02, 9.57it/s] 28it [00:03, 9.56it/s] 29it [00:03, 9.57it/s] 30it [00:03, 9.58it/s] 31it [00:03, 9.54it/s] 32it [00:03, 9.37it/s] 33it [00:03, 9.49it/s] 34it [00:03, 9.48it/s] 35it [00:03, 9.44it/s] 36it [00:03, 9.39it/s] 37it [00:03, 9.38it/s] 38it [00:04, 9.34it/s] 39it [00:04, 9.33it/s] 40it [00:04, 9.41it/s] 41it [00:04, 9.43it/s] 42it [00:04, 9.47it/s] 43it [00:04, 9.56it/s] 44it [00:04, 9.59it/s] 45it [00:04, 9.61it/s] 46it [00:04, 9.59it/s] 47it [00:05, 9.49it/s] 48it [00:05, 9.55it/s] 49it [00:05, 9.62it/s] 50it [00:05, 9.59it/s]2025-05-26 05:05:11,692 - INFO - [Epoch 064 | Batch 0050] IWAE-loss 4078.9944 | mean log_px -0.0116 | KL -3263.32 + 51it [00:05, 6.25it/s] 52it [00:05, 6.97it/s] 53it [00:05, 7.58it/s] 54it [00:05, 8.07it/s] 55it [00:06, 8.38it/s] 56it [00:06, 8.56it/s] 57it [00:06, 8.62it/s] 58it [00:06, 8.80it/s] 59it [00:06, 8.97it/s] 60it [00:06, 9.11it/s] 61it [00:06, 9.21it/s] 62it [00:06, 9.29it/s] 63it [00:06, 9.40it/s] 64it [00:07, 9.39it/s] 65it [00:07, 9.39it/s] 66it [00:07, 9.38it/s] 67it [00:07, 9.39it/s] 68it [00:07, 9.44it/s] 69it [00:07, 9.46it/s] 70it [00:07, 9.49it/s] 71it [00:07, 9.48it/s] 72it [00:07, 9.49it/s] 73it [00:07, 9.49it/s] 74it [00:08, 9.52it/s] 75it [00:08, 9.52it/s] 76it [00:08, 9.51it/s] 77it [00:08, 9.57it/s] 78it [00:08, 9.60it/s] 79it [00:08, 9.59it/s] 80it [00:08, 9.58it/s] 81it [00:08, 9.55it/s] 82it [00:08, 9.53it/s] 83it [00:09, 9.53it/s] 84it [00:09, 9.50it/s] 85it [00:09, 9.49it/s] 86it [00:09, 9.51it/s] 87it [00:09, 8.99it/s] 88it [00:09, 9.15it/s] 89it [00:09, 9.26it/s] 90it [00:09, 9.33it/s] 91it [00:09, 9.41it/s] 92it [00:09, 9.46it/s] 93it [00:10, 9.48it/s] 94it [00:10, 9.49it/s] 95it [00:10, 9.51it/s] 96it [00:10, 9.51it/s] 97it [00:10, 9.54it/s] 98it [00:10, 9.51it/s] 99it [00:10, 9.52it/s] 100it [00:10, 9.55it/s]2025-05-26 05:05:17,172 - INFO - [Epoch 064 | Batch 0100] IWAE-loss 4177.9673 | mean log_px -0.0192 | KL -3262.71 + 101it [00:10, 9.57it/s] 102it [00:11, 9.57it/s] 103it [00:11, 9.56it/s] 104it [00:11, 9.56it/s] 105it [00:11, 9.59it/s] 106it [00:11, 9.57it/s] 107it [00:11, 9.59it/s] 108it [00:11, 9.56it/s] 109it [00:11, 9.54it/s] 110it [00:11, 9.54it/s] 111it [00:11, 9.56it/s] 112it [00:12, 9.56it/s] 113it [00:12, 9.58it/s] 114it [00:12, 9.51it/s] 115it [00:12, 9.52it/s] 116it [00:12, 9.54it/s] 117it [00:12, 9.56it/s] 118it [00:12, 9.54it/s] 119it [00:12, 9.56it/s] 120it [00:12, 9.60it/s] 121it [00:13, 9.53it/s] 122it [00:13, 9.53it/s] 123it [00:13, 9.48it/s] 124it [00:13, 9.53it/s] 125it [00:13, 9.56it/s] 126it [00:13, 9.55it/s] 127it [00:13, 9.54it/s] 128it [00:13, 9.56it/s] 129it [00:13, 9.55it/s] 130it [00:13, 9.54it/s] 131it [00:14, 9.53it/s] 132it [00:14, 9.50it/s] 133it [00:14, 9.54it/s] 134it [00:14, 9.56it/s] 135it [00:14, 9.56it/s] 136it [00:14, 9.49it/s] 137it [00:14, 9.51it/s] 138it [00:14, 9.50it/s] 139it [00:14, 9.49it/s] 140it [00:15, 9.48it/s] 141it [00:15, 9.51it/s] 142it [00:15, 9.54it/s] 143it [00:15, 9.54it/s] 144it [00:15, 9.50it/s] 145it [00:15, 9.53it/s] 146it [00:15, 9.50it/s] 147it [00:15, 9.56it/s] 148it [00:15, 9.60it/s] 149it [00:15, 9.59it/s] 150it [00:16, 9.58it/s]2025-05-26 05:05:22,411 - INFO - [Epoch 064 | Batch 0150] IWAE-loss 4131.0303 | mean log_px -0.0125 | KL -3256.42 + 151it [00:16, 9.61it/s] 152it [00:16, 9.59it/s] 153it [00:16, 9.57it/s] 154it [00:16, 9.57it/s] 155it [00:16, 9.16it/s] 156it [00:16, 9.25it/s] 157it [00:16, 9.33it/s] 158it [00:16, 9.37it/s] 159it [00:17, 9.44it/s] 160it [00:17, 9.48it/s] 161it [00:17, 9.50it/s] 162it [00:17, 9.53it/s] 163it [00:17, 9.58it/s] 164it [00:17, 9.53it/s] 165it [00:17, 9.58it/s] 166it [00:17, 9.57it/s] 167it [00:17, 9.62it/s] 168it [00:17, 9.56it/s] 169it [00:18, 9.51it/s] 170it [00:18, 9.55it/s] 171it [00:18, 9.54it/s] 172it [00:18, 9.54it/s] 173it [00:18, 9.50it/s] 174it [00:18, 9.50it/s] 175it [00:18, 9.53it/s] 176it [00:18, 9.53it/s] 177it [00:18, 9.53it/s] 178it [00:19, 9.54it/s] 179it [00:19, 9.53it/s] 180it [00:19, 9.56it/s] 181it [00:19, 9.58it/s] 182it [00:19, 9.04it/s] 183it [00:19, 9.15it/s] 184it [00:19, 9.29it/s] 185it [00:19, 9.38it/s] 186it [00:19, 9.42it/s] 187it [00:19, 9.48it/s] 188it [00:20, 9.45it/s] 189it [00:20, 9.45it/s] 190it [00:20, 9.51it/s] 191it [00:20, 9.47it/s] 192it [00:20, 9.49it/s] 193it [00:20, 9.49it/s] 194it [00:20, 9.48it/s] 195it [00:20, 8.38it/s] 196it [00:20, 8.74it/s] 196it [00:21, 9.32it/s] +2025-05-26 05:05:27,300 - INFO - Epoch: 64, Objective: tensor([4486.4854], device='cuda:0', grad_fn=), Loss: 0.017137622460722923, KL/n: 66.45817565917969 + 0it [00:00, ?it/s]2025-05-26 05:05:27,579 - INFO - [Epoch 065 | Batch 0000] IWAE-loss 4915.1265 | mean log_px -0.0304 | KL -3253.02 + 1it [00:00, 5.30it/s] 2it [00:00, 6.71it/s] 3it [00:00, 7.76it/s] 4it [00:00, 8.36it/s] 5it [00:00, 8.71it/s] 6it [00:00, 8.97it/s] 7it [00:00, 9.16it/s] 8it [00:00, 9.27it/s] 9it [00:01, 9.35it/s] 10it [00:01, 9.41it/s] 11it [00:01, 9.45it/s] 12it [00:01, 8.93it/s] 13it [00:01, 9.10it/s] 14it [00:01, 9.23it/s] 15it [00:01, 9.31it/s] 16it [00:01, 9.35it/s] 17it [00:01, 9.40it/s] 18it [00:02, 9.39it/s] 19it [00:02, 9.45it/s] 20it [00:02, 9.50it/s] 21it [00:02, 9.51it/s] 22it [00:02, 9.51it/s] 23it [00:02, 9.52it/s] 24it [00:02, 9.55it/s] 25it [00:02, 9.57it/s] 26it [00:02, 9.61it/s] 27it [00:02, 9.57it/s] 28it [00:03, 9.57it/s] 29it [00:03, 9.54it/s] 30it [00:03, 9.51it/s] 31it [00:03, 8.96it/s] 32it [00:03, 9.09it/s] 33it [00:03, 9.22it/s] 34it [00:03, 9.36it/s] 35it [00:03, 9.44it/s] 36it [00:03, 9.46it/s] 37it [00:04, 9.50it/s] 38it [00:04, 9.51it/s] 39it [00:04, 8.97it/s] 40it [00:04, 9.11it/s] 41it [00:04, 9.23it/s] 42it [00:04, 9.32it/s] 43it [00:04, 9.39it/s] 44it [00:04, 9.46it/s] 45it [00:04, 9.47it/s] 46it [00:04, 9.43it/s] 47it [00:05, 9.46it/s] 48it [00:05, 9.45it/s] 49it [00:05, 9.48it/s] 50it [00:05, 9.46it/s]2025-05-26 05:05:32,909 - INFO - [Epoch 065 | Batch 0050] IWAE-loss 4041.6321 | mean log_px -0.0125 | KL -3247.29 + 51it [00:05, 9.43it/s] 52it [00:05, 9.47it/s] 53it [00:05, 9.47it/s] 54it [00:05, 9.48it/s] 55it [00:05, 9.53it/s] 56it [00:06, 9.58it/s] 57it [00:06, 9.57it/s] 58it [00:06, 9.13it/s] 59it [00:06, 9.24it/s] 60it [00:06, 9.33it/s] 61it [00:06, 9.40it/s] 62it [00:06, 9.03it/s] 63it [00:06, 9.23it/s] 64it [00:06, 9.28it/s] 65it [00:07, 9.37it/s] 66it [00:07, 9.39it/s] 67it [00:07, 9.39it/s] 68it [00:07, 9.45it/s] 69it [00:07, 9.53it/s] 70it [00:07, 9.54it/s] 71it [00:07, 9.61it/s] 72it [00:07, 9.61it/s] 73it [00:07, 9.66it/s] 74it [00:07, 9.66it/s] 75it [00:08, 9.68it/s] 76it [00:08, 9.19it/s] 77it [00:08, 9.28it/s] 78it [00:08, 9.33it/s] 79it [00:08, 9.40it/s] 80it [00:08, 9.03it/s] 81it [00:08, 9.16it/s] 82it [00:08, 9.25it/s] 83it [00:08, 8.89it/s] 84it [00:09, 9.08it/s] 85it [00:09, 9.22it/s] 86it [00:09, 9.30it/s] 87it [00:09, 9.44it/s] 88it [00:09, 9.01it/s] 89it [00:09, 9.15it/s] 90it [00:09, 9.24it/s] 91it [00:09, 9.35it/s] 92it [00:09, 9.40it/s] 93it [00:10, 9.03it/s] 94it [00:10, 9.18it/s] 95it [00:10, 9.30it/s] 96it [00:10, 9.38it/s] 97it [00:10, 9.46it/s] 98it [00:10, 9.52it/s] 99it [00:10, 8.99it/s] 100it [00:10, 9.11it/s]2025-05-26 05:05:38,278 - INFO - [Epoch 065 | Batch 0100] IWAE-loss 4149.1934 | mean log_px -0.0150 | KL -3245.47 + 101it [00:10, 9.23it/s] 102it [00:10, 9.32it/s] 103it [00:11, 9.38it/s] 104it [00:11, 9.42it/s] 105it [00:11, 9.48it/s] 106it [00:11, 9.08it/s] 107it [00:11, 9.20it/s] 108it [00:11, 9.33it/s] 109it [00:11, 9.37it/s] 110it [00:11, 9.44it/s] 111it [00:11, 9.46it/s] 112it [00:12, 9.40it/s] 113it [00:12, 9.46it/s] 114it [00:12, 9.07it/s] 115it [00:12, 9.26it/s] 116it [00:12, 9.34it/s] 117it [00:12, 9.42it/s] 118it [00:12, 9.44it/s] 119it [00:12, 9.06it/s] 120it [00:12, 9.19it/s] 121it [00:13, 9.26it/s] 122it [00:13, 9.35it/s] 123it [00:13, 8.99it/s] 124it [00:13, 9.19it/s] 125it [00:13, 9.30it/s] 126it [00:13, 9.41it/s] 127it [00:13, 9.44it/s] 128it [00:13, 9.52it/s] 129it [00:13, 9.55it/s] 130it [00:13, 9.53it/s] 131it [00:14, 9.55it/s] 132it [00:14, 9.57it/s] 133it [00:14, 9.15it/s] 134it [00:14, 9.21it/s] 135it [00:14, 8.87it/s] 136it [00:14, 9.07it/s] 137it [00:14, 9.23it/s] 138it [00:14, 8.90it/s] 139it [00:14, 9.08it/s] 140it [00:15, 9.24it/s] 141it [00:15, 8.90it/s] 142it [00:15, 9.10it/s] 143it [00:15, 9.25it/s] 144it [00:15, 9.34it/s] 145it [00:15, 9.38it/s] 146it [00:15, 9.41it/s] 147it [00:15, 9.47it/s] 148it [00:15, 9.44it/s] 149it [00:16, 9.03it/s] 150it [00:16, 9.16it/s]2025-05-26 05:05:43,663 - INFO - [Epoch 065 | Batch 0150] IWAE-loss 5137.2002 | mean log_px -0.0301 | KL -3244.56 + 151it [00:16, 9.23it/s] 152it [00:16, 8.67it/s] 153it [00:16, 8.72it/s] 154it [00:16, 8.83it/s] 155it [00:16, 9.07it/s] 156it [00:16, 9.23it/s] 157it [00:16, 9.34it/s] 158it [00:17, 8.98it/s] 159it [00:17, 9.17it/s] 160it [00:17, 9.25it/s] 161it [00:17, 9.38it/s] 162it [00:17, 9.47it/s] 163it [00:17, 9.52it/s] 164it [00:17, 9.57it/s] 165it [00:17, 9.55it/s] 166it [00:17, 9.52it/s] 167it [00:17, 9.55it/s] 168it [00:18, 9.54it/s] 169it [00:18, 9.55it/s] 170it [00:18, 9.54it/s] 171it [00:18, 9.59it/s] 172it [00:18, 9.63it/s] 173it [00:18, 9.59it/s] 174it [00:18, 9.56it/s] 175it [00:18, 9.56it/s] 176it [00:18, 9.02it/s] 177it [00:19, 9.18it/s] 178it [00:19, 9.29it/s] 179it [00:19, 9.37it/s] 180it [00:19, 9.40it/s] 181it [00:19, 8.75it/s] 182it [00:19, 8.75it/s] 183it [00:19, 8.93it/s] 184it [00:19, 9.08it/s] 185it [00:19, 9.21it/s] 186it [00:20, 9.33it/s] 187it [00:20, 9.35it/s] 188it [00:20, 8.88it/s] 189it [00:20, 9.04it/s] 190it [00:20, 9.22it/s] 191it [00:20, 9.31it/s] 192it [00:20, 9.21it/s] 193it [00:20, 9.25it/s] 194it [00:20, 9.24it/s] 195it [00:21, 8.71it/s] 196it [00:21, 8.97it/s] 196it [00:21, 9.24it/s] +2025-05-26 05:05:48,646 - INFO - Epoch: 65, Objective: tensor([4243.4243], device='cuda:0', grad_fn=), Loss: 0.016095492988824844, KL/n: 66.21897888183594 + 0it [00:00, ?it/s]2025-05-26 05:05:48,917 - INFO - [Epoch 066 | Batch 0000] IWAE-loss 4330.0098 | mean log_px -0.0173 | KL -3242.21 + 1it [00:00, 4.73it/s] 2it [00:00, 6.75it/s] 3it [00:00, 7.82it/s] 4it [00:00, 8.37it/s] 5it [00:00, 8.76it/s] 6it [00:00, 8.97it/s] 7it [00:00, 9.16it/s] 8it [00:00, 9.25it/s] 9it [00:01, 9.30it/s] 10it [00:01, 9.32it/s] 11it [00:01, 9.37it/s] 12it [00:01, 8.89it/s] 13it [00:01, 9.11it/s] 14it [00:01, 9.25it/s] 15it [00:01, 9.37it/s] 16it [00:01, 9.44it/s] 17it [00:01, 9.47it/s] 18it [00:02, 9.52it/s] 19it [00:02, 9.52it/s] 20it [00:02, 9.55it/s] 21it [00:02, 9.59it/s] 22it [00:02, 9.22it/s] 23it [00:02, 9.32it/s] 24it [00:02, 9.36it/s] 25it [00:02, 9.40it/s] 26it [00:02, 9.37it/s] 27it [00:02, 9.42it/s] 28it [00:03, 9.42it/s] 29it [00:03, 9.44it/s] 30it [00:03, 9.12it/s] 31it [00:03, 9.24it/s] 32it [00:03, 9.30it/s] 33it [00:03, 9.33it/s] 34it [00:03, 9.36it/s] 35it [00:03, 9.36it/s] 36it [00:03, 9.38it/s] 37it [00:04, 9.43it/s] 38it [00:04, 8.90it/s] 39it [00:04, 9.09it/s] 40it [00:04, 9.20it/s] 41it [00:04, 9.27it/s] 42it [00:04, 9.34it/s] 43it [00:04, 9.37it/s] 44it [00:04, 9.41it/s] 45it [00:04, 9.44it/s] 46it [00:05, 9.33it/s] 47it [00:05, 9.39it/s] 48it [00:05, 9.46it/s] 49it [00:05, 9.52it/s] 50it [00:05, 9.48it/s]2025-05-26 05:05:54,276 - INFO - [Epoch 066 | Batch 0050] IWAE-loss 5074.5923 | mean log_px -0.0331 | KL -3240.32 + 51it [00:05, 9.48it/s] 52it [00:05, 9.53it/s] 53it [00:05, 9.50it/s] 54it [00:05, 9.47it/s] 55it [00:05, 9.12it/s] 56it [00:06, 9.22it/s] 57it [00:06, 9.29it/s] 58it [00:06, 9.35it/s] 59it [00:06, 9.39it/s] 60it [00:06, 9.04it/s] 61it [00:06, 9.17it/s] 62it [00:06, 9.26it/s] 63it [00:06, 9.33it/s] 64it [00:06, 9.39it/s] 65it [00:07, 9.42it/s] 66it [00:07, 9.42it/s] 67it [00:07, 9.46it/s] 68it [00:07, 6.22it/s] 69it [00:07, 6.92it/s] 70it [00:07, 7.52it/s] 71it [00:07, 8.03it/s] 72it [00:07, 8.40it/s] 73it [00:08, 8.42it/s] 74it [00:08, 8.71it/s] 75it [00:08, 8.95it/s] 76it [00:08, 9.09it/s] 77it [00:08, 9.22it/s] 78it [00:08, 9.29it/s] 79it [00:08, 9.37it/s] 80it [00:08, 9.37it/s] 81it [00:08, 9.45it/s] 82it [00:09, 9.45it/s] 83it [00:09, 9.49it/s] 84it [00:09, 9.46it/s] 85it [00:09, 9.47it/s] 86it [00:09, 9.49it/s] 87it [00:09, 9.48it/s] 88it [00:09, 9.44it/s] 89it [00:09, 9.46it/s] 90it [00:09, 9.45it/s] 91it [00:09, 9.45it/s] 92it [00:10, 9.37it/s] 93it [00:10, 9.36it/s] 94it [00:10, 9.07it/s] 95it [00:10, 9.20it/s] 96it [00:10, 9.29it/s] 97it [00:10, 9.34it/s] 98it [00:10, 9.37it/s] 99it [00:10, 9.41it/s] 100it [00:10, 9.39it/s]2025-05-26 05:05:59,794 - INFO - [Epoch 066 | Batch 0100] IWAE-loss 4414.3447 | mean log_px -0.0179 | KL -3239.95 + 101it [00:11, 9.45it/s] 102it [00:11, 9.45it/s] 103it [00:11, 9.48it/s] 104it [00:11, 9.47it/s] 105it [00:11, 9.49it/s] 106it [00:11, 9.49it/s] 107it [00:11, 9.47it/s] 108it [00:11, 9.45it/s] 109it [00:11, 9.46it/s] 110it [00:12, 9.46it/s] 111it [00:12, 9.47it/s] 112it [00:12, 9.48it/s] 113it [00:12, 9.51it/s] 114it [00:12, 9.50it/s] 115it [00:12, 9.19it/s] 116it [00:12, 9.31it/s] 117it [00:12, 9.37it/s] 118it [00:12, 9.38it/s] 119it [00:12, 9.32it/s] 120it [00:13, 9.37it/s] 121it [00:13, 9.39it/s] 122it [00:13, 9.45it/s] 123it [00:13, 9.42it/s] 124it [00:13, 9.41it/s] 125it [00:13, 9.41it/s] 126it [00:13, 9.38it/s] 127it [00:13, 9.42it/s] 128it [00:13, 9.46it/s] 129it [00:14, 9.46it/s] 130it [00:14, 9.46it/s] 131it [00:14, 9.44it/s] 132it [00:14, 9.44it/s] 133it [00:14, 9.44it/s] 134it [00:14, 9.42it/s] 135it [00:14, 9.52it/s] 136it [00:14, 9.40it/s] 137it [00:14, 9.32it/s] 138it [00:14, 9.12it/s] 139it [00:15, 8.96it/s] 140it [00:15, 9.10it/s] 141it [00:15, 9.22it/s] 142it [00:15, 9.30it/s] 143it [00:15, 9.36it/s] 144it [00:15, 9.43it/s] 145it [00:15, 9.44it/s] 146it [00:15, 9.44it/s] 147it [00:15, 9.47it/s] 148it [00:16, 9.43it/s] 149it [00:16, 9.44it/s] 150it [00:16, 9.39it/s]2025-05-26 05:06:05,121 - INFO - [Epoch 066 | Batch 0150] IWAE-loss 4754.2173 | mean log_px -0.0265 | KL -3233.78 + 151it [00:16, 9.30it/s] 152it [00:16, 9.39it/s] 153it [00:16, 9.53it/s] 154it [00:16, 9.57it/s] 155it [00:16, 9.62it/s] 156it [00:16, 9.61it/s] 157it [00:17, 9.60it/s] 158it [00:17, 9.53it/s] 159it [00:17, 9.58it/s] 160it [00:17, 9.60it/s] 161it [00:17, 9.62it/s] 162it [00:17, 9.64it/s] 163it [00:17, 9.66it/s] 164it [00:17, 9.67it/s] 165it [00:17, 9.68it/s] 166it [00:17, 9.68it/s] 167it [00:18, 9.69it/s] 168it [00:18, 9.68it/s] 169it [00:18, 9.70it/s] 170it [00:18, 9.68it/s] 171it [00:18, 9.69it/s] 172it [00:18, 9.69it/s] 173it [00:18, 9.77it/s] 174it [00:18, 9.74it/s] 175it [00:18, 9.74it/s] 176it [00:18, 9.72it/s] 177it [00:19, 9.72it/s] 178it [00:19, 9.70it/s] 179it [00:19, 9.71it/s] 180it [00:19, 9.05it/s] 181it [00:19, 9.29it/s] 182it [00:19, 9.46it/s] 183it [00:19, 9.57it/s] 184it [00:19, 9.66it/s] 185it [00:19, 9.70it/s] 186it [00:20, 9.06it/s] 187it [00:20, 9.30it/s] 188it [00:20, 9.46it/s] 189it [00:20, 9.59it/s] 190it [00:20, 9.67it/s] 191it [00:20, 9.74it/s] 192it [00:20, 9.76it/s] 193it [00:20, 9.18it/s] 194it [00:20, 9.35it/s] 195it [00:20, 8.92it/s] 196it [00:21, 9.26it/s] +2025-05-26 05:06:09,936 - INFO - Epoch: 66, Objective: tensor([4165.6123], device='cuda:0', grad_fn=), Loss: 0.015236176550388336, KL/n: 65.961181640625 + 0it [00:00, ?it/s]2025-05-26 05:06:10,217 - INFO - [Epoch 067 | Batch 0000] IWAE-loss 4508.1504 | mean log_px -0.0203 | KL -3233.36 + 1it [00:00, 4.44it/s] 2it [00:00, 6.47it/s] 4it [00:00, 8.32it/s] 5it [00:00, 8.77it/s] 6it [00:00, 9.11it/s] 7it [00:00, 8.75it/s] 8it [00:00, 9.08it/s] 10it [00:01, 9.50it/s] 11it [00:01, 9.60it/s] 13it [00:01, 9.80it/s] 14it [00:01, 9.83it/s] 16it [00:01, 9.91it/s] 17it [00:01, 9.45it/s] 18it [00:01, 9.57it/s] 20it [00:02, 9.74it/s] 21it [00:02, 9.32it/s] 22it [00:02, 9.47it/s] 23it [00:02, 9.60it/s] 24it [00:02, 9.70it/s] 26it [00:02, 9.82it/s] 27it [00:02, 9.86it/s] 29it [00:03, 9.90it/s] 31it [00:03, 9.95it/s] 32it [00:03, 9.95it/s] 34it [00:03, 9.99it/s] 36it [00:03, 10.00it/s] 37it [00:03, 10.00it/s] 38it [00:04, 9.99it/s] 40it [00:04, 10.01it/s] 41it [00:04, 9.43it/s] 42it [00:04, 9.29it/s] 43it [00:04, 9.25it/s] 44it [00:04, 8.84it/s] 45it [00:04, 9.05it/s] 46it [00:04, 9.17it/s] 47it [00:04, 9.23it/s] 48it [00:05, 9.25it/s] 49it [00:05, 9.21it/s] 50it [00:05, 9.18it/s]2025-05-26 05:06:15,455 - INFO - [Epoch 067 | Batch 0050] IWAE-loss 4197.2188 | mean log_px -0.0214 | KL -3226.38 + 51it [00:05, 9.12it/s] 52it [00:05, 9.25it/s] 53it [00:05, 9.32it/s] 54it [00:05, 9.41it/s] 55it [00:05, 9.48it/s] 56it [00:05, 9.51it/s] 57it [00:06, 9.48it/s] 58it [00:06, 9.45it/s] 59it [00:06, 9.47it/s] 60it [00:06, 9.44it/s] 61it [00:06, 9.46it/s] 62it [00:06, 8.93it/s] 63it [00:06, 9.06it/s] 64it [00:06, 9.11it/s] 65it [00:06, 8.56it/s] 66it [00:07, 8.70it/s] 67it [00:07, 8.95it/s] 68it [00:07, 9.13it/s] 69it [00:07, 9.26it/s] 70it [00:07, 9.35it/s] 71it [00:07, 9.42it/s] 72it [00:07, 9.48it/s] 73it [00:07, 9.53it/s] 74it [00:07, 9.55it/s] 75it [00:08, 9.58it/s] 76it [00:08, 9.57it/s] 77it [00:08, 9.58it/s] 78it [00:08, 9.51it/s] 79it [00:08, 9.35it/s] 80it [00:08, 9.42it/s] 81it [00:08, 9.54it/s] 82it [00:08, 9.56it/s] 83it [00:08, 9.64it/s] 84it [00:08, 9.08it/s] 85it [00:09, 9.29it/s] 86it [00:09, 9.43it/s] 87it [00:09, 9.54it/s] 88it [00:09, 9.61it/s] 89it [00:09, 9.66it/s] 90it [00:09, 9.69it/s] 91it [00:09, 9.73it/s] 92it [00:09, 9.73it/s] 93it [00:09, 9.74it/s] 94it [00:10, 9.14it/s] 95it [00:10, 9.31it/s] 96it [00:10, 9.44it/s] 97it [00:10, 9.55it/s] 98it [00:10, 9.61it/s] 99it [00:10, 9.18it/s] 100it [00:10, 9.34it/s]2025-05-26 05:06:20,775 - INFO - [Epoch 067 | Batch 0100] IWAE-loss 4479.0835 | mean log_px -0.0211 | KL -3224.74 + 101it [00:10, 9.44it/s] 102it [00:10, 9.51it/s] 103it [00:10, 9.56it/s] 104it [00:11, 9.56it/s] 105it [00:11, 9.63it/s] 106it [00:11, 9.62it/s] 107it [00:11, 9.68it/s] 108it [00:11, 9.70it/s] 109it [00:11, 9.76it/s] 110it [00:11, 9.76it/s] 111it [00:11, 9.80it/s] 112it [00:11, 9.79it/s] 113it [00:11, 9.72it/s] 114it [00:12, 9.74it/s] 115it [00:12, 9.76it/s] 116it [00:12, 9.14it/s] 117it [00:12, 9.33it/s] 118it [00:12, 9.46it/s] 119it [00:12, 9.55it/s] 120it [00:12, 9.62it/s] 121it [00:12, 9.69it/s] 122it [00:12, 9.72it/s] 123it [00:13, 9.76it/s] 124it [00:13, 9.76it/s] 125it [00:13, 9.79it/s] 126it [00:13, 9.78it/s] 127it [00:13, 9.78it/s] 128it [00:13, 9.77it/s] 129it [00:13, 9.79it/s] 130it [00:13, 9.78it/s] 131it [00:13, 9.78it/s] 132it [00:13, 9.77it/s] 133it [00:14, 9.78it/s] 134it [00:14, 9.78it/s] 135it [00:14, 9.15it/s] 136it [00:14, 9.33it/s] 137it [00:14, 9.44it/s] 138it [00:14, 9.46it/s] 139it [00:14, 9.58it/s] 140it [00:14, 9.57it/s] 141it [00:14, 9.63it/s] 142it [00:15, 9.06it/s] 143it [00:15, 9.29it/s] 144it [00:15, 9.45it/s] 145it [00:15, 9.56it/s] 146it [00:15, 9.63it/s] 147it [00:15, 9.69it/s] 148it [00:15, 9.72it/s] 149it [00:15, 9.74it/s] 150it [00:15, 9.74it/s]2025-05-26 05:06:25,965 - INFO - [Epoch 067 | Batch 0150] IWAE-loss 4168.6562 | mean log_px -0.0179 | KL -3215.23 + 151it [00:15, 9.14it/s] 152it [00:16, 9.29it/s] 153it [00:16, 9.42it/s] 154it [00:16, 9.47it/s] 155it [00:16, 9.53it/s] 156it [00:16, 9.59it/s] 157it [00:16, 9.62it/s] 158it [00:16, 9.53it/s] 159it [00:16, 8.65it/s] 160it [00:16, 8.96it/s] 161it [00:17, 9.24it/s] 162it [00:17, 8.80it/s] 163it [00:17, 9.07it/s] 164it [00:17, 9.31it/s] 165it [00:17, 9.51it/s] 166it [00:17, 9.62it/s] 168it [00:17, 9.43it/s] 169it [00:17, 9.55it/s] 170it [00:17, 9.64it/s] 171it [00:18, 9.71it/s] 172it [00:18, 9.73it/s] 174it [00:18, 9.85it/s] 176it [00:18, 9.56it/s] 178it [00:18, 9.73it/s] 179it [00:18, 9.78it/s] 180it [00:19, 9.83it/s] 181it [00:19, 9.86it/s] 182it [00:19, 9.31it/s] 183it [00:19, 9.44it/s] 185it [00:19, 9.69it/s] 186it [00:19, 9.11it/s] 187it [00:19, 9.26it/s] 188it [00:19, 9.37it/s] 189it [00:19, 9.47it/s] 190it [00:20, 9.58it/s] 191it [00:20, 9.61it/s] 192it [00:20, 9.10it/s] 193it [00:20, 9.32it/s] 194it [00:20, 9.44it/s] 195it [00:20, 9.12it/s] 196it [00:20, 9.43it/s] +2025-05-26 05:06:30,842 - INFO - Epoch: 67, Objective: tensor([4425.1938], device='cuda:0', grad_fn=), Loss: 0.020734276622533798, KL/n: 65.69780731201172 + 0it [00:00, ?it/s]2025-05-26 05:06:31,092 - INFO - [Epoch 068 | Batch 0000] IWAE-loss 4215.6938 | mean log_px -0.0170 | KL -3219.93 + 1it [00:00, 5.32it/s] 2it [00:00, 7.32it/s] 4it [00:00, 8.79it/s] 6it [00:00, 9.33it/s] 7it [00:00, 9.47it/s] 8it [00:00, 9.56it/s] 10it [00:01, 9.24it/s] 11it [00:01, 9.41it/s] 12it [00:01, 9.53it/s] 13it [00:01, 9.63it/s] 14it [00:01, 9.69it/s] 16it [00:01, 9.81it/s] 18it [00:01, 9.89it/s] 19it [00:02, 9.90it/s] 20it [00:02, 9.92it/s] 21it [00:02, 9.90it/s] 22it [00:02, 9.90it/s] 24it [00:02, 9.98it/s] 26it [00:02, 9.99it/s] 27it [00:02, 9.96it/s] 28it [00:02, 9.49it/s] 30it [00:03, 9.70it/s] 31it [00:03, 9.39it/s] 32it [00:03, 9.52it/s] 33it [00:03, 9.63it/s] 34it [00:03, 9.71it/s] 35it [00:03, 9.78it/s] 36it [00:03, 9.23it/s] 37it [00:03, 9.25it/s] 38it [00:04, 9.21it/s] 39it [00:04, 8.83it/s] 40it [00:04, 8.91it/s] 41it [00:04, 9.08it/s] 42it [00:04, 9.25it/s] 43it [00:04, 9.44it/s] 44it [00:04, 9.55it/s] 46it [00:04, 9.77it/s] 47it [00:04, 9.79it/s] 48it [00:05, 9.75it/s] 49it [00:05, 9.81it/s]2025-05-26 05:06:36,287 - INFO - [Epoch 068 | Batch 0050] IWAE-loss 4135.7124 | mean log_px -0.0192 | KL -3214.93 + 51it [00:05, 9.45it/s] 53it [00:05, 9.68it/s] 54it [00:05, 9.74it/s] 55it [00:05, 9.74it/s] 56it [00:05, 9.34it/s] 57it [00:05, 9.50it/s] 58it [00:06, 9.61it/s] 60it [00:06, 6.97it/s] 62it [00:06, 7.91it/s] 63it [00:06, 8.28it/s] 64it [00:06, 8.53it/s] 65it [00:06, 8.86it/s] 66it [00:07, 8.73it/s] 68it [00:07, 9.25it/s] 69it [00:07, 9.06it/s] 70it [00:07, 9.02it/s] 72it [00:07, 9.42it/s] 73it [00:07, 9.49it/s] 74it [00:07, 9.57it/s] 76it [00:08, 9.74it/s] 78it [00:08, 9.87it/s] 79it [00:08, 9.89it/s] 80it [00:08, 9.39it/s] 81it [00:08, 9.51it/s] 83it [00:08, 9.70it/s] 84it [00:08, 9.72it/s] 85it [00:09, 9.77it/s] 86it [00:09, 9.74it/s] 87it [00:09, 9.79it/s] 88it [00:09, 9.77it/s] 89it [00:09, 9.84it/s] 90it [00:09, 9.28it/s] 92it [00:09, 9.62it/s] 93it [00:09, 9.70it/s] 94it [00:10, 9.75it/s] 95it [00:10, 9.77it/s] 96it [00:10, 9.74it/s] 98it [00:10, 9.86it/s] 100it [00:10, 9.92it/s]2025-05-26 05:06:41,639 - INFO - [Epoch 068 | Batch 0100] IWAE-loss 4981.6865 | mean log_px -0.0295 | KL -3210.19 + 101it [00:10, 9.92it/s] 103it [00:10, 9.97it/s] 104it [00:11, 9.59it/s] 105it [00:11, 9.66it/s] 106it [00:11, 9.21it/s] 107it [00:11, 9.36it/s] 108it [00:11, 9.50it/s] 109it [00:11, 9.63it/s] 110it [00:11, 9.73it/s] 111it [00:11, 9.79it/s] 112it [00:11, 9.85it/s] 114it [00:12, 9.90it/s] 116it [00:12, 9.94it/s] 117it [00:12, 9.94it/s] 119it [00:12, 9.96it/s] 120it [00:12, 9.60it/s] 122it [00:12, 9.75it/s] 124it [00:13, 9.87it/s] 125it [00:13, 9.90it/s] 127it [00:13, 9.95it/s] 128it [00:13, 9.95it/s] 130it [00:13, 9.95it/s] 132it [00:13, 9.93it/s] 133it [00:13, 9.94it/s] 135it [00:14, 9.98it/s] 136it [00:14, 9.97it/s] 137it [00:14, 9.96it/s] 138it [00:14, 9.94it/s] 140it [00:14, 9.94it/s] 141it [00:14, 9.95it/s] 142it [00:14, 9.94it/s] 143it [00:14, 9.95it/s] 144it [00:15, 9.93it/s] 145it [00:15, 9.94it/s] 146it [00:15, 9.96it/s] 147it [00:15, 9.94it/s] 148it [00:15, 9.94it/s] 149it [00:15, 9.85it/s] 150it [00:15, 9.70it/s]2025-05-26 05:06:46,733 - INFO - [Epoch 068 | Batch 0150] IWAE-loss 3965.0554 | mean log_px -0.0127 | KL -3208.22 + 151it [00:15, 8.84it/s] 152it [00:15, 8.90it/s] 153it [00:16, 8.97it/s] 154it [00:16, 9.00it/s] 155it [00:16, 9.24it/s] 156it [00:16, 9.42it/s] 157it [00:16, 8.98it/s] 158it [00:16, 9.03it/s] 159it [00:16, 9.07it/s] 160it [00:16, 9.00it/s] 161it [00:16, 9.07it/s] 162it [00:17, 9.21it/s] 164it [00:17, 9.56it/s] 166it [00:17, 9.73it/s] 167it [00:17, 9.78it/s] 168it [00:17, 9.82it/s] 170it [00:17, 9.93it/s] 171it [00:17, 9.93it/s] 172it [00:18, 9.94it/s] 173it [00:18, 9.95it/s] 174it [00:18, 9.92it/s] 176it [00:18, 9.52it/s] 178it [00:18, 9.52it/s] 179it [00:18, 9.46it/s] 180it [00:18, 9.50it/s] 182it [00:19, 9.72it/s] 184it [00:19, 9.81it/s] 186it [00:19, 9.88it/s] 188it [00:19, 9.90it/s] 189it [00:19, 9.90it/s] 190it [00:19, 9.91it/s] 192it [00:20, 9.96it/s] 193it [00:20, 9.52it/s] 195it [00:20, 9.42it/s] 196it [00:20, 9.53it/s] +2025-05-26 05:06:51,546 - INFO - Epoch: 68, Objective: tensor([4401.1167], device='cuda:0', grad_fn=), Loss: 0.016813162714242935, KL/n: 65.4537582397461 + 0it [00:00, ?it/s]2025-05-26 05:06:51,818 - INFO - [Epoch 069 | Batch 0000] IWAE-loss 3877.0161 | mean log_px -0.0104 | KL -3203.73 + 1it [00:00, 4.79it/s] 3it [00:00, 7.87it/s] 5it [00:00, 8.91it/s] 6it [00:00, 9.18it/s] 7it [00:00, 9.20it/s] 8it [00:00, 9.18it/s] 10it [00:01, 9.59it/s] 12it [00:01, 9.79it/s] 14it [00:01, 9.89it/s] 16it [00:01, 9.99it/s] 18it [00:01, 10.05it/s] 20it [00:02, 10.10it/s] 22it [00:02, 9.97it/s] 23it [00:02, 9.60it/s] 25it [00:02, 9.77it/s] 27it [00:02, 9.85it/s] 29it [00:03, 9.94it/s] 31it [00:03, 9.99it/s] 33it [00:03, 10.05it/s] 35it [00:03, 9.73it/s] 37it [00:03, 9.85it/s] 39it [00:04, 9.94it/s] 41it [00:04, 9.99it/s] 43it [00:04, 10.04it/s] 45it [00:04, 10.06it/s] 47it [00:04, 10.09it/s] 49it [00:05, 10.09it/s]2025-05-26 05:06:56,861 - INFO - [Epoch 069 | Batch 0050] IWAE-loss 3863.5151 | mean log_px -0.0112 | KL -3199.91 + 51it [00:05, 9.88it/s] 52it [00:05, 9.66it/s] 54it [00:05, 9.80it/s] 55it [00:05, 9.52it/s] 57it [00:05, 9.73it/s] 59it [00:06, 9.87it/s] 61it [00:06, 9.95it/s] 63it [00:06, 10.02it/s] 65it [00:06, 9.70it/s] 67it [00:06, 9.83it/s] 69it [00:07, 9.92it/s] 71it [00:07, 9.99it/s] 73it [00:07, 10.04it/s] 75it [00:07, 10.06it/s] 77it [00:07, 10.09it/s] 79it [00:08, 10.10it/s] 81it [00:08, 10.11it/s] 83it [00:08, 10.12it/s] 85it [00:08, 9.78it/s] 86it [00:08, 9.82it/s] 88it [00:08, 9.92it/s] 90it [00:09, 9.97it/s] 92it [00:09, 10.02it/s] 94it [00:09, 10.05it/s] 96it [00:09, 10.07it/s] 98it [00:09, 10.09it/s] 100it [00:10, 10.11it/s]2025-05-26 05:07:01,895 - INFO - [Epoch 069 | Batch 0100] IWAE-loss 3742.5066 | mean log_px -0.0079 | KL -3197.15 + 102it [00:10, 9.99it/s] 104it [00:10, 10.02it/s] 106it [00:10, 9.69it/s] 108it [00:10, 9.81it/s] 110it [00:11, 9.90it/s] 112it [00:11, 9.97it/s] 114it [00:11, 10.02it/s] 116it [00:11, 10.06it/s] 118it [00:11, 9.73it/s] 120it [00:12, 9.67it/s] 122it [00:12, 9.80it/s] 124it [00:12, 9.89it/s] 126it [00:12, 9.95it/s] 128it [00:12, 10.00it/s] 130it [00:13, 9.69it/s] 132it [00:13, 9.80it/s] 134it [00:13, 9.88it/s] 136it [00:13, 9.95it/s] 138it [00:14, 10.00it/s] 140it [00:14, 10.04it/s] 142it [00:14, 10.07it/s] 144it [00:14, 9.81it/s] 146it [00:14, 9.92it/s] 148it [00:15, 9.99it/s] 150it [00:15, 10.02it/s]2025-05-26 05:07:06,940 - INFO - [Epoch 069 | Batch 0150] IWAE-loss 4124.4932 | mean log_px -0.0141 | KL -3199.10 + 152it [00:15, 10.05it/s] 154it [00:15, 9.73it/s] 156it [00:15, 9.85it/s] 158it [00:16, 9.94it/s] 160it [00:16, 10.01it/s] 162it [00:16, 10.05it/s] 164it [00:16, 9.73it/s] 166it [00:16, 9.85it/s] 168it [00:17, 9.94it/s] 170it [00:17, 9.97it/s] 172it [00:17, 10.01it/s] 174it [00:17, 10.05it/s] 176it [00:17, 10.08it/s] 178it [00:18, 10.09it/s] 180it [00:18, 10.09it/s] 182it [00:18, 10.10it/s] 184it [00:18, 10.09it/s] 186it [00:18, 10.09it/s] 188it [00:19, 10.10it/s] 190it [00:19, 9.84it/s] 192it [00:19, 9.93it/s] 194it [00:19, 9.72it/s] 195it [00:19, 9.49it/s] 196it [00:19, 9.85it/s] +2025-05-26 05:07:11,581 - INFO - Epoch: 69, Objective: tensor([5429.6377], device='cuda:0', grad_fn=), Loss: 0.039554789662361145, KL/n: 65.18160247802734 + 0it [00:00, ?it/s]2025-05-26 05:07:11,880 - INFO - [Epoch 070 | Batch 0000] IWAE-loss 3927.8982 | mean log_px -0.0122 | KL -3190.02 + 1it [00:00, 4.34it/s] 3it [00:00, 7.03it/s] 4it [00:00, 7.82it/s] 6it [00:00, 8.79it/s] 8it [00:00, 9.28it/s] 10it [00:01, 9.52it/s] 12it [00:01, 9.70it/s] 14it [00:01, 9.81it/s] 16it [00:01, 9.90it/s] 18it [00:01, 9.94it/s] 20it [00:02, 9.97it/s] 22it [00:02, 10.00it/s] 24it [00:02, 10.02it/s] 26it [00:02, 10.03it/s] 28it [00:02, 9.71it/s] 29it [00:03, 9.69it/s] 30it [00:03, 9.71it/s] 32it [00:03, 9.81it/s] 33it [00:03, 9.75it/s] 34it [00:03, 9.78it/s] 36it [00:03, 9.45it/s] 37it [00:03, 9.57it/s] 38it [00:04, 9.65it/s] 39it [00:04, 9.74it/s] 41it [00:04, 9.88it/s] 42it [00:04, 9.90it/s] 44it [00:04, 9.96it/s] 45it [00:04, 9.95it/s] 46it [00:04, 9.96it/s] 48it [00:04, 9.99it/s] 50it [00:05, 10.00it/s]2025-05-26 05:07:16,977 - INFO - [Epoch 070 | Batch 0050] IWAE-loss 4088.9717 | mean log_px -0.0128 | KL -3193.53 + 51it [00:05, 7.21it/s] 53it [00:05, 8.06it/s] 54it [00:05, 8.17it/s] 56it [00:05, 8.79it/s] 58it [00:06, 9.19it/s] 59it [00:06, 8.74it/s] 60it [00:06, 8.75it/s] 61it [00:06, 8.94it/s] 62it [00:06, 9.11it/s] 63it [00:06, 8.93it/s] 64it [00:06, 9.19it/s] 66it [00:07, 9.54it/s] 68it [00:07, 9.71it/s] 69it [00:07, 9.76it/s] 70it [00:07, 9.80it/s] 71it [00:07, 9.39it/s] 72it [00:07, 9.49it/s] 74it [00:07, 9.72it/s] 76it [00:08, 9.86it/s] 78it [00:08, 9.93it/s] 80it [00:08, 9.99it/s] 82it [00:08, 10.01it/s] 84it [00:08, 10.02it/s] 86it [00:09, 10.03it/s] 88it [00:09, 10.03it/s] 90it [00:09, 10.03it/s] 92it [00:09, 10.04it/s] 94it [00:09, 10.05it/s] 96it [00:10, 10.05it/s] 98it [00:10, 10.05it/s] 100it [00:10, 10.03it/s]2025-05-26 05:07:22,261 - INFO - [Epoch 070 | Batch 0100] IWAE-loss 4525.4941 | mean log_px -0.0213 | KL -3186.68 + 102it [00:10, 9.63it/s] 103it [00:10, 9.68it/s] 104it [00:10, 9.74it/s] 105it [00:11, 9.79it/s] 106it [00:11, 9.82it/s] 108it [00:11, 9.92it/s] 109it [00:11, 9.92it/s] 110it [00:11, 9.93it/s] 112it [00:11, 9.98it/s] 114it [00:11, 10.01it/s] 115it [00:12, 10.00it/s] 116it [00:12, 10.00it/s] 118it [00:12, 10.02it/s] 120it [00:12, 10.01it/s] 122it [00:12, 9.63it/s] 124it [00:12, 9.76it/s] 126it [00:13, 9.85it/s] 128it [00:13, 9.92it/s] 129it [00:13, 9.91it/s] 131it [00:13, 9.93it/s] 132it [00:13, 9.93it/s] 133it [00:13, 9.58it/s] 134it [00:13, 9.67it/s] 136it [00:14, 9.82it/s] 138it [00:14, 9.91it/s] 140it [00:14, 9.97it/s] 141it [00:14, 9.97it/s] 142it [00:14, 9.92it/s] 143it [00:14, 9.87it/s] 144it [00:14, 9.88it/s] 146it [00:15, 9.49it/s] 148it [00:15, 9.67it/s] 149it [00:15, 9.46it/s] 150it [00:15, 9.55it/s]2025-05-26 05:07:27,368 - INFO - [Epoch 070 | Batch 0150] IWAE-loss 3830.5117 | mean log_px -0.0118 | KL -3191.07 + 151it [00:15, 9.26it/s] 152it [00:15, 9.44it/s] 153it [00:15, 9.58it/s] 155it [00:16, 9.79it/s] 156it [00:16, 9.84it/s] 158it [00:16, 9.92it/s] 160it [00:16, 9.55it/s] 162it [00:16, 9.71it/s] 164it [00:17, 9.83it/s] 166it [00:17, 9.87it/s] 167it [00:17, 9.88it/s] 169it [00:17, 9.94it/s] 171it [00:17, 9.98it/s] 173it [00:17, 10.01it/s] 175it [00:18, 10.02it/s] 177it [00:18, 10.03it/s] 179it [00:18, 10.04it/s] 181it [00:18, 9.68it/s] 182it [00:18, 9.74it/s] 184it [00:19, 9.84it/s] 186it [00:19, 9.91it/s] 188it [00:19, 9.95it/s] 190it [00:19, 9.98it/s] 192it [00:19, 10.00it/s] 194it [00:20, 10.02it/s] 196it [00:20, 9.83it/s] 196it [00:20, 9.65it/s] +2025-05-26 05:07:32,034 - INFO - Epoch: 70, Objective: tensor([4718.2910], device='cuda:0', grad_fn=), Loss: 0.02613232657313347, KL/n: 64.95722961425781 + 0it [00:00, ?it/s]2025-05-26 05:07:32,302 - INFO - [Epoch 071 | Batch 0000] IWAE-loss 4098.5879 | mean log_px -0.0153 | KL -3181.93 + 1it [00:00, 4.72it/s] 2it [00:00, 6.83it/s] 4it [00:00, 8.54it/s] 5it [00:00, 8.43it/s] 6it [00:00, 8.85it/s] 7it [00:00, 9.15it/s] 8it [00:00, 9.37it/s] 9it [00:01, 8.99it/s] 10it [00:01, 9.27it/s] 12it [00:01, 9.62it/s] 13it [00:01, 9.24it/s] 14it [00:01, 9.41it/s] 16it [00:01, 9.68it/s] 17it [00:01, 9.30it/s] 19it [00:02, 9.61it/s] 20it [00:02, 9.25it/s] 22it [00:02, 9.57it/s] 23it [00:02, 9.25it/s] 25it [00:02, 9.56it/s] 26it [00:02, 9.61it/s] 28it [00:03, 9.39it/s] 30it [00:03, 9.63it/s] 32it [00:03, 9.80it/s] 33it [00:03, 9.44it/s] 35it [00:03, 9.66it/s] 37it [00:03, 9.81it/s] 39it [00:04, 9.91it/s] 41it [00:04, 9.97it/s] 43it [00:04, 10.02it/s] 45it [00:04, 10.04it/s] 47it [00:04, 10.06it/s] 49it [00:05, 10.07it/s]2025-05-26 05:07:37,480 - INFO - [Epoch 071 | Batch 0050] IWAE-loss 3795.4751 | mean log_px -0.0104 | KL -3178.03 + 51it [00:05, 10.05it/s] 53it [00:05, 10.06it/s] 55it [00:05, 10.02it/s] 57it [00:05, 10.05it/s] 59it [00:06, 9.95it/s] 61it [00:06, 10.00it/s] 63it [00:06, 10.04it/s] 65it [00:06, 10.06it/s] 67it [00:06, 10.08it/s] 69it [00:07, 9.76it/s] 71it [00:07, 9.86it/s] 72it [00:07, 9.43it/s] 74it [00:07, 9.64it/s] 76it [00:07, 9.80it/s] 77it [00:08, 9.45it/s] 79it [00:08, 9.66it/s] 81it [00:08, 9.44it/s] 83it [00:08, 9.64it/s] 85it [00:08, 9.78it/s] 87it [00:09, 9.88it/s] 89it [00:09, 9.95it/s] 91it [00:09, 10.01it/s] 92it [00:09, 9.99it/s] 94it [00:09, 10.03it/s] 96it [00:09, 10.06it/s] 98it [00:10, 9.77it/s] 99it [00:10, 9.81it/s] 100it [00:10, 9.38it/s]2025-05-26 05:07:42,584 - INFO - [Epoch 071 | Batch 0100] IWAE-loss 3703.3640 | mean log_px -0.0093 | KL -3174.69 + 101it [00:10, 9.52it/s] 103it [00:10, 9.75it/s] 105it [00:10, 9.87it/s] 106it [00:10, 9.89it/s] 108it [00:11, 9.99it/s] 110it [00:11, 10.01it/s] 112it [00:11, 10.04it/s] 114it [00:11, 10.09it/s] 116it [00:11, 10.11it/s] 118it [00:12, 10.12it/s] 120it [00:12, 9.84it/s] 121it [00:12, 9.86it/s] 122it [00:12, 9.85it/s] 123it [00:12, 9.76it/s] 124it [00:12, 9.33it/s] 125it [00:12, 9.43it/s] 126it [00:12, 9.50it/s] 127it [00:13, 9.59it/s] 129it [00:13, 9.82it/s] 131it [00:13, 9.50it/s] 132it [00:13, 9.59it/s] 134it [00:13, 9.77it/s] 136it [00:14, 9.89it/s] 138it [00:14, 9.93it/s] 139it [00:14, 9.57it/s] 140it [00:14, 9.64it/s] 142it [00:14, 9.81it/s] 143it [00:14, 9.39it/s] 145it [00:14, 9.66it/s] 147it [00:15, 9.81it/s] 149it [00:15, 9.90it/s]2025-05-26 05:07:47,669 - INFO - [Epoch 071 | Batch 0150] IWAE-loss 3954.1804 | mean log_px -0.0154 | KL -3167.20 + 151it [00:15, 9.94it/s] 153it [00:15, 9.64it/s] 155it [00:15, 9.79it/s] 156it [00:16, 9.81it/s] 158it [00:16, 9.92it/s] 160it [00:16, 9.99it/s] 162it [00:16, 10.03it/s] 164it [00:16, 9.71it/s] 166it [00:17, 9.82it/s] 167it [00:17, 9.69it/s] 168it [00:17, 9.59it/s] 169it [00:17, 9.60it/s] 171it [00:17, 9.79it/s] 173it [00:17, 9.90it/s] 175it [00:17, 9.94it/s] 177it [00:18, 9.99it/s] 178it [00:18, 9.98it/s] 179it [00:18, 9.92it/s] 181it [00:18, 9.96it/s] 183it [00:18, 9.86it/s] 184it [00:18, 9.82it/s] 185it [00:19, 9.34it/s] 187it [00:19, 9.63it/s] 189it [00:19, 9.80it/s] 191it [00:19, 9.90it/s] 192it [00:19, 9.52it/s] 194it [00:19, 9.73it/s] 195it [00:20, 9.47it/s] 196it [00:20, 9.18it/s] 196it [00:20, 9.68it/s] +2025-05-26 05:07:52,402 - INFO - Epoch: 71, Objective: tensor([4948.8066], device='cuda:0', grad_fn=), Loss: 0.03435065969824791, KL/n: 64.70899200439453 + 0it [00:00, ?it/s]2025-05-26 05:07:52,676 - INFO - [Epoch 072 | Batch 0000] IWAE-loss 4508.8237 | mean log_px -0.0191 | KL -3173.76 + 1it [00:00, 5.60it/s] 2it [00:00, 7.47it/s] 3it [00:00, 7.77it/s] 4it [00:00, 8.49it/s] 5it [00:00, 8.92it/s] 6it [00:00, 9.14it/s] 8it [00:00, 9.55it/s] 9it [00:01, 9.56it/s] 10it [00:01, 9.65it/s] 12it [00:01, 9.82it/s] 13it [00:01, 9.85it/s] 14it [00:01, 9.38it/s] 15it [00:01, 6.45it/s] 16it [00:01, 7.11it/s] 17it [00:02, 7.39it/s] 18it [00:02, 7.95it/s] 19it [00:02, 8.44it/s] 20it [00:02, 8.83it/s] 22it [00:02, 9.34it/s] 23it [00:02, 9.05it/s] 24it [00:02, 9.20it/s] 26it [00:02, 9.52it/s] 27it [00:03, 9.11it/s] 28it [00:03, 9.31it/s] 29it [00:03, 9.45it/s] 30it [00:03, 8.98it/s] 31it [00:03, 9.23it/s] 32it [00:03, 9.38it/s] 34it [00:03, 9.63it/s] 35it [00:03, 9.70it/s] 36it [00:04, 9.76it/s] 37it [00:04, 9.72it/s] 38it [00:04, 9.28it/s] 39it [00:04, 9.43it/s] 40it [00:04, 9.53it/s] 41it [00:04, 9.65it/s] 42it [00:04, 9.70it/s] 43it [00:04, 9.73it/s] 45it [00:04, 9.84it/s] 46it [00:05, 9.88it/s] 47it [00:05, 9.88it/s] 49it [00:05, 9.92it/s] 50it [00:05, 9.92it/s]2025-05-26 05:07:58,076 - INFO - [Epoch 072 | Batch 0050] IWAE-loss 4654.4067 | mean log_px -0.0212 | KL -3164.67 + 51it [00:05, 9.88it/s] 52it [00:05, 9.85it/s] 53it [00:05, 9.87it/s] 54it [00:05, 9.87it/s] 56it [00:06, 9.93it/s] 57it [00:06, 9.87it/s] 58it [00:06, 9.84it/s] 59it [00:06, 9.84it/s] 60it [00:06, 9.85it/s] 61it [00:06, 9.87it/s] 62it [00:06, 9.87it/s] 63it [00:06, 9.91it/s] 64it [00:06, 9.88it/s] 65it [00:06, 9.86it/s] 66it [00:07, 9.85it/s] 67it [00:07, 9.87it/s] 68it [00:07, 9.85it/s] 69it [00:07, 9.86it/s] 70it [00:07, 9.83it/s] 71it [00:07, 9.77it/s] 72it [00:07, 9.82it/s] 73it [00:07, 9.80it/s] 74it [00:07, 9.81it/s] 75it [00:08, 9.85it/s] 76it [00:08, 9.83it/s] 77it [00:08, 9.81it/s] 79it [00:08, 9.88it/s] 80it [00:08, 9.85it/s] 81it [00:08, 9.84it/s] 82it [00:08, 9.82it/s] 83it [00:08, 9.80it/s] 85it [00:09, 9.85it/s] 86it [00:09, 9.85it/s] 87it [00:09, 9.87it/s] 88it [00:09, 9.84it/s] 89it [00:09, 9.83it/s] 90it [00:09, 9.86it/s] 91it [00:09, 9.87it/s] 92it [00:09, 9.89it/s] 93it [00:09, 9.87it/s] 94it [00:09, 9.83it/s] 95it [00:10, 9.82it/s] 96it [00:10, 9.74it/s] 97it [00:10, 9.76it/s] 98it [00:10, 9.79it/s] 99it [00:10, 9.80it/s] 100it [00:10, 9.79it/s]2025-05-26 05:08:03,159 - INFO - [Epoch 072 | Batch 0100] IWAE-loss 5721.9814 | mean log_px -0.0405 | KL -3163.68 + 101it [00:10, 9.75it/s] 102it [00:10, 9.75it/s] 103it [00:10, 9.81it/s] 104it [00:10, 9.86it/s] 105it [00:11, 9.89it/s] 106it [00:11, 9.86it/s] 107it [00:11, 9.89it/s] 109it [00:11, 9.96it/s] 110it [00:11, 9.92it/s] 111it [00:11, 9.93it/s] 112it [00:11, 9.85it/s] 113it [00:11, 9.85it/s] 114it [00:11, 9.85it/s] 115it [00:12, 9.80it/s] 116it [00:12, 9.17it/s] 117it [00:12, 9.39it/s] 118it [00:12, 9.54it/s] 119it [00:12, 9.65it/s] 120it [00:12, 9.11it/s] 121it [00:12, 9.34it/s] 122it [00:12, 9.49it/s] 123it [00:12, 9.62it/s] 124it [00:13, 9.69it/s] 125it [00:13, 9.74it/s] 126it [00:13, 9.76it/s] 127it [00:13, 9.80it/s] 128it [00:13, 9.22it/s] 129it [00:13, 9.41it/s] 130it [00:13, 9.54it/s] 131it [00:13, 9.63it/s] 132it [00:13, 9.08it/s] 133it [00:13, 9.33it/s] 134it [00:14, 9.48it/s] 135it [00:14, 9.62it/s] 136it [00:14, 9.72it/s] 137it [00:14, 9.78it/s] 138it [00:14, 9.81it/s] 139it [00:14, 9.83it/s] 140it [00:14, 9.85it/s] 141it [00:14, 9.88it/s] 142it [00:14, 9.88it/s] 143it [00:15, 9.27it/s] 144it [00:15, 9.42it/s] 145it [00:15, 9.57it/s] 146it [00:15, 9.68it/s] 147it [00:15, 9.77it/s] 148it [00:15, 9.83it/s] 149it [00:15, 9.88it/s] 150it [00:15, 9.84it/s]2025-05-26 05:08:08,331 - INFO - [Epoch 072 | Batch 0150] IWAE-loss 4235.5010 | mean log_px -0.0156 | KL -3162.35 + 151it [00:15, 9.36it/s] 152it [00:15, 9.53it/s] 153it [00:16, 9.66it/s] 154it [00:16, 9.76it/s] 155it [00:16, 9.82it/s] 156it [00:16, 9.84it/s] 157it [00:16, 9.87it/s] 158it [00:16, 9.87it/s] 159it [00:16, 9.90it/s] 161it [00:16, 9.96it/s] 162it [00:16, 9.93it/s] 164it [00:17, 9.97it/s] 166it [00:17, 9.98it/s] 167it [00:17, 9.98it/s] 168it [00:17, 9.97it/s] 169it [00:17, 9.95it/s] 170it [00:17, 9.37it/s] 171it [00:17, 9.52it/s] 172it [00:17, 9.63it/s] 173it [00:18, 9.70it/s] 174it [00:18, 9.78it/s] 176it [00:18, 9.89it/s] 177it [00:18, 9.86it/s] 178it [00:18, 9.88it/s] 179it [00:18, 9.90it/s] 180it [00:18, 9.89it/s] 181it [00:18, 9.90it/s] 182it [00:18, 9.90it/s] 183it [00:19, 9.89it/s] 185it [00:19, 9.95it/s] 186it [00:19, 9.40it/s] 187it [00:19, 9.54it/s] 188it [00:19, 9.63it/s] 189it [00:19, 9.65it/s] 190it [00:19, 9.72it/s] 191it [00:19, 9.21it/s] 192it [00:20, 9.40it/s] 193it [00:20, 9.53it/s] 194it [00:20, 9.57it/s] 195it [00:20, 9.23it/s] 196it [00:20, 9.55it/s] +2025-05-26 05:08:13,067 - INFO - Epoch: 72, Objective: tensor([3779.6716], device='cuda:0', grad_fn=), Loss: 0.01213796902447939, KL/n: 64.47173309326172 + 0it [00:00, ?it/s]2025-05-26 05:08:13,365 - INFO - [Epoch 073 | Batch 0000] IWAE-loss 4182.9614 | mean log_px -0.0191 | KL -3160.06 + 1it [00:00, 4.22it/s] 2it [00:00, 6.30it/s] 3it [00:00, 7.57it/s] 4it [00:00, 8.34it/s] 5it [00:00, 8.85it/s] 6it [00:00, 9.11it/s] 8it [00:00, 9.53it/s] 9it [00:01, 9.22it/s] 10it [00:01, 9.39it/s] 12it [00:01, 9.63it/s] 13it [00:01, 9.69it/s] 14it [00:01, 9.74it/s] 15it [00:01, 9.79it/s] 17it [00:01, 9.89it/s] 18it [00:01, 9.91it/s] 19it [00:02, 9.92it/s] 20it [00:02, 9.92it/s] 21it [00:02, 9.90it/s] 22it [00:02, 9.40it/s] 23it [00:02, 9.52it/s] 24it [00:02, 9.65it/s] 26it [00:02, 9.78it/s] 27it [00:02, 9.80it/s] 28it [00:02, 9.84it/s] 30it [00:03, 9.93it/s] 31it [00:03, 9.53it/s] 32it [00:03, 9.62it/s] 33it [00:03, 9.64it/s] 34it [00:03, 9.23it/s] 35it [00:03, 9.39it/s] 36it [00:03, 9.51it/s] 37it [00:03, 9.62it/s] 38it [00:04, 9.72it/s] 39it [00:04, 9.77it/s] 40it [00:04, 9.33it/s] 41it [00:04, 9.48it/s] 42it [00:04, 9.60it/s] 43it [00:04, 9.70it/s] 44it [00:04, 9.76it/s] 45it [00:04, 9.80it/s] 46it [00:04, 9.84it/s] 47it [00:04, 9.32it/s] 48it [00:05, 9.46it/s] 49it [00:05, 9.58it/s] 50it [00:05, 9.68it/s]2025-05-26 05:08:18,554 - INFO - [Epoch 073 | Batch 0050] IWAE-loss 4043.1121 | mean log_px -0.0134 | KL -3153.70 + 51it [00:05, 9.08it/s] 52it [00:05, 9.31it/s] 53it [00:05, 9.47it/s] 54it [00:05, 9.60it/s] 55it [00:05, 9.70it/s] 56it [00:05, 9.28it/s] 57it [00:06, 9.47it/s] 58it [00:06, 9.51it/s] 59it [00:06, 9.54it/s] 60it [00:06, 9.14it/s] 61it [00:06, 9.38it/s] 62it [00:06, 9.56it/s] 63it [00:06, 9.68it/s] 64it [00:06, 9.21it/s] 65it [00:06, 9.39it/s] 66it [00:06, 9.50it/s] 67it [00:07, 8.98it/s] 68it [00:07, 9.24it/s] 69it [00:07, 9.40it/s] 70it [00:07, 9.40it/s] 72it [00:07, 9.53it/s] 73it [00:07, 9.36it/s] 74it [00:07, 9.32it/s] 75it [00:07, 9.31it/s] 76it [00:08, 9.40it/s] 77it [00:08, 9.49it/s] 78it [00:08, 9.54it/s] 79it [00:08, 9.60it/s] 80it [00:08, 9.64it/s] 81it [00:08, 9.68it/s] 82it [00:08, 9.09it/s] 83it [00:08, 9.28it/s] 84it [00:08, 9.37it/s] 85it [00:09, 9.45it/s] 86it [00:09, 9.55it/s] 87it [00:09, 9.03it/s] 88it [00:09, 9.26it/s] 89it [00:09, 9.45it/s] 90it [00:09, 9.11it/s] 91it [00:09, 9.34it/s] 92it [00:09, 9.50it/s] 93it [00:09, 9.63it/s] 94it [00:09, 9.72it/s] 96it [00:10, 9.86it/s] 97it [00:10, 9.89it/s] 98it [00:10, 9.45it/s] 100it [00:10, 9.67it/s]2025-05-26 05:08:23,853 - INFO - [Epoch 073 | Batch 0100] IWAE-loss 4164.0747 | mean log_px -0.0208 | KL -3156.93 + 101it [00:10, 9.23it/s] 102it [00:10, 9.39it/s] 104it [00:11, 9.65it/s] 105it [00:11, 9.23it/s] 106it [00:11, 9.40it/s] 107it [00:11, 9.51it/s] 108it [00:11, 9.64it/s] 109it [00:11, 9.72it/s] 110it [00:11, 9.31it/s] 112it [00:11, 9.63it/s] 114it [00:12, 9.76it/s] 115it [00:12, 9.70it/s] 116it [00:12, 9.75it/s] 117it [00:12, 9.80it/s] 118it [00:12, 9.83it/s] 119it [00:12, 9.84it/s] 120it [00:12, 9.87it/s] 121it [00:12, 9.90it/s] 122it [00:12, 9.25it/s] 123it [00:12, 9.44it/s] 124it [00:13, 9.54it/s] 125it [00:13, 9.65it/s] 126it [00:13, 9.74it/s] 127it [00:13, 9.75it/s] 128it [00:13, 9.21it/s] 129it [00:13, 9.39it/s] 130it [00:13, 9.47it/s] 131it [00:13, 9.61it/s] 132it [00:13, 9.19it/s] 133it [00:14, 9.38it/s] 134it [00:14, 9.54it/s] 136it [00:14, 9.25it/s] 137it [00:14, 9.42it/s] 138it [00:14, 9.54it/s] 140it [00:14, 9.73it/s] 141it [00:14, 9.79it/s] 142it [00:14, 9.82it/s] 143it [00:15, 9.31it/s] 144it [00:15, 9.47it/s] 145it [00:15, 9.60it/s] 146it [00:15, 9.67it/s] 148it [00:15, 9.80it/s] 149it [00:15, 9.41it/s] 150it [00:15, 9.51it/s]2025-05-26 05:08:29,091 - INFO - [Epoch 073 | Batch 0150] IWAE-loss 4541.8203 | mean log_px -0.0273 | KL -3146.10 + 151it [00:15, 9.53it/s] 152it [00:16, 9.62it/s] 153it [00:16, 9.71it/s] 154it [00:16, 9.16it/s] 155it [00:16, 9.19it/s] 156it [00:16, 9.34it/s] 157it [00:16, 9.51it/s] 158it [00:16, 9.14it/s] 159it [00:16, 9.33it/s] 160it [00:16, 9.50it/s] 161it [00:17, 9.03it/s] 162it [00:17, 9.24it/s] 163it [00:17, 9.43it/s] 164it [00:17, 9.55it/s] 165it [00:17, 9.06it/s] 166it [00:17, 9.30it/s] 168it [00:17, 9.59it/s] 169it [00:17, 9.17it/s] 170it [00:17, 9.32it/s] 172it [00:18, 9.61it/s] 173it [00:18, 9.65it/s] 174it [00:18, 9.31it/s] 175it [00:18, 9.48it/s] 176it [00:18, 9.58it/s] 177it [00:18, 9.66it/s] 178it [00:18, 9.72it/s] 179it [00:18, 9.77it/s] 180it [00:19, 9.35it/s] 181it [00:19, 9.44it/s] 182it [00:19, 9.52it/s] 183it [00:19, 9.62it/s] 184it [00:19, 9.65it/s] 185it [00:19, 9.71it/s] 186it [00:19, 9.71it/s] 187it [00:19, 9.25it/s] 188it [00:19, 9.40it/s] 189it [00:19, 9.51it/s] 190it [00:20, 9.61it/s] 191it [00:20, 9.69it/s] 192it [00:20, 9.24it/s] 194it [00:20, 9.59it/s] 195it [00:20, 9.31it/s] 196it [00:20, 9.12it/s] 196it [00:20, 9.44it/s] +2025-05-26 05:08:33,967 - INFO - Epoch: 73, Objective: tensor([3657.3047], device='cuda:0', grad_fn=), Loss: 0.007871869951486588, KL/n: 64.23025512695312 + 0it [00:00, ?it/s]2025-05-26 05:08:34,245 - INFO - [Epoch 074 | Batch 0000] IWAE-loss 4381.4062 | mean log_px -0.0209 | KL -3141.13 + 1it [00:00, 5.41it/s] 2it [00:00, 7.30it/s] 3it [00:00, 7.77it/s] 4it [00:00, 8.50it/s] 5it [00:00, 8.98it/s] 6it [00:00, 9.30it/s] 8it [00:00, 9.67it/s] 10it [00:01, 9.79it/s] 11it [00:01, 9.42it/s] 12it [00:01, 9.53it/s] 13it [00:01, 9.64it/s] 14it [00:01, 9.69it/s] 15it [00:01, 9.29it/s] 16it [00:01, 9.44it/s] 17it [00:01, 9.55it/s] 18it [00:01, 9.12it/s] 19it [00:02, 9.30it/s] 20it [00:02, 9.45it/s] 21it [00:02, 8.93it/s] 22it [00:02, 9.16it/s] 23it [00:02, 9.33it/s] 24it [00:02, 8.88it/s] 25it [00:02, 9.15it/s] 26it [00:02, 9.33it/s] 27it [00:02, 8.91it/s] 28it [00:03, 9.16it/s] 29it [00:03, 9.39it/s] 30it [00:03, 9.55it/s] 31it [00:03, 9.64it/s] 32it [00:03, 9.23it/s] 33it [00:03, 9.42it/s] 34it [00:03, 9.49it/s] 35it [00:03, 9.05it/s] 36it [00:03, 9.25it/s] 37it [00:04, 9.45it/s] 38it [00:04, 9.58it/s] 39it [00:04, 9.69it/s] 40it [00:04, 9.76it/s] 41it [00:04, 9.79it/s] 42it [00:04, 9.34it/s] 43it [00:04, 9.51it/s] 44it [00:04, 9.63it/s] 45it [00:04, 9.25it/s] 46it [00:04, 9.44it/s] 47it [00:05, 9.60it/s] 48it [00:05, 9.69it/s] 49it [00:05, 6.29it/s] 50it [00:05, 6.78it/s]2025-05-26 05:08:39,735 - INFO - [Epoch 074 | Batch 0050] IWAE-loss 4331.8213 | mean log_px -0.0203 | KL -3145.59 + 51it [00:05, 7.47it/s] 52it [00:05, 8.06it/s] 53it [00:05, 8.16it/s] 54it [00:05, 8.57it/s] 55it [00:06, 8.96it/s] 56it [00:06, 9.19it/s] 57it [00:06, 9.39it/s] 58it [00:06, 9.51it/s] 59it [00:06, 9.63it/s] 60it [00:06, 9.71it/s] 61it [00:06, 9.75it/s] 62it [00:06, 9.29it/s] 63it [00:06, 9.49it/s] 64it [00:07, 9.60it/s] 65it [00:07, 9.68it/s] 66it [00:07, 9.29it/s] 67it [00:07, 9.47it/s] 68it [00:07, 9.56it/s] 69it [00:07, 9.65it/s] 70it [00:07, 9.21it/s] 71it [00:07, 9.41it/s] 72it [00:07, 9.54it/s] 73it [00:07, 9.66it/s] 74it [00:08, 9.25it/s] 75it [00:08, 9.34it/s] 76it [00:08, 9.37it/s] 77it [00:08, 9.41it/s] 78it [00:08, 8.90it/s] 79it [00:08, 9.18it/s] 80it [00:08, 9.36it/s] 81it [00:08, 9.51it/s] 82it [00:08, 9.62it/s] 83it [00:09, 9.08it/s] 84it [00:09, 9.29it/s] 85it [00:09, 9.41it/s] 86it [00:09, 9.55it/s] 87it [00:09, 9.67it/s] 88it [00:09, 9.25it/s] 89it [00:09, 9.43it/s] 90it [00:09, 9.54it/s] 91it [00:09, 9.65it/s] 92it [00:10, 9.26it/s] 93it [00:10, 9.42it/s] 94it [00:10, 9.54it/s] 95it [00:10, 9.62it/s] 96it [00:10, 9.67it/s] 97it [00:10, 9.73it/s] 98it [00:10, 9.30it/s] 99it [00:10, 9.46it/s] 100it [00:10, 9.59it/s]2025-05-26 05:08:45,004 - INFO - [Epoch 074 | Batch 0100] IWAE-loss 3966.7395 | mean log_px -0.0130 | KL -3133.57 + 101it [00:10, 9.08it/s] 102it [00:11, 9.32it/s] 103it [00:11, 9.47it/s] 104it [00:11, 9.61it/s] 105it [00:11, 9.68it/s] 106it [00:11, 9.14it/s] 108it [00:11, 9.50it/s] 109it [00:11, 9.19it/s] 110it [00:11, 9.36it/s] 111it [00:12, 9.52it/s] 112it [00:12, 9.63it/s] 113it [00:12, 9.27it/s] 114it [00:12, 9.43it/s] 115it [00:12, 9.59it/s] 116it [00:12, 9.68it/s] 117it [00:12, 9.26it/s] 118it [00:12, 9.44it/s] 119it [00:12, 9.59it/s] 120it [00:12, 9.67it/s] 121it [00:13, 9.75it/s] 122it [00:13, 9.25it/s] 123it [00:13, 9.44it/s] 124it [00:13, 9.57it/s] 125it [00:13, 9.68it/s] 126it [00:13, 9.74it/s] 127it [00:13, 9.30it/s] 128it [00:13, 9.48it/s] 129it [00:13, 9.55it/s] 130it [00:14, 9.61it/s] 131it [00:14, 9.70it/s] 132it [00:14, 9.13it/s] 133it [00:14, 9.34it/s] 134it [00:14, 9.51it/s] 135it [00:14, 9.62it/s] 136it [00:14, 9.68it/s] 137it [00:14, 9.22it/s] 138it [00:14, 9.43it/s] 139it [00:14, 9.56it/s] 140it [00:15, 9.67it/s] 141it [00:15, 9.25it/s] 142it [00:15, 9.41it/s] 143it [00:15, 9.56it/s] 144it [00:15, 9.63it/s] 145it [00:15, 9.71it/s] 146it [00:15, 9.29it/s] 147it [00:15, 9.43it/s] 148it [00:15, 9.58it/s] 149it [00:16, 9.61it/s] 150it [00:16, 9.19it/s]2025-05-26 05:08:50,296 - INFO - [Epoch 074 | Batch 0150] IWAE-loss 3943.3928 | mean log_px -0.0122 | KL -3135.55 + 151it [00:16, 9.33it/s] 152it [00:16, 9.30it/s] 153it [00:16, 8.99it/s] 154it [00:16, 9.20it/s] 155it [00:16, 9.42it/s] 156it [00:16, 9.55it/s] 157it [00:16, 9.67it/s] 158it [00:16, 9.76it/s] 160it [00:17, 9.86it/s] 161it [00:17, 9.46it/s] 162it [00:17, 9.57it/s] 163it [00:17, 9.66it/s] 164it [00:17, 9.75it/s] 165it [00:17, 9.80it/s] 166it [00:17, 9.80it/s] 167it [00:17, 9.36it/s] 168it [00:18, 9.50it/s] 169it [00:18, 9.64it/s] 170it [00:18, 8.94it/s] 171it [00:18, 8.99it/s] 172it [00:18, 9.12it/s] 173it [00:18, 9.30it/s] 174it [00:18, 9.47it/s] 175it [00:18, 9.62it/s] 176it [00:18, 9.72it/s] 177it [00:18, 9.74it/s] 178it [00:19, 9.76it/s] 179it [00:19, 9.76it/s] 180it [00:19, 9.16it/s] 181it [00:19, 9.38it/s] 182it [00:19, 9.49it/s] 183it [00:19, 9.59it/s] 184it [00:19, 9.65it/s] 185it [00:19, 9.73it/s] 186it [00:19, 9.30it/s] 187it [00:20, 9.47it/s] 188it [00:20, 9.61it/s] 189it [00:20, 9.71it/s] 190it [00:20, 9.79it/s] 191it [00:20, 9.81it/s] 192it [00:20, 9.75it/s] 194it [00:20, 9.87it/s] 195it [00:20, 9.52it/s] 196it [00:20, 9.27it/s] 196it [00:21, 9.32it/s] +2025-05-26 05:08:55,127 - INFO - Epoch: 74, Objective: tensor([3946.5691], device='cuda:0', grad_fn=), Loss: 0.01754077710211277, KL/n: 63.97822570800781 + 0it [00:00, ?it/s]2025-05-26 05:08:55,410 - INFO - [Epoch 075 | Batch 0000] IWAE-loss 4051.3987 | mean log_px -0.0158 | KL -3134.45 + 1it [00:00, 5.29it/s] 2it [00:00, 6.58it/s] 4it [00:00, 8.38it/s] 5it [00:00, 8.81it/s] 6it [00:00, 9.13it/s] 8it [00:00, 9.53it/s] 9it [00:01, 9.64it/s] 10it [00:01, 9.67it/s] 11it [00:01, 9.30it/s] 12it [00:01, 9.44it/s] 14it [00:01, 9.67it/s] 15it [00:01, 9.34it/s] 17it [00:01, 9.62it/s] 18it [00:01, 9.22it/s] 19it [00:02, 9.39it/s] 20it [00:02, 9.52it/s] 22it [00:02, 9.72it/s] 23it [00:02, 9.31it/s] 24it [00:02, 9.47it/s] 26it [00:02, 9.71it/s] 27it [00:02, 9.77it/s] 28it [00:03, 9.42it/s] 30it [00:03, 9.67it/s] 32it [00:03, 9.80it/s] 34it [00:03, 9.89it/s] 36it [00:03, 9.94it/s] 37it [00:03, 9.51it/s] 38it [00:04, 9.60it/s] 39it [00:04, 9.57it/s] 41it [00:04, 9.77it/s] 42it [00:04, 9.79it/s] 43it [00:04, 9.33it/s] 44it [00:04, 9.50it/s] 46it [00:04, 9.74it/s] 48it [00:05, 9.85it/s] 49it [00:05, 9.51it/s] 50it [00:05, 9.59it/s]2025-05-26 05:09:00,611 - INFO - [Epoch 075 | Batch 0050] IWAE-loss 3742.8145 | mean log_px -0.0096 | KL -3130.84 + 51it [00:05, 9.67it/s] 52it [00:05, 9.72it/s] 53it [00:05, 9.79it/s] 54it [00:05, 9.83it/s] 55it [00:05, 9.83it/s] 56it [00:05, 9.86it/s] 58it [00:06, 9.94it/s] 59it [00:06, 9.95it/s] 60it [00:06, 9.94it/s] 61it [00:06, 9.37it/s] 62it [00:06, 9.52it/s] 63it [00:06, 9.64it/s] 64it [00:06, 9.69it/s] 66it [00:06, 9.83it/s] 67it [00:07, 9.43it/s] 68it [00:07, 9.56it/s] 69it [00:07, 9.66it/s] 70it [00:07, 9.71it/s] 71it [00:07, 9.78it/s] 72it [00:07, 9.37it/s] 74it [00:07, 9.65it/s] 75it [00:07, 9.73it/s] 76it [00:07, 9.37it/s] 77it [00:08, 9.53it/s] 78it [00:08, 9.65it/s] 79it [00:08, 9.74it/s] 81it [00:08, 9.90it/s] 82it [00:08, 9.90it/s] 83it [00:08, 9.51it/s] 84it [00:08, 9.63it/s] 86it [00:08, 9.80it/s] 87it [00:09, 9.34it/s] 88it [00:09, 9.47it/s] 90it [00:09, 9.69it/s] 91it [00:09, 9.74it/s] 92it [00:09, 9.26it/s] 94it [00:09, 9.57it/s] 95it [00:09, 9.64it/s] 96it [00:10, 9.30it/s] 97it [00:10, 9.46it/s] 99it [00:10, 9.70it/s]2025-05-26 05:09:05,786 - INFO - [Epoch 075 | Batch 0100] IWAE-loss 4642.5938 | mean log_px -0.0251 | KL -3130.53 + 101it [00:10, 9.40it/s] 102it [00:10, 9.51it/s] 103it [00:10, 9.61it/s] 104it [00:10, 9.68it/s] 105it [00:11, 9.19it/s] 106it [00:11, 9.39it/s] 107it [00:11, 9.50it/s] 108it [00:11, 9.63it/s] 109it [00:11, 9.70it/s] 110it [00:11, 9.76it/s] 111it [00:11, 9.83it/s] 112it [00:11, 9.82it/s] 113it [00:11, 9.86it/s] 114it [00:11, 9.59it/s] 115it [00:12, 9.25it/s] 116it [00:12, 9.46it/s] 118it [00:12, 9.72it/s] 120it [00:12, 9.82it/s] 121it [00:12, 9.85it/s] 122it [00:12, 9.88it/s] 124it [00:12, 9.95it/s] 125it [00:13, 9.45it/s] 127it [00:13, 9.67it/s] 128it [00:13, 9.73it/s] 129it [00:13, 9.79it/s] 130it [00:13, 9.27it/s] 131it [00:13, 9.45it/s] 132it [00:13, 9.52it/s] 133it [00:13, 9.63it/s] 134it [00:13, 9.72it/s] 135it [00:14, 9.79it/s] 136it [00:14, 9.82it/s] 138it [00:14, 9.89it/s] 139it [00:14, 9.91it/s] 141it [00:14, 9.98it/s] 142it [00:14, 9.96it/s] 144it [00:15, 9.94it/s] 145it [00:15, 9.41it/s] 146it [00:15, 9.38it/s] 147it [00:15, 9.40it/s] 148it [00:15, 9.49it/s] 149it [00:15, 9.58it/s] 150it [00:15, 9.63it/s]2025-05-26 05:09:10,976 - INFO - [Epoch 075 | Batch 0150] IWAE-loss 4248.3130 | mean log_px -0.0234 | KL -3122.70 + 151it [00:15, 9.09it/s] 152it [00:15, 9.27it/s] 153it [00:15, 9.40it/s] 154it [00:16, 9.50it/s] 155it [00:16, 9.59it/s] 156it [00:16, 9.62it/s] 157it [00:16, 9.64it/s] 158it [00:16, 9.05it/s] 159it [00:16, 9.24it/s] 160it [00:16, 9.42it/s] 162it [00:16, 9.71it/s] 163it [00:17, 9.77it/s] 164it [00:17, 9.82it/s] 166it [00:17, 9.92it/s] 168it [00:17, 9.96it/s] 169it [00:17, 9.97it/s] 170it [00:17, 9.96it/s] 171it [00:17, 9.41it/s] 173it [00:18, 9.67it/s] 174it [00:18, 9.74it/s] 176it [00:18, 9.86it/s] 178it [00:18, 9.53it/s] 179it [00:18, 9.61it/s] 180it [00:18, 9.69it/s] 181it [00:18, 9.75it/s] 182it [00:18, 9.81it/s] 184it [00:19, 9.90it/s] 186it [00:19, 9.94it/s] 187it [00:19, 9.95it/s] 188it [00:19, 9.54it/s] 189it [00:19, 9.64it/s] 190it [00:19, 9.72it/s] 192it [00:19, 9.83it/s] 193it [00:20, 9.87it/s] 194it [00:20, 9.90it/s] 195it [00:20, 9.51it/s] 196it [00:20, 9.16it/s] 196it [00:20, 9.57it/s] +2025-05-26 05:09:15,746 - INFO - Epoch: 75, Objective: tensor([4487.3818], device='cuda:0', grad_fn=), Loss: 0.022050147876143456, KL/n: 63.74296569824219 + 0it [00:00, ?it/s]2025-05-26 05:09:16,041 - INFO - [Epoch 076 | Batch 0000] IWAE-loss 3891.9312 | mean log_px -0.0134 | KL -3123.93 + 1it [00:00, 4.95it/s] 2it [00:00, 6.35it/s] 4it [00:00, 8.27it/s] 5it [00:00, 8.25it/s] 7it [00:00, 9.04it/s] 8it [00:00, 9.24it/s] 9it [00:01, 9.42it/s] 11it [00:01, 9.35it/s] 12it [00:01, 9.49it/s] 14it [00:01, 9.71it/s] 15it [00:01, 9.75it/s] 17it [00:01, 9.55it/s] 18it [00:01, 9.64it/s] 20it [00:02, 9.82it/s] 22it [00:02, 9.93it/s] 24it [00:02, 9.98it/s] 26it [00:02, 10.03it/s] 28it [00:02, 10.05it/s] 30it [00:03, 10.05it/s] 32it [00:03, 9.71it/s] 34it [00:03, 9.83it/s] 35it [00:03, 9.86it/s] 36it [00:03, 9.75it/s] 37it [00:03, 9.76it/s] 38it [00:03, 9.79it/s] 39it [00:04, 9.81it/s] 40it [00:04, 9.82it/s] 41it [00:04, 9.84it/s] 42it [00:04, 6.44it/s] 43it [00:04, 7.17it/s] 44it [00:04, 7.78it/s] 46it [00:04, 8.65it/s] 47it [00:05, 8.93it/s] 48it [00:05, 9.16it/s] 49it [00:05, 9.36it/s] 50it [00:05, 9.48it/s]2025-05-26 05:09:21,340 - INFO - [Epoch 076 | Batch 0050] IWAE-loss 3677.9912 | mean log_px -0.0094 | KL -3120.58 + 51it [00:05, 9.57it/s] 53it [00:05, 9.76it/s] 54it [00:05, 9.78it/s] 55it [00:05, 9.83it/s] 56it [00:06, 9.83it/s] 57it [00:06, 9.85it/s] 58it [00:06, 9.86it/s] 59it [00:06, 9.88it/s] 60it [00:06, 9.86it/s] 61it [00:06, 9.87it/s] 62it [00:06, 9.86it/s] 63it [00:06, 9.89it/s] 64it [00:06, 9.88it/s] 66it [00:07, 9.95it/s] 67it [00:07, 9.94it/s] 68it [00:07, 9.79it/s] 69it [00:07, 9.83it/s] 70it [00:07, 9.82it/s] 72it [00:07, 9.88it/s] 73it [00:07, 9.87it/s] 74it [00:07, 9.82it/s] 75it [00:07, 9.65it/s] 76it [00:08, 9.47it/s] 77it [00:08, 9.61it/s] 78it [00:08, 9.72it/s] 79it [00:08, 9.75it/s] 80it [00:08, 9.76it/s] 81it [00:08, 9.78it/s] 82it [00:08, 9.81it/s] 83it [00:08, 9.82it/s] 84it [00:08, 9.85it/s] 85it [00:08, 9.85it/s] 86it [00:09, 9.80it/s] 87it [00:09, 9.80it/s] 88it [00:09, 9.79it/s] 89it [00:09, 9.85it/s] 90it [00:09, 9.85it/s] 91it [00:09, 9.86it/s] 92it [00:09, 9.86it/s] 93it [00:09, 9.89it/s] 94it [00:09, 9.86it/s] 95it [00:09, 9.87it/s] 96it [00:10, 9.90it/s] 98it [00:10, 9.92it/s] 99it [00:10, 9.91it/s] 100it [00:10, 9.87it/s]2025-05-26 05:09:26,421 - INFO - [Epoch 076 | Batch 0100] IWAE-loss 4684.5400 | mean log_px -0.0297 | KL -3118.37 + 101it [00:10, 9.85it/s] 102it [00:10, 9.84it/s] 103it [00:10, 9.82it/s] 104it [00:10, 9.82it/s] 105it [00:10, 9.85it/s] 106it [00:11, 9.82it/s] 107it [00:11, 9.84it/s] 109it [00:11, 9.89it/s] 110it [00:11, 9.85it/s] 111it [00:11, 9.88it/s] 112it [00:11, 9.86it/s] 113it [00:11, 9.87it/s] 114it [00:11, 9.86it/s] 115it [00:12, 9.87it/s] 116it [00:12, 9.86it/s] 117it [00:12, 9.87it/s] 118it [00:12, 9.86it/s] 119it [00:12, 9.86it/s] 120it [00:12, 9.85it/s] 121it [00:12, 9.85it/s] 122it [00:12, 9.85it/s] 123it [00:12, 9.87it/s] 124it [00:12, 9.90it/s] 125it [00:13, 9.89it/s] 126it [00:13, 9.92it/s] 127it [00:13, 9.91it/s] 128it [00:13, 9.88it/s] 129it [00:13, 9.88it/s] 130it [00:13, 9.86it/s] 131it [00:13, 9.86it/s] 133it [00:13, 9.93it/s] 134it [00:13, 9.90it/s] 135it [00:14, 9.91it/s] 136it [00:14, 9.89it/s] 137it [00:14, 9.89it/s] 138it [00:14, 9.88it/s] 139it [00:14, 9.86it/s] 140it [00:14, 9.87it/s] 141it [00:14, 9.86it/s] 142it [00:14, 9.87it/s] 143it [00:14, 9.85it/s] 144it [00:14, 9.85it/s] 145it [00:15, 9.85it/s] 146it [00:15, 9.85it/s] 148it [00:15, 9.91it/s] 149it [00:15, 9.91it/s] 150it [00:15, 9.90it/s]2025-05-26 05:09:31,486 - INFO - [Epoch 076 | Batch 0150] IWAE-loss 4113.5596 | mean log_px -0.0186 | KL -3107.95 + 151it [00:15, 9.87it/s] 152it [00:15, 9.86it/s] 153it [00:15, 9.87it/s] 154it [00:15, 9.86it/s] 156it [00:16, 9.94it/s] 157it [00:16, 9.92it/s] 158it [00:16, 9.90it/s] 159it [00:16, 9.91it/s] 160it [00:16, 9.88it/s] 162it [00:16, 9.93it/s] 164it [00:16, 9.97it/s] 165it [00:17, 9.96it/s] 167it [00:17, 9.58it/s] 169it [00:17, 9.76it/s] 171it [00:17, 9.88it/s] 173it [00:17, 9.59it/s] 175it [00:18, 9.74it/s] 176it [00:18, 9.47it/s] 178it [00:18, 9.70it/s] 180it [00:18, 9.83it/s] 181it [00:18, 9.78it/s] 182it [00:18, 9.82it/s] 184it [00:19, 9.93it/s] 186it [00:19, 10.00it/s] 188it [00:19, 10.03it/s] 190it [00:19, 10.07it/s] 192it [00:19, 10.07it/s] 194it [00:20, 9.72it/s] 195it [00:20, 9.48it/s] 196it [00:20, 9.65it/s] +2025-05-26 05:09:36,182 - INFO - Epoch: 76, Objective: tensor([3478.5898], device='cuda:0', grad_fn=), Loss: 0.005448373034596443, KL/n: 63.492427825927734 + 0it [00:00, ?it/s]2025-05-26 05:09:36,450 - INFO - [Epoch 077 | Batch 0000] IWAE-loss 3869.8042 | mean log_px -0.0148 | KL -3113.27 + 1it [00:00, 4.88it/s] 2it [00:00, 6.92it/s] 4it [00:00, 8.41it/s] 5it [00:00, 8.84it/s] 7it [00:00, 9.38it/s] 9it [00:01, 9.67it/s] 11it [00:01, 9.83it/s] 12it [00:01, 9.50it/s] 14it [00:01, 9.65it/s] 16it [00:01, 9.81it/s] 18it [00:01, 9.92it/s] 19it [00:02, 9.51it/s] 20it [00:02, 9.60it/s] 22it [00:02, 9.77it/s] 24it [00:02, 9.88it/s] 26it [00:02, 9.94it/s] 28it [00:02, 9.99it/s] 30it [00:03, 10.03it/s] 31it [00:03, 10.00it/s] 32it [00:03, 10.00it/s] 33it [00:03, 9.63it/s] 35it [00:03, 9.80it/s] 36it [00:03, 9.81it/s] 38it [00:03, 9.93it/s] 40it [00:04, 9.99it/s] 42it [00:04, 10.03it/s] 44it [00:04, 9.87it/s] 45it [00:04, 9.60it/s] 47it [00:04, 9.77it/s] 49it [00:05, 9.88it/s]2025-05-26 05:09:41,543 - INFO - [Epoch 077 | Batch 0050] IWAE-loss 4025.5740 | mean log_px -0.0166 | KL -3104.95 + 51it [00:05, 9.93it/s] 53it [00:05, 9.63it/s] 54it [00:05, 9.69it/s] 56it [00:05, 9.83it/s] 58it [00:05, 9.89it/s] 60it [00:06, 9.60it/s] 62it [00:06, 9.75it/s] 64it [00:06, 9.86it/s] 66it [00:06, 9.94it/s] 68it [00:07, 9.99it/s] 70it [00:07, 10.03it/s] 72it [00:07, 10.04it/s] 74it [00:07, 9.72it/s] 76it [00:07, 9.83it/s] 78it [00:08, 9.91it/s] 80it [00:08, 9.64it/s] 81it [00:08, 9.67it/s] 82it [00:08, 9.66it/s] 84it [00:08, 9.82it/s] 85it [00:08, 9.52it/s] 87it [00:08, 9.73it/s] 89it [00:09, 9.86it/s] 91it [00:09, 9.57it/s] 93it [00:09, 9.67it/s] 94it [00:09, 9.66it/s] 96it [00:09, 9.53it/s] 98it [00:10, 9.71it/s] 99it [00:10, 9.38it/s]2025-05-26 05:09:46,687 - INFO - [Epoch 077 | Batch 0100] IWAE-loss 3877.6897 | mean log_px -0.0162 | KL -3102.57 + 101it [00:10, 9.61it/s] 103it [00:10, 9.76it/s] 105it [00:10, 9.87it/s] 106it [00:10, 9.50it/s] 108it [00:11, 9.70it/s] 109it [00:11, 9.34it/s] 110it [00:11, 9.48it/s] 112it [00:11, 9.70it/s] 114it [00:11, 9.84it/s] 115it [00:11, 9.86it/s] 117it [00:12, 9.96it/s] 119it [00:12, 10.01it/s] 121it [00:12, 10.04it/s] 123it [00:12, 9.66it/s] 125it [00:12, 9.80it/s] 127it [00:13, 9.90it/s] 129it [00:13, 9.97it/s] 131it [00:13, 9.68it/s] 133it [00:13, 9.81it/s] 134it [00:13, 9.82it/s] 135it [00:13, 9.75it/s] 137it [00:14, 9.88it/s] 139it [00:14, 9.95it/s] 141it [00:14, 10.00it/s] 143it [00:14, 10.03it/s] 145it [00:14, 10.06it/s] 147it [00:15, 10.07it/s] 149it [00:15, 10.09it/s]2025-05-26 05:09:51,743 - INFO - [Epoch 077 | Batch 0150] IWAE-loss 3844.5071 | mean log_px -0.0126 | KL -3099.34 + 151it [00:15, 9.82it/s] 153it [00:15, 9.91it/s] 155it [00:15, 9.97it/s] 157it [00:16, 10.01it/s] 159it [00:16, 9.70it/s] 161it [00:16, 9.78it/s] 163it [00:16, 9.87it/s] 165it [00:16, 9.95it/s] 167it [00:17, 10.00it/s] 169it [00:17, 10.02it/s] 171it [00:17, 10.05it/s] 173it [00:17, 10.07it/s] 175it [00:17, 10.09it/s] 177it [00:18, 9.75it/s] 179it [00:18, 9.85it/s] 180it [00:18, 9.51it/s] 182it [00:18, 9.71it/s] 184it [00:18, 9.83it/s] 185it [00:18, 9.55it/s] 186it [00:19, 9.51it/s] 187it [00:19, 9.49it/s] 189it [00:19, 9.73it/s] 190it [00:19, 9.34it/s] 192it [00:19, 9.64it/s] 194it [00:19, 9.81it/s] 195it [00:19, 9.54it/s] 196it [00:20, 9.73it/s] +2025-05-26 05:09:56,455 - INFO - Epoch: 77, Objective: tensor([3908.6809], device='cuda:0', grad_fn=), Loss: 0.015703242272138596, KL/n: 63.27415466308594 + 0it [00:00, ?it/s]2025-05-26 05:09:56,719 - INFO - [Epoch 078 | Batch 0000] IWAE-loss 3679.0872 | mean log_px -0.0106 | KL -3098.49 + 1it [00:00, 4.96it/s] 2it [00:00, 6.93it/s] 3it [00:00, 7.58it/s] 4it [00:00, 8.37it/s] 5it [00:00, 8.44it/s] 6it [00:00, 8.72it/s] 7it [00:00, 9.06it/s] 8it [00:00, 8.82it/s] 10it [00:01, 9.35it/s] 11it [00:01, 9.01it/s] 12it [00:01, 9.24it/s] 14it [00:01, 9.56it/s] 15it [00:01, 9.59it/s] 16it [00:01, 9.07it/s] 17it [00:01, 8.90it/s] 18it [00:02, 8.92it/s] 19it [00:02, 8.95it/s] 20it [00:02, 8.97it/s] 21it [00:02, 9.07it/s] 22it [00:02, 9.14it/s] 23it [00:02, 9.20it/s] 24it [00:02, 9.22it/s] 25it [00:02, 8.68it/s] 26it [00:02, 8.82it/s] 27it [00:03, 8.91it/s] 28it [00:03, 9.10it/s] 29it [00:03, 9.21it/s] 30it [00:03, 9.28it/s] 31it [00:03, 9.31it/s] 32it [00:03, 9.32it/s] 33it [00:03, 9.40it/s] 34it [00:03, 9.38it/s] 35it [00:03, 9.41it/s] 36it [00:04, 9.44it/s] 37it [00:04, 9.41it/s] 38it [00:04, 9.37it/s] 39it [00:04, 9.43it/s] 40it [00:04, 9.43it/s] 41it [00:04, 9.44it/s] 42it [00:04, 9.40it/s] 43it [00:04, 9.40it/s] 44it [00:04, 9.42it/s] 45it [00:04, 9.45it/s] 46it [00:05, 9.44it/s] 47it [00:05, 9.46it/s] 48it [00:05, 9.45it/s] 49it [00:05, 6.07it/s] 50it [00:05, 6.79it/s]2025-05-26 05:10:02,335 - INFO - [Epoch 078 | Batch 0050] IWAE-loss 4400.3760 | mean log_px -0.0214 | KL -3091.28 + 51it [00:05, 7.41it/s] 52it [00:05, 7.91it/s] 53it [00:06, 8.30it/s] 54it [00:06, 8.61it/s] 55it [00:06, 8.87it/s] 56it [00:06, 8.83it/s] 57it [00:06, 8.96it/s] 58it [00:06, 9.05it/s] 59it [00:06, 8.64it/s] 60it [00:06, 8.85it/s] 61it [00:06, 9.05it/s] 62it [00:06, 9.14it/s] 63it [00:07, 8.76it/s] 64it [00:07, 8.94it/s] 65it [00:07, 9.07it/s] 66it [00:07, 9.17it/s] 67it [00:07, 9.29it/s] 68it [00:07, 9.34it/s] 69it [00:07, 9.04it/s] 70it [00:07, 9.17it/s] 71it [00:07, 9.27it/s] 72it [00:08, 9.28it/s] 73it [00:08, 9.31it/s] 74it [00:08, 9.34it/s] 75it [00:08, 9.35it/s] 76it [00:08, 9.44it/s] 77it [00:08, 9.43it/s] 78it [00:08, 9.42it/s] 79it [00:08, 9.44it/s] 80it [00:08, 9.43it/s] 81it [00:09, 9.50it/s] 82it [00:09, 9.49it/s] 83it [00:09, 9.47it/s] 84it [00:09, 9.42it/s] 85it [00:09, 9.41it/s] 86it [00:09, 9.07it/s] 87it [00:09, 9.19it/s] 88it [00:09, 9.27it/s] 89it [00:09, 9.36it/s] 90it [00:10, 9.38it/s] 91it [00:10, 9.39it/s] 92it [00:10, 9.46it/s] 93it [00:10, 9.44it/s] 94it [00:10, 9.49it/s] 95it [00:10, 9.45it/s] 96it [00:10, 9.48it/s] 97it [00:10, 9.47it/s] 98it [00:10, 9.46it/s] 99it [00:10, 9.46it/s] 100it [00:11, 9.44it/s]2025-05-26 05:10:07,707 - INFO - [Epoch 078 | Batch 0100] IWAE-loss 4047.0798 | mean log_px -0.0176 | KL -3091.62 + 101it [00:11, 8.93it/s] 102it [00:11, 9.09it/s] 103it [00:11, 9.23it/s] 104it [00:11, 9.34it/s] 105it [00:11, 9.39it/s] 106it [00:11, 9.44it/s] 107it [00:11, 9.42it/s] 108it [00:11, 9.50it/s] 109it [00:12, 9.53it/s] 110it [00:12, 9.47it/s] 111it [00:12, 8.90it/s] 112it [00:12, 9.03it/s] 113it [00:12, 9.15it/s] 114it [00:12, 9.21it/s] 115it [00:12, 9.28it/s] 116it [00:12, 9.32it/s] 117it [00:12, 9.38it/s] 118it [00:13, 9.38it/s] 119it [00:13, 9.41it/s] 120it [00:13, 8.94it/s] 121it [00:13, 9.12it/s] 122it [00:13, 9.28it/s] 123it [00:13, 9.38it/s] 124it [00:13, 9.41it/s] 125it [00:13, 9.43it/s] 126it [00:13, 9.43it/s] 127it [00:13, 9.47it/s] 128it [00:14, 9.47it/s] 129it [00:14, 9.49it/s] 130it [00:14, 9.30it/s] 131it [00:14, 9.00it/s] 132it [00:14, 9.15it/s] 133it [00:14, 9.25it/s] 134it [00:14, 9.36it/s] 135it [00:14, 9.36it/s] 136it [00:14, 9.39it/s] 137it [00:15, 9.41it/s] 138it [00:15, 9.49it/s] 139it [00:15, 9.56it/s] 140it [00:15, 9.58it/s] 141it [00:15, 9.49it/s] 142it [00:15, 9.23it/s] 143it [00:15, 8.84it/s] 144it [00:15, 8.47it/s] 145it [00:15, 8.75it/s] 146it [00:16, 8.92it/s] 147it [00:16, 9.06it/s] 148it [00:16, 9.18it/s] 149it [00:16, 9.25it/s] 150it [00:16, 9.38it/s]2025-05-26 05:10:13,108 - INFO - [Epoch 078 | Batch 0150] IWAE-loss 4209.9824 | mean log_px -0.0231 | KL -3090.24 + 151it [00:16, 9.45it/s] 152it [00:16, 9.42it/s] 153it [00:16, 9.40it/s] 154it [00:16, 9.46it/s] 155it [00:16, 9.41it/s] 156it [00:17, 9.40it/s] 157it [00:17, 8.96it/s] 158it [00:17, 9.11it/s] 159it [00:17, 9.22it/s] 160it [00:17, 9.36it/s] 161it [00:17, 9.42it/s] 162it [00:17, 9.45it/s] 163it [00:17, 9.48it/s] 164it [00:17, 9.01it/s] 165it [00:18, 9.12it/s] 166it [00:18, 9.27it/s] 167it [00:18, 9.35it/s] 168it [00:18, 9.38it/s] 169it [00:18, 9.40it/s] 170it [00:18, 9.45it/s] 171it [00:18, 9.45it/s] 172it [00:18, 9.45it/s] 173it [00:18, 9.22it/s] 174it [00:19, 9.36it/s] 175it [00:19, 9.36it/s] 176it [00:19, 9.39it/s] 177it [00:19, 9.45it/s] 178it [00:19, 9.48it/s] 179it [00:19, 9.48it/s] 180it [00:19, 9.49it/s] 181it [00:19, 9.48it/s] 182it [00:19, 9.48it/s] 183it [00:19, 9.56it/s] 184it [00:20, 9.57it/s] 185it [00:20, 9.61it/s] 186it [00:20, 9.55it/s] 187it [00:20, 9.55it/s] 188it [00:20, 9.53it/s] 189it [00:20, 9.27it/s] 190it [00:20, 8.95it/s] 191it [00:20, 9.08it/s] 192it [00:20, 9.18it/s] 193it [00:21, 8.79it/s] 194it [00:21, 8.95it/s] 195it [00:21, 8.58it/s] 196it [00:21, 8.91it/s] 196it [00:21, 9.13it/s] +2025-05-26 05:10:18,047 - INFO - Epoch: 78, Objective: tensor([4202.6504], device='cuda:0', grad_fn=), Loss: 0.022261351346969604, KL/n: 63.005916595458984 + 0it [00:00, ?it/s]2025-05-26 05:10:18,315 - INFO - [Epoch 079 | Batch 0000] IWAE-loss 3951.9302 | mean log_px -0.0140 | KL -3084.01 + 1it [00:00, 5.30it/s] 2it [00:00, 6.62it/s] 3it [00:00, 7.64it/s] 4it [00:00, 8.25it/s] 5it [00:00, 8.67it/s] 6it [00:00, 8.91it/s] 7it [00:00, 9.08it/s] 8it [00:00, 9.20it/s] 9it [00:01, 9.27it/s] 10it [00:01, 9.38it/s] 11it [00:01, 9.40it/s] 12it [00:01, 9.44it/s] 13it [00:01, 9.50it/s] 14it [00:01, 9.53it/s] 15it [00:01, 8.94it/s] 16it [00:01, 9.09it/s] 17it [00:01, 9.22it/s] 18it [00:02, 9.22it/s] 19it [00:02, 8.81it/s] 20it [00:02, 8.97it/s] 21it [00:02, 9.14it/s] 22it [00:02, 9.24it/s] 23it [00:02, 8.83it/s] 24it [00:02, 9.00it/s] 25it [00:02, 8.69it/s] 26it [00:02, 8.92it/s] 27it [00:03, 9.08it/s] 28it [00:03, 9.21it/s] 29it [00:03, 8.83it/s] 30it [00:03, 8.99it/s] 31it [00:03, 9.10it/s] 32it [00:03, 9.24it/s] 33it [00:03, 9.33it/s] 34it [00:03, 9.37it/s] 35it [00:03, 9.41it/s] 36it [00:04, 9.42it/s] 37it [00:04, 9.44it/s] 38it [00:04, 9.46it/s] 39it [00:04, 9.49it/s] 40it [00:04, 9.47it/s] 41it [00:04, 8.98it/s] 42it [00:04, 9.17it/s] 43it [00:04, 9.24it/s] 44it [00:04, 9.33it/s] 45it [00:04, 9.41it/s] 46it [00:05, 9.41it/s] 47it [00:05, 9.50it/s] 48it [00:05, 9.45it/s] 49it [00:05, 9.44it/s] 50it [00:05, 9.46it/s]2025-05-26 05:10:23,732 - INFO - [Epoch 079 | Batch 0050] IWAE-loss 4607.3691 | mean log_px -0.0238 | KL -3084.28 + 51it [00:05, 8.92it/s] 52it [00:05, 9.05it/s] 53it [00:05, 9.20it/s] 54it [00:05, 9.35it/s] 55it [00:06, 9.39it/s] 56it [00:06, 9.41it/s] 57it [00:06, 9.44it/s] 58it [00:06, 9.44it/s] 59it [00:06, 9.44it/s] 60it [00:06, 9.42it/s] 61it [00:06, 9.52it/s] 62it [00:06, 9.50it/s] 63it [00:06, 9.47it/s] 64it [00:06, 9.48it/s] 65it [00:07, 9.49it/s] 66it [00:07, 9.45it/s] 67it [00:07, 9.41it/s] 68it [00:07, 9.40it/s] 69it [00:07, 9.42it/s] 70it [00:07, 8.88it/s] 71it [00:07, 9.04it/s] 72it [00:07, 9.14it/s] 73it [00:07, 9.30it/s] 74it [00:08, 9.33it/s] 75it [00:08, 9.37it/s] 76it [00:08, 9.40it/s] 77it [00:08, 9.47it/s] 78it [00:08, 9.10it/s] 79it [00:08, 8.81it/s] 80it [00:08, 8.96it/s] 81it [00:08, 9.14it/s] 82it [00:08, 9.28it/s] 83it [00:09, 8.89it/s] 84it [00:09, 8.99it/s] 85it [00:09, 9.11it/s] 86it [00:09, 8.68it/s] 87it [00:09, 8.93it/s] 88it [00:09, 9.09it/s] 89it [00:09, 9.18it/s] 90it [00:09, 9.27it/s] 91it [00:09, 9.34it/s] 92it [00:10, 9.44it/s] 93it [00:10, 9.42it/s] 94it [00:10, 9.44it/s] 95it [00:10, 9.46it/s] 96it [00:10, 9.50it/s] 97it [00:10, 9.57it/s] 98it [00:10, 9.51it/s] 99it [00:10, 9.49it/s] 100it [00:10, 9.47it/s]2025-05-26 05:10:29,122 - INFO - [Epoch 079 | Batch 0100] IWAE-loss 4182.2646 | mean log_px -0.0189 | KL -3085.25 + 101it [00:10, 9.40it/s] 102it [00:11, 9.43it/s] 103it [00:11, 9.45it/s] 104it [00:11, 9.45it/s] 105it [00:11, 9.46it/s] 106it [00:11, 9.44it/s] 107it [00:11, 8.92it/s] 108it [00:11, 9.07it/s] 109it [00:11, 9.23it/s] 110it [00:11, 9.33it/s] 111it [00:12, 9.43it/s] 112it [00:12, 9.44it/s] 113it [00:12, 9.46it/s] 114it [00:12, 9.51it/s] 115it [00:12, 9.53it/s] 116it [00:12, 9.51it/s] 117it [00:12, 9.52it/s] 118it [00:12, 9.49it/s] 119it [00:12, 9.51it/s] 120it [00:13, 9.48it/s] 121it [00:13, 9.51it/s] 122it [00:13, 9.52it/s] 123it [00:13, 9.40it/s] 124it [00:13, 9.39it/s] 125it [00:13, 9.40it/s] 126it [00:13, 8.89it/s] 127it [00:13, 9.07it/s] 128it [00:13, 9.13it/s] 129it [00:13, 9.27it/s] 130it [00:14, 9.31it/s] 131it [00:14, 9.34it/s] 132it [00:14, 9.39it/s] 133it [00:14, 9.42it/s] 134it [00:14, 9.44it/s] 135it [00:14, 9.48it/s] 136it [00:14, 9.46it/s] 137it [00:14, 9.46it/s] 138it [00:14, 9.49it/s] 139it [00:15, 9.48it/s] 140it [00:15, 9.50it/s] 141it [00:15, 9.47it/s] 142it [00:15, 9.45it/s] 143it [00:15, 9.47it/s] 144it [00:15, 9.43it/s] 145it [00:15, 9.35it/s] 146it [00:15, 9.26it/s] 147it [00:15, 9.29it/s] 148it [00:16, 9.36it/s] 149it [00:16, 9.39it/s] 150it [00:16, 9.43it/s]2025-05-26 05:10:34,449 - INFO - [Epoch 079 | Batch 0150] IWAE-loss 3905.8240 | mean log_px -0.0154 | KL -3072.65 + 151it [00:16, 9.38it/s] 152it [00:16, 9.33it/s] 153it [00:16, 9.40it/s] 154it [00:16, 9.47it/s] 155it [00:16, 9.49it/s] 156it [00:16, 9.43it/s] 157it [00:16, 9.39it/s] 158it [00:17, 9.39it/s] 159it [00:17, 9.42it/s] 160it [00:17, 9.39it/s] 161it [00:17, 9.41it/s] 162it [00:17, 8.91it/s] 163it [00:17, 9.04it/s] 164it [00:17, 9.17it/s] 165it [00:17, 9.27it/s] 166it [00:17, 9.29it/s] 167it [00:18, 9.34it/s] 168it [00:18, 9.32it/s] 169it [00:18, 9.41it/s] 170it [00:18, 9.40it/s] 171it [00:18, 9.44it/s] 172it [00:18, 9.43it/s] 173it [00:18, 9.40it/s] 174it [00:18, 9.41it/s] 175it [00:18, 9.39it/s] 176it [00:18, 9.42it/s] 177it [00:19, 8.91it/s] 178it [00:19, 9.04it/s] 179it [00:19, 9.21it/s] 180it [00:19, 9.27it/s] 181it [00:19, 9.33it/s] 182it [00:19, 9.20it/s] 183it [00:19, 9.28it/s] 184it [00:19, 9.37it/s] 185it [00:19, 8.97it/s] 186it [00:20, 9.08it/s] 187it [00:20, 9.15it/s] 188it [00:20, 9.25it/s] 189it [00:20, 9.32it/s] 190it [00:20, 9.34it/s] 191it [00:20, 9.39it/s] 192it [00:20, 9.42it/s] 193it [00:20, 9.44it/s] 194it [00:20, 9.47it/s] 195it [00:21, 8.87it/s] 196it [00:21, 8.68it/s] 196it [00:21, 9.22it/s] +2025-05-26 05:10:39,422 - INFO - Epoch: 79, Objective: tensor([3949.7637], device='cuda:0', grad_fn=), Loss: 0.015167269855737686, KL/n: 62.748844146728516 + 0it [00:00, ?it/s]2025-05-26 05:10:39,697 - INFO - [Epoch 080 | Batch 0000] IWAE-loss 4421.7627 | mean log_px -0.0238 | KL -3073.79 + 1it [00:00, 5.24it/s] 2it [00:00, 6.43it/s] 3it [00:00, 7.55it/s] 4it [00:00, 8.18it/s] 5it [00:00, 8.61it/s] 6it [00:00, 8.85it/s] 7it [00:00, 9.05it/s] 8it [00:00, 9.22it/s] 9it [00:01, 9.31it/s] 10it [00:01, 9.37it/s] 11it [00:01, 9.40it/s] 12it [00:01, 9.40it/s] 13it [00:01, 9.32it/s] 14it [00:01, 9.42it/s] 15it [00:01, 9.42it/s] 16it [00:01, 9.40it/s] 17it [00:01, 9.42it/s] 18it [00:02, 9.43it/s] 19it [00:02, 9.46it/s] 20it [00:02, 9.46it/s] 21it [00:02, 9.47it/s] 22it [00:02, 9.43it/s] 23it [00:02, 9.44it/s] 24it [00:02, 9.37it/s] 25it [00:02, 9.33it/s] 26it [00:02, 9.37it/s] 27it [00:02, 9.25it/s] 28it [00:03, 9.20it/s] 29it [00:03, 9.28it/s] 30it [00:03, 9.25it/s] 31it [00:03, 9.26it/s] 32it [00:03, 9.27it/s] 33it [00:03, 9.29it/s] 34it [00:03, 8.84it/s] 35it [00:03, 9.02it/s] 36it [00:03, 9.15it/s] 37it [00:04, 9.24it/s] 38it [00:04, 9.31it/s] 39it [00:04, 9.33it/s] 40it [00:04, 9.34it/s] 41it [00:04, 8.96it/s] 42it [00:04, 9.08it/s] 43it [00:04, 9.17it/s] 44it [00:04, 9.26it/s] 45it [00:04, 9.33it/s] 46it [00:05, 8.79it/s] 47it [00:05, 8.94it/s] 48it [00:05, 9.09it/s] 49it [00:05, 9.18it/s] 50it [00:05, 9.24it/s]2025-05-26 05:10:45,099 - INFO - [Epoch 080 | Batch 0050] IWAE-loss 4183.6655 | mean log_px -0.0173 | KL -3067.25 + 51it [00:05, 5.86it/s] 52it [00:05, 6.60it/s] 53it [00:06, 7.22it/s] 54it [00:06, 7.68it/s] 55it [00:06, 7.76it/s] 56it [00:06, 8.20it/s] 57it [00:06, 8.56it/s] 58it [00:06, 8.79it/s] 59it [00:06, 8.92it/s] 60it [00:06, 9.05it/s] 61it [00:06, 8.48it/s] 62it [00:07, 8.63it/s] 63it [00:07, 8.92it/s] 64it [00:07, 8.64it/s] 65it [00:07, 8.92it/s] 66it [00:07, 9.12it/s] 67it [00:07, 9.28it/s] 68it [00:07, 8.86it/s] 69it [00:07, 9.14it/s] 70it [00:07, 9.33it/s] 71it [00:08, 9.46it/s] 72it [00:08, 8.98it/s] 73it [00:08, 9.23it/s] 74it [00:08, 9.40it/s] 75it [00:08, 9.53it/s] 76it [00:08, 9.60it/s] 77it [00:08, 9.20it/s] 78it [00:08, 9.37it/s] 79it [00:08, 9.51it/s] 80it [00:08, 9.60it/s] 81it [00:09, 9.67it/s] 82it [00:09, 9.72it/s] 83it [00:09, 9.75it/s] 84it [00:09, 9.78it/s] 85it [00:09, 9.27it/s] 86it [00:09, 9.43it/s] 87it [00:09, 9.54it/s] 88it [00:09, 9.56it/s] 89it [00:09, 9.64it/s] 90it [00:09, 9.71it/s] 91it [00:10, 9.75it/s] 92it [00:10, 9.75it/s] 93it [00:10, 9.78it/s] 94it [00:10, 9.31it/s] 95it [00:10, 9.47it/s] 96it [00:10, 9.57it/s] 97it [00:10, 9.06it/s] 98it [00:10, 9.26it/s] 99it [00:10, 9.43it/s] 100it [00:11, 9.54it/s]2025-05-26 05:10:50,666 - INFO - [Epoch 080 | Batch 0100] IWAE-loss 3951.3103 | mean log_px -0.0163 | KL -3071.85 + 101it [00:11, 9.60it/s] 102it [00:11, 9.65it/s] 103it [00:11, 9.72it/s] 104it [00:11, 9.76it/s] 105it [00:11, 9.79it/s] 106it [00:11, 9.80it/s] 107it [00:11, 9.82it/s] 108it [00:11, 9.19it/s] 109it [00:11, 9.37it/s] 110it [00:12, 9.49it/s] 111it [00:12, 9.60it/s] 112it [00:12, 9.67it/s] 113it [00:12, 9.67it/s] 114it [00:12, 9.72it/s] 115it [00:12, 9.69it/s] 116it [00:12, 9.72it/s] 117it [00:12, 9.77it/s] 118it [00:12, 9.78it/s] 119it [00:13, 9.79it/s] 120it [00:13, 9.80it/s] 121it [00:13, 9.80it/s] 122it [00:13, 9.79it/s] 123it [00:13, 9.80it/s] 124it [00:13, 9.33it/s] 125it [00:13, 9.47it/s] 126it [00:13, 9.57it/s] 127it [00:13, 9.64it/s] 128it [00:13, 9.23it/s] 129it [00:14, 9.41it/s] 130it [00:14, 9.52it/s] 131it [00:14, 9.62it/s] 132it [00:14, 9.68it/s] 133it [00:14, 9.74it/s] 134it [00:14, 9.77it/s] 135it [00:14, 9.79it/s] 136it [00:14, 9.58it/s] 137it [00:14, 9.65it/s] 138it [00:14, 9.69it/s] 139it [00:15, 9.73it/s] 140it [00:15, 9.75it/s] 141it [00:15, 9.78it/s] 142it [00:15, 9.77it/s] 143it [00:15, 9.29it/s] 144it [00:15, 9.44it/s] 145it [00:15, 9.58it/s] 146it [00:15, 9.65it/s] 147it [00:15, 9.72it/s] 148it [00:16, 9.76it/s] 149it [00:16, 9.19it/s] 150it [00:16, 9.37it/s]2025-05-26 05:10:55,863 - INFO - [Epoch 080 | Batch 0150] IWAE-loss 3631.5173 | mean log_px -0.0095 | KL -3060.06 + 151it [00:16, 9.51it/s] 152it [00:16, 9.60it/s] 153it [00:16, 9.68it/s] 154it [00:16, 9.73it/s] 155it [00:16, 9.77it/s] 156it [00:16, 9.74it/s] 157it [00:16, 9.77it/s] 158it [00:17, 9.77it/s] 159it [00:17, 9.78it/s] 160it [00:17, 9.78it/s] 161it [00:17, 9.25it/s] 162it [00:17, 9.40it/s] 163it [00:17, 9.52it/s] 164it [00:17, 9.08it/s] 165it [00:17, 9.25it/s] 166it [00:17, 9.38it/s] 167it [00:18, 9.51it/s] 168it [00:18, 9.61it/s] 169it [00:18, 9.68it/s] 170it [00:18, 9.72it/s] 171it [00:18, 9.06it/s] 172it [00:18, 9.01it/s] 173it [00:18, 9.06it/s] 174it [00:18, 9.18it/s] 175it [00:18, 9.33it/s] 176it [00:18, 9.42it/s] 177it [00:19, 8.92it/s] 178it [00:19, 9.10it/s] 179it [00:19, 9.26it/s] 180it [00:19, 9.37it/s] 181it [00:19, 9.45it/s] 182it [00:19, 9.50it/s] 183it [00:19, 9.47it/s] 184it [00:19, 8.92it/s] 185it [00:19, 9.13it/s] 186it [00:20, 9.24it/s] 187it [00:20, 9.23it/s] 188it [00:20, 9.36it/s] 189it [00:20, 9.52it/s] 190it [00:20, 9.62it/s] 191it [00:20, 9.69it/s] 192it [00:20, 9.22it/s] 193it [00:20, 9.38it/s] 194it [00:20, 9.47it/s] 195it [00:21, 8.97it/s] 196it [00:21, 9.24it/s] +2025-05-26 05:11:00,765 - INFO - Epoch: 80, Objective: tensor([3925.0637], device='cuda:0', grad_fn=), Loss: 0.012692895717918873, KL/n: 62.49341583251953 + 0it [00:00, ?it/s]2025-05-26 05:11:01,035 - INFO - [Epoch 081 | Batch 0000] IWAE-loss 4076.6638 | mean log_px -0.0189 | KL -3062.57 + 1it [00:00, 5.55it/s] 2it [00:00, 7.36it/s] 3it [00:00, 8.33it/s] 4it [00:00, 8.43it/s] 5it [00:00, 8.88it/s] 6it [00:00, 9.19it/s] 7it [00:00, 9.40it/s] 8it [00:00, 8.94it/s] 9it [00:01, 9.22it/s] 10it [00:01, 9.40it/s] 11it [00:01, 9.52it/s] 12it [00:01, 9.57it/s] 13it [00:01, 9.59it/s] 14it [00:01, 9.61it/s] 15it [00:01, 9.67it/s] 16it [00:01, 9.69it/s] 17it [00:01, 9.74it/s] 18it [00:01, 9.78it/s] 19it [00:02, 9.78it/s] 20it [00:02, 9.79it/s] 21it [00:02, 9.75it/s] 22it [00:02, 9.76it/s] 23it [00:02, 9.81it/s] 24it [00:02, 9.68it/s] 25it [00:02, 9.72it/s] 26it [00:02, 9.75it/s] 27it [00:02, 9.48it/s] 28it [00:02, 9.57it/s] 29it [00:03, 9.65it/s] 30it [00:03, 9.70it/s] 31it [00:03, 9.74it/s] 32it [00:03, 9.77it/s] 33it [00:03, 9.80it/s] 34it [00:03, 9.75it/s] 35it [00:03, 9.72it/s] 36it [00:03, 9.73it/s] 37it [00:03, 9.77it/s] 38it [00:04, 9.76it/s] 39it [00:04, 9.79it/s] 40it [00:04, 9.78it/s] 41it [00:04, 9.79it/s] 42it [00:04, 9.67it/s] 43it [00:04, 9.57it/s] 44it [00:04, 9.54it/s] 45it [00:04, 9.52it/s] 46it [00:04, 9.38it/s] 47it [00:04, 9.46it/s] 48it [00:05, 9.46it/s] 49it [00:05, 9.45it/s] 50it [00:05, 9.46it/s]2025-05-26 05:11:06,234 - INFO - [Epoch 081 | Batch 0050] IWAE-loss 3596.1819 | mean log_px -0.0087 | KL -3056.84 + 51it [00:05, 9.39it/s] 52it [00:05, 9.42it/s] 53it [00:05, 9.48it/s] 54it [00:05, 9.44it/s] 55it [00:05, 9.47it/s] 56it [00:05, 9.48it/s] 57it [00:06, 9.49it/s] 58it [00:06, 9.47it/s] 59it [00:06, 9.47it/s] 60it [00:06, 9.48it/s] 61it [00:06, 9.47it/s] 62it [00:06, 9.46it/s] 63it [00:06, 9.46it/s] 64it [00:06, 8.99it/s] 65it [00:06, 9.13it/s] 66it [00:06, 9.23it/s] 67it [00:07, 9.34it/s] 68it [00:07, 9.31it/s] 69it [00:07, 8.89it/s] 70it [00:07, 9.02it/s] 71it [00:07, 9.17it/s] 72it [00:07, 9.24it/s] 73it [00:07, 8.79it/s] 74it [00:07, 8.94it/s] 75it [00:07, 9.09it/s] 76it [00:08, 9.06it/s] 77it [00:08, 9.19it/s] 78it [00:08, 9.26it/s] 79it [00:08, 9.33it/s] 80it [00:08, 9.34it/s] 81it [00:08, 9.43it/s] 82it [00:08, 9.48it/s] 83it [00:08, 9.48it/s] 84it [00:08, 8.99it/s] 85it [00:09, 9.11it/s] 86it [00:09, 9.22it/s] 87it [00:09, 9.28it/s] 88it [00:09, 8.81it/s] 89it [00:09, 8.99it/s] 90it [00:09, 9.11it/s] 91it [00:09, 9.23it/s] 92it [00:09, 8.83it/s] 93it [00:09, 9.02it/s] 94it [00:10, 9.08it/s] 95it [00:10, 9.18it/s] 96it [00:10, 9.24it/s] 97it [00:10, 9.30it/s] 98it [00:10, 9.33it/s] 99it [00:10, 9.34it/s] 100it [00:10, 9.43it/s]2025-05-26 05:11:11,647 - INFO - [Epoch 081 | Batch 0100] IWAE-loss 4514.4556 | mean log_px -0.0243 | KL -3053.01 + 101it [00:10, 9.43it/s] 102it [00:10, 8.95it/s] 103it [00:11, 8.80it/s] 104it [00:11, 8.93it/s] 105it [00:11, 9.02it/s] 106it [00:11, 8.67it/s] 107it [00:11, 8.84it/s] 108it [00:11, 9.02it/s] 109it [00:11, 9.18it/s] 110it [00:11, 8.77it/s] 111it [00:11, 8.94it/s] 112it [00:12, 9.09it/s] 113it [00:12, 9.21it/s] 114it [00:12, 9.31it/s] 115it [00:12, 9.32it/s] 116it [00:12, 9.35it/s] 117it [00:12, 9.39it/s] 118it [00:12, 9.43it/s] 119it [00:12, 9.43it/s] 120it [00:12, 8.96it/s] 121it [00:13, 9.16it/s] 122it [00:13, 9.25it/s] 123it [00:13, 9.29it/s] 124it [00:13, 9.33it/s] 125it [00:13, 9.34it/s] 126it [00:13, 9.36it/s] 127it [00:13, 9.45it/s] 128it [00:13, 9.47it/s] 129it [00:13, 9.39it/s] 130it [00:13, 8.89it/s] 131it [00:14, 9.07it/s] 132it [00:14, 9.18it/s] 133it [00:14, 9.26it/s] 134it [00:14, 8.85it/s] 135it [00:14, 9.02it/s] 136it [00:14, 9.11it/s] 137it [00:14, 9.21it/s] 138it [00:14, 9.18it/s] 139it [00:14, 9.30it/s] 140it [00:15, 8.88it/s] 141it [00:15, 9.05it/s] 142it [00:15, 9.17it/s] 143it [00:15, 9.26it/s] 144it [00:15, 9.31it/s] 145it [00:15, 9.32it/s] 146it [00:15, 9.37it/s] 147it [00:15, 9.45it/s] 148it [00:15, 9.40it/s] 149it [00:16, 9.36it/s] 150it [00:16, 9.40it/s]2025-05-26 05:11:17,093 - INFO - [Epoch 081 | Batch 0150] IWAE-loss 3807.7285 | mean log_px -0.0127 | KL -3054.70 + 151it [00:16, 9.42it/s] 152it [00:16, 8.94it/s] 153it [00:16, 9.08it/s] 154it [00:16, 9.24it/s] 155it [00:16, 8.79it/s] 156it [00:16, 9.00it/s] 157it [00:16, 9.04it/s] 158it [00:17, 9.16it/s] 159it [00:17, 9.21it/s] 160it [00:17, 8.88it/s] 161it [00:17, 9.04it/s] 162it [00:17, 9.16it/s] 163it [00:17, 9.25it/s] 164it [00:17, 9.30it/s] 165it [00:17, 9.32it/s] 166it [00:17, 9.34it/s] 167it [00:17, 9.40it/s] 168it [00:18, 9.43it/s] 169it [00:18, 9.46it/s] 170it [00:18, 9.45it/s] 171it [00:18, 9.44it/s] 172it [00:18, 9.45it/s] 173it [00:18, 9.46it/s] 174it [00:18, 9.47it/s] 175it [00:18, 9.48it/s] 176it [00:18, 9.45it/s] 177it [00:19, 9.49it/s] 178it [00:19, 9.52it/s] 179it [00:19, 9.49it/s] 180it [00:19, 8.94it/s] 181it [00:19, 9.07it/s] 182it [00:19, 9.18it/s] 183it [00:19, 9.26it/s] 184it [00:19, 8.81it/s] 185it [00:19, 8.97it/s] 186it [00:20, 9.05it/s] 187it [00:20, 9.19it/s] 188it [00:20, 8.88it/s] 189it [00:20, 9.08it/s] 190it [00:20, 9.18it/s] 191it [00:20, 9.27it/s] 192it [00:20, 9.30it/s] 193it [00:20, 9.36it/s] 194it [00:20, 9.41it/s] 195it [00:21, 8.34it/s] 196it [00:21, 8.68it/s] 196it [00:21, 9.24it/s] +2025-05-26 05:11:22,115 - INFO - Epoch: 81, Objective: tensor([4405.5898], device='cuda:0', grad_fn=), Loss: 0.024367935955524445, KL/n: 62.24941635131836 + 0it [00:00, ?it/s]2025-05-26 05:11:22,574 - INFO - [Epoch 082 | Batch 0000] IWAE-loss 4408.0596 | mean log_px -0.0199 | KL -3051.39 + 1it [00:00, 5.32it/s] 2it [00:00, 6.67it/s] 3it [00:00, 7.80it/s] 4it [00:00, 8.43it/s] 5it [00:00, 8.78it/s] 6it [00:00, 8.99it/s] 7it [00:00, 9.18it/s] 8it [00:00, 9.27it/s] 9it [00:01, 9.30it/s] 10it [00:01, 9.36it/s] 11it [00:01, 9.40it/s] 12it [00:01, 9.40it/s] 13it [00:01, 9.45it/s] 14it [00:01, 9.42it/s] 15it [00:01, 8.95it/s] 16it [00:01, 9.09it/s] 17it [00:01, 9.06it/s] 18it [00:02, 9.18it/s] 19it [00:02, 9.32it/s] 20it [00:02, 8.66it/s] 21it [00:02, 8.93it/s] 22it [00:02, 9.10it/s] 23it [00:02, 9.18it/s] 24it [00:02, 9.29it/s] 25it [00:02, 9.41it/s] 26it [00:02, 9.41it/s] 27it [00:02, 9.46it/s] 28it [00:03, 9.46it/s] 29it [00:03, 9.50it/s] 30it [00:03, 9.51it/s] 31it [00:03, 9.58it/s] 32it [00:03, 9.52it/s] 33it [00:03, 9.54it/s] 34it [00:03, 9.55it/s] 35it [00:03, 9.00it/s] 36it [00:03, 9.12it/s] 37it [00:04, 9.26it/s] 38it [00:04, 9.34it/s] 39it [00:04, 9.39it/s] 40it [00:04, 9.42it/s] 41it [00:04, 9.07it/s] 42it [00:04, 9.20it/s] 43it [00:04, 9.26it/s] 44it [00:04, 8.79it/s] 45it [00:04, 8.95it/s] 46it [00:05, 9.12it/s] 47it [00:05, 9.17it/s] 48it [00:05, 8.69it/s] 49it [00:05, 8.95it/s] 50it [00:05, 9.04it/s]2025-05-26 05:11:27,992 - INFO - [Epoch 082 | Batch 0050] IWAE-loss 4216.4087 | mean log_px -0.0181 | KL -3045.86 + 51it [00:05, 9.07it/s] 52it [00:05, 9.18it/s] 53it [00:05, 8.79it/s] 54it [00:05, 9.01it/s] 55it [00:06, 9.09it/s] 56it [00:06, 9.22it/s] 57it [00:06, 8.76it/s] 58it [00:06, 8.93it/s] 59it [00:06, 8.96it/s] 60it [00:06, 9.11it/s] 61it [00:06, 8.73it/s] 62it [00:06, 8.94it/s] 63it [00:06, 8.95it/s] 64it [00:07, 8.97it/s] 65it [00:07, 8.36it/s] 66it [00:07, 8.67it/s] 67it [00:07, 8.91it/s] 68it [00:07, 9.04it/s] 69it [00:07, 8.68it/s] 70it [00:07, 8.95it/s] 71it [00:07, 9.16it/s] 72it [00:07, 9.28it/s] 73it [00:08, 8.79it/s] 74it [00:08, 8.91it/s] 75it [00:08, 9.04it/s] 76it [00:08, 8.77it/s] 77it [00:08, 8.99it/s] 78it [00:08, 9.14it/s] 79it [00:08, 8.73it/s] 80it [00:08, 8.96it/s] 81it [00:08, 9.15it/s] 82it [00:09, 9.28it/s] 83it [00:09, 8.80it/s] 84it [00:09, 8.96it/s] 85it [00:09, 9.16it/s] 86it [00:09, 9.25it/s] 87it [00:09, 9.34it/s] 88it [00:09, 9.39it/s] 89it [00:09, 8.89it/s] 90it [00:09, 9.06it/s] 91it [00:10, 9.20it/s] 92it [00:10, 9.26it/s] 93it [00:10, 8.82it/s] 94it [00:10, 9.01it/s] 95it [00:10, 9.20it/s] 96it [00:10, 9.27it/s] 97it [00:10, 9.33it/s] 98it [00:10, 9.36it/s] 99it [00:10, 9.39it/s] 100it [00:11, 9.41it/s]2025-05-26 05:11:33,518 - INFO - [Epoch 082 | Batch 0100] IWAE-loss 4081.9727 | mean log_px -0.0158 | KL -3040.89 + 101it [00:11, 9.40it/s] 102it [00:11, 9.42it/s] 103it [00:11, 9.41it/s] 104it [00:11, 9.45it/s] 105it [00:11, 9.48it/s] 106it [00:11, 9.49it/s] 107it [00:11, 9.46it/s] 108it [00:11, 8.94it/s] 109it [00:11, 9.12it/s] 110it [00:12, 9.21it/s] 111it [00:12, 9.30it/s] 112it [00:12, 8.83it/s] 113it [00:12, 9.04it/s] 114it [00:12, 9.17it/s] 115it [00:12, 9.28it/s] 116it [00:12, 8.80it/s] 117it [00:12, 9.00it/s] 118it [00:12, 9.15it/s] 119it [00:13, 9.27it/s] 120it [00:13, 9.30it/s] 121it [00:13, 9.37it/s] 122it [00:13, 8.77it/s] 123it [00:13, 8.85it/s] 124it [00:13, 9.09it/s] 125it [00:13, 8.73it/s] 126it [00:13, 9.02it/s] 127it [00:13, 9.24it/s] 128it [00:14, 9.39it/s] 129it [00:14, 9.52it/s] 130it [00:14, 9.60it/s] 131it [00:14, 9.52it/s] 132it [00:14, 8.99it/s] 133it [00:14, 9.19it/s] 134it [00:14, 9.34it/s] 135it [00:14, 9.43it/s] 136it [00:14, 8.97it/s] 137it [00:15, 9.19it/s] 138it [00:15, 9.34it/s] 139it [00:15, 9.46it/s] 140it [00:15, 8.97it/s] 141it [00:15, 9.16it/s] 142it [00:15, 9.33it/s] 143it [00:15, 9.46it/s] 144it [00:15, 8.98it/s] 145it [00:15, 9.20it/s] 146it [00:16, 9.36it/s] 147it [00:16, 9.48it/s] 148it [00:16, 9.01it/s] 149it [00:16, 9.22it/s] 150it [00:16, 9.37it/s]2025-05-26 05:11:38,944 - INFO - [Epoch 082 | Batch 0150] IWAE-loss 3857.5825 | mean log_px -0.0146 | KL -3036.50 + 151it [00:16, 9.45it/s] 152it [00:16, 8.98it/s] 153it [00:16, 9.20it/s] 154it [00:16, 9.36it/s] 155it [00:16, 9.47it/s] 156it [00:17, 8.98it/s] 157it [00:17, 9.20it/s] 158it [00:17, 9.34it/s] 159it [00:17, 9.33it/s] 160it [00:17, 8.80it/s] 161it [00:17, 9.03it/s] 162it [00:17, 9.23it/s] 163it [00:17, 9.38it/s] 164it [00:17, 8.94it/s] 165it [00:18, 9.13it/s] 166it [00:18, 9.29it/s] 167it [00:18, 9.40it/s] 168it [00:18, 8.92it/s] 169it [00:18, 9.16it/s] 170it [00:18, 9.32it/s] 171it [00:18, 9.44it/s] 172it [00:18, 8.97it/s] 173it [00:18, 9.19it/s] 174it [00:19, 9.32it/s] 175it [00:19, 9.44it/s] 176it [00:19, 8.92it/s] 177it [00:19, 9.14it/s] 178it [00:19, 9.29it/s] 179it [00:19, 9.43it/s] 180it [00:19, 8.97it/s] 181it [00:19, 9.15it/s] 182it [00:19, 9.30it/s] 183it [00:20, 9.41it/s] 184it [00:20, 8.95it/s] 185it [00:20, 9.15it/s] 186it [00:20, 9.29it/s] 187it [00:20, 9.43it/s] 188it [00:20, 8.97it/s] 189it [00:20, 9.17it/s] 190it [00:20, 9.30it/s] 191it [00:20, 9.43it/s] 192it [00:21, 9.55it/s] 193it [00:21, 9.60it/s] 194it [00:21, 9.67it/s] 195it [00:21, 8.49it/s] 196it [00:21, 8.88it/s] 196it [00:21, 9.10it/s] +2025-05-26 05:11:43,960 - INFO - Epoch: 82, Objective: tensor([3370.0046], device='cuda:0', grad_fn=), Loss: 0.005570830777287483, KL/n: 62.00031280517578 + 0it [00:00, ?it/s]2025-05-26 05:11:44,240 - INFO - [Epoch 083 | Batch 0000] IWAE-loss 4002.6240 | mean log_px -0.0153 | KL -3036.43 + 1it [00:00, 5.39it/s] 2it [00:00, 7.26it/s] 3it [00:00, 8.28it/s] 4it [00:00, 8.84it/s] 5it [00:00, 9.21it/s] 6it [00:00, 9.40it/s] 7it [00:00, 9.49it/s] 8it [00:00, 9.59it/s] 9it [00:01, 9.69it/s] 10it [00:01, 9.72it/s] 11it [00:01, 9.78it/s] 12it [00:01, 9.79it/s] 13it [00:01, 9.83it/s] 14it [00:01, 9.83it/s] 15it [00:01, 9.85it/s] 16it [00:01, 9.85it/s] 17it [00:01, 9.85it/s] 18it [00:01, 9.84it/s] 19it [00:02, 9.85it/s] 20it [00:02, 9.85it/s] 21it [00:02, 9.87it/s] 22it [00:02, 9.84it/s] 23it [00:02, 9.84it/s] 24it [00:02, 9.84it/s] 25it [00:02, 9.84it/s] 26it [00:02, 9.84it/s] 27it [00:02, 9.81it/s] 28it [00:02, 9.81it/s] 29it [00:03, 9.83it/s] 30it [00:03, 9.83it/s] 31it [00:03, 9.84it/s] 32it [00:03, 9.84it/s] 33it [00:03, 9.84it/s] 34it [00:03, 9.85it/s] 35it [00:03, 9.86it/s] 36it [00:03, 9.27it/s] 37it [00:03, 9.45it/s] 38it [00:03, 9.55it/s] 39it [00:04, 9.63it/s] 40it [00:04, 9.14it/s] 41it [00:04, 9.33it/s] 42it [00:04, 9.33it/s] 43it [00:04, 9.41it/s] 44it [00:04, 9.44it/s] 45it [00:04, 9.45it/s] 46it [00:04, 9.43it/s] 47it [00:04, 9.49it/s] 48it [00:05, 9.51it/s] 49it [00:05, 9.52it/s] 50it [00:05, 9.50it/s]2025-05-26 05:11:49,399 - INFO - [Epoch 083 | Batch 0050] IWAE-loss 3834.6262 | mean log_px -0.0148 | KL -3028.71 + 51it [00:05, 9.46it/s] 52it [00:05, 9.48it/s] 53it [00:05, 9.49it/s] 54it [00:05, 9.43it/s] 55it [00:05, 9.42it/s] 56it [00:05, 9.46it/s] 57it [00:05, 9.46it/s] 58it [00:06, 9.50it/s] 59it [00:06, 9.49it/s] 60it [00:06, 9.51it/s] 61it [00:06, 9.53it/s] 62it [00:06, 9.51it/s] 63it [00:06, 9.53it/s] 64it [00:06, 9.46it/s] 65it [00:06, 9.49it/s] 66it [00:06, 9.47it/s] 67it [00:07, 9.50it/s] 68it [00:07, 9.47it/s] 69it [00:07, 9.28it/s] 70it [00:07, 9.36it/s] 71it [00:07, 9.39it/s] 72it [00:07, 9.44it/s] 73it [00:07, 9.49it/s] 74it [00:07, 9.49it/s] 75it [00:07, 9.47it/s] 76it [00:07, 9.47it/s] 77it [00:08, 9.52it/s] 78it [00:08, 9.53it/s] 79it [00:08, 9.54it/s] 80it [00:08, 9.55it/s] 81it [00:08, 9.54it/s] 82it [00:08, 9.57it/s] 83it [00:08, 9.61it/s] 84it [00:08, 9.63it/s] 85it [00:08, 9.61it/s] 86it [00:09, 9.63it/s] 87it [00:09, 9.67it/s] 88it [00:09, 9.63it/s] 89it [00:09, 9.60it/s] 90it [00:09, 9.60it/s] 91it [00:09, 9.64it/s] 92it [00:09, 9.62it/s] 93it [00:09, 9.63it/s] 94it [00:09, 9.64it/s] 95it [00:09, 9.62it/s] 96it [00:10, 9.58it/s] 97it [00:10, 9.61it/s] 98it [00:10, 9.61it/s] 99it [00:10, 9.60it/s] 100it [00:10, 9.56it/s]2025-05-26 05:11:54,646 - INFO - [Epoch 083 | Batch 0100] IWAE-loss 4239.6172 | mean log_px -0.0240 | KL -3028.14 + 101it [00:10, 9.59it/s] 102it [00:10, 9.59it/s] 103it [00:10, 9.63it/s] 104it [00:10, 9.63it/s] 105it [00:11, 9.62it/s] 106it [00:11, 9.63it/s] 107it [00:11, 9.63it/s] 108it [00:11, 9.60it/s] 109it [00:11, 9.62it/s] 110it [00:11, 9.33it/s] 111it [00:11, 9.39it/s] 112it [00:11, 9.44it/s] 113it [00:11, 9.45it/s] 114it [00:11, 9.42it/s] 115it [00:12, 9.44it/s] 116it [00:12, 9.46it/s] 117it [00:12, 9.49it/s] 118it [00:12, 9.46it/s] 119it [00:12, 9.39it/s] 120it [00:12, 9.39it/s] 121it [00:12, 9.44it/s] 122it [00:12, 9.24it/s] 123it [00:12, 9.33it/s] 124it [00:13, 9.37it/s] 125it [00:13, 9.38it/s] 126it [00:13, 9.35it/s] 127it [00:13, 9.40it/s] 128it [00:13, 9.43it/s] 129it [00:13, 9.45it/s] 130it [00:13, 9.50it/s] 131it [00:13, 9.48it/s] 132it [00:13, 9.49it/s] 133it [00:13, 9.50it/s] 134it [00:14, 9.48it/s] 135it [00:14, 9.47it/s] 136it [00:14, 9.45it/s] 137it [00:14, 9.43it/s] 138it [00:14, 9.41it/s] 139it [00:14, 9.45it/s] 140it [00:14, 9.45it/s] 141it [00:14, 9.47it/s] 142it [00:14, 9.46it/s] 143it [00:15, 9.27it/s] 144it [00:15, 9.31it/s] 145it [00:15, 9.38it/s] 146it [00:15, 9.41it/s] 147it [00:15, 9.42it/s] 148it [00:15, 9.44it/s] 149it [00:15, 9.43it/s] 150it [00:15, 9.40it/s]2025-05-26 05:11:59,940 - INFO - [Epoch 083 | Batch 0150] IWAE-loss 3907.8083 | mean log_px -0.0154 | KL -3022.59 + 151it [00:15, 9.38it/s] 152it [00:15, 9.42it/s] 153it [00:16, 9.41it/s] 154it [00:16, 9.44it/s] 155it [00:16, 9.49it/s] 156it [00:16, 9.48it/s] 157it [00:16, 9.48it/s] 158it [00:16, 9.22it/s] 159it [00:16, 9.10it/s] 160it [00:16, 9.05it/s] 161it [00:16, 9.22it/s] 162it [00:17, 9.33it/s] 163it [00:17, 9.16it/s] 164it [00:17, 8.82it/s] 165it [00:17, 9.05it/s] 166it [00:17, 9.20it/s] 167it [00:17, 9.32it/s] 168it [00:17, 9.42it/s] 169it [00:17, 9.46it/s] 170it [00:17, 9.48it/s] 171it [00:18, 9.42it/s] 172it [00:18, 9.41it/s] 173it [00:18, 9.32it/s] 174it [00:18, 9.35it/s] 175it [00:18, 9.39it/s] 176it [00:18, 9.30it/s] 177it [00:18, 9.27it/s] 178it [00:18, 9.23it/s] 179it [00:18, 9.31it/s] 180it [00:19, 9.37it/s] 181it [00:19, 9.42it/s] 182it [00:19, 9.44it/s] 183it [00:19, 9.41it/s] 184it [00:19, 8.91it/s] 185it [00:19, 8.97it/s] 186it [00:19, 8.84it/s] 187it [00:19, 8.71it/s] 188it [00:19, 8.94it/s] 189it [00:20, 8.89it/s] 190it [00:20, 8.84it/s] 191it [00:20, 8.95it/s] 192it [00:20, 9.05it/s] 193it [00:20, 9.16it/s] 194it [00:20, 9.23it/s] 195it [00:20, 8.71it/s] 196it [00:20, 8.95it/s] 196it [00:20, 9.40it/s] +2025-05-26 05:12:04,947 - INFO - Epoch: 83, Objective: tensor([3918.3167], device='cuda:0', grad_fn=), Loss: 0.013034864328801632, KL/n: 61.751060485839844 + 0it [00:00, ?it/s]2025-05-26 05:12:05,409 - INFO - [Epoch 084 | Batch 0000] IWAE-loss 3879.0281 | mean log_px -0.0132 | KL -3020.57 + 1it [00:00, 4.68it/s] 2it [00:00, 6.64it/s] 3it [00:00, 7.78it/s] 4it [00:00, 8.37it/s] 5it [00:00, 8.77it/s] 6it [00:00, 9.02it/s] 7it [00:00, 9.24it/s] 8it [00:00, 9.33it/s] 9it [00:01, 8.63it/s] 10it [00:01, 8.92it/s] 11it [00:01, 9.15it/s] 12it [00:01, 9.30it/s] 13it [00:01, 8.89it/s] 14it [00:01, 9.15it/s] 15it [00:01, 9.37it/s] 16it [00:01, 9.50it/s] 17it [00:01, 9.02it/s] 18it [00:02, 9.23it/s] 19it [00:02, 9.38it/s] 20it [00:02, 9.48it/s] 21it [00:02, 8.94it/s] 22it [00:02, 9.19it/s] 23it [00:02, 9.40it/s] 24it [00:02, 9.53it/s] 25it [00:02, 9.03it/s] 26it [00:02, 9.27it/s] 27it [00:03, 9.46it/s] 28it [00:03, 9.55it/s] 29it [00:03, 9.18it/s] 30it [00:03, 9.37it/s] 31it [00:03, 9.52it/s] 32it [00:03, 9.61it/s] 33it [00:03, 9.70it/s] 34it [00:03, 9.73it/s] 35it [00:03, 9.78it/s] 36it [00:03, 9.78it/s] 37it [00:04, 9.80it/s] 38it [00:04, 9.80it/s] 39it [00:04, 9.84it/s] 40it [00:04, 9.77it/s] 41it [00:04, 9.81it/s] 42it [00:04, 9.81it/s] 43it [00:04, 9.81it/s] 44it [00:04, 9.83it/s] 45it [00:04, 9.84it/s] 46it [00:04, 9.82it/s] 47it [00:05, 9.20it/s] 48it [00:05, 9.37it/s] 49it [00:05, 9.53it/s] 50it [00:05, 9.44it/s]2025-05-26 05:12:10,720 - INFO - [Epoch 084 | Batch 0050] IWAE-loss 3803.3413 | mean log_px -0.0113 | KL -3022.37 + 51it [00:05, 9.46it/s] 52it [00:05, 9.48it/s] 53it [00:05, 9.49it/s] 54it [00:05, 9.48it/s] 55it [00:05, 9.49it/s] 56it [00:06, 9.46it/s] 57it [00:06, 9.47it/s] 58it [00:06, 9.45it/s] 59it [00:06, 9.37it/s] 60it [00:06, 9.39it/s] 61it [00:06, 9.43it/s] 62it [00:06, 9.46it/s] 63it [00:06, 9.54it/s] 64it [00:06, 9.51it/s] 65it [00:06, 9.50it/s] 66it [00:07, 8.89it/s] 67it [00:07, 9.09it/s] 68it [00:07, 9.20it/s] 69it [00:07, 9.36it/s] 70it [00:07, 9.50it/s] 71it [00:07, 9.50it/s] 72it [00:07, 9.51it/s] 73it [00:07, 9.57it/s] 74it [00:07, 9.54it/s] 75it [00:08, 9.54it/s] 76it [00:08, 9.51it/s] 77it [00:08, 9.50it/s] 78it [00:08, 9.14it/s] 79it [00:08, 9.23it/s] 80it [00:08, 9.34it/s] 81it [00:08, 9.39it/s] 82it [00:08, 9.44it/s] 83it [00:08, 9.27it/s] 84it [00:09, 9.31it/s] 85it [00:09, 9.36it/s] 86it [00:09, 9.37it/s] 87it [00:09, 9.24it/s] 88it [00:09, 9.34it/s] 89it [00:09, 9.35it/s] 90it [00:09, 9.42it/s] 91it [00:09, 9.46it/s] 92it [00:09, 9.51it/s] 93it [00:09, 9.48it/s] 94it [00:10, 9.45it/s] 95it [00:10, 9.48it/s] 96it [00:10, 9.52it/s] 97it [00:10, 9.48it/s] 98it [00:10, 9.48it/s] 99it [00:10, 9.47it/s] 100it [00:10, 9.48it/s]2025-05-26 05:12:16,031 - INFO - [Epoch 084 | Batch 0100] IWAE-loss 6303.6221 | mean log_px -0.0504 | KL -3017.94 + 101it [00:10, 9.47it/s] 102it [00:10, 9.49it/s] 103it [00:11, 9.48it/s] 104it [00:11, 9.49it/s] 105it [00:11, 9.49it/s] 106it [00:11, 9.50it/s] 107it [00:11, 9.51it/s] 108it [00:11, 9.51it/s] 109it [00:11, 9.50it/s] 110it [00:11, 9.48it/s] 111it [00:11, 9.53it/s] 112it [00:11, 9.47it/s] 113it [00:12, 9.50it/s] 114it [00:12, 9.50it/s] 115it [00:12, 9.51it/s] 116it [00:12, 9.50it/s] 117it [00:12, 9.46it/s] 118it [00:12, 9.43it/s] 119it [00:12, 9.42it/s] 120it [00:12, 9.48it/s] 121it [00:12, 9.50it/s] 122it [00:13, 9.47it/s] 123it [00:13, 9.52it/s] 124it [00:13, 9.49it/s] 125it [00:13, 9.44it/s] 126it [00:13, 9.50it/s] 127it [00:13, 9.50it/s] 128it [00:13, 9.48it/s] 129it [00:13, 9.50it/s] 130it [00:13, 9.47it/s] 131it [00:13, 9.47it/s] 132it [00:14, 9.45it/s] 133it [00:14, 9.47it/s] 134it [00:14, 9.47it/s] 135it [00:14, 9.49it/s] 136it [00:14, 9.51it/s] 137it [00:14, 9.62it/s] 138it [00:14, 9.71it/s] 139it [00:14, 9.76it/s] 140it [00:14, 9.78it/s] 141it [00:15, 9.80it/s] 142it [00:15, 9.82it/s] 143it [00:15, 9.86it/s] 144it [00:15, 9.88it/s] 145it [00:15, 9.90it/s] 146it [00:15, 9.89it/s] 147it [00:15, 9.89it/s] 148it [00:15, 9.89it/s] 149it [00:15, 9.90it/s] 150it [00:15, 9.90it/s]2025-05-26 05:12:21,239 - INFO - [Epoch 084 | Batch 0150] IWAE-loss 3802.7544 | mean log_px -0.0130 | KL -3015.59 + 151it [00:16, 9.27it/s] 152it [00:16, 9.45it/s] 153it [00:16, 9.61it/s] 154it [00:16, 9.69it/s] 155it [00:16, 9.78it/s] 156it [00:16, 9.84it/s] 157it [00:16, 9.88it/s] 158it [00:16, 9.89it/s] 159it [00:16, 9.91it/s] 160it [00:16, 9.41it/s] 161it [00:17, 9.54it/s] 162it [00:17, 9.66it/s] 163it [00:17, 9.75it/s] 164it [00:17, 9.79it/s] 165it [00:17, 9.84it/s] 166it [00:17, 9.86it/s] 167it [00:17, 9.89it/s] 168it [00:17, 9.89it/s] 169it [00:17, 9.89it/s] 170it [00:17, 9.90it/s] 171it [00:18, 9.90it/s] 172it [00:18, 9.90it/s] 173it [00:18, 9.90it/s] 174it [00:18, 9.92it/s] 176it [00:18, 9.98it/s] 177it [00:18, 9.98it/s] 178it [00:18, 9.97it/s] 179it [00:18, 9.97it/s] 180it [00:18, 9.97it/s] 181it [00:19, 9.33it/s] 182it [00:19, 9.49it/s] 183it [00:19, 9.63it/s] 184it [00:19, 9.71it/s] 185it [00:19, 9.79it/s] 186it [00:19, 9.83it/s] 187it [00:19, 9.84it/s] 188it [00:19, 9.87it/s] 190it [00:20, 9.93it/s] 191it [00:20, 9.94it/s] 192it [00:20, 9.76it/s] 193it [00:20, 9.80it/s] 194it [00:20, 9.83it/s] 195it [00:20, 9.30it/s] 196it [00:20, 9.47it/s] +2025-05-26 05:12:25,960 - INFO - Epoch: 84, Objective: tensor([4500.4517], device='cuda:0', grad_fn=), Loss: 0.03310453146696091, KL/n: 61.500885009765625 + 0it [00:00, ?it/s]2025-05-26 05:12:26,231 - INFO - [Epoch 085 | Batch 0000] IWAE-loss 3595.1533 | mean log_px -0.0110 | KL -3013.15 + 1it [00:00, 4.85it/s] 3it [00:00, 7.90it/s] 4it [00:00, 7.99it/s] 6it [00:00, 8.92it/s] 8it [00:00, 9.37it/s] 10it [00:01, 9.64it/s] 12it [00:01, 9.80it/s] 13it [00:01, 9.59it/s] 15it [00:01, 9.77it/s] 17it [00:01, 9.90it/s] 19it [00:02, 9.97it/s] 21it [00:02, 9.66it/s] 23it [00:02, 9.79it/s] 25it [00:02, 9.90it/s] 27it [00:02, 9.97it/s] 29it [00:03, 10.02it/s] 31it [00:03, 10.06it/s] 33it [00:03, 10.09it/s] 35it [00:03, 10.10it/s] 37it [00:03, 10.10it/s] 39it [00:04, 10.11it/s] 41it [00:04, 10.10it/s] 43it [00:04, 10.10it/s] 45it [00:04, 10.10it/s] 47it [00:04, 10.13it/s] 49it [00:05, 10.13it/s]2025-05-26 05:12:31,257 - INFO - [Epoch 085 | Batch 0050] IWAE-loss 3756.6094 | mean log_px -0.0141 | KL -3010.08 + 51it [00:05, 10.12it/s] 53it [00:05, 10.12it/s] 55it [00:05, 10.11it/s] 57it [00:05, 10.12it/s] 59it [00:06, 10.07it/s] 61it [00:06, 9.71it/s] 62it [00:06, 9.71it/s] 63it [00:06, 9.73it/s] 64it [00:06, 9.73it/s] 65it [00:06, 9.75it/s] 66it [00:06, 9.75it/s] 67it [00:06, 9.75it/s] 68it [00:06, 9.76it/s] 69it [00:07, 9.76it/s] 70it [00:07, 9.74it/s] 71it [00:07, 9.15it/s] 72it [00:07, 9.38it/s] 74it [00:07, 9.70it/s] 76it [00:07, 9.87it/s] 78it [00:07, 9.97it/s] 80it [00:08, 10.03it/s] 81it [00:08, 9.70it/s] 82it [00:08, 9.76it/s] 83it [00:08, 9.71it/s] 85it [00:08, 9.87it/s] 87it [00:08, 9.96it/s] 89it [00:09, 9.76it/s] 91it [00:09, 9.87it/s] 93it [00:09, 9.94it/s] 94it [00:09, 9.59it/s] 96it [00:09, 9.77it/s] 98it [00:10, 9.57it/s] 99it [00:10, 9.63it/s] 100it [00:10, 9.67it/s]2025-05-26 05:12:36,375 - INFO - [Epoch 085 | Batch 0100] IWAE-loss 3645.5867 | mean log_px -0.0103 | KL -3006.17 + 101it [00:10, 9.73it/s] 103it [00:10, 9.45it/s] 104it [00:10, 9.56it/s] 105it [00:10, 9.59it/s] 107it [00:10, 9.80it/s] 109it [00:11, 9.91it/s] 111it [00:11, 9.98it/s] 113it [00:11, 10.03it/s] 115it [00:11, 10.07it/s] 117it [00:11, 10.09it/s] 119it [00:12, 10.11it/s] 121it [00:12, 9.76it/s] 123it [00:12, 9.88it/s] 125it [00:12, 9.96it/s] 127it [00:12, 10.00it/s] 129it [00:13, 10.04it/s] 131it [00:13, 10.07it/s] 133it [00:13, 10.01it/s] 135it [00:13, 9.71it/s] 136it [00:13, 9.76it/s] 138it [00:14, 9.89it/s] 140it [00:14, 9.97it/s] 142it [00:14, 10.03it/s] 144it [00:14, 10.06it/s] 146it [00:14, 10.04it/s] 148it [00:15, 10.06it/s] 150it [00:15, 10.07it/s]2025-05-26 05:12:41,397 - INFO - [Epoch 085 | Batch 0150] IWAE-loss 4150.4175 | mean log_px -0.0174 | KL -3003.18 + 152it [00:15, 10.07it/s] 154it [00:15, 10.08it/s] 156it [00:15, 10.09it/s] 158it [00:16, 10.08it/s] 160it [00:16, 9.74it/s] 162it [00:16, 9.51it/s] 164it [00:16, 9.68it/s] 166it [00:16, 9.80it/s] 167it [00:16, 9.55it/s] 169it [00:17, 9.71it/s] 171it [00:17, 9.84it/s] 173it [00:17, 9.58it/s] 175it [00:17, 9.74it/s] 177it [00:18, 9.85it/s] 179it [00:18, 9.92it/s] 181it [00:18, 9.98it/s] 183it [00:18, 10.02it/s] 185it [00:18, 10.05it/s] 187it [00:19, 10.06it/s] 189it [00:19, 10.04it/s] 191it [00:19, 10.06it/s] 193it [00:19, 10.08it/s] 195it [00:19, 9.82it/s] 196it [00:19, 9.82it/s] +2025-05-26 05:12:46,054 - INFO - Epoch: 85, Objective: tensor([3568.9839], device='cuda:0', grad_fn=), Loss: 0.01087101548910141, KL/n: 61.26937484741211 + 0it [00:00, ?it/s]2025-05-26 05:12:46,521 - INFO - [Epoch 086 | Batch 0000] IWAE-loss 3738.7234 | mean log_px -0.0156 | KL -3002.08 + 1it [00:00, 4.62it/s] 2it [00:00, 6.76it/s] 4it [00:00, 8.49it/s] 5it [00:00, 8.86it/s] 6it [00:00, 9.16it/s] 7it [00:00, 9.40it/s] 8it [00:00, 9.55it/s] 10it [00:01, 9.77it/s] 12it [00:01, 9.88it/s] 14it [00:01, 9.93it/s] 16it [00:01, 9.96it/s] 18it [00:01, 9.93it/s] 20it [00:02, 9.95it/s] 22it [00:02, 9.97it/s] 24it [00:02, 10.00it/s] 25it [00:02, 9.69it/s] 26it [00:02, 9.74it/s] 27it [00:02, 9.79it/s] 28it [00:02, 9.82it/s] 29it [00:03, 9.32it/s] 30it [00:03, 9.49it/s] 31it [00:03, 9.62it/s] 32it [00:03, 9.69it/s] 33it [00:03, 9.78it/s] 34it [00:03, 9.81it/s] 35it [00:03, 9.87it/s] 36it [00:03, 9.86it/s] 38it [00:03, 9.92it/s] 39it [00:04, 9.94it/s] 40it [00:04, 9.91it/s] 42it [00:04, 9.96it/s] 44it [00:04, 10.00it/s] 46it [00:04, 10.01it/s] 47it [00:04, 10.00it/s] 48it [00:04, 9.98it/s] 49it [00:05, 9.57it/s] 50it [00:05, 9.66it/s]2025-05-26 05:12:51,617 - INFO - [Epoch 086 | Batch 0050] IWAE-loss 3615.4333 | mean log_px -0.0113 | KL -2999.07 + 51it [00:05, 9.73it/s] 52it [00:05, 9.79it/s] 54it [00:05, 9.91it/s] 56it [00:05, 9.95it/s] 57it [00:05, 9.96it/s] 58it [00:05, 9.93it/s] 59it [00:06, 9.94it/s] 60it [00:06, 9.94it/s] 62it [00:06, 9.98it/s] 64it [00:06, 9.93it/s] 65it [00:06, 9.89it/s] 66it [00:06, 9.87it/s] 68it [00:06, 9.94it/s] 70it [00:07, 9.98it/s] 71it [00:07, 9.98it/s] 72it [00:07, 9.97it/s] 73it [00:07, 9.77it/s] 74it [00:07, 9.39it/s] 76it [00:07, 9.64it/s] 78it [00:08, 9.78it/s] 80it [00:08, 9.87it/s] 82it [00:08, 9.92it/s] 84it [00:08, 9.96it/s] 86it [00:08, 9.99it/s] 88it [00:09, 10.00it/s] 90it [00:09, 10.01it/s] 92it [00:09, 10.02it/s] 94it [00:09, 10.03it/s] 96it [00:09, 10.03it/s] 98it [00:10, 10.04it/s] 100it [00:10, 10.03it/s]2025-05-26 05:12:56,644 - INFO - [Epoch 086 | Batch 0100] IWAE-loss 4592.9512 | mean log_px -0.0254 | KL -2993.21 + 102it [00:10, 10.01it/s] 104it [00:10, 10.01it/s] 106it [00:10, 10.01it/s] 108it [00:11, 9.74it/s] 110it [00:11, 9.82it/s] 112it [00:11, 9.89it/s] 113it [00:11, 9.91it/s] 114it [00:11, 9.93it/s] 116it [00:11, 9.97it/s] 117it [00:11, 9.51it/s] 118it [00:12, 9.61it/s] 120it [00:12, 9.77it/s] 122it [00:12, 9.86it/s] 123it [00:12, 9.89it/s] 124it [00:12, 9.91it/s] 126it [00:12, 9.97it/s] 128it [00:13, 10.00it/s] 130it [00:13, 9.92it/s] 131it [00:13, 9.92it/s] 132it [00:13, 9.92it/s] 133it [00:13, 9.94it/s] 134it [00:13, 9.94it/s] 136it [00:13, 9.98it/s] 137it [00:13, 9.56it/s] 138it [00:14, 9.66it/s] 140it [00:14, 9.80it/s] 141it [00:14, 9.82it/s] 142it [00:14, 9.84it/s] 144it [00:14, 9.90it/s] 146it [00:14, 9.95it/s] 147it [00:14, 9.91it/s] 149it [00:15, 9.97it/s]2025-05-26 05:13:01,708 - INFO - [Epoch 086 | Batch 0150] IWAE-loss 3799.1528 | mean log_px -0.0115 | KL -2990.14 + 151it [00:15, 9.98it/s] 153it [00:15, 10.01it/s] 154it [00:15, 9.66it/s] 156it [00:15, 9.79it/s] 157it [00:16, 9.42it/s] 159it [00:16, 9.64it/s] 160it [00:16, 9.69it/s] 162it [00:16, 9.84it/s] 164it [00:16, 9.91it/s] 166it [00:16, 9.97it/s] 167it [00:17, 9.94it/s] 168it [00:17, 9.84it/s] 169it [00:17, 9.30it/s] 170it [00:17, 9.36it/s] 171it [00:17, 9.52it/s] 172it [00:17, 9.63it/s] 173it [00:17, 9.72it/s] 174it [00:17, 9.78it/s] 176it [00:17, 9.38it/s] 178it [00:18, 9.62it/s] 180it [00:18, 9.74it/s] 182it [00:18, 9.54it/s] 183it [00:18, 9.62it/s] 184it [00:18, 9.61it/s] 185it [00:18, 9.68it/s] 187it [00:19, 9.82it/s] 189it [00:19, 9.51it/s] 190it [00:19, 9.60it/s] 192it [00:19, 9.76it/s] 194it [00:19, 9.86it/s] 195it [00:19, 9.13it/s] 196it [00:20, 9.74it/s] +2025-05-26 05:13:06,494 - INFO - Epoch: 86, Objective: tensor([3665.3276], device='cuda:0', grad_fn=), Loss: 0.01617186702787876, KL/n: 61.00396728515625 + 0it [00:00, ?it/s]2025-05-26 05:13:06,762 - INFO - [Epoch 087 | Batch 0000] IWAE-loss 3902.4707 | mean log_px -0.0153 | KL -2986.10 + 1it [00:00, 5.52it/s] 2it [00:00, 7.46it/s] 4it [00:00, 8.34it/s] 6it [00:00, 9.07it/s] 7it [00:00, 9.28it/s] 9it [00:01, 9.60it/s] 11it [00:01, 9.78it/s] 13it [00:01, 9.89it/s] 15it [00:01, 9.96it/s] 16it [00:01, 9.55it/s] 18it [00:01, 9.73it/s] 19it [00:02, 9.78it/s] 20it [00:02, 9.82it/s] 22it [00:02, 9.92it/s] 24it [00:02, 9.96it/s] 26it [00:02, 9.98it/s] 27it [00:02, 9.61it/s] 29it [00:03, 9.78it/s] 31it [00:03, 9.87it/s] 32it [00:03, 9.89it/s] 34it [00:03, 9.95it/s] 35it [00:03, 9.95it/s] 36it [00:03, 9.95it/s] 38it [00:03, 10.00it/s] 40it [00:04, 10.02it/s] 42it [00:04, 9.99it/s] 43it [00:04, 9.95it/s] 44it [00:04, 9.96it/s] 46it [00:04, 9.99it/s] 48it [00:04, 10.01it/s] 50it [00:05, 10.02it/s]2025-05-26 05:13:11,815 - INFO - [Epoch 087 | Batch 0050] IWAE-loss 4207.4248 | mean log_px -0.0193 | KL -2987.37 + 52it [00:05, 9.97it/s] 53it [00:05, 9.66it/s] 54it [00:05, 9.67it/s] 56it [00:05, 9.79it/s] 58it [00:05, 9.88it/s] 59it [00:06, 9.89it/s] 60it [00:06, 9.91it/s] 61it [00:06, 9.92it/s] 62it [00:06, 9.93it/s] 64it [00:06, 9.97it/s] 65it [00:06, 9.59it/s] 67it [00:06, 9.77it/s] 68it [00:06, 9.81it/s] 70it [00:07, 9.91it/s] 72it [00:07, 9.63it/s] 74it [00:07, 9.77it/s] 76it [00:07, 9.87it/s] 78it [00:07, 9.93it/s] 79it [00:08, 9.94it/s] 81it [00:08, 9.98it/s] 82it [00:08, 9.98it/s] 84it [00:08, 10.01it/s] 86it [00:08, 10.02it/s] 88it [00:08, 10.03it/s] 90it [00:09, 10.04it/s] 92it [00:09, 10.05it/s] 94it [00:09, 10.04it/s] 96it [00:09, 9.70it/s] 98it [00:09, 9.79it/s] 100it [00:10, 9.86it/s]2025-05-26 05:13:16,883 - INFO - [Epoch 087 | Batch 0100] IWAE-loss 3976.6338 | mean log_px -0.0192 | KL -2984.05 + 101it [00:10, 9.86it/s] 102it [00:10, 9.45it/s] 103it [00:10, 9.56it/s] 104it [00:10, 9.66it/s] 105it [00:10, 9.74it/s] 106it [00:10, 9.80it/s] 108it [00:11, 9.90it/s] 110it [00:11, 9.96it/s] 112it [00:11, 9.99it/s] 114it [00:11, 10.00it/s] 115it [00:11, 9.57it/s] 116it [00:11, 9.65it/s] 118it [00:12, 9.81it/s] 120it [00:12, 9.85it/s] 121it [00:12, 9.85it/s] 122it [00:12, 9.83it/s] 123it [00:12, 9.84it/s] 124it [00:12, 9.84it/s] 125it [00:12, 9.85it/s] 126it [00:12, 9.83it/s] 127it [00:12, 9.84it/s] 128it [00:13, 9.82it/s] 129it [00:13, 9.84it/s] 130it [00:13, 9.82it/s] 131it [00:13, 9.82it/s] 132it [00:13, 9.81it/s] 133it [00:13, 9.83it/s] 134it [00:13, 9.82it/s] 135it [00:13, 9.84it/s] 136it [00:13, 9.82it/s] 137it [00:13, 9.84it/s] 138it [00:14, 9.81it/s] 139it [00:14, 9.83it/s] 140it [00:14, 9.81it/s] 141it [00:14, 9.82it/s] 142it [00:14, 9.81it/s] 143it [00:14, 9.82it/s] 144it [00:14, 9.82it/s] 145it [00:14, 9.85it/s] 146it [00:14, 9.84it/s] 147it [00:14, 9.85it/s] 148it [00:15, 9.83it/s] 149it [00:15, 9.85it/s] 150it [00:15, 9.83it/s]2025-05-26 05:13:21,981 - INFO - [Epoch 087 | Batch 0150] IWAE-loss 3641.0764 | mean log_px -0.0103 | KL -2975.16 + 151it [00:15, 9.81it/s] 152it [00:15, 9.80it/s] 153it [00:15, 9.81it/s] 154it [00:15, 9.79it/s] 155it [00:15, 9.67it/s] 156it [00:15, 9.68it/s] 157it [00:16, 9.64it/s] 158it [00:16, 9.68it/s] 159it [00:16, 9.72it/s] 160it [00:16, 9.72it/s] 161it [00:16, 9.76it/s] 162it [00:16, 9.76it/s] 163it [00:16, 9.78it/s] 164it [00:16, 9.77it/s] 165it [00:16, 9.78it/s] 166it [00:16, 9.80it/s] 167it [00:17, 9.80it/s] 168it [00:17, 9.80it/s] 169it [00:17, 9.82it/s] 170it [00:17, 9.82it/s] 171it [00:17, 9.82it/s] 172it [00:17, 9.80it/s] 173it [00:17, 9.82it/s] 174it [00:17, 9.81it/s] 175it [00:17, 9.83it/s] 176it [00:17, 9.83it/s] 177it [00:18, 9.86it/s] 178it [00:18, 9.84it/s] 179it [00:18, 9.87it/s] 180it [00:18, 9.86it/s] 181it [00:18, 9.87it/s] 182it [00:18, 9.86it/s] 183it [00:18, 9.87it/s] 184it [00:18, 9.85it/s] 185it [00:18, 9.86it/s] 186it [00:18, 9.85it/s] 187it [00:19, 9.86it/s] 188it [00:19, 9.85it/s] 189it [00:19, 9.85it/s] 190it [00:19, 9.85it/s] 191it [00:19, 9.84it/s] 192it [00:19, 9.85it/s] 193it [00:19, 9.85it/s] 194it [00:19, 9.84it/s] 195it [00:19, 9.38it/s] 196it [00:20, 9.77it/s] +2025-05-26 05:13:26,682 - INFO - Epoch: 87, Objective: tensor([3995.7356], device='cuda:0', grad_fn=), Loss: 0.013150476850569248, KL/n: 60.77505874633789 + 0it [00:00, ?it/s]2025-05-26 05:13:27,137 - INFO - [Epoch 088 | Batch 0000] IWAE-loss 3533.7141 | mean log_px -0.0108 | KL -2978.48 + 1it [00:00, 5.48it/s] 2it [00:00, 7.36it/s] 3it [00:00, 8.32it/s] 4it [00:00, 8.87it/s] 5it [00:00, 9.22it/s] 6it [00:00, 9.43it/s] 7it [00:00, 9.55it/s] 8it [00:00, 9.64it/s] 9it [00:00, 9.67it/s] 10it [00:01, 9.69it/s] 11it [00:01, 9.71it/s] 12it [00:01, 9.70it/s] 13it [00:01, 9.73it/s] 14it [00:01, 9.70it/s] 15it [00:01, 9.73it/s] 16it [00:01, 9.73it/s] 17it [00:01, 9.72it/s] 18it [00:01, 9.69it/s] 19it [00:02, 9.72it/s] 20it [00:02, 9.68it/s] 21it [00:02, 9.72it/s] 22it [00:02, 9.70it/s] 23it [00:02, 9.72it/s] 24it [00:02, 9.71it/s] 25it [00:02, 9.69it/s] 26it [00:02, 9.65it/s] 27it [00:02, 9.66it/s] 28it [00:02, 9.65it/s] 29it [00:03, 9.65it/s] 30it [00:03, 9.52it/s] 31it [00:03, 9.56it/s] 32it [00:03, 9.61it/s] 33it [00:03, 9.65it/s] 34it [00:03, 9.64it/s] 35it [00:03, 9.68it/s] 36it [00:03, 9.67it/s] 37it [00:03, 9.70it/s] 38it [00:03, 9.70it/s] 39it [00:04, 9.72it/s] 40it [00:04, 9.71it/s] 41it [00:04, 9.73it/s] 42it [00:04, 9.73it/s] 43it [00:04, 9.72it/s] 44it [00:04, 9.70it/s] 45it [00:04, 9.76it/s] 46it [00:04, 9.75it/s] 47it [00:04, 9.77it/s] 48it [00:05, 9.76it/s] 49it [00:05, 9.75it/s] 50it [00:05, 9.78it/s]2025-05-26 05:13:32,282 - INFO - [Epoch 088 | Batch 0050] IWAE-loss 4089.7800 | mean log_px -0.0202 | KL -2976.60 + 51it [00:05, 9.74it/s] 52it [00:05, 9.73it/s] 53it [00:05, 9.73it/s] 54it [00:05, 9.70it/s] 55it [00:05, 9.75it/s] 56it [00:05, 9.72it/s] 57it [00:05, 9.73it/s] 58it [00:06, 9.74it/s] 59it [00:06, 9.75it/s] 60it [00:06, 9.73it/s] 61it [00:06, 9.73it/s] 62it [00:06, 9.72it/s] 63it [00:06, 9.71it/s] 64it [00:06, 9.71it/s] 65it [00:06, 9.56it/s] 66it [00:06, 9.61it/s] 67it [00:06, 9.65it/s] 68it [00:07, 9.68it/s] 69it [00:07, 9.72it/s] 70it [00:07, 9.71it/s] 71it [00:07, 9.74it/s] 72it [00:07, 9.73it/s] 73it [00:07, 9.74it/s] 74it [00:07, 9.72it/s] 75it [00:07, 9.65it/s] 76it [00:07, 9.52it/s] 77it [00:08, 9.33it/s] 78it [00:08, 9.42it/s] 79it [00:08, 9.51it/s] 80it [00:08, 9.56it/s] 81it [00:08, 9.63it/s] 82it [00:08, 9.65it/s] 83it [00:08, 9.67it/s] 84it [00:08, 9.68it/s] 85it [00:08, 9.72it/s] 86it [00:08, 9.69it/s] 87it [00:09, 9.58it/s] 88it [00:09, 9.58it/s] 89it [00:09, 9.64it/s] 90it [00:09, 9.65it/s] 91it [00:09, 9.67it/s] 92it [00:09, 9.68it/s] 93it [00:09, 9.70it/s] 94it [00:09, 9.69it/s] 95it [00:09, 9.69it/s] 96it [00:09, 9.69it/s] 97it [00:10, 9.66it/s] 98it [00:10, 9.66it/s] 99it [00:10, 9.67it/s] 100it [00:10, 9.70it/s]2025-05-26 05:13:37,456 - INFO - [Epoch 088 | Batch 0100] IWAE-loss 3568.9946 | mean log_px -0.0101 | KL -2965.73 + 101it [00:10, 9.70it/s] 102it [00:10, 9.71it/s] 103it [00:10, 9.72it/s] 104it [00:10, 9.68it/s] 105it [00:10, 9.70it/s] 106it [00:11, 9.68it/s] 107it [00:11, 9.71it/s] 108it [00:11, 9.71it/s] 109it [00:11, 9.73it/s] 110it [00:11, 9.74it/s] 111it [00:11, 9.73it/s] 112it [00:11, 9.74it/s] 113it [00:11, 9.79it/s] 114it [00:11, 9.77it/s] 115it [00:11, 9.80it/s] 116it [00:12, 9.81it/s] 117it [00:12, 9.82it/s] 118it [00:12, 9.82it/s] 119it [00:12, 9.81it/s] 120it [00:12, 9.78it/s] 121it [00:12, 9.77it/s] 122it [00:12, 9.78it/s] 123it [00:12, 9.81it/s] 124it [00:12, 9.81it/s] 125it [00:12, 9.81it/s] 126it [00:13, 9.82it/s] 127it [00:13, 9.83it/s] 128it [00:13, 9.83it/s] 129it [00:13, 9.84it/s] 130it [00:13, 9.83it/s] 131it [00:13, 9.82it/s] 132it [00:13, 9.80it/s] 133it [00:13, 9.78it/s] 134it [00:13, 9.77it/s] 135it [00:13, 9.76it/s] 136it [00:14, 9.76it/s] 137it [00:14, 9.79it/s] 138it [00:14, 9.78it/s] 139it [00:14, 9.79it/s] 140it [00:14, 9.79it/s] 141it [00:14, 9.82it/s] 142it [00:14, 9.76it/s] 143it [00:14, 9.79it/s] 144it [00:14, 9.80it/s] 145it [00:14, 9.81it/s] 146it [00:15, 9.81it/s] 147it [00:15, 9.83it/s] 148it [00:15, 9.77it/s] 149it [00:15, 9.81it/s] 150it [00:15, 9.82it/s]2025-05-26 05:13:42,566 - INFO - [Epoch 088 | Batch 0150] IWAE-loss 3878.7766 | mean log_px -0.0216 | KL -2965.69 + 151it [00:15, 9.75it/s] 152it [00:15, 9.75it/s] 153it [00:15, 9.79it/s] 154it [00:15, 9.80it/s] 155it [00:16, 9.83it/s] 156it [00:16, 9.83it/s] 157it [00:16, 9.86it/s] 158it [00:16, 9.81it/s] 159it [00:16, 9.83it/s] 160it [00:16, 9.79it/s] 161it [00:16, 9.79it/s] 162it [00:16, 9.76it/s] 163it [00:16, 9.75it/s] 164it [00:16, 9.74it/s] 165it [00:17, 9.75it/s] 166it [00:17, 9.74it/s] 167it [00:17, 9.76it/s] 168it [00:17, 9.76it/s] 169it [00:17, 9.75it/s] 170it [00:17, 9.74it/s] 171it [00:17, 9.75it/s] 172it [00:17, 9.74it/s] 173it [00:17, 9.79it/s] 174it [00:17, 9.79it/s] 175it [00:18, 9.81it/s] 176it [00:18, 9.73it/s] 177it [00:18, 9.66it/s] 178it [00:18, 9.67it/s] 179it [00:18, 9.70it/s] 180it [00:18, 9.71it/s] 181it [00:18, 9.72it/s] 182it [00:18, 9.72it/s] 183it [00:18, 9.73it/s] 184it [00:18, 9.73it/s] 185it [00:19, 9.69it/s] 186it [00:19, 9.69it/s] 187it [00:19, 9.72it/s] 188it [00:19, 9.72it/s] 189it [00:19, 9.74it/s] 190it [00:19, 9.72it/s] 191it [00:19, 9.76it/s] 192it [00:19, 9.73it/s] 193it [00:19, 9.70it/s] 194it [00:20, 9.71it/s] 195it [00:20, 9.28it/s] 196it [00:20, 9.65it/s] +2025-05-26 05:13:47,301 - INFO - Epoch: 88, Objective: tensor([3712.7053], device='cuda:0', grad_fn=), Loss: 0.014657406136393547, KL/n: 60.55072784423828 + 0it [00:00, ?it/s]2025-05-26 05:13:47,577 - INFO - [Epoch 089 | Batch 0000] IWAE-loss 3791.1438 | mean log_px -0.0117 | KL -2966.70 + 1it [00:00, 5.33it/s] 2it [00:00, 7.28it/s] 3it [00:00, 8.27it/s] 4it [00:00, 8.81it/s] 5it [00:00, 9.17it/s] 6it [00:00, 9.37it/s] 7it [00:00, 9.53it/s] 8it [00:00, 9.62it/s] 9it [00:01, 9.70it/s] 10it [00:01, 9.72it/s] 11it [00:01, 9.77it/s] 12it [00:01, 9.78it/s] 13it [00:01, 9.80it/s] 14it [00:01, 9.79it/s] 15it [00:01, 9.80it/s] 16it [00:01, 9.78it/s] 17it [00:01, 9.58it/s] 18it [00:01, 9.25it/s] 19it [00:02, 9.15it/s] 20it [00:02, 8.64it/s] 21it [00:02, 8.96it/s] 22it [00:02, 9.20it/s] 23it [00:02, 9.29it/s] 24it [00:02, 8.97it/s] 25it [00:02, 9.15it/s] 26it [00:02, 9.29it/s] 27it [00:02, 9.37it/s] 28it [00:03, 9.01it/s] 29it [00:03, 9.17it/s] 30it [00:03, 9.31it/s] 31it [00:03, 8.97it/s] 32it [00:03, 9.16it/s] 33it [00:03, 9.32it/s] 34it [00:03, 9.48it/s] 35it [00:03, 9.51it/s] 36it [00:03, 9.53it/s] 37it [00:04, 9.45it/s] 38it [00:04, 9.50it/s] 39it [00:04, 9.37it/s] 40it [00:04, 9.43it/s] 41it [00:04, 9.13it/s] 42it [00:04, 9.29it/s] 43it [00:04, 9.40it/s] 44it [00:04, 9.44it/s] 45it [00:04, 9.46it/s] 46it [00:04, 8.97it/s] 47it [00:05, 8.90it/s] 48it [00:05, 9.03it/s] 49it [00:05, 9.14it/s] 50it [00:05, 9.22it/s]2025-05-26 05:13:52,908 - INFO - [Epoch 089 | Batch 0050] IWAE-loss 3452.4019 | mean log_px -0.0074 | KL -2963.17 + 51it [00:05, 9.28it/s] 52it [00:05, 9.26it/s] 53it [00:05, 9.38it/s] 54it [00:05, 9.40it/s] 55it [00:05, 9.49it/s] 56it [00:06, 9.53it/s] 57it [00:06, 9.54it/s] 58it [00:06, 9.54it/s] 59it [00:06, 9.53it/s] 60it [00:06, 9.51it/s] 61it [00:06, 9.50it/s] 62it [00:06, 9.51it/s] 63it [00:06, 9.51it/s] 64it [00:06, 9.52it/s] 65it [00:06, 9.54it/s] 66it [00:07, 9.53it/s] 67it [00:07, 9.38it/s] 68it [00:07, 9.43it/s] 69it [00:07, 9.41it/s] 70it [00:07, 9.49it/s] 71it [00:07, 8.94it/s] 72it [00:07, 9.09it/s] 73it [00:07, 9.20it/s] 74it [00:07, 9.28it/s] 75it [00:08, 9.33it/s] 76it [00:08, 9.40it/s] 77it [00:08, 9.50it/s] 78it [00:08, 9.49it/s] 79it [00:08, 9.51it/s] 80it [00:08, 9.50it/s] 81it [00:08, 9.50it/s] 82it [00:08, 9.50it/s] 83it [00:08, 8.96it/s] 84it [00:09, 9.09it/s] 85it [00:09, 9.13it/s] 86it [00:09, 9.09it/s] 87it [00:09, 9.21it/s] 88it [00:09, 9.21it/s] 89it [00:09, 8.97it/s] 90it [00:09, 8.60it/s] 91it [00:09, 8.75it/s] 92it [00:09, 8.84it/s] 93it [00:10, 9.09it/s] 94it [00:10, 9.27it/s] 95it [00:10, 9.42it/s] 96it [00:10, 9.52it/s] 97it [00:10, 9.59it/s] 98it [00:10, 9.59it/s] 99it [00:10, 9.54it/s] 100it [00:10, 9.47it/s]2025-05-26 05:13:58,259 - INFO - [Epoch 089 | Batch 0100] IWAE-loss 3771.1143 | mean log_px -0.0146 | KL -2961.73 + 101it [00:10, 9.56it/s] 102it [00:10, 9.63it/s] 103it [00:11, 9.60it/s] 104it [00:11, 9.51it/s] 105it [00:11, 9.50it/s] 106it [00:11, 9.64it/s] 108it [00:11, 9.82it/s] 110it [00:11, 9.93it/s] 112it [00:11, 9.98it/s] 114it [00:12, 10.00it/s] 115it [00:12, 9.93it/s] 116it [00:12, 9.45it/s] 118it [00:12, 9.69it/s] 120it [00:12, 9.82it/s] 122it [00:13, 9.91it/s] 124it [00:13, 9.96it/s] 126it [00:13, 10.00it/s] 128it [00:13, 10.01it/s] 130it [00:13, 10.02it/s] 132it [00:14, 10.01it/s] 134it [00:14, 10.03it/s] 136it [00:14, 10.03it/s] 138it [00:14, 10.04it/s] 140it [00:14, 10.04it/s] 142it [00:14, 10.01it/s] 144it [00:15, 9.95it/s] 145it [00:15, 9.93it/s] 146it [00:15, 9.90it/s] 147it [00:15, 9.89it/s] 148it [00:15, 9.86it/s] 149it [00:15, 9.87it/s] 150it [00:15, 9.85it/s]2025-05-26 05:14:03,305 - INFO - [Epoch 089 | Batch 0150] IWAE-loss 3447.8906 | mean log_px -0.0127 | KL -2953.03 + 151it [00:15, 9.84it/s] 152it [00:16, 9.82it/s] 153it [00:16, 9.82it/s] 154it [00:16, 9.79it/s] 155it [00:16, 9.80it/s] 156it [00:16, 9.81it/s] 157it [00:16, 9.82it/s] 158it [00:16, 9.83it/s] 159it [00:16, 9.83it/s] 160it [00:16, 9.82it/s] 161it [00:16, 9.82it/s] 162it [00:17, 9.82it/s] 163it [00:17, 9.83it/s] 164it [00:17, 9.83it/s] 165it [00:17, 9.85it/s] 166it [00:17, 9.84it/s] 167it [00:17, 9.84it/s] 168it [00:17, 9.83it/s] 169it [00:17, 9.85it/s] 170it [00:17, 9.84it/s] 171it [00:17, 9.86it/s] 172it [00:18, 9.86it/s] 173it [00:18, 9.86it/s] 174it [00:18, 9.84it/s] 175it [00:18, 9.85it/s] 176it [00:18, 9.84it/s] 177it [00:18, 9.84it/s] 178it [00:18, 9.75it/s] 179it [00:18, 9.61it/s] 180it [00:18, 9.46it/s] 181it [00:18, 9.36it/s] 182it [00:19, 9.43it/s] 183it [00:19, 9.51it/s] 184it [00:19, 9.56it/s] 185it [00:19, 9.60it/s] 186it [00:19, 9.60it/s] 187it [00:19, 9.63it/s] 188it [00:19, 9.65it/s] 189it [00:19, 9.66it/s] 190it [00:19, 9.65it/s] 191it [00:20, 9.01it/s] 192it [00:20, 9.24it/s] 194it [00:20, 9.60it/s] 195it [00:20, 8.74it/s] 196it [00:20, 8.97it/s] 196it [00:20, 9.49it/s] +2025-05-26 05:14:08,090 - INFO - Epoch: 89, Objective: tensor([3744.3455], device='cuda:0', grad_fn=), Loss: 0.016745569184422493, KL/n: 60.30201721191406 + 0it [00:00, ?it/s]2025-05-26 05:14:08,554 - INFO - [Epoch 090 | Batch 0000] IWAE-loss 4105.8560 | mean log_px -0.0164 | KL -2952.96 + 1it [00:00, 5.30it/s] 3it [00:00, 8.20it/s] 5it [00:00, 9.10it/s] 7it [00:00, 9.53it/s] 9it [00:00, 9.74it/s] 11it [00:01, 9.88it/s] 12it [00:01, 9.33it/s] 13it [00:01, 9.36it/s] 14it [00:01, 9.34it/s] 16it [00:01, 9.63it/s] 18it [00:01, 9.80it/s] 19it [00:02, 9.83it/s] 21it [00:02, 9.93it/s] 22it [00:02, 9.92it/s] 24it [00:02, 9.94it/s] 25it [00:02, 9.46it/s] 26it [00:02, 9.55it/s] 27it [00:02, 9.58it/s] 28it [00:02, 9.60it/s] 30it [00:03, 9.79it/s] 31it [00:03, 9.45it/s] 33it [00:03, 9.69it/s] 35it [00:03, 9.42it/s] 37it [00:03, 9.59it/s] 39it [00:04, 9.75it/s] 40it [00:04, 9.40it/s] 42it [00:04, 9.61it/s] 44it [00:04, 9.77it/s] 46it [00:04, 9.89it/s] 48it [00:05, 9.61it/s] 50it [00:05, 9.76it/s]2025-05-26 05:14:13,690 - INFO - [Epoch 090 | Batch 0050] IWAE-loss 3642.5940 | mean log_px -0.0134 | KL -2952.94 + 51it [00:05, 9.75it/s] 53it [00:05, 9.55it/s] 54it [00:05, 9.60it/s] 55it [00:05, 9.65it/s] 57it [00:05, 9.83it/s] 59it [00:06, 9.93it/s] 60it [00:06, 9.51it/s] 62it [00:06, 9.72it/s] 64it [00:06, 9.85it/s] 65it [00:06, 9.84it/s] 67it [00:06, 9.49it/s] 69it [00:07, 9.70it/s] 70it [00:07, 9.76it/s] 72it [00:07, 9.49it/s] 74it [00:07, 9.68it/s] 76it [00:07, 9.81it/s] 78it [00:08, 9.91it/s] 80it [00:08, 9.61it/s] 82it [00:08, 9.75it/s] 84it [00:08, 9.85it/s] 86it [00:08, 9.93it/s] 88it [00:09, 9.97it/s] 90it [00:09, 10.01it/s] 92it [00:09, 9.76it/s] 94it [00:09, 9.86it/s] 96it [00:09, 9.60it/s] 98it [00:10, 9.75it/s] 100it [00:10, 9.86it/s]2025-05-26 05:14:18,810 - INFO - [Epoch 090 | Batch 0100] IWAE-loss 4252.8389 | mean log_px -0.0252 | KL -2944.33 + 101it [00:10, 9.85it/s] 103it [00:10, 9.95it/s] 104it [00:10, 9.54it/s] 106it [00:10, 9.67it/s] 107it [00:11, 9.68it/s] 108it [00:11, 9.73it/s] 110it [00:11, 9.85it/s] 111it [00:11, 9.81it/s] 113it [00:11, 9.84it/s] 115it [00:11, 9.54it/s] 116it [00:11, 9.62it/s] 118it [00:12, 9.80it/s] 120it [00:12, 9.89it/s] 122it [00:12, 9.96it/s] 124it [00:12, 10.01it/s] 126it [00:12, 10.04it/s] 128it [00:13, 10.06it/s] 130it [00:13, 10.07it/s] 132it [00:13, 9.73it/s] 134it [00:13, 9.61it/s] 135it [00:13, 9.67it/s] 137it [00:14, 9.82it/s] 139it [00:14, 9.91it/s] 141it [00:14, 9.97it/s] 143it [00:14, 10.01it/s] 145it [00:14, 10.04it/s] 147it [00:15, 10.05it/s] 149it [00:15, 10.07it/s]2025-05-26 05:14:23,869 - INFO - [Epoch 090 | Batch 0150] IWAE-loss 3503.3472 | mean log_px -0.0103 | KL -2943.74 + 151it [00:15, 9.74it/s] 153it [00:15, 9.84it/s] 155it [00:15, 9.59it/s] 157it [00:16, 9.74it/s] 159it [00:16, 9.59it/s] 161it [00:16, 9.74it/s] 163it [00:16, 9.84it/s] 165it [00:16, 9.58it/s] 167it [00:17, 9.74it/s] 168it [00:17, 9.43it/s] 170it [00:17, 9.65it/s] 172it [00:17, 9.79it/s] 174it [00:17, 9.54it/s] 176it [00:18, 9.71it/s] 177it [00:18, 9.38it/s] 179it [00:18, 9.63it/s] 181it [00:18, 9.77it/s] 183it [00:18, 9.87it/s] 184it [00:18, 9.85it/s] 185it [00:19, 9.52it/s] 187it [00:19, 9.70it/s] 189it [00:19, 9.84it/s] 190it [00:19, 9.53it/s] 192it [00:19, 9.73it/s] 194it [00:19, 9.84it/s] 195it [00:20, 9.23it/s] 196it [00:20, 9.68it/s] +2025-05-26 05:14:28,663 - INFO - Epoch: 90, Objective: tensor([3948.3491], device='cuda:0', grad_fn=), Loss: 0.02164594642817974, KL/n: 60.072139739990234 + 0it [00:00, ?it/s]2025-05-26 05:14:28,933 - INFO - [Epoch 091 | Batch 0000] IWAE-loss 3966.0691 | mean log_px -0.0175 | KL -2943.96 + 1it [00:00, 5.50it/s] 2it [00:00, 7.44it/s] 4it [00:00, 8.88it/s] 6it [00:00, 9.40it/s] 7it [00:00, 9.49it/s] 8it [00:00, 9.57it/s] 9it [00:00, 9.68it/s] 10it [00:01, 9.76it/s] 12it [00:01, 9.88it/s] 14it [00:01, 9.97it/s] 15it [00:01, 9.96it/s] 17it [00:01, 9.67it/s] 18it [00:01, 9.73it/s] 19it [00:02, 9.73it/s] 20it [00:02, 9.79it/s] 22it [00:02, 9.89it/s] 24it [00:02, 9.93it/s] 26it [00:02, 9.96it/s] 28it [00:02, 10.00it/s] 29it [00:03, 9.98it/s] 30it [00:03, 9.97it/s] 32it [00:03, 9.99it/s] 33it [00:03, 9.80it/s] 34it [00:03, 9.47it/s] 36it [00:03, 9.72it/s] 38it [00:03, 9.84it/s] 39it [00:04, 9.43it/s] 40it [00:04, 9.55it/s] 41it [00:04, 9.65it/s] 43it [00:04, 9.82it/s] 44it [00:04, 9.83it/s] 45it [00:04, 9.86it/s] 46it [00:04, 9.89it/s] 48it [00:04, 9.94it/s] 49it [00:05, 9.95it/s] 50it [00:05, 9.95it/s]2025-05-26 05:14:34,004 - INFO - [Epoch 091 | Batch 0050] IWAE-loss 3997.3748 | mean log_px -0.0152 | KL -2940.93 + 51it [00:05, 9.94it/s] 52it [00:05, 9.93it/s] 54it [00:05, 9.99it/s] 56it [00:05, 10.00it/s] 58it [00:05, 10.02it/s] 60it [00:06, 10.00it/s] 62it [00:06, 10.01it/s] 64it [00:06, 10.03it/s] 66it [00:06, 10.03it/s] 68it [00:06, 10.02it/s] 70it [00:07, 10.02it/s] 72it [00:07, 10.04it/s] 74it [00:07, 9.71it/s] 75it [00:07, 9.76it/s] 76it [00:07, 9.80it/s] 78it [00:07, 9.88it/s] 79it [00:08, 9.48it/s] 80it [00:08, 9.58it/s] 81it [00:08, 9.66it/s] 82it [00:08, 9.74it/s] 83it [00:08, 9.79it/s] 84it [00:08, 9.82it/s] 86it [00:08, 9.80it/s] 87it [00:08, 9.74it/s] 88it [00:09, 9.16it/s] 89it [00:09, 9.16it/s] 90it [00:09, 9.15it/s] 91it [00:09, 9.14it/s] 92it [00:09, 8.93it/s] 93it [00:09, 9.20it/s] 94it [00:09, 9.37it/s] 95it [00:09, 9.49it/s] 96it [00:09, 9.56it/s] 97it [00:09, 9.56it/s] 98it [00:10, 9.02it/s] 99it [00:10, 9.25it/s]2025-05-26 05:14:39,168 - INFO - [Epoch 091 | Batch 0100] IWAE-loss 3747.8899 | mean log_px -0.0144 | KL -2939.49 + 101it [00:10, 9.59it/s] 102it [00:10, 9.68it/s] 104it [00:10, 9.84it/s] 105it [00:10, 9.87it/s] 107it [00:11, 9.94it/s] 108it [00:11, 9.95it/s] 109it [00:11, 9.95it/s] 110it [00:11, 9.93it/s] 112it [00:11, 10.00it/s] 113it [00:11, 9.49it/s] 114it [00:11, 9.59it/s] 116it [00:11, 9.76it/s] 117it [00:12, 9.30it/s] 119it [00:12, 9.58it/s] 120it [00:12, 9.66it/s] 121it [00:12, 9.72it/s] 122it [00:12, 9.78it/s] 123it [00:12, 9.84it/s] 124it [00:12, 9.88it/s] 125it [00:12, 9.88it/s] 127it [00:13, 9.97it/s] 128it [00:13, 9.96it/s] 129it [00:13, 9.96it/s] 130it [00:13, 9.97it/s] 131it [00:13, 9.80it/s] 132it [00:13, 9.16it/s] 133it [00:13, 9.38it/s] 134it [00:13, 9.52it/s] 136it [00:13, 9.74it/s] 137it [00:14, 9.30it/s] 138it [00:14, 9.47it/s] 140it [00:14, 9.70it/s] 141it [00:14, 9.76it/s] 142it [00:14, 9.81it/s] 144it [00:14, 9.90it/s] 145it [00:14, 9.52it/s] 146it [00:15, 9.60it/s] 147it [00:15, 9.65it/s] 148it [00:15, 9.20it/s] 150it [00:15, 9.52it/s]2025-05-26 05:14:44,321 - INFO - [Epoch 091 | Batch 0150] IWAE-loss 4462.9419 | mean log_px -0.0253 | KL -2929.27 + 151it [00:15, 9.09it/s] 152it [00:15, 9.31it/s] 153it [00:15, 9.48it/s] 154it [00:15, 9.33it/s] 155it [00:16, 9.31it/s] 156it [00:16, 9.30it/s] 158it [00:16, 9.62it/s] 160it [00:16, 9.78it/s] 162it [00:16, 9.88it/s] 164it [00:16, 9.57it/s] 165it [00:17, 9.64it/s] 166it [00:17, 9.71it/s] 168it [00:17, 9.84it/s] 170it [00:17, 9.91it/s] 171it [00:17, 9.49it/s] 172it [00:17, 9.57it/s] 174it [00:17, 9.76it/s] 175it [00:18, 9.37it/s] 176it [00:18, 9.50it/s] 178it [00:18, 9.71it/s] 180it [00:18, 9.43it/s] 181it [00:18, 9.52it/s] 182it [00:18, 9.62it/s] 184it [00:19, 9.80it/s] 185it [00:19, 9.83it/s] 187it [00:19, 9.94it/s] 188it [00:19, 9.95it/s] 189it [00:19, 9.96it/s] 190it [00:19, 9.97it/s] 192it [00:19, 9.53it/s] 193it [00:19, 9.63it/s] 194it [00:20, 9.69it/s] 195it [00:20, 8.84it/s] 196it [00:20, 9.64it/s] +2025-05-26 05:14:49,117 - INFO - Epoch: 91, Objective: tensor([3768.4514], device='cuda:0', grad_fn=), Loss: 0.01296775322407484, KL/n: 59.81892013549805 + 0it [00:00, ?it/s]2025-05-26 05:14:49,575 - INFO - [Epoch 092 | Batch 0000] IWAE-loss 3812.1208 | mean log_px -0.0154 | KL -2928.92 + 1it [00:00, 5.48it/s] 2it [00:00, 6.79it/s] 4it [00:00, 8.56it/s] 6it [00:00, 8.80it/s] 8it [00:00, 9.30it/s] 10it [00:01, 9.29it/s] 12it [00:01, 9.57it/s] 14it [00:01, 9.76it/s] 16it [00:01, 9.53it/s] 18it [00:01, 9.71it/s] 20it [00:02, 9.57it/s] 22it [00:02, 9.74it/s] 24it [00:02, 9.86it/s] 26it [00:02, 9.95it/s] 27it [00:02, 9.58it/s] 28it [00:02, 9.66it/s] 30it [00:03, 9.83it/s] 32it [00:03, 9.93it/s] 33it [00:03, 9.63it/s] 35it [00:03, 9.81it/s] 37it [00:03, 9.93it/s] 38it [00:03, 9.62it/s] 39it [00:04, 9.64it/s] 41it [00:04, 9.84it/s] 43it [00:04, 9.94it/s] 45it [00:04, 10.01it/s] 47it [00:04, 9.69it/s] 49it [00:05, 9.83it/s] 50it [00:05, 9.48it/s]2025-05-26 05:14:54,725 - INFO - [Epoch 092 | Batch 0050] IWAE-loss 3494.9722 | mean log_px -0.0081 | KL -2923.38 + 52it [00:05, 9.67it/s] 54it [00:05, 9.83it/s] 56it [00:05, 9.93it/s] 57it [00:05, 9.56it/s] 59it [00:06, 9.76it/s] 60it [00:06, 9.39it/s] 62it [00:06, 9.65it/s] 64it [00:06, 9.82it/s] 66it [00:06, 9.93it/s] 68it [00:07, 10.00it/s] 70it [00:07, 9.76it/s] 72it [00:07, 9.87it/s] 74it [00:07, 9.68it/s] 75it [00:07, 9.59it/s] 76it [00:07, 9.36it/s] 77it [00:08, 9.37it/s] 79it [00:08, 9.64it/s] 81it [00:08, 9.81it/s] 83it [00:08, 9.91it/s] 84it [00:08, 9.93it/s] 85it [00:08, 9.76it/s] 86it [00:08, 9.45it/s] 87it [00:09, 9.49it/s] 89it [00:09, 9.59it/s] 90it [00:09, 9.68it/s] 91it [00:09, 9.26it/s] 93it [00:09, 9.60it/s] 95it [00:09, 9.76it/s] 96it [00:09, 9.37it/s] 98it [00:10, 9.64it/s] 100it [00:10, 9.81it/s]2025-05-26 05:14:59,872 - INFO - [Epoch 092 | Batch 0100] IWAE-loss 3449.9321 | mean log_px -0.0083 | KL -2921.72 + 102it [00:10, 9.89it/s] 104it [00:10, 9.67it/s] 106it [00:10, 9.81it/s] 108it [00:11, 9.90it/s] 110it [00:11, 9.68it/s] 112it [00:11, 9.80it/s] 114it [00:11, 9.57it/s] 116it [00:12, 9.62it/s] 117it [00:12, 9.66it/s] 118it [00:12, 9.59it/s] 120it [00:12, 9.68it/s] 122it [00:12, 9.81it/s] 124it [00:12, 9.51it/s] 125it [00:12, 9.49it/s] 126it [00:13, 9.55it/s] 127it [00:13, 9.61it/s] 128it [00:13, 9.64it/s] 129it [00:13, 9.71it/s] 130it [00:13, 9.74it/s] 131it [00:13, 9.80it/s] 132it [00:13, 9.82it/s] 133it [00:13, 9.86it/s] 134it [00:13, 9.86it/s] 135it [00:14, 9.26it/s] 136it [00:14, 9.43it/s] 137it [00:14, 9.55it/s] 138it [00:14, 9.62it/s] 139it [00:14, 9.70it/s] 140it [00:14, 9.72it/s] 141it [00:14, 9.75it/s] 142it [00:14, 9.78it/s] 143it [00:14, 9.82it/s] 144it [00:14, 9.83it/s] 145it [00:15, 9.86it/s] 146it [00:15, 9.33it/s] 147it [00:15, 9.49it/s] 148it [00:15, 9.58it/s] 149it [00:15, 9.57it/s] 150it [00:15, 9.60it/s]2025-05-26 05:15:05,052 - INFO - [Epoch 092 | Batch 0150] IWAE-loss 3478.1560 | mean log_px -0.0111 | KL -2921.63 + 151it [00:15, 9.62it/s] 152it [00:15, 9.64it/s] 153it [00:15, 9.71it/s] 154it [00:15, 9.73it/s] 155it [00:16, 9.78it/s] 156it [00:16, 9.79it/s] 157it [00:16, 9.81it/s] 158it [00:16, 9.83it/s] 159it [00:16, 9.84it/s] 160it [00:16, 9.85it/s] 161it [00:16, 9.86it/s] 162it [00:16, 9.85it/s] 163it [00:16, 9.84it/s] 164it [00:16, 9.85it/s] 165it [00:17, 9.25it/s] 166it [00:17, 9.40it/s] 167it [00:17, 9.55it/s] 168it [00:17, 9.65it/s] 169it [00:17, 9.73it/s] 170it [00:17, 9.75it/s] 171it [00:17, 9.81it/s] 172it [00:17, 9.78it/s] 173it [00:17, 9.82it/s] 174it [00:18, 9.83it/s] 175it [00:18, 9.80it/s] 176it [00:18, 9.81it/s] 177it [00:18, 9.84it/s] 178it [00:18, 9.80it/s] 179it [00:18, 9.83it/s] 180it [00:18, 9.84it/s] 181it [00:18, 9.22it/s] 182it [00:18, 9.41it/s] 183it [00:18, 9.53it/s] 184it [00:19, 9.58it/s] 185it [00:19, 9.68it/s] 186it [00:19, 9.70it/s] 187it [00:19, 9.73it/s] 188it [00:19, 9.78it/s] 189it [00:19, 9.72it/s] 190it [00:19, 9.16it/s] 191it [00:19, 9.19it/s] 192it [00:19, 9.31it/s] 193it [00:20, 9.39it/s] 194it [00:20, 9.45it/s] 195it [00:20, 9.15it/s] 196it [00:20, 9.61it/s] +2025-05-26 05:15:09,827 - INFO - Epoch: 92, Objective: tensor([3705.5750], device='cuda:0', grad_fn=), Loss: 0.016982443630695343, KL/n: 59.582088470458984 + 0it [00:00, ?it/s]2025-05-26 05:15:10,103 - INFO - [Epoch 093 | Batch 0000] IWAE-loss 4068.8088 | mean log_px -0.0203 | KL -2920.25 + 1it [00:00, 4.68it/s] 2it [00:00, 6.72it/s] 3it [00:00, 7.89it/s] 4it [00:00, 8.00it/s] 5it [00:00, 8.61it/s] 6it [00:00, 8.92it/s] 7it [00:00, 8.62it/s] 8it [00:00, 9.00it/s] 10it [00:01, 9.47it/s] 11it [00:01, 9.59it/s] 12it [00:01, 9.66it/s] 14it [00:01, 9.35it/s] 15it [00:01, 9.49it/s] 16it [00:01, 9.60it/s] 18it [00:01, 9.76it/s] 19it [00:02, 9.78it/s] 20it [00:02, 9.82it/s] 21it [00:02, 9.84it/s] 22it [00:02, 9.86it/s] 23it [00:02, 9.89it/s] 24it [00:02, 9.90it/s] 25it [00:02, 9.91it/s] 26it [00:02, 9.93it/s] 28it [00:03, 9.96it/s] 30it [00:03, 10.00it/s] 32it [00:03, 10.00it/s] 34it [00:03, 10.01it/s] 36it [00:03, 9.99it/s] 37it [00:03, 9.99it/s] 38it [00:04, 9.97it/s] 40it [00:04, 10.00it/s] 41it [00:04, 9.99it/s] 42it [00:04, 9.98it/s] 43it [00:04, 9.97it/s] 44it [00:04, 9.97it/s] 45it [00:04, 9.98it/s] 46it [00:04, 9.97it/s] 47it [00:04, 9.97it/s] 48it [00:05, 9.97it/s] 49it [00:05, 9.96it/s] 50it [00:05, 9.97it/s]2025-05-26 05:15:15,222 - INFO - [Epoch 093 | Batch 0050] IWAE-loss 4193.2715 | mean log_px -0.0235 | KL -2915.12 + 51it [00:05, 9.95it/s] 52it [00:05, 9.87it/s] 53it [00:05, 9.90it/s] 55it [00:05, 9.97it/s] 56it [00:05, 9.97it/s] 58it [00:06, 10.02it/s] 59it [00:06, 10.01it/s] 61it [00:06, 10.01it/s] 62it [00:06, 9.93it/s] 64it [00:06, 9.95it/s] 66it [00:06, 9.98it/s] 67it [00:06, 9.51it/s] 68it [00:07, 9.61it/s] 69it [00:07, 9.66it/s] 70it [00:07, 9.19it/s] 72it [00:07, 9.51it/s] 73it [00:07, 9.10it/s] 74it [00:07, 9.28it/s] 76it [00:07, 9.59it/s] 78it [00:08, 9.76it/s] 80it [00:08, 9.85it/s] 82it [00:08, 9.92it/s] 83it [00:08, 9.93it/s] 84it [00:08, 9.93it/s] 86it [00:08, 9.99it/s] 87it [00:09, 9.53it/s] 88it [00:09, 9.63it/s] 90it [00:09, 9.79it/s] 92it [00:09, 9.90it/s] 93it [00:09, 9.91it/s] 94it [00:09, 9.93it/s] 96it [00:09, 9.98it/s] 98it [00:10, 9.99it/s] 99it [00:10, 9.99it/s]2025-05-26 05:15:20,319 - INFO - [Epoch 093 | Batch 0100] IWAE-loss 3753.0735 | mean log_px -0.0142 | KL -2914.49 + 101it [00:10, 9.99it/s] 102it [00:10, 9.51it/s] 104it [00:10, 9.69it/s] 106it [00:10, 9.81it/s] 107it [00:11, 9.84it/s] 108it [00:11, 9.87it/s] 109it [00:11, 9.89it/s] 110it [00:11, 9.89it/s] 111it [00:11, 9.91it/s] 112it [00:11, 9.92it/s] 113it [00:11, 9.94it/s] 114it [00:11, 9.92it/s] 116it [00:11, 9.97it/s] 117it [00:12, 9.98it/s] 118it [00:12, 9.97it/s] 119it [00:12, 9.96it/s] 120it [00:12, 9.94it/s] 122it [00:12, 9.98it/s] 124it [00:12, 9.98it/s] 126it [00:12, 10.00it/s] 127it [00:13, 10.00it/s] 128it [00:13, 9.99it/s] 130it [00:13, 10.01it/s] 131it [00:13, 10.01it/s] 132it [00:13, 10.00it/s] 133it [00:13, 10.00it/s] 134it [00:13, 9.97it/s] 135it [00:13, 9.97it/s] 136it [00:13, 9.96it/s] 138it [00:14, 10.00it/s] 139it [00:14, 9.48it/s] 140it [00:14, 9.60it/s] 142it [00:14, 9.79it/s] 144it [00:14, 9.87it/s] 145it [00:14, 9.89it/s] 146it [00:14, 9.90it/s] 148it [00:15, 9.92it/s] 150it [00:15, 9.96it/s]2025-05-26 05:15:25,371 - INFO - [Epoch 093 | Batch 0150] IWAE-loss 3694.4592 | mean log_px -0.0135 | KL -2910.63 + 152it [00:15, 9.99it/s] 154it [00:15, 9.98it/s] 156it [00:15, 10.00it/s] 157it [00:16, 10.00it/s] 158it [00:16, 9.98it/s] 160it [00:16, 10.02it/s] 162it [00:16, 10.02it/s] 164it [00:16, 10.02it/s] 166it [00:16, 9.65it/s] 167it [00:17, 9.68it/s] 168it [00:17, 9.74it/s] 169it [00:17, 9.29it/s] 171it [00:17, 9.58it/s] 172it [00:17, 9.65it/s] 173it [00:17, 9.72it/s] 174it [00:17, 9.71it/s] 176it [00:18, 9.82it/s] 178it [00:18, 9.88it/s] 179it [00:18, 9.89it/s] 181it [00:18, 9.96it/s] 182it [00:18, 9.97it/s] 183it [00:18, 9.97it/s] 184it [00:18, 9.96it/s] 186it [00:19, 10.00it/s] 188it [00:19, 10.00it/s] 190it [00:19, 10.00it/s] 191it [00:19, 9.99it/s] 192it [00:19, 9.97it/s] 194it [00:19, 10.01it/s] 195it [00:19, 9.67it/s] 196it [00:20, 9.76it/s] +2025-05-26 05:15:30,034 - INFO - Epoch: 93, Objective: tensor([3518.6760], device='cuda:0', grad_fn=), Loss: 0.009369171224534512, KL/n: 59.381324768066406 + 0it [00:00, ?it/s]2025-05-26 05:15:30,469 - INFO - [Epoch 094 | Batch 0000] IWAE-loss 3675.7261 | mean log_px -0.0113 | KL -2903.85 + 1it [00:00, 5.42it/s] 3it [00:00, 8.27it/s] 5it [00:00, 9.15it/s] 7it [00:00, 9.11it/s] 9it [00:00, 9.43it/s] 11it [00:01, 9.67it/s] 13it [00:01, 9.82it/s] 15it [00:01, 9.89it/s] 16it [00:01, 9.60it/s] 18it [00:01, 9.77it/s] 20it [00:02, 9.61it/s] 22it [00:02, 9.76it/s] 24it [00:02, 9.88it/s] 26it [00:02, 9.95it/s] 28it [00:02, 10.01it/s] 30it [00:03, 10.05it/s] 32it [00:03, 10.07it/s] 34it [00:03, 10.09it/s] 36it [00:03, 10.11it/s] 38it [00:03, 10.13it/s] 40it [00:04, 10.13it/s] 42it [00:04, 10.03it/s] 44it [00:04, 10.05it/s] 46it [00:04, 10.08it/s] 48it [00:04, 10.11it/s] 50it [00:05, 10.11it/s]2025-05-26 05:15:35,501 - INFO - [Epoch 094 | Batch 0050] IWAE-loss 4268.3975 | mean log_px -0.0242 | KL -2905.98 + 52it [00:05, 9.84it/s] 54it [00:05, 9.92it/s] 56it [00:05, 9.98it/s] 58it [00:05, 10.03it/s] 60it [00:06, 10.05it/s] 62it [00:06, 10.08it/s] 64it [00:06, 10.02it/s] 66it [00:06, 9.77it/s] 68it [00:06, 9.88it/s] 70it [00:07, 9.94it/s] 72it [00:07, 9.73it/s] 73it [00:07, 9.77it/s] 74it [00:07, 9.80it/s] 75it [00:07, 9.40it/s] 77it [00:07, 9.68it/s] 78it [00:07, 9.31it/s] 80it [00:08, 9.61it/s] 81it [00:08, 9.68it/s] 82it [00:08, 9.28it/s] 84it [00:08, 9.60it/s] 85it [00:08, 9.56it/s] 86it [00:08, 9.65it/s] 88it [00:08, 9.84it/s] 90it [00:09, 9.94it/s] 92it [00:09, 10.00it/s] 94it [00:09, 10.05it/s] 96it [00:09, 10.07it/s] 98it [00:09, 10.08it/s] 100it [00:10, 9.89it/s]2025-05-26 05:15:40,603 - INFO - [Epoch 094 | Batch 0100] IWAE-loss 3504.3542 | mean log_px -0.0100 | KL -2904.47 + 101it [00:10, 9.49it/s] 102it [00:10, 9.58it/s] 104it [00:10, 9.77it/s] 106it [00:10, 9.89it/s] 108it [00:11, 9.97it/s] 110it [00:11, 10.02it/s] 112it [00:11, 10.01it/s] 114it [00:11, 10.04it/s] 116it [00:11, 10.06it/s] 118it [00:12, 9.70it/s] 119it [00:12, 9.73it/s] 120it [00:12, 9.68it/s] 122it [00:12, 9.51it/s] 124it [00:12, 9.72it/s] 126it [00:12, 9.86it/s] 128it [00:13, 9.94it/s] 130it [00:13, 9.72it/s] 132it [00:13, 9.83it/s] 134it [00:13, 9.92it/s] 136it [00:13, 9.98it/s] 138it [00:14, 10.01it/s] 140it [00:14, 10.05it/s] 142it [00:14, 10.08it/s] 144it [00:14, 10.10it/s] 146it [00:14, 10.11it/s] 148it [00:15, 10.12it/s] 150it [00:15, 10.12it/s]2025-05-26 05:15:45,637 - INFO - [Epoch 094 | Batch 0150] IWAE-loss 3472.2581 | mean log_px -0.0113 | KL -2900.82 + 152it [00:15, 10.12it/s] 154it [00:15, 10.12it/s] 156it [00:15, 10.14it/s] 158it [00:16, 10.13it/s] 160it [00:16, 10.13it/s] 162it [00:16, 10.13it/s] 164it [00:16, 10.10it/s] 166it [00:16, 10.09it/s] 168it [00:17, 10.06it/s] 170it [00:17, 10.07it/s] 172it [00:17, 10.08it/s] 174it [00:17, 10.10it/s] 176it [00:17, 10.11it/s] 178it [00:17, 10.12it/s] 180it [00:18, 10.12it/s] 182it [00:18, 10.13it/s] 184it [00:18, 10.11it/s] 186it [00:18, 10.11it/s] 188it [00:18, 10.13it/s] 190it [00:19, 10.14it/s] 192it [00:19, 10.13it/s] 194it [00:19, 9.86it/s] 195it [00:19, 9.60it/s] 196it [00:19, 9.86it/s] +2025-05-26 05:15:50,225 - INFO - Epoch: 94, Objective: tensor([3317.0979], device='cuda:0', grad_fn=), Loss: 0.006679388228803873, KL/n: 59.15084457397461 + 0it [00:00, ?it/s]2025-05-26 05:15:50,495 - INFO - [Epoch 095 | Batch 0000] IWAE-loss 3526.1443 | mean log_px -0.0090 | KL -2896.83 + 1it [00:00, 4.87it/s] 3it [00:00, 7.92it/s] 5it [00:00, 8.93it/s] 7it [00:00, 9.43it/s] 9it [00:00, 9.69it/s] 11it [00:01, 9.86it/s] 13it [00:01, 9.97it/s] 15it [00:01, 10.04it/s] 17it [00:01, 10.08it/s] 19it [00:01, 10.10it/s] 21it [00:02, 10.12it/s] 23it [00:02, 10.14it/s] 25it [00:02, 9.85it/s] 27it [00:02, 9.91it/s] 29it [00:02, 9.99it/s] 31it [00:03, 10.04it/s] 33it [00:03, 10.07it/s] 35it [00:03, 10.10it/s] 37it [00:03, 10.11it/s] 39it [00:03, 10.12it/s] 41it [00:04, 9.61it/s] 42it [00:04, 9.50it/s] 43it [00:04, 9.31it/s] 44it [00:04, 9.44it/s] 46it [00:04, 9.67it/s] 47it [00:04, 9.28it/s] 48it [00:04, 9.44it/s] 50it [00:05, 9.68it/s]2025-05-26 05:15:55,565 - INFO - [Epoch 095 | Batch 0050] IWAE-loss 3349.6074 | mean log_px -0.0067 | KL -2888.48 + 51it [00:05, 9.69it/s] 52it [00:05, 9.26it/s] 54it [00:05, 9.58it/s] 56it [00:05, 9.76it/s] 58it [00:05, 9.87it/s] 60it [00:06, 9.95it/s] 62it [00:06, 9.67it/s] 64it [00:06, 9.80it/s] 65it [00:06, 9.75it/s] 67it [00:06, 9.81it/s] 68it [00:06, 9.84it/s] 69it [00:07, 9.43it/s] 70it [00:07, 9.53it/s] 72it [00:07, 9.73it/s] 74it [00:07, 9.86it/s] 76it [00:07, 9.92it/s] 78it [00:08, 9.97it/s] 80it [00:08, 9.81it/s] 82it [00:08, 9.89it/s] 84it [00:08, 9.94it/s] 86it [00:08, 9.98it/s] 88it [00:09, 10.00it/s] 89it [00:09, 9.69it/s] 90it [00:09, 9.58it/s] 91it [00:09, 9.61it/s] 92it [00:09, 9.66it/s] 94it [00:09, 9.83it/s] 96it [00:09, 9.91it/s] 98it [00:10, 9.96it/s] 100it [00:10, 10.00it/s]2025-05-26 05:16:00,658 - INFO - [Epoch 095 | Batch 0100] IWAE-loss 3535.2415 | mean log_px -0.0105 | KL -2890.72 + 101it [00:10, 9.95it/s] 102it [00:10, 9.94it/s] 104it [00:10, 10.00it/s] 106it [00:10, 10.03it/s] 108it [00:11, 10.06it/s] 110it [00:11, 10.07it/s] 112it [00:11, 10.00it/s] 113it [00:11, 9.87it/s] 114it [00:11, 9.36it/s] 116it [00:11, 9.62it/s] 118it [00:12, 9.78it/s] 120it [00:12, 9.88it/s] 122it [00:12, 9.93it/s] 124it [00:12, 9.97it/s] 126it [00:12, 9.99it/s] 127it [00:12, 9.94it/s] 128it [00:13, 9.48it/s] 130it [00:13, 9.69it/s] 131it [00:13, 9.73it/s] 132it [00:13, 9.77it/s] 133it [00:13, 9.80it/s] 134it [00:13, 9.81it/s] 135it [00:13, 9.38it/s] 136it [00:13, 9.54it/s] 138it [00:14, 9.68it/s] 139it [00:14, 9.34it/s] 140it [00:14, 9.48it/s] 141it [00:14, 9.61it/s] 142it [00:14, 9.71it/s] 144it [00:14, 9.86it/s] 145it [00:14, 9.49it/s] 146it [00:14, 9.59it/s] 148it [00:15, 9.79it/s] 150it [00:15, 9.90it/s]2025-05-26 05:16:05,771 - INFO - [Epoch 095 | Batch 0150] IWAE-loss 4350.0732 | mean log_px -0.0231 | KL -2887.25 + 151it [00:15, 9.87it/s] 152it [00:15, 9.89it/s] 154it [00:15, 9.96it/s] 155it [00:15, 9.58it/s] 156it [00:15, 9.64it/s] 157it [00:16, 9.73it/s] 158it [00:16, 9.24it/s] 159it [00:16, 9.34it/s] 160it [00:16, 9.33it/s] 161it [00:16, 9.46it/s] 162it [00:16, 9.14it/s] 164it [00:16, 9.54it/s] 165it [00:16, 9.16it/s] 166it [00:17, 9.37it/s] 168it [00:17, 9.67it/s] 170it [00:17, 9.83it/s] 172it [00:17, 9.90it/s] 174it [00:17, 9.97it/s] 176it [00:18, 10.00it/s] 177it [00:18, 9.61it/s] 179it [00:18, 9.72it/s] 180it [00:18, 9.77it/s] 181it [00:18, 9.37it/s] 182it [00:18, 9.48it/s] 183it [00:18, 9.60it/s] 184it [00:18, 9.69it/s] 185it [00:19, 9.20it/s] 186it [00:19, 9.41it/s] 188it [00:19, 9.71it/s] 190it [00:19, 9.85it/s] 192it [00:19, 9.95it/s] 194it [00:19, 10.00it/s] 195it [00:20, 9.68it/s] 196it [00:20, 9.71it/s] +2025-05-26 05:16:10,537 - INFO - Epoch: 95, Objective: tensor([3332.1047], device='cuda:0', grad_fn=), Loss: 0.008258700370788574, KL/n: 58.8862190246582 + 0it [00:00, ?it/s]2025-05-26 05:16:10,992 - INFO - [Epoch 096 | Batch 0000] IWAE-loss 4336.8301 | mean log_px -0.0305 | KL -2885.20 + 1it [00:00, 4.81it/s] 3it [00:00, 7.87it/s] 5it [00:00, 8.45it/s] 7it [00:00, 9.04it/s] 9it [00:01, 9.40it/s] 10it [00:01, 9.02it/s] 11it [00:01, 9.00it/s] 12it [00:01, 9.12it/s] 13it [00:01, 9.28it/s] 14it [00:01, 9.44it/s] 15it [00:01, 9.14it/s] 16it [00:01, 9.33it/s] 17it [00:01, 9.50it/s] 18it [00:01, 9.61it/s] 19it [00:02, 9.13it/s] 20it [00:02, 9.34it/s] 21it [00:02, 9.45it/s] 22it [00:02, 9.58it/s] 24it [00:02, 9.81it/s] 25it [00:02, 9.79it/s] 26it [00:02, 9.76it/s] 27it [00:02, 9.81it/s] 29it [00:03, 9.95it/s] 31it [00:03, 10.03it/s] 33it [00:03, 10.07it/s] 35it [00:03, 10.09it/s] 37it [00:03, 10.09it/s] 39it [00:04, 10.09it/s] 41it [00:04, 10.10it/s] 43it [00:04, 10.11it/s] 45it [00:04, 10.11it/s] 47it [00:04, 10.11it/s] 49it [00:05, 10.11it/s]2025-05-26 05:16:16,112 - INFO - [Epoch 096 | Batch 0050] IWAE-loss 3660.0618 | mean log_px -0.0111 | KL -2883.02 + 51it [00:05, 10.09it/s] 53it [00:05, 10.09it/s] 55it [00:05, 10.10it/s] 57it [00:05, 10.10it/s] 59it [00:06, 10.09it/s] 61it [00:06, 10.09it/s] 63it [00:06, 10.08it/s] 65it [00:06, 10.08it/s] 67it [00:06, 10.09it/s] 69it [00:07, 10.09it/s] 71it [00:07, 10.10it/s] 73it [00:07, 10.11it/s] 75it [00:07, 10.11it/s] 77it [00:07, 10.12it/s] 79it [00:08, 9.85it/s] 81it [00:08, 9.93it/s] 82it [00:08, 9.89it/s] 84it [00:08, 9.96it/s] 86it [00:08, 10.01it/s] 88it [00:08, 10.04it/s] 90it [00:09, 10.07it/s] 92it [00:09, 9.73it/s] 94it [00:09, 9.85it/s] 96it [00:09, 9.94it/s] 98it [00:09, 10.00it/s] 100it [00:10, 10.04it/s]2025-05-26 05:16:21,103 - INFO - [Epoch 096 | Batch 0100] IWAE-loss 3525.8738 | mean log_px -0.0101 | KL -2880.33 + 102it [00:10, 10.04it/s] 104it [00:10, 10.07it/s] 106it [00:10, 10.09it/s] 108it [00:10, 10.09it/s] 110it [00:11, 10.09it/s] 112it [00:11, 10.10it/s] 114it [00:11, 10.11it/s] 116it [00:11, 10.12it/s] 118it [00:11, 10.13it/s] 120it [00:12, 9.97it/s] 121it [00:12, 9.69it/s] 123it [00:12, 9.83it/s] 125it [00:12, 9.93it/s] 127it [00:12, 9.99it/s] 129it [00:13, 10.04it/s] 131it [00:13, 10.06it/s] 133it [00:13, 10.08it/s] 135it [00:13, 10.10it/s] 137it [00:13, 9.68it/s] 138it [00:14, 9.72it/s] 139it [00:14, 9.66it/s] 140it [00:14, 9.72it/s] 142it [00:14, 9.87it/s] 144it [00:14, 9.97it/s] 146it [00:14, 10.02it/s] 148it [00:15, 10.07it/s] 150it [00:15, 10.09it/s]2025-05-26 05:16:26,109 - INFO - [Epoch 096 | Batch 0150] IWAE-loss 3406.4150 | mean log_px -0.0099 | KL -2879.07 + 152it [00:15, 10.08it/s] 154it [00:15, 9.99it/s] 156it [00:15, 10.00it/s] 158it [00:15, 10.04it/s] 160it [00:16, 10.05it/s] 162it [00:16, 10.05it/s] 164it [00:16, 9.69it/s] 166it [00:16, 9.80it/s] 168it [00:17, 9.90it/s] 170it [00:17, 9.96it/s] 171it [00:17, 9.59it/s] 173it [00:17, 9.76it/s] 175it [00:17, 9.87it/s] 177it [00:17, 9.95it/s] 179it [00:18, 10.00it/s] 181it [00:18, 10.03it/s] 183it [00:18, 10.06it/s] 185it [00:18, 10.09it/s] 187it [00:18, 10.11it/s] 189it [00:19, 10.12it/s] 191it [00:19, 10.12it/s] 193it [00:19, 10.12it/s] 195it [00:19, 9.86it/s] 196it [00:19, 9.86it/s] +2025-05-26 05:16:30,737 - INFO - Epoch: 96, Objective: tensor([3542.8840], device='cuda:0', grad_fn=), Loss: 0.012501702643930912, KL/n: 58.68415069580078 + 0it [00:00, ?it/s]2025-05-26 05:16:31,014 - INFO - [Epoch 097 | Batch 0000] IWAE-loss 4043.2427 | mean log_px -0.0168 | KL -2875.78 + 1it [00:00, 4.66it/s] 2it [00:00, 6.75it/s] 4it [00:00, 8.54it/s] 6it [00:00, 9.24it/s] 8it [00:00, 9.59it/s] 10it [00:01, 9.78it/s] 12it [00:01, 9.91it/s] 14it [00:01, 9.95it/s] 15it [00:01, 9.56it/s] 17it [00:01, 9.75it/s] 19it [00:02, 9.87it/s] 21it [00:02, 9.96it/s] 23it [00:02, 10.01it/s] 25it [00:02, 10.05it/s] 27it [00:02, 10.07it/s] 29it [00:03, 10.08it/s] 31it [00:03, 10.09it/s] 33it [00:03, 10.09it/s] 35it [00:03, 10.09it/s] 37it [00:03, 10.09it/s] 39it [00:03, 10.10it/s] 41it [00:04, 10.11it/s] 43it [00:04, 10.09it/s] 45it [00:04, 10.09it/s] 47it [00:04, 10.09it/s] 49it [00:04, 10.10it/s]2025-05-26 05:16:36,012 - INFO - [Epoch 097 | Batch 0050] IWAE-loss 3348.9727 | mean log_px -0.0105 | KL -2877.25 + 51it [00:05, 10.06it/s] 53it [00:05, 9.98it/s] 54it [00:05, 9.97it/s] 56it [00:05, 10.02it/s] 58it [00:05, 10.05it/s] 60it [00:06, 10.05it/s] 62it [00:06, 10.04it/s] 64it [00:06, 9.69it/s] 66it [00:06, 9.80it/s] 67it [00:06, 9.54it/s] 68it [00:06, 9.63it/s] 70it [00:07, 9.80it/s] 72it [00:07, 9.89it/s] 73it [00:07, 9.49it/s] 75it [00:07, 9.70it/s] 77it [00:07, 9.84it/s] 78it [00:07, 9.87it/s] 80it [00:08, 9.95it/s] 82it [00:08, 10.00it/s] 84it [00:08, 10.03it/s] 86it [00:08, 10.05it/s] 88it [00:08, 10.05it/s] 90it [00:09, 10.07it/s] 92it [00:09, 10.05it/s] 94it [00:09, 9.78it/s] 96it [00:09, 9.87it/s] 97it [00:09, 9.52it/s] 98it [00:09, 9.60it/s] 99it [00:10, 9.64it/s]2025-05-26 05:16:41,095 - INFO - [Epoch 097 | Batch 0100] IWAE-loss 3721.4724 | mean log_px -0.0175 | KL -2865.73 + 101it [00:10, 9.78it/s] 103it [00:10, 9.88it/s] 105it [00:10, 9.96it/s] 106it [00:10, 9.94it/s] 108it [00:10, 9.99it/s] 110it [00:11, 10.01it/s] 112it [00:11, 10.04it/s] 114it [00:11, 9.75it/s] 116it [00:11, 9.83it/s] 118it [00:11, 9.90it/s] 120it [00:12, 9.95it/s] 122it [00:12, 9.99it/s] 123it [00:12, 9.54it/s] 124it [00:12, 9.40it/s] 125it [00:12, 9.45it/s] 126it [00:12, 9.57it/s] 128it [00:13, 9.76it/s] 130it [00:13, 9.88it/s] 132it [00:13, 9.96it/s] 134it [00:13, 10.00it/s] 135it [00:13, 9.98it/s] 136it [00:13, 9.98it/s] 138it [00:14, 10.02it/s] 140it [00:14, 10.04it/s] 142it [00:14, 10.06it/s] 144it [00:14, 10.07it/s] 146it [00:14, 10.08it/s] 148it [00:15, 10.10it/s] 150it [00:15, 10.09it/s]2025-05-26 05:16:46,128 - INFO - [Epoch 097 | Batch 0150] IWAE-loss 3712.6641 | mean log_px -0.0218 | KL -2866.04 + 152it [00:15, 9.73it/s] 153it [00:15, 9.72it/s] 154it [00:15, 9.72it/s] 155it [00:15, 9.75it/s] 156it [00:15, 9.71it/s] 157it [00:15, 9.67it/s] 158it [00:16, 9.65it/s] 159it [00:16, 9.40it/s] 161it [00:16, 9.69it/s] 163it [00:16, 9.84it/s] 164it [00:16, 9.50it/s] 165it [00:16, 9.58it/s] 167it [00:16, 9.78it/s] 169it [00:17, 9.89it/s] 171it [00:17, 9.96it/s] 173it [00:17, 10.00it/s] 175it [00:17, 10.03it/s] 177it [00:17, 10.04it/s] 179it [00:18, 10.05it/s] 181it [00:18, 10.07it/s] 183it [00:18, 10.07it/s] 185it [00:18, 9.97it/s] 187it [00:18, 10.01it/s] 189it [00:19, 10.03it/s] 191it [00:19, 10.04it/s] 193it [00:19, 10.06it/s] 195it [00:19, 9.80it/s] 196it [00:19, 9.57it/s] 196it [00:19, 9.83it/s] +2025-05-26 05:16:50,812 - INFO - Epoch: 97, Objective: tensor([3453.2244], device='cuda:0', grad_fn=), Loss: 0.01020082551985979, KL/n: 58.48168182373047 + 0it [00:00, ?it/s]2025-05-26 05:16:51,277 - INFO - [Epoch 098 | Batch 0000] IWAE-loss 3513.9075 | mean log_px -0.0093 | KL -2864.63 + 1it [00:00, 5.27it/s] 2it [00:00, 6.76it/s] 3it [00:00, 7.93it/s] 4it [00:00, 8.61it/s] 5it [00:00, 9.06it/s] 6it [00:00, 9.34it/s] 7it [00:00, 9.53it/s] 8it [00:00, 9.66it/s] 10it [00:01, 9.82it/s] 12it [00:01, 9.89it/s] 14it [00:01, 9.91it/s] 16it [00:01, 9.94it/s] 18it [00:01, 9.97it/s] 19it [00:02, 9.57it/s] 20it [00:02, 9.65it/s] 22it [00:02, 9.79it/s] 24it [00:02, 9.87it/s] 25it [00:02, 9.89it/s] 26it [00:02, 9.90it/s] 28it [00:02, 9.94it/s] 29it [00:03, 9.95it/s] 30it [00:03, 9.94it/s] 31it [00:03, 9.93it/s] 32it [00:03, 9.94it/s] 34it [00:03, 9.97it/s] 36it [00:03, 9.98it/s] 37it [00:03, 9.97it/s] 38it [00:03, 9.96it/s] 40it [00:04, 9.97it/s] 42it [00:04, 9.99it/s] 43it [00:04, 9.99it/s] 44it [00:04, 9.96it/s] 45it [00:04, 9.97it/s] 46it [00:04, 9.98it/s] 48it [00:04, 10.00it/s] 50it [00:05, 10.02it/s]2025-05-26 05:16:56,328 - INFO - [Epoch 098 | Batch 0050] IWAE-loss 4490.0361 | mean log_px -0.0283 | KL -2859.88 + 52it [00:05, 9.61it/s] 54it [00:05, 9.71it/s] 55it [00:05, 9.76it/s] 56it [00:05, 9.78it/s] 57it [00:05, 9.80it/s] 58it [00:05, 9.40it/s] 59it [00:06, 9.55it/s] 60it [00:06, 9.62it/s] 61it [00:06, 9.16it/s] 62it [00:06, 9.37it/s] 63it [00:06, 9.54it/s] 64it [00:06, 9.66it/s] 66it [00:06, 9.84it/s] 68it [00:07, 9.92it/s] 70it [00:07, 9.94it/s] 71it [00:07, 9.94it/s] 72it [00:07, 9.95it/s] 73it [00:07, 9.96it/s] 74it [00:07, 9.97it/s] 75it [00:07, 9.98it/s] 76it [00:07, 9.89it/s] 77it [00:07, 9.75it/s] 78it [00:08, 9.75it/s] 79it [00:08, 9.81it/s] 80it [00:08, 9.83it/s] 81it [00:08, 9.84it/s] 82it [00:08, 9.87it/s] 83it [00:08, 9.25it/s] 84it [00:08, 9.44it/s] 86it [00:08, 9.69it/s] 87it [00:08, 9.75it/s] 88it [00:09, 9.80it/s] 89it [00:09, 9.85it/s] 90it [00:09, 9.88it/s] 91it [00:09, 9.89it/s] 92it [00:09, 9.88it/s] 93it [00:09, 9.90it/s] 94it [00:09, 9.86it/s] 95it [00:09, 9.88it/s] 96it [00:09, 9.89it/s] 97it [00:09, 9.91it/s] 98it [00:10, 9.90it/s] 99it [00:10, 9.51it/s] 100it [00:10, 9.63it/s]2025-05-26 05:17:01,468 - INFO - [Epoch 098 | Batch 0100] IWAE-loss 3895.4548 | mean log_px -0.0165 | KL -2864.15 + 101it [00:10, 9.67it/s] 102it [00:10, 9.75it/s] 103it [00:10, 9.82it/s] 104it [00:10, 9.84it/s] 105it [00:10, 9.88it/s] 106it [00:10, 9.86it/s] 107it [00:10, 9.89it/s] 108it [00:11, 9.89it/s] 109it [00:11, 9.91it/s] 110it [00:11, 9.92it/s] 112it [00:11, 9.94it/s] 114it [00:11, 9.97it/s] 115it [00:11, 9.97it/s] 116it [00:11, 9.96it/s] 118it [00:12, 9.98it/s] 119it [00:12, 9.98it/s] 120it [00:12, 9.97it/s] 121it [00:12, 9.98it/s] 122it [00:12, 9.98it/s] 124it [00:12, 10.00it/s] 126it [00:12, 10.00it/s] 127it [00:12, 10.00it/s] 128it [00:13, 9.99it/s] 129it [00:13, 9.96it/s] 130it [00:13, 9.94it/s] 131it [00:13, 9.96it/s] 132it [00:13, 9.95it/s] 133it [00:13, 9.95it/s] 135it [00:13, 9.97it/s] 136it [00:13, 9.97it/s] 138it [00:14, 9.99it/s] 139it [00:14, 9.99it/s] 141it [00:14, 10.00it/s] 142it [00:14, 10.00it/s] 144it [00:14, 10.01it/s] 145it [00:14, 10.00it/s] 146it [00:14, 9.99it/s] 148it [00:15, 10.00it/s] 150it [00:15, 9.62it/s]2025-05-26 05:17:06,504 - INFO - [Epoch 098 | Batch 0150] IWAE-loss 3752.1211 | mean log_px -0.0133 | KL -2858.67 + 151it [00:15, 9.67it/s] 152it [00:15, 9.74it/s] 154it [00:15, 9.86it/s] 155it [00:15, 9.88it/s] 156it [00:15, 9.39it/s] 157it [00:16, 9.47it/s] 158it [00:16, 9.58it/s] 160it [00:16, 9.29it/s] 162it [00:16, 9.56it/s] 164it [00:16, 9.72it/s] 166it [00:16, 9.52it/s] 167it [00:17, 9.60it/s] 168it [00:17, 9.66it/s] 169it [00:17, 9.74it/s] 171it [00:17, 9.86it/s] 172it [00:17, 9.48it/s] 173it [00:17, 9.55it/s] 174it [00:17, 9.57it/s] 175it [00:17, 9.11it/s] 176it [00:18, 9.30it/s] 177it [00:18, 9.47it/s] 178it [00:18, 9.61it/s] 179it [00:18, 9.72it/s] 180it [00:18, 9.19it/s] 181it [00:18, 9.41it/s] 182it [00:18, 9.57it/s] 183it [00:18, 9.69it/s] 184it [00:18, 9.27it/s] 186it [00:19, 9.51it/s] 187it [00:19, 9.58it/s] 188it [00:19, 9.13it/s] 189it [00:19, 9.35it/s] 190it [00:19, 9.45it/s] 191it [00:19, 9.52it/s] 192it [00:19, 9.61it/s] 194it [00:19, 9.78it/s] 195it [00:20, 9.44it/s] 196it [00:20, 9.70it/s] +2025-05-26 05:17:11,326 - INFO - Epoch: 98, Objective: tensor([3792.0647], device='cuda:0', grad_fn=), Loss: 0.014100815169513226, KL/n: 58.269466400146484 + 0it [00:00, ?it/s]2025-05-26 05:17:11,596 - INFO - [Epoch 099 | Batch 0000] IWAE-loss 3312.5208 | mean log_px -0.0071 | KL -2853.84 + 1it [00:00, 4.77it/s] 3it [00:00, 7.86it/s] 5it [00:00, 8.84it/s] 7it [00:00, 9.06it/s] 8it [00:00, 9.26it/s] 10it [00:01, 9.59it/s] 12it [00:01, 9.77it/s] 14it [00:01, 9.89it/s] 16it [00:01, 9.96it/s] 17it [00:01, 9.69it/s] 19it [00:02, 9.86it/s] 21it [00:02, 9.94it/s] 23it [00:02, 9.99it/s] 25it [00:02, 10.04it/s] 27it [00:02, 9.79it/s] 29it [00:03, 9.89it/s] 31it [00:03, 9.85it/s] 32it [00:03, 9.78it/s] 33it [00:03, 9.73it/s] 34it [00:03, 9.25it/s] 35it [00:03, 9.20it/s] 36it [00:03, 9.19it/s] 37it [00:03, 9.35it/s] 38it [00:03, 9.49it/s] 39it [00:04, 9.62it/s] 40it [00:04, 9.68it/s] 41it [00:04, 9.73it/s] 42it [00:04, 9.72it/s] 43it [00:04, 9.77it/s] 44it [00:04, 9.80it/s] 45it [00:04, 9.82it/s] 46it [00:04, 9.75it/s] 47it [00:04, 9.72it/s] 48it [00:05, 9.74it/s] 50it [00:05, 9.88it/s]2025-05-26 05:17:16,726 - INFO - [Epoch 099 | Batch 0050] IWAE-loss 3289.7585 | mean log_px -0.0074 | KL -2854.63 + 51it [00:05, 9.86it/s] 52it [00:05, 9.87it/s] 53it [00:05, 9.88it/s] 54it [00:05, 9.85it/s] 55it [00:05, 9.86it/s] 56it [00:05, 9.86it/s] 57it [00:05, 9.89it/s] 58it [00:06, 9.88it/s] 59it [00:06, 9.88it/s] 60it [00:06, 9.87it/s] 61it [00:06, 9.87it/s] 62it [00:06, 9.87it/s] 63it [00:06, 9.89it/s] 64it [00:06, 9.85it/s] 65it [00:06, 9.87it/s] 66it [00:06, 9.87it/s] 67it [00:06, 9.89it/s] 68it [00:07, 9.87it/s] 69it [00:07, 9.88it/s] 70it [00:07, 9.88it/s] 71it [00:07, 9.90it/s] 72it [00:07, 9.89it/s] 73it [00:07, 9.90it/s] 74it [00:07, 9.89it/s] 75it [00:07, 9.91it/s] 76it [00:07, 9.90it/s] 77it [00:07, 9.90it/s] 78it [00:08, 9.88it/s] 79it [00:08, 9.89it/s] 80it [00:08, 9.89it/s] 81it [00:08, 9.90it/s] 82it [00:08, 9.91it/s] 83it [00:08, 9.90it/s] 84it [00:08, 9.89it/s] 85it [00:08, 9.90it/s] 86it [00:08, 9.89it/s] 87it [00:08, 9.91it/s] 88it [00:09, 9.89it/s] 89it [00:09, 9.91it/s] 90it [00:09, 9.89it/s] 91it [00:09, 9.89it/s] 92it [00:09, 9.89it/s] 93it [00:09, 9.90it/s] 94it [00:09, 9.90it/s] 95it [00:09, 9.90it/s] 96it [00:09, 9.89it/s] 97it [00:09, 9.90it/s] 98it [00:10, 9.89it/s] 99it [00:10, 9.89it/s] 100it [00:10, 9.88it/s]2025-05-26 05:17:21,783 - INFO - [Epoch 099 | Batch 0100] IWAE-loss 3397.9956 | mean log_px -0.0134 | KL -2848.25 + 101it [00:10, 9.87it/s] 102it [00:10, 9.87it/s] 103it [00:10, 9.71it/s] 104it [00:10, 9.73it/s] 105it [00:10, 9.77it/s] 106it [00:10, 9.80it/s] 107it [00:10, 9.83it/s] 108it [00:11, 9.84it/s] 109it [00:11, 9.84it/s] 110it [00:11, 9.84it/s] 111it [00:11, 9.86it/s] 112it [00:11, 9.87it/s] 113it [00:11, 9.88it/s] 114it [00:11, 9.88it/s] 115it [00:11, 9.82it/s] 116it [00:11, 9.84it/s] 117it [00:11, 9.87it/s] 118it [00:12, 9.87it/s] 119it [00:12, 9.89it/s] 120it [00:12, 9.87it/s] 121it [00:12, 9.89it/s] 122it [00:12, 9.88it/s] 123it [00:12, 9.88it/s] 124it [00:12, 9.87it/s] 126it [00:12, 9.93it/s] 127it [00:13, 9.93it/s] 128it [00:13, 9.90it/s] 129it [00:13, 9.90it/s] 130it [00:13, 9.88it/s] 131it [00:13, 9.89it/s] 132it [00:13, 9.87it/s] 133it [00:13, 9.85it/s] 134it [00:13, 9.86it/s] 135it [00:13, 9.88it/s] 136it [00:13, 9.87it/s] 137it [00:14, 9.88it/s] 138it [00:14, 9.88it/s] 139it [00:14, 9.88it/s] 140it [00:14, 9.88it/s] 141it [00:14, 9.68it/s] 142it [00:14, 9.73it/s] 143it [00:14, 9.78it/s] 144it [00:14, 9.80it/s] 145it [00:14, 9.59it/s] 146it [00:14, 9.39it/s] 147it [00:15, 9.01it/s] 148it [00:15, 9.00it/s] 149it [00:15, 8.69it/s]2025-05-26 05:17:26,930 - INFO - [Epoch 099 | Batch 0150] IWAE-loss 3503.2078 | mean log_px -0.0094 | KL -2843.22 + 151it [00:15, 9.28it/s] 152it [00:15, 9.44it/s] 154it [00:15, 9.72it/s] 155it [00:15, 9.32it/s] 157it [00:16, 9.62it/s] 158it [00:16, 9.26it/s] 160it [00:16, 9.58it/s] 162it [00:16, 9.77it/s] 164it [00:16, 9.89it/s] 166it [00:17, 9.97it/s] 168it [00:17, 10.03it/s] 170it [00:17, 9.97it/s] 172it [00:17, 10.02it/s] 174it [00:17, 10.05it/s] 176it [00:18, 10.05it/s] 178it [00:18, 10.07it/s] 180it [00:18, 10.09it/s] 182it [00:18, 10.11it/s] 184it [00:18, 10.12it/s] 186it [00:19, 10.01it/s] 188it [00:19, 9.94it/s] 189it [00:19, 9.93it/s] 190it [00:19, 9.92it/s] 191it [00:19, 9.92it/s] 192it [00:19, 9.91it/s] 193it [00:19, 9.92it/s] 194it [00:19, 9.91it/s] 195it [00:19, 9.44it/s] 196it [00:20, 9.74it/s] +2025-05-26 05:17:31,574 - INFO - Epoch: 99, Objective: tensor([3379.9856], device='cuda:0', grad_fn=), Loss: 0.00989951379597187, KL/n: 58.04240417480469 +2025-05-26 05:17:31,578 - INFO - Select objective: bbb + 0it [00:00, ?it/s] 2it [00:00, 16.53it/s] 5it [00:00, 23.15it/s] 8it [00:00, 26.08it/s] 11it [00:00, 27.45it/s] 14it [00:00, 28.34it/s] 17it [00:00, 28.72it/s] 20it [00:00, 29.09it/s] 23it [00:00, 29.01it/s] 26it [00:00, 29.16it/s] 29it [00:01, 29.28it/s] 32it [00:01, 29.37it/s] 35it [00:01, 29.40it/s] 38it [00:01, 29.48it/s] 41it [00:01, 29.18it/s] 44it [00:01, 29.33it/s] 47it [00:01, 29.51it/s] 50it [00:01, 29.59it/s] 53it [00:01, 29.59it/s] 56it [00:01, 29.66it/s] 59it [00:02, 29.69it/s] 62it [00:02, 29.77it/s] 65it [00:02, 29.66it/s] 68it [00:02, 29.64it/s] 72it [00:02, 29.85it/s] 75it [00:02, 29.80it/s] 78it [00:02, 29.85it/s] 81it [00:02, 29.70it/s] 84it [00:02, 29.65it/s] 87it [00:02, 29.73it/s] 90it [00:03, 29.78it/s] 93it [00:03, 29.82it/s] 96it [00:03, 29.85it/s] 99it [00:03, 29.83it/s] 102it [00:03, 29.86it/s] 105it [00:03, 29.78it/s] 108it [00:03, 29.82it/s] 111it [00:03, 29.78it/s] 114it [00:03, 29.67it/s] 117it [00:04, 29.59it/s] 121it [00:04, 29.74it/s] 124it [00:04, 29.70it/s] 128it [00:04, 29.84it/s] 131it [00:04, 29.84it/s] 135it [00:04, 29.91it/s] 139it [00:04, 29.79it/s] 142it [00:04, 29.84it/s] 145it [00:04, 29.75it/s] 148it [00:05, 29.58it/s] 151it [00:05, 29.61it/s] 154it [00:05, 29.54it/s] 157it [00:05, 29.61it/s] 160it [00:05, 29.66it/s] 163it [00:05, 29.74it/s] 166it [00:05, 29.73it/s] 169it [00:05, 29.50it/s] 172it [00:05, 29.62it/s] 175it [00:05, 29.53it/s] 179it [00:06, 29.75it/s] 182it [00:06, 29.76it/s] 186it [00:06, 29.90it/s] 190it [00:06, 29.80it/s] 193it [00:06, 29.75it/s] 196it [00:06, 29.81it/s] 199it [00:06, 29.83it/s] 202it [00:06, 29.79it/s] 205it [00:06, 29.69it/s] 208it [00:07, 29.66it/s] 211it [00:07, 29.69it/s] 214it [00:07, 29.53it/s] 217it [00:07, 29.65it/s] 220it [00:07, 29.73it/s] 223it [00:07, 29.63it/s] 226it [00:07, 29.32it/s] 229it [00:07, 29.23it/s] 232it [00:07, 29.18it/s] 236it [00:08, 29.54it/s] 239it [00:08, 29.65it/s] 242it [00:08, 29.65it/s] 245it [00:08, 29.51it/s] 248it [00:08, 29.33it/s] 251it [00:08, 29.52it/s] 254it [00:08, 29.58it/s] 257it [00:08, 29.52it/s] 261it [00:08, 29.73it/s] 264it [00:08, 29.67it/s] 267it [00:09, 29.49it/s] 270it [00:09, 29.57it/s] 273it [00:09, 29.68it/s] 277it [00:09, 29.63it/s] 280it [00:09, 28.43it/s] 280it [00:09, 29.22it/s] +2025-05-26 05:17:41,492 - INFO - Epoch: 0, Objective: 0.030164141207933426, Loss: 0.02757582627236843, KL/n: 0.002588314935564995 + 0%| | 0/84 [00:00), Loss: 0.46993568539619446, KL/n: 68.613525390625 + 0it [00:00, ?it/s]2025-05-26 05:19:57,834 - INFO - [Epoch 001 | Batch 0000] IWAE-loss 41328.6367 | mean log_px -0.5423 | KL -3364.53 + 2it [00:00, 15.00it/s] 6it [00:00, 24.39it/s] 9it [00:00, 25.79it/s] 13it [00:00, 28.11it/s] 17it [00:00, 29.01it/s] 20it [00:00, 29.26it/s] 24it [00:00, 29.92it/s] 28it [00:00, 30.19it/s] 32it [00:01, 30.71it/s] 36it [00:01, 30.72it/s] 40it [00:01, 30.43it/s] 44it [00:01, 30.52it/s] 48it [00:01, 30.95it/s]2025-05-26 05:19:59,473 - INFO - [Epoch 001 | Batch 0050] IWAE-loss 22804.9512 | mean log_px -0.2774 | KL -3389.26 + 52it [00:01, 30.82it/s] 56it [00:01, 30.42it/s] 60it [00:02, 30.49it/s] 64it [00:02, 30.89it/s] 68it [00:02, 30.55it/s] 72it [00:02, 30.60it/s] 76it [00:02, 30.97it/s] 80it [00:02, 30.44it/s] 84it [00:02, 30.81it/s] 88it [00:02, 30.81it/s] 92it [00:03, 30.68it/s] 96it [00:03, 30.96it/s] 100it [00:03, 30.99it/s]2025-05-26 05:20:01,098 - INFO - [Epoch 001 | Batch 0100] IWAE-loss 29099.3145 | mean log_px -0.3671 | KL -3402.68 + 104it [00:03, 30.54it/s] 108it [00:03, 30.97it/s] 112it [00:03, 30.39it/s] 116it [00:03, 30.30it/s] 120it [00:04, 29.29it/s] 123it [00:04, 29.13it/s] 127it [00:04, 29.47it/s] 131it [00:04, 30.28it/s] 135it [00:04, 30.49it/s] 139it [00:04, 30.44it/s] 143it [00:04, 29.03it/s] 147it [00:04, 29.46it/s]2025-05-26 05:20:02,779 - INFO - [Epoch 001 | Batch 0150] IWAE-loss 33030.3203 | mean log_px -0.4231 | KL -3416.42 + 151it [00:05, 29.63it/s] 154it [00:05, 29.36it/s] 158it [00:05, 30.38it/s] 162it [00:05, 30.18it/s] 166it [00:05, 30.46it/s] 170it [00:05, 30.05it/s] 174it [00:05, 30.75it/s] 178it [00:05, 30.83it/s] 182it [00:06, 30.75it/s] 186it [00:06, 30.28it/s] 190it [00:06, 30.57it/s] 194it [00:06, 30.89it/s] 196it [00:06, 29.82it/s] +2025-05-26 05:20:04,323 - INFO - Epoch: 1, Objective: tensor([27755.5234], device='cuda:0', grad_fn=), Loss: 0.343679279088974, KL/n: 69.91226196289062 + 0it [00:00, ?it/s]2025-05-26 05:20:04,524 - INFO - [Epoch 002 | Batch 0000] IWAE-loss 24771.7012 | mean log_px -0.3049 | KL -3425.47 + 2it [00:00, 16.07it/s] 5it [00:00, 22.26it/s] 9it [00:00, 26.30it/s] 13it [00:00, 28.23it/s] 16it [00:00, 27.91it/s] 20it [00:00, 28.83it/s] 23it [00:00, 28.98it/s] 27it [00:00, 29.52it/s] 30it [00:01, 28.89it/s] 33it [00:01, 28.61it/s] 36it [00:01, 28.95it/s] 40it [00:01, 28.75it/s] 43it [00:01, 28.58it/s] 47it [00:01, 28.96it/s] 50it [00:01, 28.43it/s]2025-05-26 05:20:06,236 - INFO - [Epoch 002 | Batch 0050] IWAE-loss 23962.0957 | mean log_px -0.2933 | KL -3431.02 + 53it [00:01, 28.82it/s] 57it [00:02, 29.35it/s] 60it [00:02, 29.04it/s] 63it [00:02, 29.17it/s] 66it [00:02, 29.16it/s] 69it [00:02, 29.11it/s] 73it [00:02, 29.60it/s] 76it [00:02, 28.89it/s] 80it [00:02, 29.31it/s] 83it [00:02, 29.12it/s] 86it [00:03, 29.14it/s] 90it [00:03, 29.49it/s] 93it [00:03, 29.03it/s] 96it [00:03, 29.04it/s] 99it [00:03, 29.09it/s]2025-05-26 05:20:07,953 - INFO - [Epoch 002 | Batch 0100] IWAE-loss 18612.4961 | mean log_px -0.2168 | KL -3439.96 + 102it [00:03, 28.88it/s] 105it [00:03, 28.37it/s] 109it [00:03, 29.11it/s] 112it [00:03, 29.22it/s] 115it [00:04, 29.43it/s] 119it [00:04, 29.71it/s] 123it [00:04, 29.97it/s] 126it [00:04, 29.52it/s] 129it [00:04, 29.40it/s] 132it [00:04, 29.01it/s] 136it [00:04, 29.21it/s] 139it [00:04, 28.79it/s] 143it [00:04, 28.90it/s] 147it [00:05, 29.42it/s] 150it [00:05, 29.28it/s]2025-05-26 05:20:09,677 - INFO - [Epoch 002 | Batch 0150] IWAE-loss 20737.0684 | mean log_px -0.2470 | KL -3445.83 + 153it [00:05, 28.40it/s] 156it [00:05, 28.02it/s] 159it [00:05, 28.19it/s] 163it [00:05, 29.04it/s] 166it [00:05, 28.46it/s] 169it [00:05, 28.59it/s] 172it [00:05, 28.38it/s] 175it [00:06, 28.77it/s] 178it [00:06, 28.56it/s] 182it [00:06, 28.77it/s] 185it [00:06, 28.41it/s] 188it [00:06, 28.66it/s] 192it [00:06, 29.08it/s] 195it [00:06, 27.57it/s] 196it [00:06, 28.53it/s] +2025-05-26 05:20:11,310 - INFO - Epoch: 2, Objective: tensor([19413.9609], device='cuda:0', grad_fn=), Loss: 0.23482824862003326, KL/n: 70.47401428222656 + 0it [00:00, ?it/s]2025-05-26 05:20:11,685 - INFO - [Epoch 003 | Batch 0000] IWAE-loss 26469.2031 | mean log_px -0.3288 | KL -3451.09 + 2it [00:00, 15.20it/s] 5it [00:00, 22.29it/s] 9it [00:00, 26.44it/s] 13it [00:00, 28.17it/s] 17it [00:00, 29.11it/s] 21it [00:00, 29.55it/s] 25it [00:00, 29.94it/s] 29it [00:01, 30.18it/s] 33it [00:01, 30.25it/s] 37it [00:01, 30.64it/s] 41it [00:01, 29.53it/s] 45it [00:01, 29.82it/s] 49it [00:01, 30.05it/s]2025-05-26 05:20:13,335 - INFO - [Epoch 003 | Batch 0050] IWAE-loss 18213.8281 | mean log_px -0.2108 | KL -3458.14 + 53it [00:01, 30.15it/s] 57it [00:01, 30.29it/s] 61it [00:02, 30.42it/s] 65it [00:02, 30.46it/s] 69it [00:02, 30.48it/s] 73it [00:02, 30.55it/s] 77it [00:02, 30.90it/s] 81it [00:02, 30.49it/s] 85it [00:02, 30.47it/s] 89it [00:02, 30.49it/s] 93it [00:03, 30.57it/s] 97it [00:03, 30.60it/s]2025-05-26 05:20:14,972 - INFO - [Epoch 003 | Batch 0100] IWAE-loss 20620.9824 | mean log_px -0.2452 | KL -3458.33 + 101it [00:03, 30.59it/s] 105it [00:03, 30.64it/s] 109it [00:03, 30.63it/s] 113it [00:03, 30.60it/s] 117it [00:03, 30.51it/s] 121it [00:04, 30.62it/s] 125it [00:04, 30.45it/s] 129it [00:04, 31.06it/s] 133it [00:04, 30.80it/s] 137it [00:04, 30.84it/s] 141it [00:04, 30.18it/s] 145it [00:04, 30.86it/s] 149it [00:04, 30.44it/s]2025-05-26 05:20:16,607 - INFO - [Epoch 003 | Batch 0150] IWAE-loss 22469.4336 | mean log_px -0.2715 | KL -3466.90 + 153it [00:05, 30.44it/s] 157it [00:05, 30.73it/s] 161it [00:05, 30.16it/s] 165it [00:05, 30.71it/s] 169it [00:05, 30.73it/s] 173it [00:05, 30.04it/s] 177it [00:05, 30.59it/s] 181it [00:06, 29.99it/s] 185it [00:06, 30.00it/s] 189it [00:06, 30.50it/s] 193it [00:06, 30.24it/s] 196it [00:06, 29.83it/s] +2025-05-26 05:20:18,172 - INFO - Epoch: 3, Objective: tensor([16944.2090], device='cuda:0', grad_fn=), Loss: 0.19525867700576782, KL/n: 70.87026977539062 + 0it [00:00, ?it/s]2025-05-26 05:20:18,385 - INFO - [Epoch 004 | Batch 0000] IWAE-loss 22920.8672 | mean log_px -0.2778 | KL -3472.81 + 1it [00:00, 9.47it/s] 5it [00:00, 23.01it/s] 8it [00:00, 25.60it/s] 12it [00:00, 28.06it/s] 15it [00:00, 27.98it/s] 19it [00:00, 29.21it/s] 22it [00:00, 28.73it/s] 25it [00:00, 28.84it/s] 28it [00:01, 28.95it/s] 32it [00:01, 29.92it/s] 35it [00:01, 29.85it/s] 38it [00:01, 29.02it/s] 42it [00:01, 29.51it/s] 45it [00:01, 28.85it/s] 49it [00:01, 29.57it/s]2025-05-26 05:20:20,083 - INFO - [Epoch 004 | Batch 0050] IWAE-loss 19934.9766 | mean log_px -0.2351 | KL -3476.23 + 52it [00:01, 28.93it/s] 55it [00:01, 29.15it/s] 59it [00:02, 29.74it/s] 62it [00:02, 29.04it/s] 65it [00:02, 29.30it/s] 69it [00:02, 29.64it/s] 72it [00:02, 29.12it/s] 75it [00:02, 28.98it/s] 79it [00:02, 29.41it/s] 83it [00:02, 29.78it/s] 86it [00:02, 29.06it/s] 90it [00:03, 29.32it/s] 94it [00:03, 29.33it/s] 98it [00:03, 29.36it/s]2025-05-26 05:20:21,779 - INFO - [Epoch 004 | Batch 0100] IWAE-loss 21755.9512 | mean log_px -0.2611 | KL -3480.36 + 102it [00:03, 29.27it/s] 106it [00:03, 29.58it/s] 109it [00:03, 29.02it/s] 113it [00:03, 29.64it/s] 116it [00:04, 29.60it/s] 119it [00:04, 28.93it/s] 122it [00:04, 29.06it/s] 126it [00:04, 29.20it/s] 130it [00:04, 29.24it/s] 134it [00:04, 29.30it/s] 137it [00:04, 29.43it/s] 140it [00:04, 29.55it/s] 143it [00:04, 29.03it/s] 146it [00:05, 28.88it/s] 149it [00:05, 28.52it/s]2025-05-26 05:20:23,504 - INFO - [Epoch 004 | Batch 0150] IWAE-loss 18605.0137 | mean log_px -0.2160 | KL -3484.41 + 152it [00:05, 28.50it/s] 155it [00:05, 28.90it/s] 159it [00:05, 29.01it/s] 163it [00:05, 29.15it/s] 166it [00:05, 29.01it/s] 170it [00:05, 28.97it/s] 174it [00:06, 29.34it/s] 178it [00:06, 29.49it/s] 181it [00:06, 28.92it/s] 185it [00:06, 29.53it/s] 188it [00:06, 29.21it/s] 191it [00:06, 28.81it/s] 195it [00:06, 27.83it/s] 196it [00:06, 28.72it/s] +2025-05-26 05:20:25,119 - INFO - Epoch: 4, Objective: tensor([16574.2109], device='cuda:0', grad_fn=), Loss: 0.19108611345291138, KL/n: 71.17504119873047 + 0it [00:00, ?it/s]2025-05-26 05:20:25,492 - INFO - [Epoch 005 | Batch 0000] IWAE-loss 16495.5020 | mean log_px -0.1858 | KL -3489.05 + 2it [00:00, 15.57it/s] 5it [00:00, 21.99it/s] 9it [00:00, 25.62it/s] 13it [00:00, 28.15it/s] 17it [00:00, 28.84it/s] 20it [00:00, 28.67it/s] 23it [00:00, 28.99it/s] 26it [00:00, 29.14it/s] 30it [00:01, 29.54it/s] 34it [00:01, 29.71it/s] 38it [00:01, 30.22it/s] 42it [00:01, 30.06it/s] 46it [00:01, 30.00it/s] 49it [00:01, 29.49it/s]2025-05-26 05:20:27,175 - INFO - [Epoch 005 | Batch 0050] IWAE-loss 17186.3125 | mean log_px -0.1956 | KL -3491.69 + 53it [00:01, 30.02it/s] 56it [00:01, 29.38it/s] 60it [00:02, 29.43it/s] 64it [00:02, 29.75it/s] 68it [00:02, 30.09it/s] 72it [00:02, 29.95it/s] 75it [00:02, 29.39it/s] 79it [00:02, 29.73it/s] 83it [00:02, 29.97it/s] 86it [00:02, 29.33it/s] 90it [00:03, 29.57it/s] 94it [00:03, 30.28it/s] 98it [00:03, 30.22it/s]2025-05-26 05:20:28,849 - INFO - [Epoch 005 | Batch 0100] IWAE-loss 19680.8086 | mean log_px -0.2312 | KL -3495.88 + 102it [00:03, 29.79it/s] 105it [00:03, 29.63it/s] 108it [00:03, 29.59it/s] 112it [00:03, 29.93it/s] 116it [00:03, 30.25it/s] 120it [00:04, 29.85it/s] 123it [00:04, 29.50it/s] 127it [00:04, 29.78it/s] 130it [00:04, 29.66it/s] 134it [00:04, 29.93it/s] 137it [00:04, 29.86it/s] 141it [00:04, 30.32it/s] 145it [00:04, 30.13it/s] 149it [00:05, 30.15it/s]2025-05-26 05:20:30,523 - INFO - [Epoch 005 | Batch 0150] IWAE-loss 20225.8477 | mean log_px -0.2390 | KL -3498.40 + 153it [00:05, 29.44it/s] 157it [00:05, 29.78it/s] 160it [00:05, 29.67it/s] 164it [00:05, 29.74it/s] 168it [00:05, 30.32it/s] 172it [00:05, 29.53it/s] 176it [00:05, 29.54it/s] 180it [00:06, 30.16it/s] 184it [00:06, 29.60it/s] 188it [00:06, 29.76it/s] 192it [00:06, 30.07it/s] 196it [00:06, 30.05it/s] 196it [00:06, 29.27it/s] +2025-05-26 05:20:32,106 - INFO - Epoch: 5, Objective: tensor([15888.0312], device='cuda:0', grad_fn=), Loss: 0.17937389016151428, KL/n: 71.46297454833984 + 0it [00:00, ?it/s]2025-05-26 05:20:32,323 - INFO - [Epoch 006 | Batch 0000] IWAE-loss 20044.2480 | mean log_px -0.2363 | KL -3503.08 + 1it [00:00, 9.86it/s] 4it [00:00, 21.19it/s] 8it [00:00, 26.50it/s] 11it [00:00, 27.08it/s] 15it [00:00, 28.65it/s] 19it [00:00, 29.49it/s] 23it [00:00, 29.57it/s] 26it [00:00, 29.25it/s] 30it [00:01, 30.13it/s] 33it [00:01, 29.53it/s] 37it [00:01, 30.22it/s] 41it [00:01, 30.16it/s] 45it [00:01, 30.24it/s] 49it [00:01, 30.20it/s]2025-05-26 05:20:33,989 - INFO - [Epoch 006 | Batch 0050] IWAE-loss 18991.9668 | mean log_px -0.2213 | KL -3502.69 + 53it [00:01, 30.25it/s] 57it [00:01, 29.85it/s] 60it [00:02, 29.81it/s] 64it [00:02, 30.12it/s] 68it [00:02, 29.27it/s] 72it [00:02, 30.13it/s] 76it [00:02, 30.03it/s] 80it [00:02, 30.27it/s] 84it [00:02, 29.89it/s] 88it [00:02, 29.84it/s] 91it [00:03, 29.76it/s] 94it [00:03, 29.09it/s] 97it [00:03, 29.15it/s]2025-05-26 05:20:35,670 - INFO - [Epoch 006 | Batch 0100] IWAE-loss 16707.7285 | mean log_px -0.1886 | KL -3505.21 + 101it [00:03, 29.15it/s] 105it [00:03, 29.07it/s] 109it [00:03, 29.75it/s] 112it [00:03, 29.13it/s] 116it [00:03, 29.25it/s] 119it [00:04, 29.18it/s] 123it [00:04, 29.48it/s] 127it [00:04, 29.50it/s] 130it [00:04, 29.35it/s] 133it [00:04, 29.40it/s] 136it [00:04, 29.21it/s] 140it [00:04, 29.22it/s] 144it [00:04, 29.47it/s] 147it [00:05, 29.36it/s] 150it [00:05, 29.11it/s]2025-05-26 05:20:37,377 - INFO - [Epoch 006 | Batch 0150] IWAE-loss 15213.6631 | mean log_px -0.1672 | KL -3512.55 + 154it [00:05, 29.54it/s] 158it [00:05, 29.93it/s] 161it [00:05, 29.50it/s] 164it [00:05, 29.39it/s] 167it [00:05, 29.28it/s] 171it [00:05, 29.24it/s] 175it [00:05, 29.74it/s] 178it [00:06, 29.54it/s] 181it [00:06, 28.80it/s] 185it [00:06, 29.12it/s] 188it [00:06, 29.07it/s] 192it [00:06, 29.23it/s] 195it [00:06, 27.33it/s] 196it [00:06, 29.01it/s] +2025-05-26 05:20:38,992 - INFO - Epoch: 6, Objective: tensor([13226.5508], device='cuda:0', grad_fn=), Loss: 0.14230650663375854, KL/n: 71.71227264404297 + 0it [00:00, ?it/s]2025-05-26 05:20:39,376 - INFO - [Epoch 007 | Batch 0000] IWAE-loss 19194.7715 | mean log_px -0.2240 | KL -3517.77 + 1it [00:00, 10.00it/s] 4it [00:00, 20.22it/s] 8it [00:00, 25.78it/s] 11it [00:00, 26.51it/s] 14it [00:00, 27.36it/s] 18it [00:00, 28.11it/s] 22it [00:00, 29.02it/s] 25it [00:00, 29.16it/s] 28it [00:01, 29.15it/s] 32it [00:01, 29.88it/s] 35it [00:01, 29.06it/s] 39it [00:01, 29.97it/s] 42it [00:01, 29.12it/s] 46it [00:01, 29.15it/s] 50it [00:01, 29.40it/s]2025-05-26 05:20:41,081 - INFO - [Epoch 007 | Batch 0050] IWAE-loss 14441.4629 | mean log_px -0.1561 | KL -3514.82 + 53it [00:01, 29.45it/s] 57it [00:02, 29.56it/s] 60it [00:02, 29.38it/s] 64it [00:02, 29.52it/s] 68it [00:02, 29.94it/s] 71it [00:02, 29.61it/s] 75it [00:02, 29.96it/s] 78it [00:02, 29.69it/s] 82it [00:02, 29.63it/s] 86it [00:02, 30.29it/s] 90it [00:03, 30.05it/s] 94it [00:03, 30.08it/s] 98it [00:03, 30.13it/s]2025-05-26 05:20:42,757 - INFO - [Epoch 007 | Batch 0100] IWAE-loss 14698.3955 | mean log_px -0.1597 | KL -3518.26 + 102it [00:03, 30.11it/s] 106it [00:03, 29.39it/s] 110it [00:03, 30.09it/s] 114it [00:03, 29.96it/s] 118it [00:04, 29.66it/s] 122it [00:04, 30.25it/s] 126it [00:04, 30.14it/s] 130it [00:04, 29.71it/s] 133it [00:04, 29.48it/s] 136it [00:04, 28.81it/s] 139it [00:04, 27.77it/s] 143it [00:04, 28.23it/s] 147it [00:05, 29.20it/s] 150it [00:05, 28.86it/s]2025-05-26 05:20:44,457 - INFO - [Epoch 007 | Batch 0150] IWAE-loss 13650.4648 | mean log_px -0.1447 | KL -3523.06 + 154it [00:05, 29.27it/s] 157it [00:05, 29.18it/s] 160it [00:05, 29.12it/s] 164it [00:05, 29.62it/s] 167it [00:05, 28.93it/s] 171it [00:05, 29.60it/s] 174it [00:05, 29.13it/s] 177it [00:06, 29.29it/s] 181it [00:06, 29.47it/s] 184it [00:06, 28.79it/s] 188it [00:06, 29.61it/s] 191it [00:06, 28.71it/s] 194it [00:06, 28.78it/s] 196it [00:06, 28.82it/s] +2025-05-26 05:20:46,090 - INFO - Epoch: 7, Objective: tensor([14926.7266], device='cuda:0', grad_fn=), Loss: 0.16049005091190338, KL/n: 71.94602966308594 + 0it [00:00, ?it/s]2025-05-26 05:20:46,295 - INFO - [Epoch 008 | Batch 0000] IWAE-loss 10372.6602 | mean log_px -0.0978 | KL -3525.98 + 2it [00:00, 15.77it/s] 5it [00:00, 22.34it/s] 9it [00:00, 26.16it/s] 13it [00:00, 28.72it/s] 16it [00:00, 28.59it/s] 20it [00:00, 29.97it/s] 23it [00:00, 29.54it/s] 27it [00:00, 29.93it/s] 30it [00:01, 29.86it/s] 34it [00:01, 30.38it/s] 38it [00:01, 30.21it/s] 42it [00:01, 30.40it/s] 46it [00:01, 30.29it/s] 50it [00:01, 30.99it/s]2025-05-26 05:20:47,939 - INFO - [Epoch 008 | Batch 0050] IWAE-loss 15945.5898 | mean log_px -0.1774 | KL -3529.62 + 54it [00:01, 30.87it/s] 58it [00:01, 30.46it/s] 62it [00:02, 30.47it/s] 66it [00:02, 30.51it/s] 70it [00:02, 30.72it/s] 74it [00:02, 30.71it/s] 78it [00:02, 30.33it/s] 82it [00:02, 30.34it/s] 86it [00:02, 30.46it/s] 90it [00:03, 29.91it/s] 94it [00:03, 30.36it/s] 98it [00:03, 30.71it/s]2025-05-26 05:20:49,590 - INFO - [Epoch 008 | Batch 0100] IWAE-loss 10654.3936 | mean log_px -0.1018 | KL -3525.81 + 102it [00:03, 30.10it/s] 106it [00:03, 29.71it/s] 110it [00:03, 29.88it/s] 114it [00:03, 30.07it/s] 118it [00:03, 30.45it/s] 122it [00:04, 30.47it/s] 126it [00:04, 30.09it/s] 130it [00:04, 30.36it/s] 134it [00:04, 30.16it/s] 138it [00:04, 30.20it/s] 142it [00:04, 30.28it/s] 146it [00:04, 30.37it/s] 150it [00:05, 30.04it/s]2025-05-26 05:20:51,234 - INFO - [Epoch 008 | Batch 0150] IWAE-loss 13537.7305 | mean log_px -0.1430 | KL -3530.51 + 154it [00:05, 30.68it/s] 158it [00:05, 30.62it/s] 162it [00:05, 30.07it/s] 166it [00:05, 30.73it/s] 170it [00:05, 30.71it/s] 174it [00:05, 30.40it/s] 178it [00:05, 30.47it/s] 182it [00:06, 30.76it/s] 186it [00:06, 30.76it/s] 190it [00:06, 30.39it/s] 194it [00:06, 30.35it/s] 196it [00:06, 29.80it/s] +2025-05-26 05:20:52,788 - INFO - Epoch: 8, Objective: tensor([13541.4258], device='cuda:0', grad_fn=), Loss: 0.1426759660243988, KL/n: 72.14434051513672 + 0it [00:00, ?it/s]2025-05-26 05:20:53,173 - INFO - [Epoch 009 | Batch 0000] IWAE-loss 14324.3496 | mean log_px -0.1541 | KL -3536.14 + 1it [00:00, 9.85it/s] 4it [00:00, 20.41it/s] 8it [00:00, 25.89it/s] 11it [00:00, 27.33it/s] 14it [00:00, 27.20it/s] 18it [00:00, 28.75it/s] 22it [00:00, 29.13it/s] 25it [00:00, 28.52it/s] 29it [00:01, 29.46it/s] 32it [00:01, 29.50it/s] 35it [00:01, 28.65it/s] 39it [00:01, 29.20it/s] 42it [00:01, 28.90it/s] 45it [00:01, 28.50it/s] 48it [00:01, 28.53it/s]2025-05-26 05:20:54,901 - INFO - [Epoch 009 | Batch 0050] IWAE-loss 11184.5459 | mean log_px -0.1092 | KL -3537.98 + 51it [00:01, 27.96it/s] 55it [00:01, 29.06it/s] 58it [00:02, 28.45it/s] 61it [00:02, 28.67it/s] 64it [00:02, 29.01it/s] 67it [00:02, 28.55it/s] 71it [00:02, 28.74it/s] 75it [00:02, 28.63it/s] 79it [00:02, 29.20it/s] 83it [00:02, 29.59it/s] 87it [00:03, 29.99it/s] 90it [00:03, 29.35it/s] 94it [00:03, 30.12it/s] 98it [00:03, 30.23it/s]2025-05-26 05:20:56,598 - INFO - [Epoch 009 | Batch 0100] IWAE-loss 16544.4180 | mean log_px -0.1858 | KL -3535.94 + 102it [00:03, 30.11it/s] 106it [00:03, 29.93it/s] 109it [00:03, 29.17it/s] 113it [00:03, 29.93it/s] 116it [00:04, 29.37it/s] 120it [00:04, 29.79it/s] 124it [00:04, 30.06it/s] 127it [00:04, 29.98it/s] 130it [00:04, 29.41it/s] 134it [00:04, 29.71it/s] 137it [00:04, 29.12it/s] 141it [00:04, 29.60it/s] 145it [00:04, 30.15it/s] 149it [00:05, 29.46it/s]2025-05-26 05:20:58,277 - INFO - [Epoch 009 | Batch 0150] IWAE-loss 18082.6641 | mean log_px -0.2078 | KL -3539.67 + 152it [00:05, 29.23it/s] 156it [00:05, 29.61it/s] 160it [00:05, 29.93it/s] 163it [00:05, 29.74it/s] 166it [00:05, 28.86it/s] 169it [00:05, 29.11it/s] 173it [00:05, 29.65it/s] 176it [00:06, 28.99it/s] 180it [00:06, 29.18it/s] 184it [00:06, 29.84it/s] 187it [00:06, 29.06it/s] 190it [00:06, 28.41it/s] 194it [00:06, 29.01it/s] 196it [00:06, 28.75it/s] +2025-05-26 05:20:59,903 - INFO - Epoch: 9, Objective: tensor([12314.6270], device='cuda:0', grad_fn=), Loss: 0.12443278729915619, KL/n: 72.30850982666016 + 0it [00:00, ?it/s]2025-05-26 05:21:00,114 - INFO - [Epoch 010 | Batch 0000] IWAE-loss 15676.4102 | mean log_px -0.1735 | KL -3534.72 + 1it [00:00, 9.83it/s] 5it [00:00, 23.47it/s] 8it [00:00, 25.86it/s] 12it [00:00, 28.15it/s] 15it [00:00, 28.66it/s] 19it [00:00, 29.57it/s] 23it [00:00, 29.83it/s] 27it [00:00, 30.15it/s] 31it [00:01, 30.24it/s] 35it [00:01, 30.74it/s] 39it [00:01, 30.37it/s] 43it [00:01, 30.56it/s] 47it [00:01, 30.34it/s]2025-05-26 05:21:01,755 - INFO - [Epoch 010 | Batch 0050] IWAE-loss 14031.0078 | mean log_px -0.1498 | KL -3547.17 + 51it [00:01, 30.22it/s] 55it [00:01, 30.90it/s] 59it [00:02, 30.43it/s] 63it [00:02, 30.51it/s] 67it [00:02, 30.90it/s] 71it [00:02, 30.79it/s] 75it [00:02, 30.45it/s] 79it [00:02, 30.48it/s] 83it [00:02, 30.51it/s] 87it [00:02, 30.56it/s] 91it [00:03, 30.89it/s] 95it [00:03, 30.46it/s] 99it [00:03, 30.47it/s]2025-05-26 05:21:03,402 - INFO - [Epoch 010 | Batch 0100] IWAE-loss 12550.3027 | mean log_px -0.1287 | KL -3541.58 + 103it [00:03, 29.80it/s] 106it [00:03, 28.85it/s] 109it [00:03, 28.12it/s] 112it [00:03, 27.73it/s] 116it [00:03, 28.45it/s] 120it [00:04, 28.95it/s] 123it [00:04, 28.76it/s] 126it [00:04, 29.07it/s] 130it [00:04, 29.60it/s] 133it [00:04, 29.02it/s] 137it [00:04, 29.67it/s] 140it [00:04, 29.71it/s] 143it [00:04, 29.06it/s] 146it [00:04, 29.03it/s] 149it [00:05, 29.08it/s]2025-05-26 05:21:05,126 - INFO - [Epoch 010 | Batch 0150] IWAE-loss 12438.1709 | mean log_px -0.1271 | KL -3543.86 + 153it [00:05, 29.10it/s] 156it [00:05, 29.30it/s] 160it [00:05, 29.58it/s] 163it [00:05, 28.88it/s] 167it [00:05, 29.26it/s] 171it [00:05, 29.32it/s] 175it [00:05, 29.86it/s] 178it [00:06, 29.31it/s] 182it [00:06, 30.02it/s] 185it [00:06, 29.34it/s] 189it [00:06, 29.61it/s] 192it [00:06, 29.46it/s] 195it [00:06, 27.88it/s] 196it [00:06, 29.24it/s] +2025-05-26 05:21:06,733 - INFO - Epoch: 10, Objective: tensor([11702.4199], device='cuda:0', grad_fn=), Loss: 0.11607591807842255, KL/n: 72.46379852294922 + 0it [00:00, ?it/s]2025-05-26 05:21:07,118 - INFO - [Epoch 011 | Batch 0000] IWAE-loss 12625.6602 | mean log_px -0.1297 | KL -3548.19 + 2it [00:00, 14.05it/s] 6it [00:00, 23.23it/s] 10it [00:00, 27.25it/s] 13it [00:00, 27.34it/s] 17it [00:00, 28.49it/s] 21it [00:00, 29.04it/s] 25it [00:00, 29.55it/s] 28it [00:01, 29.39it/s] 32it [00:01, 30.01it/s] 35it [00:01, 29.37it/s] 39it [00:01, 30.01it/s] 42it [00:01, 29.87it/s] 46it [00:01, 30.03it/s] 50it [00:01, 29.81it/s]2025-05-26 05:21:08,798 - INFO - [Epoch 011 | Batch 0050] IWAE-loss 12040.0361 | mean log_px -0.1212 | KL -3556.24 + 54it [00:01, 29.98it/s] 57it [00:01, 29.59it/s] 61it [00:02, 30.06it/s] 65it [00:02, 30.44it/s] 69it [00:02, 30.28it/s] 73it [00:02, 30.32it/s] 77it [00:02, 30.02it/s] 81it [00:02, 30.44it/s] 85it [00:02, 30.35it/s] 89it [00:03, 29.70it/s] 93it [00:03, 29.64it/s] 96it [00:03, 29.50it/s] 100it [00:03, 29.90it/s]2025-05-26 05:21:10,458 - INFO - [Epoch 011 | Batch 0100] IWAE-loss 13540.5400 | mean log_px -0.1426 | KL -3556.50 + 103it [00:03, 29.79it/s] 106it [00:03, 29.80it/s] 110it [00:03, 30.53it/s] 114it [00:03, 30.22it/s] 118it [00:03, 30.26it/s] 122it [00:04, 30.65it/s] 126it [00:04, 30.56it/s] 130it [00:04, 30.63it/s] 134it [00:04, 30.18it/s] 138it [00:04, 30.41it/s] 142it [00:04, 30.04it/s] 146it [00:04, 30.17it/s] 150it [00:05, 30.39it/s]2025-05-26 05:21:12,106 - INFO - [Epoch 011 | Batch 0150] IWAE-loss 14201.5371 | mean log_px -0.1521 | KL -3554.20 + 154it [00:05, 30.03it/s] 158it [00:05, 30.28it/s] 162it [00:05, 30.00it/s] 166it [00:05, 30.43it/s] 170it [00:05, 30.05it/s] 174it [00:05, 30.32it/s] 178it [00:05, 30.05it/s] 182it [00:06, 30.12it/s] 186it [00:06, 30.14it/s] 190it [00:06, 30.26it/s] 194it [00:06, 30.30it/s] 196it [00:06, 29.49it/s] +2025-05-26 05:21:13,681 - INFO - Epoch: 11, Objective: tensor([14391.9463], device='cuda:0', grad_fn=), Loss: 0.15944251418113708, KL/n: 72.59249877929688 + 0it [00:00, ?it/s]2025-05-26 05:21:13,894 - INFO - [Epoch 012 | Batch 0000] IWAE-loss 14934.0508 | mean log_px -0.1626 | KL -3552.75 + 1it [00:00, 9.54it/s] 4it [00:00, 20.62it/s] 8it [00:00, 26.45it/s] 12it [00:00, 28.26it/s] 16it [00:00, 29.12it/s] 19it [00:00, 28.78it/s] 23it [00:00, 29.50it/s] 27it [00:00, 30.38it/s] 31it [00:01, 30.55it/s] 35it [00:01, 30.57it/s] 39it [00:01, 30.21it/s] 43it [00:01, 30.63it/s] 47it [00:01, 30.66it/s]2025-05-26 05:21:15,537 - INFO - [Epoch 012 | Batch 0050] IWAE-loss 10078.7207 | mean log_px -0.0931 | KL -3562.00 + 51it [00:01, 30.04it/s] 55it [00:01, 30.77it/s] 59it [00:02, 30.38it/s] 63it [00:02, 30.84it/s] 67it [00:02, 30.74it/s] 71it [00:02, 30.38it/s] 75it [00:02, 30.75it/s] 79it [00:02, 30.37it/s] 83it [00:02, 30.74it/s] 87it [00:02, 30.34it/s] 91it [00:03, 30.49it/s] 95it [00:03, 30.78it/s] 99it [00:03, 30.80it/s]2025-05-26 05:21:17,172 - INFO - [Epoch 012 | Batch 0100] IWAE-loss 14258.9668 | mean log_px -0.1529 | KL -3557.95 + 103it [00:03, 30.67it/s] 107it [00:03, 30.42it/s] 111it [00:03, 30.45it/s] 115it [00:03, 30.50it/s] 119it [00:03, 30.84it/s] 123it [00:04, 30.81it/s] 127it [00:04, 30.46it/s] 131it [00:04, 30.80it/s] 135it [00:04, 30.14it/s] 139it [00:04, 30.55it/s] 143it [00:04, 30.87it/s] 147it [00:04, 30.80it/s]2025-05-26 05:21:18,807 - INFO - [Epoch 012 | Batch 0150] IWAE-loss 15773.4404 | mean log_px -0.1745 | KL -3559.86 + 151it [00:05, 30.20it/s] 155it [00:05, 30.85it/s] 159it [00:05, 30.76it/s] 163it [00:05, 30.41it/s] 167it [00:05, 30.48it/s] 171it [00:05, 30.51it/s] 175it [00:05, 30.54it/s] 179it [00:05, 30.54it/s] 183it [00:06, 30.82it/s] 187it [00:06, 30.69it/s] 191it [00:06, 30.39it/s] 195it [00:06, 29.23it/s] 196it [00:06, 29.95it/s] +2025-05-26 05:21:20,348 - INFO - Epoch: 12, Objective: tensor([11574.0742], device='cuda:0', grad_fn=), Loss: 0.11686700582504272, KL/n: 72.71397399902344 + 0it [00:00, ?it/s]2025-05-26 05:21:20,728 - INFO - [Epoch 013 | Batch 0000] IWAE-loss 9369.8613 | mean log_px -0.0830 | KL -3562.15 + 2it [00:00, 15.45it/s] 5it [00:00, 22.95it/s] 8it [00:00, 25.07it/s] 12it [00:00, 28.00it/s] 15it [00:00, 28.08it/s] 18it [00:00, 28.49it/s] 22it [00:00, 29.24it/s] 25it [00:00, 29.29it/s] 29it [00:01, 29.98it/s] 32it [00:01, 29.69it/s] 35it [00:01, 29.05it/s] 39it [00:01, 29.93it/s] 42it [00:01, 29.31it/s] 46it [00:01, 29.49it/s] 50it [00:01, 29.89it/s]2025-05-26 05:21:22,406 - INFO - [Epoch 013 | Batch 0050] IWAE-loss 12209.3398 | mean log_px -0.1235 | KL -3565.70 + 54it [00:01, 29.96it/s] 58it [00:02, 30.37it/s] 62it [00:02, 30.07it/s] 66it [00:02, 30.12it/s] 70it [00:02, 30.11it/s] 74it [00:02, 29.29it/s] 77it [00:02, 29.45it/s] 80it [00:02, 29.41it/s] 84it [00:02, 29.57it/s] 88it [00:03, 30.33it/s] 92it [00:03, 30.13it/s] 96it [00:03, 29.46it/s] 100it [00:03, 29.61it/s]2025-05-26 05:21:24,078 - INFO - [Epoch 013 | Batch 0100] IWAE-loss 9832.3418 | mean log_px -0.0895 | KL -3564.59 + 104it [00:03, 29.67it/s] 108it [00:03, 30.19it/s] 112it [00:03, 30.17it/s] 116it [00:03, 29.79it/s] 119it [00:04, 28.82it/s] 123it [00:04, 29.14it/s] 127it [00:04, 29.66it/s] 130it [00:04, 29.04it/s] 134it [00:04, 29.42it/s] 138it [00:04, 30.13it/s] 142it [00:04, 30.00it/s] 145it [00:04, 29.38it/s] 149it [00:05, 29.79it/s]2025-05-26 05:21:25,778 - INFO - [Epoch 013 | Batch 0150] IWAE-loss 14124.4805 | mean log_px -0.1508 | KL -3565.40 + 152it [00:05, 29.69it/s] 155it [00:05, 28.05it/s] 159it [00:05, 28.42it/s] 163it [00:05, 29.39it/s] 166it [00:05, 28.99it/s] 169it [00:05, 29.12it/s] 172it [00:05, 28.83it/s] 175it [00:05, 28.98it/s] 179it [00:06, 29.79it/s] 182it [00:06, 29.02it/s] 186it [00:06, 29.20it/s] 190it [00:06, 29.60it/s] 193it [00:06, 29.06it/s] 196it [00:06, 29.00it/s] +2025-05-26 05:21:27,401 - INFO - Epoch: 13, Objective: tensor([10300.4492], device='cuda:0', grad_fn=), Loss: 0.09235146641731262, KL/n: 72.79515838623047 + 0it [00:00, ?it/s]2025-05-26 05:21:27,611 - INFO - [Epoch 014 | Batch 0000] IWAE-loss 11991.5596 | mean log_px -0.1204 | KL -3566.11 + 1it [00:00, 9.95it/s] 4it [00:00, 20.81it/s] 8it [00:00, 26.84it/s] 11it [00:00, 27.38it/s] 15it [00:00, 29.45it/s] 18it [00:00, 29.36it/s] 22it [00:00, 29.80it/s] 26it [00:00, 30.46it/s] 30it [00:01, 30.54it/s] 34it [00:01, 29.89it/s] 38it [00:01, 30.65it/s] 42it [00:01, 30.68it/s] 46it [00:01, 30.68it/s] 50it [00:01, 30.28it/s]2025-05-26 05:21:29,251 - INFO - [Epoch 014 | Batch 0050] IWAE-loss 8737.1328 | mean log_px -0.0739 | KL -3566.85 + 54it [00:01, 30.34it/s] 58it [00:01, 30.44it/s] 62it [00:02, 30.85it/s] 66it [00:02, 30.80it/s] 70it [00:02, 30.46it/s] 74it [00:02, 30.73it/s] 78it [00:02, 30.72it/s] 82it [00:02, 30.77it/s] 86it [00:02, 30.48it/s] 90it [00:03, 30.79it/s] 94it [00:03, 30.77it/s] 98it [00:03, 30.34it/s]2025-05-26 05:21:30,883 - INFO - [Epoch 014 | Batch 0100] IWAE-loss 10533.0479 | mean log_px -0.0995 | KL -3565.07 + 102it [00:03, 30.43it/s] 106it [00:03, 30.45it/s] 110it [00:03, 30.47it/s] 114it [00:03, 30.49it/s] 118it [00:03, 30.60it/s] 122it [00:04, 30.89it/s] 126it [00:04, 30.71it/s] 130it [00:04, 30.79it/s] 134it [00:04, 30.40it/s] 138it [00:04, 30.81it/s] 142it [00:04, 30.70it/s] 146it [00:04, 30.80it/s] 150it [00:04, 30.45it/s]2025-05-26 05:21:32,518 - INFO - [Epoch 014 | Batch 0150] IWAE-loss 13362.9570 | mean log_px -0.1399 | KL -3566.50 + 154it [00:05, 30.50it/s] 158it [00:05, 30.81it/s] 162it [00:05, 30.77it/s] 166it [00:05, 30.34it/s] 170it [00:05, 30.29it/s] 174it [00:05, 30.09it/s] 178it [00:05, 29.35it/s] 182it [00:06, 30.05it/s] 186it [00:06, 30.43it/s] 190it [00:06, 30.59it/s] 194it [00:06, 30.24it/s] 196it [00:06, 29.92it/s] +2025-05-26 05:21:34,075 - INFO - Epoch: 14, Objective: tensor([8674.3564], device='cuda:0', grad_fn=), Loss: 0.07409722357988358, KL/n: 72.8468017578125 + 0it [00:00, ?it/s]2025-05-26 05:21:34,459 - INFO - [Epoch 015 | Batch 0000] IWAE-loss 8316.8721 | mean log_px -0.0679 | KL -3566.54 + 2it [00:00, 15.30it/s] 5it [00:00, 22.90it/s] 8it [00:00, 24.64it/s] 12it [00:00, 28.06it/s] 15it [00:00, 28.57it/s] 18it [00:00, 28.80it/s] 22it [00:00, 29.30it/s] 25it [00:00, 28.83it/s] 29it [00:01, 28.74it/s] 33it [00:01, 29.75it/s] 36it [00:01, 29.60it/s] 40it [00:01, 29.95it/s] 44it [00:01, 30.27it/s] 48it [00:01, 29.68it/s]2025-05-26 05:21:36,135 - INFO - [Epoch 015 | Batch 0050] IWAE-loss 8884.7939 | mean log_px -0.0760 | KL -3568.22 + 52it [00:01, 29.91it/s] 55it [00:01, 29.73it/s] 59it [00:02, 29.98it/s] 62it [00:02, 29.78it/s] 66it [00:02, 30.03it/s] 70it [00:02, 30.28it/s] 74it [00:02, 30.19it/s] 78it [00:02, 30.15it/s] 82it [00:02, 29.74it/s] 85it [00:02, 29.73it/s] 88it [00:03, 29.62it/s] 92it [00:03, 29.72it/s] 96it [00:03, 30.01it/s] 100it [00:03, 30.04it/s]2025-05-26 05:21:37,804 - INFO - [Epoch 015 | Batch 0100] IWAE-loss 7275.8506 | mean log_px -0.0530 | KL -3565.84 + 104it [00:03, 29.93it/s] 107it [00:03, 29.79it/s] 111it [00:03, 29.84it/s] 115it [00:03, 29.88it/s] 119it [00:04, 30.50it/s] 123it [00:04, 30.20it/s] 127it [00:04, 30.23it/s] 131it [00:04, 30.18it/s] 135it [00:04, 30.11it/s] 139it [00:04, 29.76it/s] 142it [00:04, 29.66it/s] 146it [00:04, 30.03it/s] 150it [00:05, 30.15it/s]2025-05-26 05:21:39,471 - INFO - [Epoch 015 | Batch 0150] IWAE-loss 9055.9580 | mean log_px -0.0784 | KL -3570.80 + 154it [00:05, 29.51it/s] 158it [00:05, 29.34it/s] 162it [00:05, 30.39it/s] 166it [00:05, 30.39it/s] 170it [00:05, 30.32it/s] 174it [00:05, 30.29it/s] 178it [00:06, 29.82it/s] 181it [00:06, 29.66it/s] 184it [00:06, 29.74it/s] 188it [00:06, 30.36it/s] 192it [00:06, 29.69it/s] 195it [00:06, 28.93it/s] 196it [00:06, 29.35it/s] +2025-05-26 05:21:41,051 - INFO - Epoch: 15, Objective: tensor([9224.1475], device='cuda:0', grad_fn=), Loss: 0.08432125300168991, KL/n: 72.91032409667969 + 0it [00:00, ?it/s]2025-05-26 05:21:41,274 - INFO - [Epoch 016 | Batch 0000] IWAE-loss 8985.7246 | mean log_px -0.0773 | KL -3571.36 + 1it [00:00, 9.14it/s] 5it [00:00, 23.95it/s] 8it [00:00, 25.73it/s] 12it [00:00, 27.83it/s] 16it [00:00, 28.99it/s] 20it [00:00, 29.91it/s] 23it [00:00, 29.35it/s] 27it [00:00, 29.87it/s] 30it [00:01, 29.78it/s] 34it [00:01, 29.92it/s] 38it [00:01, 30.05it/s] 42it [00:01, 30.72it/s] 46it [00:01, 30.29it/s] 50it [00:01, 30.70it/s]2025-05-26 05:21:42,919 - INFO - [Epoch 016 | Batch 0050] IWAE-loss 10308.2246 | mean log_px -0.0963 | KL -3570.48 + 54it [00:01, 30.22it/s] 58it [00:01, 30.27it/s] 62it [00:02, 30.31it/s] 66it [00:02, 30.29it/s] 70it [00:02, 30.70it/s] 74it [00:02, 30.23it/s] 78it [00:02, 30.66it/s] 82it [00:02, 30.52it/s] 86it [00:02, 30.50it/s] 90it [00:03, 30.08it/s] 94it [00:03, 30.37it/s] 98it [00:03, 30.09it/s]2025-05-26 05:21:44,576 - INFO - [Epoch 016 | Batch 0100] IWAE-loss 13002.2568 | mean log_px -0.1347 | KL -3571.31 + 102it [00:03, 30.15it/s] 106it [00:03, 30.21it/s] 110it [00:03, 30.23it/s] 114it [00:03, 30.28it/s] 118it [00:03, 29.79it/s] 122it [00:04, 30.16it/s] 126it [00:04, 30.28it/s] 130it [00:04, 30.07it/s] 134it [00:04, 30.72it/s] 138it [00:04, 30.60it/s] 142it [00:04, 30.57it/s] 146it [00:04, 30.24it/s] 150it [00:05, 30.56it/s]2025-05-26 05:21:46,214 - INFO - [Epoch 016 | Batch 0150] IWAE-loss 9578.2891 | mean log_px -0.0859 | KL -3567.10 + 154it [00:05, 30.06it/s] 158it [00:05, 30.41it/s] 162it [00:05, 30.74it/s] 166it [00:05, 30.70it/s] 170it [00:05, 30.24it/s] 174it [00:05, 30.30it/s] 178it [00:05, 30.44it/s] 182it [00:06, 30.62it/s] 186it [00:06, 30.02it/s] 190it [00:06, 30.15it/s] 194it [00:06, 30.20it/s] 196it [00:06, 29.73it/s] +2025-05-26 05:21:47,776 - INFO - Epoch: 16, Objective: tensor([10074.4824], device='cuda:0', grad_fn=), Loss: 0.0899372398853302, KL/n: 72.9590072631836 + 0it [00:00, ?it/s]2025-05-26 05:21:48,137 - INFO - [Epoch 017 | Batch 0000] IWAE-loss 13186.9502 | mean log_px -0.1373 | KL -3574.98 + 2it [00:00, 16.13it/s] 5it [00:00, 22.71it/s] 9it [00:00, 26.48it/s] 13it [00:00, 28.79it/s] 16it [00:00, 28.85it/s] 20it [00:00, 29.37it/s] 24it [00:00, 29.81it/s] 28it [00:00, 30.00it/s] 32it [00:01, 30.14it/s] 36it [00:01, 30.28it/s] 40it [00:01, 30.57it/s] 44it [00:01, 30.52it/s] 48it [00:01, 30.13it/s]2025-05-26 05:21:49,803 - INFO - [Epoch 017 | Batch 0050] IWAE-loss 8914.1670 | mean log_px -0.0762 | KL -3577.15 + 52it [00:01, 29.68it/s] 55it [00:01, 29.34it/s] 59it [00:02, 29.69it/s] 62it [00:02, 28.79it/s] 65it [00:02, 28.76it/s] 69it [00:02, 28.95it/s] 72it [00:02, 28.72it/s] 76it [00:02, 28.99it/s] 80it [00:02, 29.22it/s] 83it [00:02, 28.72it/s] 86it [00:02, 28.38it/s] 90it [00:03, 28.84it/s] 93it [00:03, 28.54it/s] 96it [00:03, 28.80it/s] 99it [00:03, 28.63it/s]2025-05-26 05:21:51,537 - INFO - [Epoch 017 | Batch 0100] IWAE-loss 8901.1836 | mean log_px -0.0761 | KL -3573.32 + 103it [00:03, 28.84it/s] 107it [00:03, 29.44it/s] 110it [00:03, 28.56it/s] 114it [00:03, 28.93it/s] 117it [00:04, 29.17it/s] 120it [00:04, 28.47it/s] 124it [00:04, 29.26it/s] 127it [00:04, 28.45it/s] 130it [00:04, 28.75it/s] 133it [00:04, 28.55it/s] 137it [00:04, 29.85it/s] 140it [00:04, 28.96it/s] 143it [00:04, 29.20it/s] 146it [00:05, 28.78it/s] 149it [00:05, 29.06it/s]2025-05-26 05:21:53,271 - INFO - [Epoch 017 | Batch 0150] IWAE-loss 9242.2207 | mean log_px -0.0810 | KL -3571.41 + 152it [00:05, 29.01it/s] 155it [00:05, 29.05it/s] 158it [00:05, 28.58it/s] 161it [00:05, 28.96it/s] 164it [00:05, 28.66it/s] 168it [00:05, 28.92it/s] 172it [00:05, 29.20it/s] 175it [00:06, 28.51it/s] 179it [00:06, 29.09it/s] 182it [00:06, 28.31it/s] 186it [00:06, 28.99it/s] 189it [00:06, 28.27it/s] 193it [00:06, 29.26it/s] 196it [00:06, 28.21it/s] 196it [00:06, 28.62it/s] +2025-05-26 05:21:54,916 - INFO - Epoch: 17, Objective: tensor([13480.9648], device='cuda:0', grad_fn=), Loss: 0.13737212121486664, KL/n: 72.98963165283203 + 0it [00:00, ?it/s]2025-05-26 05:21:55,140 - INFO - [Epoch 018 | Batch 0000] IWAE-loss 9429.3545 | mean log_px -0.0836 | KL -3574.62 + 1it [00:00, 9.54it/s] 4it [00:00, 20.46it/s] 8it [00:00, 26.08it/s] 11it [00:00, 26.64it/s] 15it [00:00, 28.51it/s] 18it [00:00, 27.68it/s] 22it [00:00, 28.14it/s] 26it [00:00, 29.48it/s] 29it [00:01, 29.46it/s] 32it [00:01, 29.15it/s] 35it [00:01, 29.08it/s] 39it [00:01, 29.45it/s] 43it [00:01, 29.27it/s] 46it [00:01, 28.95it/s] 50it [00:01, 29.22it/s]2025-05-26 05:21:56,849 - INFO - [Epoch 018 | Batch 0050] IWAE-loss 10995.4219 | mean log_px -0.1061 | KL -3571.84 + 54it [00:01, 29.53it/s] 57it [00:02, 29.27it/s] 60it [00:02, 28.54it/s] 63it [00:02, 28.70it/s] 66it [00:02, 28.76it/s] 69it [00:02, 28.33it/s] 72it [00:02, 28.50it/s] 76it [00:02, 28.72it/s] 79it [00:02, 28.61it/s] 82it [00:02, 28.64it/s] 86it [00:03, 28.75it/s] 90it [00:03, 29.11it/s] 93it [00:03, 28.36it/s] 97it [00:03, 29.14it/s] 100it [00:03, 28.73it/s]2025-05-26 05:21:58,589 - INFO - [Epoch 018 | Batch 0100] IWAE-loss 7979.1572 | mean log_px -0.0629 | KL -3573.94 + 104it [00:03, 29.19it/s] 107it [00:03, 28.31it/s] 111it [00:03, 28.55it/s] 115it [00:04, 29.25it/s] 118it [00:04, 29.27it/s] 121it [00:04, 28.68it/s] 125it [00:04, 29.62it/s] 128it [00:04, 29.03it/s] 132it [00:04, 28.91it/s] 136it [00:04, 29.72it/s] 139it [00:04, 29.65it/s] 142it [00:04, 28.98it/s] 146it [00:05, 29.04it/s] 150it [00:05, 29.51it/s]2025-05-26 05:22:00,305 - INFO - [Epoch 018 | Batch 0150] IWAE-loss 11832.6465 | mean log_px -0.1180 | KL -3573.99 + 153it [00:05, 29.43it/s] 156it [00:05, 29.12it/s] 160it [00:05, 29.69it/s] 163it [00:05, 29.07it/s] 166it [00:05, 28.94it/s] 170it [00:05, 29.00it/s] 174it [00:06, 29.15it/s] 178it [00:06, 29.86it/s] 181it [00:06, 29.27it/s] 184it [00:06, 29.30it/s] 188it [00:06, 29.77it/s] 191it [00:06, 29.15it/s] 195it [00:06, 27.93it/s] 196it [00:06, 28.62it/s] +2025-05-26 05:22:01,899 - INFO - Epoch: 18, Objective: tensor([9690.2705], device='cuda:0', grad_fn=), Loss: 0.08383181691169739, KL/n: 72.97569274902344 + 0it [00:00, ?it/s]2025-05-26 05:22:02,403 - INFO - [Epoch 019 | Batch 0000] IWAE-loss 10563.0986 | mean log_px -0.0999 | KL -3569.75 + 1it [00:00, 4.38it/s] 4it [00:00, 13.81it/s] 8it [00:00, 20.13it/s] 12it [00:00, 24.15it/s] 15it [00:00, 25.80it/s] 18it [00:00, 26.35it/s] 22it [00:00, 27.81it/s] 25it [00:01, 27.62it/s] 29it [00:01, 28.62it/s] 33it [00:01, 29.43it/s] 36it [00:01, 28.92it/s] 39it [00:01, 28.79it/s] 43it [00:01, 28.88it/s] 47it [00:01, 29.74it/s] 50it [00:01, 29.73it/s]2025-05-26 05:22:04,103 - INFO - [Epoch 019 | Batch 0050] IWAE-loss 11524.1367 | mean log_px -0.1136 | KL -3574.29 + 53it [00:02, 28.85it/s] 57it [00:02, 29.32it/s] 61it [00:02, 29.75it/s] 64it [00:02, 28.75it/s] 68it [00:02, 29.45it/s] 71it [00:02, 29.14it/s] 74it [00:02, 29.14it/s] 77it [00:02, 29.01it/s] 81it [00:02, 29.18it/s] 85it [00:03, 29.90it/s] 88it [00:03, 29.20it/s] 92it [00:03, 29.63it/s] 96it [00:03, 30.11it/s] 100it [00:03, 29.71it/s]2025-05-26 05:22:05,808 - INFO - [Epoch 019 | Batch 0100] IWAE-loss 10648.2744 | mean log_px -0.1011 | KL -3572.12 + 103it [00:03, 29.26it/s] 106it [00:03, 29.31it/s] 110it [00:03, 29.30it/s] 114it [00:04, 30.00it/s] 117it [00:04, 29.04it/s] 121it [00:04, 29.56it/s] 124it [00:04, 29.41it/s] 127it [00:04, 29.15it/s] 131it [00:04, 29.60it/s] 135it [00:04, 30.12it/s] 139it [00:04, 30.02it/s] 142it [00:05, 29.66it/s] 145it [00:05, 29.15it/s] 149it [00:05, 29.06it/s]2025-05-26 05:22:07,496 - INFO - [Epoch 019 | Batch 0150] IWAE-loss 7303.5244 | mean log_px -0.0534 | KL -3568.66 + 153it [00:05, 29.29it/s] 157it [00:05, 29.55it/s] 161it [00:05, 30.05it/s] 165it [00:05, 29.35it/s] 168it [00:05, 29.32it/s] 172it [00:06, 30.12it/s] 176it [00:06, 29.66it/s] 179it [00:06, 29.45it/s] 183it [00:06, 29.53it/s] 186it [00:06, 29.25it/s] 190it [00:06, 29.24it/s] 194it [00:06, 29.60it/s] 196it [00:06, 28.32it/s] +2025-05-26 05:22:09,110 - INFO - Epoch: 19, Objective: tensor([9041.3672], device='cuda:0', grad_fn=), Loss: 0.0738806203007698, KL/n: 72.98346710205078 + 0it [00:00, ?it/s]2025-05-26 05:22:09,504 - INFO - [Epoch 020 | Batch 0000] IWAE-loss 6978.5659 | mean log_px -0.0486 | KL -3573.67 + 1it [00:00, 9.92it/s] 4it [00:00, 20.50it/s] 8it [00:00, 25.39it/s] 11it [00:00, 26.76it/s] 14it [00:00, 27.41it/s] 18it [00:00, 28.18it/s] 22it [00:00, 29.10it/s] 25it [00:00, 29.04it/s] 29it [00:01, 29.14it/s] 33it [00:01, 29.91it/s] 36it [00:01, 29.13it/s] 40it [00:01, 29.34it/s] 44it [00:01, 29.96it/s] 47it [00:01, 29.32it/s]2025-05-26 05:22:11,204 - INFO - [Epoch 020 | Batch 0050] IWAE-loss 11295.7881 | mean log_px -0.1103 | KL -3573.83 + 51it [00:01, 29.37it/s] 55it [00:01, 29.67it/s] 59it [00:02, 30.00it/s] 62it [00:02, 29.23it/s] 66it [00:02, 29.48it/s] 70it [00:02, 30.08it/s] 74it [00:02, 30.01it/s] 77it [00:02, 29.43it/s] 81it [00:02, 30.04it/s] 84it [00:02, 29.27it/s] 87it [00:03, 29.45it/s] 91it [00:03, 29.87it/s] 94it [00:03, 29.33it/s] 98it [00:03, 29.47it/s]2025-05-26 05:22:12,885 - INFO - [Epoch 020 | Batch 0100] IWAE-loss 8173.0259 | mean log_px -0.0657 | KL -3575.26 + 102it [00:03, 30.00it/s] 105it [00:03, 29.27it/s] 108it [00:03, 29.30it/s] 112it [00:03, 30.03it/s] 115it [00:03, 28.88it/s] 119it [00:04, 29.83it/s] 122it [00:04, 29.11it/s] 126it [00:04, 29.17it/s] 130it [00:04, 29.98it/s] 133it [00:04, 29.82it/s] 136it [00:04, 29.38it/s] 139it [00:04, 29.16it/s] 143it [00:04, 29.20it/s] 147it [00:05, 29.98it/s] 150it [00:05, 29.45it/s]2025-05-26 05:22:14,581 - INFO - [Epoch 020 | Batch 0150] IWAE-loss 8517.9102 | mean log_px -0.0706 | KL -3574.60 + 153it [00:05, 29.47it/s] 156it [00:05, 28.66it/s] 160it [00:05, 29.21it/s] 163it [00:05, 29.21it/s] 166it [00:05, 29.03it/s] 169it [00:05, 29.28it/s] 172it [00:05, 29.07it/s] 176it [00:06, 29.03it/s] 180it [00:06, 30.02it/s] 183it [00:06, 29.20it/s] 187it [00:06, 29.45it/s] 191it [00:06, 30.13it/s] 195it [00:06, 28.36it/s] 196it [00:06, 28.91it/s] +2025-05-26 05:22:16,197 - INFO - Epoch: 20, Objective: tensor([7768.5664], device='cuda:0', grad_fn=), Loss: 0.05292247608304024, KL/n: 72.9926986694336 + 0it [00:00, ?it/s]2025-05-26 05:22:16,407 - INFO - [Epoch 021 | Batch 0000] IWAE-loss 8910.8350 | mean log_px -0.0763 | KL -3572.10 + 2it [00:00, 15.59it/s] 6it [00:00, 24.39it/s] 9it [00:00, 25.86it/s] 13it [00:00, 27.82it/s] 17it [00:00, 28.82it/s] 21it [00:00, 29.23it/s] 25it [00:00, 29.57it/s] 29it [00:01, 29.87it/s] 33it [00:01, 30.10it/s] 37it [00:01, 30.25it/s] 41it [00:01, 30.35it/s] 45it [00:01, 30.35it/s] 49it [00:01, 30.45it/s]2025-05-26 05:22:18,055 - INFO - [Epoch 021 | Batch 0050] IWAE-loss 10398.9912 | mean log_px -0.0975 | KL -3575.78 + 53it [00:01, 30.44it/s] 57it [00:01, 30.46it/s] 61it [00:02, 30.86it/s] 65it [00:02, 29.51it/s] 69it [00:02, 30.48it/s] 73it [00:02, 30.49it/s] 77it [00:02, 30.47it/s] 81it [00:02, 29.92it/s] 85it [00:02, 30.54it/s] 89it [00:03, 30.23it/s] 93it [00:03, 30.27it/s] 97it [00:03, 30.73it/s]2025-05-26 05:22:19,705 - INFO - [Epoch 021 | Batch 0100] IWAE-loss 7123.5420 | mean log_px -0.0507 | KL -3574.84 + 101it [00:03, 30.12it/s] 105it [00:03, 30.31it/s] 109it [00:03, 30.46it/s] 113it [00:03, 30.21it/s] 117it [00:03, 30.30it/s] 121it [00:04, 30.73it/s] 125it [00:04, 30.55it/s] 129it [00:04, 29.94it/s] 133it [00:04, 30.03it/s] 137it [00:04, 30.17it/s] 141it [00:04, 30.77it/s] 145it [00:04, 30.71it/s] 149it [00:04, 30.10it/s]2025-05-26 05:22:21,350 - INFO - [Epoch 021 | Batch 0150] IWAE-loss 14440.6475 | mean log_px -0.1552 | KL -3579.55 + 153it [00:05, 30.73it/s] 157it [00:05, 30.65it/s] 161it [00:05, 30.63it/s] 165it [00:05, 30.17it/s] 169it [00:05, 30.27it/s] 173it [00:05, 30.29it/s] 177it [00:05, 30.39it/s] 181it [00:06, 30.77it/s] 185it [00:06, 30.30it/s] 189it [00:06, 30.72it/s] 193it [00:06, 30.34it/s] 196it [00:06, 29.80it/s] +2025-05-26 05:22:22,900 - INFO - Epoch: 21, Objective: tensor([9626.5059], device='cuda:0', grad_fn=), Loss: 0.08952867239713669, KL/n: 72.98113250732422 + 0it [00:00, ?it/s]2025-05-26 05:22:23,109 - INFO - [Epoch 022 | Batch 0000] IWAE-loss 7838.6660 | mean log_px -0.0609 | KL -3574.87 + 1it [00:00, 9.97it/s] 4it [00:00, 20.63it/s] 8it [00:00, 25.74it/s] 11it [00:00, 26.67it/s] 15it [00:00, 27.87it/s] 19it [00:00, 29.22it/s] 22it [00:00, 28.76it/s] 26it [00:00, 29.19it/s] 30it [00:01, 30.26it/s] 34it [00:01, 29.99it/s] 37it [00:01, 29.44it/s] 41it [00:01, 29.47it/s] 45it [00:01, 30.15it/s] 49it [00:01, 30.04it/s]2025-05-26 05:22:24,793 - INFO - [Epoch 022 | Batch 0050] IWAE-loss 7246.2695 | mean log_px -0.0524 | KL -3575.72 + 53it [00:01, 29.27it/s] 57it [00:01, 29.34it/s] 61it [00:02, 30.10it/s] 65it [00:02, 30.01it/s] 69it [00:02, 29.43it/s] 73it [00:02, 29.38it/s] 77it [00:02, 30.10it/s] 81it [00:02, 30.06it/s] 85it [00:02, 29.33it/s] 89it [00:03, 29.49it/s] 93it [00:03, 30.06it/s] 97it [00:03, 30.01it/s]2025-05-26 05:22:26,479 - INFO - [Epoch 022 | Batch 0100] IWAE-loss 8993.8701 | mean log_px -0.0775 | KL -3572.26 + 101it [00:03, 29.26it/s] 105it [00:03, 29.53it/s] 108it [00:03, 29.50it/s] 112it [00:03, 29.54it/s] 116it [00:03, 29.70it/s] 119it [00:04, 29.53it/s] 123it [00:04, 29.43it/s] 127it [00:04, 30.20it/s] 131it [00:04, 29.30it/s] 135it [00:04, 29.46it/s] 139it [00:04, 30.17it/s] 143it [00:04, 29.64it/s] 147it [00:05, 29.87it/s]2025-05-26 05:22:28,155 - INFO - [Epoch 022 | Batch 0150] IWAE-loss 6235.6240 | mean log_px -0.0381 | KL -3571.26 + 151it [00:05, 30.21it/s] 155it [00:05, 29.88it/s] 158it [00:05, 29.29it/s] 162it [00:05, 29.39it/s] 165it [00:05, 29.41it/s] 168it [00:05, 28.22it/s] 172it [00:05, 28.62it/s] 176it [00:06, 28.94it/s] 180it [00:06, 29.50it/s] 183it [00:06, 28.94it/s] 187it [00:06, 29.27it/s] 191it [00:06, 29.84it/s] 194it [00:06, 29.30it/s] 196it [00:06, 29.03it/s] +2025-05-26 05:22:29,774 - INFO - Epoch: 22, Objective: tensor([8061.6055], device='cuda:0', grad_fn=), Loss: 0.06979813426733017, KL/n: 72.94580078125 + 0it [00:00, ?it/s]2025-05-26 05:22:30,163 - INFO - [Epoch 023 | Batch 0000] IWAE-loss 10925.1533 | mean log_px -0.1051 | KL -3570.03 + 1it [00:00, 9.78it/s] 4it [00:00, 20.17it/s] 8it [00:00, 25.26it/s] 12it [00:00, 27.83it/s] 16it [00:00, 28.77it/s] 19it [00:00, 28.53it/s] 23it [00:00, 29.78it/s] 26it [00:00, 29.14it/s] 30it [00:01, 30.08it/s] 33it [00:01, 29.46it/s] 37it [00:01, 29.84it/s] 40it [00:01, 29.64it/s] 44it [00:01, 29.98it/s] 47it [00:01, 29.78it/s]2025-05-26 05:22:31,833 - INFO - [Epoch 023 | Batch 0050] IWAE-loss 9461.2891 | mean log_px -0.0842 | KL -3569.74 + 51it [00:01, 30.37it/s] 55it [00:01, 30.42it/s] 59it [00:02, 29.55it/s] 63it [00:02, 29.70it/s] 67it [00:02, 30.51it/s] 71it [00:02, 28.97it/s] 75it [00:02, 28.88it/s] 79it [00:02, 29.23it/s] 82it [00:02, 28.99it/s] 86it [00:02, 29.20it/s] 90it [00:03, 29.61it/s] 93it [00:03, 29.07it/s] 97it [00:03, 29.38it/s] 100it [00:03, 29.40it/s]2025-05-26 05:22:33,536 - INFO - [Epoch 023 | Batch 0100] IWAE-loss 9782.1748 | mean log_px -0.0887 | KL -3575.02 + 103it [00:03, 29.06it/s] 107it [00:03, 28.94it/s] 111it [00:03, 29.79it/s] 114it [00:03, 29.00it/s] 118it [00:04, 29.43it/s] 122it [00:04, 29.75it/s] 125it [00:04, 29.64it/s] 128it [00:04, 28.92it/s] 132it [00:04, 29.33it/s] 135it [00:04, 29.20it/s] 138it [00:04, 29.34it/s] 142it [00:04, 29.65it/s] 145it [00:04, 28.78it/s] 149it [00:05, 29.31it/s]2025-05-26 05:22:35,251 - INFO - [Epoch 023 | Batch 0150] IWAE-loss 11103.0645 | mean log_px -0.1076 | KL -3574.47 + 153it [00:05, 29.55it/s] 156it [00:05, 29.43it/s] 159it [00:05, 29.11it/s] 163it [00:05, 29.14it/s] 167it [00:05, 29.48it/s] 170it [00:05, 29.04it/s] 174it [00:05, 29.64it/s] 177it [00:06, 29.14it/s] 181it [00:06, 29.70it/s] 184it [00:06, 29.71it/s] 187it [00:06, 29.11it/s] 191it [00:06, 29.71it/s] 194it [00:06, 29.09it/s] 196it [00:06, 28.89it/s] +2025-05-26 05:22:36,860 - INFO - Epoch: 23, Objective: tensor([9953.3223], device='cuda:0', grad_fn=), Loss: 0.08732958883047104, KL/n: 72.91426086425781 + 0it [00:00, ?it/s]2025-05-26 05:22:37,075 - INFO - [Epoch 024 | Batch 0000] IWAE-loss 8175.0044 | mean log_px -0.0658 | KL -3570.66 + 1it [00:00, 9.59it/s] 4it [00:00, 20.45it/s] 7it [00:00, 24.56it/s] 11it [00:00, 27.58it/s] 14it [00:00, 27.73it/s] 18it [00:00, 29.02it/s] 21it [00:00, 29.22it/s] 25it [00:00, 29.77it/s] 29it [00:01, 30.28it/s] 33it [00:01, 30.35it/s] 37it [00:01, 30.07it/s] 41it [00:01, 30.20it/s] 45it [00:01, 29.99it/s] 49it [00:01, 30.42it/s]2025-05-26 05:22:38,736 - INFO - [Epoch 024 | Batch 0050] IWAE-loss 11058.1162 | mean log_px -0.1070 | KL -3567.84 + 53it [00:01, 30.78it/s] 57it [00:01, 30.33it/s] 61it [00:02, 30.10it/s] 65it [00:02, 30.47it/s] 69it [00:02, 30.49it/s] 73it [00:02, 30.47it/s] 77it [00:02, 30.04it/s] 81it [00:02, 30.16it/s] 85it [00:02, 30.55it/s] 89it [00:03, 30.50it/s] 93it [00:03, 30.19it/s] 97it [00:03, 30.22it/s]2025-05-26 05:22:40,379 - INFO - [Epoch 024 | Batch 0100] IWAE-loss 5432.0298 | mean log_px -0.0266 | KL -3571.93 + 101it [00:03, 30.55it/s] 105it [00:03, 30.62it/s] 109it [00:03, 30.55it/s] 113it [00:03, 30.07it/s] 117it [00:03, 30.30it/s] 121it [00:04, 30.54it/s] 125it [00:04, 30.61it/s] 129it [00:04, 30.28it/s] 133it [00:04, 30.34it/s] 137it [00:04, 29.68it/s] 141it [00:04, 30.58it/s] 145it [00:04, 30.59it/s] 149it [00:04, 30.60it/s]2025-05-26 05:22:42,027 - INFO - [Epoch 024 | Batch 0150] IWAE-loss 8827.2461 | mean log_px -0.0751 | KL -3569.95 + 153it [00:05, 29.97it/s] 157it [00:05, 30.46it/s] 161it [00:05, 30.74it/s] 165it [00:05, 30.43it/s] 169it [00:05, 30.49it/s] 173it [00:05, 30.82it/s] 177it [00:05, 30.77it/s] 181it [00:06, 29.86it/s] 185it [00:06, 30.00it/s] 189it [00:06, 30.78it/s] 193it [00:06, 30.43it/s] 196it [00:06, 29.72it/s] +2025-05-26 05:22:43,580 - INFO - Epoch: 24, Objective: tensor([10218.4648], device='cuda:0', grad_fn=), Loss: 0.10296904295682907, KL/n: 72.86886596679688 + 0it [00:00, ?it/s]2025-05-26 05:22:44,099 - INFO - [Epoch 025 | Batch 0000] IWAE-loss 8398.8350 | mean log_px -0.0690 | KL -3568.20 + 1it [00:00, 4.14it/s] 5it [00:00, 16.00it/s] 8it [00:00, 19.67it/s] 12it [00:00, 24.07it/s] 15it [00:00, 24.97it/s] 19it [00:00, 27.26it/s] 22it [00:00, 27.91it/s] 25it [00:01, 27.84it/s] 29it [00:01, 29.10it/s] 32it [00:01, 28.52it/s] 36it [00:01, 29.55it/s] 39it [00:01, 28.92it/s] 43it [00:01, 29.19it/s] 47it [00:01, 29.66it/s]2025-05-26 05:22:45,783 - INFO - [Epoch 025 | Batch 0050] IWAE-loss 6368.2944 | mean log_px -0.0399 | KL -3571.85 + 51it [00:01, 30.02it/s] 54it [00:02, 29.29it/s] 58it [00:02, 29.75it/s] 61it [00:02, 29.58it/s] 64it [00:02, 29.64it/s] 68it [00:02, 29.67it/s] 72it [00:02, 29.88it/s] 75it [00:02, 29.52it/s] 79it [00:02, 29.66it/s] 83it [00:03, 29.90it/s] 86it [00:03, 29.72it/s] 90it [00:03, 29.85it/s] 94it [00:03, 30.02it/s] 97it [00:03, 29.29it/s]2025-05-26 05:22:47,469 - INFO - [Epoch 025 | Batch 0100] IWAE-loss 10121.3945 | mean log_px -0.0936 | KL -3566.01 + 101it [00:03, 29.73it/s] 105it [00:03, 30.06it/s] 108it [00:03, 29.36it/s] 111it [00:03, 29.35it/s] 115it [00:04, 29.78it/s] 119it [00:04, 30.07it/s] 122it [00:04, 29.35it/s] 126it [00:04, 29.73it/s] 129it [00:04, 29.52it/s] 133it [00:04, 29.53it/s] 137it [00:04, 30.24it/s] 141it [00:04, 30.01it/s] 144it [00:05, 29.36it/s] 148it [00:05, 29.82it/s]2025-05-26 05:22:49,154 - INFO - [Epoch 025 | Batch 0150] IWAE-loss 9109.3369 | mean log_px -0.0792 | KL -3567.35 + 151it [00:05, 29.60it/s] 155it [00:05, 29.84it/s] 158it [00:05, 29.56it/s] 162it [00:05, 29.62it/s] 166it [00:05, 30.14it/s] 170it [00:05, 29.98it/s] 173it [00:06, 29.78it/s] 176it [00:06, 29.71it/s] 179it [00:06, 29.70it/s] 182it [00:06, 29.14it/s] 186it [00:06, 29.38it/s] 189it [00:06, 29.17it/s] 192it [00:06, 28.58it/s] 195it [00:06, 27.54it/s] 196it [00:06, 28.45it/s] +2025-05-26 05:22:50,764 - INFO - Epoch: 25, Objective: tensor([8103.9946], device='cuda:0', grad_fn=), Loss: 0.06816604733467102, KL/n: 72.83800506591797 + 0it [00:00, ?it/s]2025-05-26 05:22:51,157 - INFO - [Epoch 026 | Batch 0000] IWAE-loss 6542.1104 | mean log_px -0.0426 | KL -3563.56 + 1it [00:00, 9.83it/s] 4it [00:00, 20.53it/s] 8it [00:00, 25.67it/s] 12it [00:00, 27.79it/s] 15it [00:00, 27.87it/s] 18it [00:00, 28.41it/s] 21it [00:00, 28.85it/s] 24it [00:00, 28.97it/s] 27it [00:00, 29.21it/s] 30it [00:01, 29.11it/s] 33it [00:01, 29.23it/s] 37it [00:01, 29.61it/s] 41it [00:01, 30.00it/s] 44it [00:01, 29.03it/s] 48it [00:01, 29.27it/s]2025-05-26 05:22:52,850 - INFO - [Epoch 026 | Batch 0050] IWAE-loss 7561.0938 | mean log_px -0.0570 | KL -3568.94 + 52it [00:01, 29.84it/s] 55it [00:01, 28.93it/s] 58it [00:02, 28.96it/s] 61it [00:02, 28.92it/s] 65it [00:02, 29.49it/s] 68it [00:02, 28.94it/s] 72it [00:02, 28.92it/s] 76it [00:02, 29.67it/s] 79it [00:02, 29.08it/s] 83it [00:02, 29.04it/s] 87it [00:03, 29.71it/s] 90it [00:03, 28.99it/s] 93it [00:03, 29.12it/s] 97it [00:03, 29.85it/s] 100it [00:03, 28.93it/s]2025-05-26 05:22:54,570 - INFO - [Epoch 026 | Batch 0100] IWAE-loss 6994.7637 | mean log_px -0.0489 | KL -3571.84 + 104it [00:03, 29.43it/s] 108it [00:03, 29.73it/s] 111it [00:03, 28.96it/s] 115it [00:03, 29.29it/s] 119it [00:04, 29.46it/s] 123it [00:04, 29.84it/s] 126it [00:04, 29.24it/s] 130it [00:04, 29.65it/s] 133it [00:04, 29.69it/s] 136it [00:04, 29.70it/s] 139it [00:04, 29.39it/s] 143it [00:04, 29.47it/s] 147it [00:05, 30.13it/s]2025-05-26 05:22:56,259 - INFO - [Epoch 026 | Batch 0150] IWAE-loss 6899.2134 | mean log_px -0.0476 | KL -3564.08 + 151it [00:05, 29.46it/s] 155it [00:05, 29.35it/s] 159it [00:05, 29.98it/s] 163it [00:05, 29.22it/s] 167it [00:05, 29.23it/s] 171it [00:05, 29.79it/s] 174it [00:05, 29.17it/s] 178it [00:06, 29.74it/s] 181it [00:06, 29.04it/s] 185it [00:06, 29.39it/s] 188it [00:06, 29.16it/s] 192it [00:06, 29.81it/s] 195it [00:06, 27.85it/s] 196it [00:06, 28.81it/s] +2025-05-26 05:22:57,872 - INFO - Epoch: 26, Objective: tensor([9639.1465], device='cuda:0', grad_fn=), Loss: 0.0952192023396492, KL/n: 72.77848052978516 + 0it [00:00, ?it/s]2025-05-26 05:22:58,077 - INFO - [Epoch 027 | Batch 0000] IWAE-loss 6978.8984 | mean log_px -0.0489 | KL -3558.69 + 2it [00:00, 15.95it/s] 5it [00:00, 22.21it/s] 8it [00:00, 25.34it/s] 12it [00:00, 28.15it/s] 15it [00:00, 27.84it/s] 19it [00:00, 28.75it/s] 23it [00:00, 29.51it/s] 26it [00:00, 28.77it/s] 30it [00:01, 29.76it/s] 34it [00:01, 29.79it/s] 37it [00:01, 29.15it/s] 41it [00:01, 29.35it/s] 45it [00:01, 30.10it/s] 49it [00:01, 30.01it/s]2025-05-26 05:22:59,766 - INFO - [Epoch 027 | Batch 0050] IWAE-loss 8259.9668 | mean log_px -0.0671 | KL -3560.43 + 52it [00:01, 29.23it/s] 55it [00:01, 28.97it/s] 59it [00:02, 29.17it/s] 62it [00:02, 28.31it/s] 66it [00:02, 28.70it/s] 70it [00:02, 29.10it/s] 73it [00:02, 28.43it/s] 77it [00:02, 28.69it/s] 80it [00:02, 29.01it/s] 83it [00:02, 28.76it/s] 87it [00:03, 28.87it/s] 91it [00:03, 29.32it/s] 94it [00:03, 28.67it/s] 98it [00:03, 29.52it/s]2025-05-26 05:23:01,502 - INFO - [Epoch 027 | Batch 0100] IWAE-loss 6988.8232 | mean log_px -0.0489 | KL -3563.29 + 101it [00:03, 28.80it/s] 104it [00:03, 28.99it/s] 107it [00:03, 28.95it/s] 110it [00:03, 28.80it/s] 114it [00:03, 29.30it/s] 118it [00:04, 29.62it/s] 122it [00:04, 29.89it/s] 125it [00:04, 29.10it/s] 129it [00:04, 29.95it/s] 132it [00:04, 29.17it/s] 136it [00:04, 29.66it/s] 139it [00:04, 29.55it/s] 143it [00:04, 29.52it/s] 147it [00:05, 30.23it/s]2025-05-26 05:23:03,187 - INFO - [Epoch 027 | Batch 0150] IWAE-loss 8031.2412 | mean log_px -0.0639 | KL -3560.13 + 151it [00:05, 29.94it/s] 154it [00:05, 29.40it/s] 158it [00:05, 29.72it/s] 161it [00:05, 29.34it/s] 164it [00:05, 29.50it/s] 168it [00:05, 30.18it/s] 172it [00:05, 29.96it/s] 175it [00:06, 29.58it/s] 178it [00:06, 29.30it/s] 182it [00:06, 29.36it/s] 186it [00:06, 29.31it/s] 189it [00:06, 29.40it/s] 192it [00:06, 29.48it/s] 195it [00:06, 28.16it/s] 196it [00:06, 28.86it/s] +2025-05-26 05:23:04,787 - INFO - Epoch: 27, Objective: tensor([9165.4453], device='cuda:0', grad_fn=), Loss: 0.07511217892169952, KL/n: 72.7235107421875 + 0it [00:00, ?it/s]2025-05-26 05:23:05,172 - INFO - [Epoch 028 | Batch 0000] IWAE-loss 6043.2148 | mean log_px -0.0354 | KL -3563.28 + 2it [00:00, 15.57it/s] 5it [00:00, 21.80it/s] 8it [00:00, 25.02it/s] 12it [00:00, 27.70it/s] 15it [00:00, 27.72it/s] 18it [00:00, 28.40it/s] 22it [00:00, 29.07it/s] 25it [00:00, 29.20it/s] 28it [00:01, 29.30it/s] 32it [00:01, 29.87it/s] 35it [00:01, 29.20it/s] 39it [00:01, 29.53it/s] 43it [00:01, 29.67it/s] 47it [00:01, 29.98it/s] 50it [00:01, 29.29it/s]2025-05-26 05:23:06,863 - INFO - [Epoch 028 | Batch 0050] IWAE-loss 6714.2021 | mean log_px -0.0451 | KL -3560.29 + 54it [00:01, 29.72it/s] 58it [00:02, 30.08it/s] 61it [00:02, 29.38it/s] 65it [00:02, 29.47it/s] 69it [00:02, 30.11it/s] 73it [00:02, 30.05it/s] 77it [00:02, 30.07it/s] 81it [00:02, 30.00it/s] 84it [00:02, 29.43it/s] 88it [00:03, 29.42it/s] 92it [00:03, 30.12it/s] 96it [00:03, 29.98it/s] 99it [00:03, 29.22it/s]2025-05-26 05:23:08,539 - INFO - [Epoch 028 | Batch 0100] IWAE-loss 6817.0000 | mean log_px -0.0465 | KL -3562.40 + 103it [00:03, 29.42it/s] 107it [00:03, 29.99it/s] 110it [00:03, 29.27it/s] 113it [00:03, 29.15it/s] 116it [00:03, 29.19it/s] 120it [00:04, 29.98it/s] 123it [00:04, 29.19it/s] 127it [00:04, 29.28it/s] 131it [00:04, 30.09it/s] 135it [00:04, 29.97it/s] 138it [00:04, 29.25it/s] 142it [00:04, 29.80it/s] 145it [00:04, 29.14it/s] 149it [00:05, 29.10it/s]2025-05-26 05:23:10,244 - INFO - [Epoch 028 | Batch 0150] IWAE-loss 9232.8408 | mean log_px -0.0810 | KL -3562.66 + 153it [00:05, 29.81it/s] 156it [00:05, 29.08it/s] 159it [00:05, 29.27it/s] 163it [00:05, 29.99it/s] 166it [00:05, 29.05it/s] 170it [00:05, 29.82it/s] 173it [00:05, 29.51it/s] 176it [00:06, 29.31it/s] 179it [00:06, 29.24it/s] 183it [00:06, 29.48it/s] 186it [00:06, 29.43it/s] 189it [00:06, 29.06it/s] 193it [00:06, 29.74it/s] 196it [00:06, 28.77it/s] 196it [00:06, 28.97it/s] +2025-05-26 05:23:11,855 - INFO - Epoch: 28, Objective: tensor([8603.9277], device='cuda:0', grad_fn=), Loss: 0.063666932284832, KL/n: 72.64057922363281 + 0it [00:00, ?it/s]2025-05-26 05:23:12,050 - INFO - [Epoch 029 | Batch 0000] IWAE-loss 7211.1953 | mean log_px -0.0522 | KL -3558.82 + 2it [00:00, 18.23it/s] 5it [00:00, 23.52it/s] 9it [00:00, 26.70it/s] 13it [00:00, 27.96it/s] 16it [00:00, 28.16it/s] 20it [00:00, 29.32it/s] 23it [00:00, 28.70it/s] 27it [00:00, 28.86it/s] 31it [00:01, 29.73it/s] 34it [00:01, 28.93it/s] 38it [00:01, 29.53it/s] 41it [00:01, 29.34it/s] 45it [00:01, 29.43it/s] 49it [00:01, 30.25it/s]2025-05-26 05:23:13,749 - INFO - [Epoch 029 | Batch 0050] IWAE-loss 5091.2432 | mean log_px -0.0219 | KL -3558.65 + 53it [00:01, 29.96it/s] 56it [00:01, 29.47it/s] 59it [00:02, 29.34it/s] 63it [00:02, 29.31it/s] 67it [00:02, 29.50it/s] 70it [00:02, 29.27it/s] 74it [00:02, 29.23it/s] 78it [00:02, 29.77it/s] 81it [00:02, 28.88it/s] 85it [00:02, 29.45it/s] 88it [00:03, 29.43it/s] 91it [00:03, 29.50it/s] 94it [00:03, 29.22it/s] 98it [00:03, 29.54it/s]2025-05-26 05:23:15,449 - INFO - [Epoch 029 | Batch 0100] IWAE-loss 7676.5796 | mean log_px -0.0588 | KL -3559.20 + 101it [00:03, 29.27it/s] 104it [00:03, 29.45it/s] 107it [00:03, 29.60it/s] 110it [00:03, 29.48it/s] 113it [00:03, 29.41it/s] 116it [00:03, 28.87it/s] 120it [00:04, 28.85it/s] 124it [00:04, 29.40it/s] 127it [00:04, 29.24it/s] 131it [00:04, 29.45it/s] 134it [00:04, 29.09it/s] 138it [00:04, 28.95it/s] 142it [00:04, 29.65it/s] 145it [00:04, 29.02it/s] 149it [00:05, 29.24it/s]2025-05-26 05:23:17,152 - INFO - [Epoch 029 | Batch 0150] IWAE-loss 5939.1680 | mean log_px -0.0340 | KL -3558.05 + 153it [00:05, 29.39it/s] 157it [00:05, 29.91it/s] 160it [00:05, 29.15it/s] 164it [00:05, 29.93it/s] 167it [00:05, 29.15it/s] 171it [00:05, 29.18it/s] 175it [00:05, 29.91it/s] 178it [00:06, 29.07it/s] 181it [00:06, 29.26it/s] 184it [00:06, 29.06it/s] 188it [00:06, 29.07it/s] 192it [00:06, 29.92it/s] 195it [00:06, 28.06it/s] 196it [00:06, 28.93it/s] +2025-05-26 05:23:18,759 - INFO - Epoch: 29, Objective: tensor([6309.2192], device='cuda:0', grad_fn=), Loss: 0.038903918117284775, KL/n: 72.57882690429688 + 0it [00:00, ?it/s]2025-05-26 05:23:18,968 - INFO - [Epoch 030 | Batch 0000] IWAE-loss 6291.7471 | mean log_px -0.0391 | KL -3552.61 + 1it [00:00, 9.74it/s] 5it [00:00, 23.14it/s] 9it [00:00, 27.04it/s] 12it [00:00, 27.53it/s] 16it [00:00, 28.82it/s] 19it [00:00, 28.85it/s] 23it [00:00, 29.81it/s] 26it [00:00, 29.37it/s] 30it [00:01, 29.52it/s] 34it [00:01, 30.16it/s] 38it [00:01, 30.15it/s] 42it [00:01, 30.20it/s] 46it [00:01, 29.74it/s] 50it [00:01, 29.81it/s]2025-05-26 05:23:20,634 - INFO - [Epoch 030 | Batch 0050] IWAE-loss 6106.9326 | mean log_px -0.0365 | KL -3550.81 + 54it [00:01, 29.87it/s] 57it [00:01, 29.55it/s] 61it [00:02, 29.91it/s] 64it [00:02, 29.73it/s] 68it [00:02, 30.05it/s] 71it [00:02, 29.82it/s] 75it [00:02, 30.05it/s] 78it [00:02, 29.88it/s] 82it [00:02, 30.19it/s] 86it [00:02, 30.42it/s] 90it [00:03, 30.41it/s] 94it [00:03, 29.93it/s] 98it [00:03, 30.25it/s]2025-05-26 05:23:22,299 - INFO - [Epoch 030 | Batch 0100] IWAE-loss 10561.5107 | mean log_px -0.1001 | KL -3555.25 + 102it [00:03, 29.91it/s] 106it [00:03, 30.18it/s] 110it [00:03, 29.98it/s] 113it [00:03, 29.79it/s] 117it [00:03, 29.79it/s] 121it [00:04, 30.13it/s] 125it [00:04, 30.44it/s] 129it [00:04, 30.34it/s] 133it [00:04, 30.19it/s] 137it [00:04, 30.09it/s] 141it [00:04, 30.09it/s] 145it [00:04, 30.10it/s] 149it [00:05, 30.09it/s]2025-05-26 05:23:23,967 - INFO - [Epoch 030 | Batch 0150] IWAE-loss 6769.3467 | mean log_px -0.0459 | KL -3553.85 + 153it [00:05, 30.09it/s] 157it [00:05, 30.09it/s] 161it [00:05, 29.72it/s] 165it [00:05, 29.88it/s] 168it [00:05, 29.71it/s] 172it [00:05, 30.33it/s] 176it [00:05, 29.83it/s] 179it [00:06, 29.85it/s] 182it [00:06, 29.69it/s] 186it [00:06, 30.31it/s] 190it [00:06, 30.31it/s] 194it [00:06, 29.62it/s] 196it [00:06, 29.48it/s] +2025-05-26 05:23:25,530 - INFO - Epoch: 30, Objective: tensor([6983.6377], device='cuda:0', grad_fn=), Loss: 0.042701512575149536, KL/n: 72.48271179199219 + 0it [00:00, ?it/s]2025-05-26 05:23:25,911 - INFO - [Epoch 031 | Batch 0000] IWAE-loss 10247.2090 | mean log_px -0.0957 | KL -3547.84 + 2it [00:00, 14.88it/s] 6it [00:00, 24.11it/s] 9it [00:00, 25.51it/s] 13it [00:00, 27.57it/s] 17it [00:00, 28.13it/s] 21it [00:00, 29.49it/s] 24it [00:00, 28.92it/s] 28it [00:00, 30.01it/s] 32it [00:01, 30.09it/s] 36it [00:01, 29.87it/s] 39it [00:01, 28.95it/s] 43it [00:01, 29.31it/s] 47it [00:01, 29.95it/s] 50it [00:01, 29.25it/s]2025-05-26 05:23:27,590 - INFO - [Epoch 031 | Batch 0050] IWAE-loss 11413.5059 | mean log_px -0.1124 | KL -3548.01 + 54it [00:01, 29.37it/s] 58it [00:02, 29.50it/s] 62it [00:02, 30.10it/s] 66it [00:02, 29.88it/s] 69it [00:02, 29.30it/s] 73it [00:02, 29.51it/s] 77it [00:02, 29.75it/s] 80it [00:02, 29.52it/s] 84it [00:02, 30.14it/s] 88it [00:03, 29.91it/s] 91it [00:03, 29.41it/s] 95it [00:03, 30.04it/s] 98it [00:03, 29.21it/s]2025-05-26 05:23:29,276 - INFO - [Epoch 031 | Batch 0100] IWAE-loss 6530.1104 | mean log_px -0.0426 | KL -3546.93 + 102it [00:03, 29.98it/s] 105it [00:03, 29.65it/s] 109it [00:03, 29.90it/s] 112it [00:03, 29.09it/s] 116it [00:03, 29.93it/s] 119it [00:04, 29.19it/s] 123it [00:04, 29.71it/s] 126it [00:04, 29.59it/s] 130it [00:04, 29.52it/s] 134it [00:04, 30.22it/s] 138it [00:04, 29.58it/s] 142it [00:04, 29.64it/s] 146it [00:04, 30.25it/s] 150it [00:05, 29.79it/s]2025-05-26 05:23:30,965 - INFO - [Epoch 031 | Batch 0150] IWAE-loss 9386.1055 | mean log_px -0.0835 | KL -3543.27 + 154it [00:05, 30.00it/s] 158it [00:05, 29.89it/s] 161it [00:05, 28.96it/s] 164it [00:05, 28.06it/s] 167it [00:05, 28.03it/s] 171it [00:05, 28.63it/s] 175it [00:05, 29.45it/s] 178it [00:06, 29.02it/s] 181it [00:06, 29.27it/s] 185it [00:06, 29.70it/s] 188it [00:06, 29.48it/s] 192it [00:06, 29.67it/s] 195it [00:06, 28.86it/s] 196it [00:06, 29.03it/s] +2025-05-26 05:23:32,578 - INFO - Epoch: 31, Objective: tensor([7436.5786], device='cuda:0', grad_fn=), Loss: 0.05694768950343132, KL/n: 72.4092025756836 + 0it [00:00, ?it/s]2025-05-26 05:23:32,775 - INFO - [Epoch 032 | Batch 0000] IWAE-loss 9081.5723 | mean log_px -0.0791 | KL -3543.87 + 2it [00:00, 19.00it/s] 5it [00:00, 24.51it/s] 9it [00:00, 27.61it/s] 12it [00:00, 27.79it/s] 16it [00:00, 29.12it/s] 19it [00:00, 29.17it/s] 23it [00:00, 30.16it/s] 27it [00:00, 30.21it/s] 31it [00:01, 29.86it/s] 35it [00:01, 29.94it/s] 38it [00:01, 29.84it/s] 42it [00:01, 30.14it/s] 46it [00:01, 30.56it/s] 50it [00:01, 29.96it/s]2025-05-26 05:23:34,430 - INFO - [Epoch 032 | Batch 0050] IWAE-loss 6334.4434 | mean log_px -0.0399 | KL -3544.42 + 53it [00:01, 29.87it/s] 57it [00:01, 30.33it/s] 61it [00:02, 30.18it/s] 65it [00:02, 30.34it/s] 69it [00:02, 30.31it/s] 73it [00:02, 30.13it/s] 77it [00:02, 30.18it/s] 81it [00:02, 30.09it/s] 85it [00:02, 30.09it/s] 89it [00:02, 30.15it/s] 93it [00:03, 30.25it/s] 97it [00:03, 30.22it/s]2025-05-26 05:23:36,092 - INFO - [Epoch 032 | Batch 0100] IWAE-loss 6394.1895 | mean log_px -0.0407 | KL -3547.70 + 101it [00:03, 30.12it/s] 105it [00:03, 29.57it/s] 109it [00:03, 30.36it/s] 113it [00:03, 30.27it/s] 117it [00:03, 29.96it/s] 121it [00:04, 30.04it/s] 125it [00:04, 30.37it/s] 129it [00:04, 30.28it/s] 133it [00:04, 29.92it/s] 136it [00:04, 29.86it/s] 139it [00:04, 29.72it/s] 142it [00:04, 28.97it/s] 145it [00:04, 28.49it/s] 149it [00:05, 28.86it/s]2025-05-26 05:23:37,773 - INFO - [Epoch 032 | Batch 0150] IWAE-loss 6953.6719 | mean log_px -0.0487 | KL -3543.11 + 153it [00:05, 29.66it/s] 157it [00:05, 30.17it/s] 161it [00:05, 30.18it/s] 165it [00:05, 30.16it/s] 169it [00:05, 30.07it/s] 173it [00:05, 30.09it/s] 177it [00:05, 30.03it/s] 181it [00:06, 29.71it/s] 184it [00:06, 29.15it/s] 188it [00:06, 29.68it/s] 192it [00:06, 29.87it/s] 195it [00:06, 28.39it/s] 196it [00:06, 29.50it/s] +2025-05-26 05:23:39,357 - INFO - Epoch: 32, Objective: tensor([9009.5889], device='cuda:0', grad_fn=), Loss: 0.07728097587823868, KL/n: 72.33047485351562 + 0it [00:00, ?it/s]2025-05-26 05:23:39,749 - INFO - [Epoch 033 | Batch 0000] IWAE-loss 6895.7715 | mean log_px -0.0478 | KL -3546.37 + 1it [00:00, 9.83it/s] 4it [00:00, 20.84it/s] 8it [00:00, 25.43it/s] 12it [00:00, 27.31it/s] 16it [00:00, 28.89it/s] 19it [00:00, 29.17it/s] 22it [00:00, 28.70it/s] 26it [00:00, 29.63it/s] 29it [00:01, 29.19it/s] 32it [00:01, 29.36it/s] 35it [00:01, 29.47it/s] 38it [00:01, 29.41it/s] 42it [00:01, 29.84it/s] 46it [00:01, 30.14it/s] 50it [00:01, 30.22it/s]2025-05-26 05:23:41,425 - INFO - [Epoch 033 | Batch 0050] IWAE-loss 6350.1094 | mean log_px -0.0401 | KL -3541.31 + 54it [00:01, 29.53it/s] 58it [00:02, 29.98it/s] 62it [00:02, 30.27it/s] 66it [00:02, 30.16it/s] 70it [00:02, 29.72it/s] 74it [00:02, 30.21it/s] 78it [00:02, 30.01it/s] 82it [00:02, 30.18it/s] 86it [00:02, 30.16it/s] 90it [00:03, 30.07it/s] 94it [00:03, 29.65it/s] 97it [00:03, 29.54it/s]2025-05-26 05:23:43,100 - INFO - [Epoch 033 | Batch 0100] IWAE-loss 8828.9014 | mean log_px -0.0755 | KL -3543.89 + 101it [00:03, 29.54it/s] 105it [00:03, 29.79it/s] 109it [00:03, 30.40it/s] 113it [00:03, 29.95it/s] 116it [00:03, 29.73it/s] 120it [00:04, 30.37it/s] 124it [00:04, 30.29it/s] 128it [00:04, 29.86it/s] 131it [00:04, 29.66it/s] 135it [00:04, 30.30it/s] 139it [00:04, 30.35it/s] 143it [00:04, 29.92it/s] 146it [00:04, 29.73it/s] 150it [00:05, 30.33it/s]2025-05-26 05:23:44,764 - INFO - [Epoch 033 | Batch 0150] IWAE-loss 6439.4922 | mean log_px -0.0414 | KL -3543.21 + 154it [00:05, 30.22it/s] 158it [00:05, 29.76it/s] 161it [00:05, 29.62it/s] 165it [00:05, 29.94it/s] 168it [00:05, 29.50it/s] 171it [00:05, 29.33it/s] 175it [00:05, 30.11it/s] 179it [00:06, 29.93it/s] 182it [00:06, 29.32it/s] 186it [00:06, 29.73it/s] 189it [00:06, 29.55it/s] 193it [00:06, 29.65it/s] 196it [00:06, 29.30it/s] +2025-05-26 05:23:46,351 - INFO - Epoch: 33, Objective: tensor([7173.4717], device='cuda:0', grad_fn=), Loss: 0.04623902589082718, KL/n: 72.23444366455078 + 0it [00:00, ?it/s]2025-05-26 05:23:46,577 - INFO - [Epoch 034 | Batch 0000] IWAE-loss 6226.3438 | mean log_px -0.0384 | KL -3540.74 + 1it [00:00, 9.55it/s] 4it [00:00, 20.71it/s] 8it [00:00, 25.72it/s] 11it [00:00, 27.04it/s] 15it [00:00, 28.53it/s] 18it [00:00, 28.26it/s] 22it [00:00, 29.52it/s] 25it [00:00, 29.03it/s] 29it [00:01, 29.55it/s] 32it [00:01, 29.34it/s] 36it [00:01, 29.74it/s] 40it [00:01, 30.15it/s] 44it [00:01, 29.93it/s] 47it [00:01, 29.44it/s]2025-05-26 05:23:48,259 - INFO - [Epoch 034 | Batch 0050] IWAE-loss 7785.6523 | mean log_px -0.0607 | KL -3535.19 + 51it [00:01, 29.52it/s] 55it [00:01, 30.27it/s] 59it [00:02, 30.09it/s] 63it [00:02, 29.98it/s] 66it [00:02, 29.57it/s] 70it [00:02, 29.94it/s] 73it [00:02, 29.26it/s] 77it [00:02, 29.76it/s] 80it [00:02, 29.57it/s] 84it [00:02, 29.88it/s] 87it [00:02, 29.68it/s] 91it [00:03, 29.74it/s] 95it [00:03, 30.07it/s] 99it [00:03, 30.25it/s]2025-05-26 05:23:49,934 - INFO - [Epoch 034 | Batch 0100] IWAE-loss 9424.0605 | mean log_px -0.0841 | KL -3535.94 + 103it [00:03, 30.15it/s] 107it [00:03, 30.03it/s] 111it [00:03, 29.33it/s] 114it [00:03, 29.47it/s] 117it [00:04, 28.90it/s] 121it [00:04, 29.29it/s] 125it [00:04, 29.69it/s] 128it [00:04, 29.14it/s] 132it [00:04, 29.65it/s] 136it [00:04, 29.90it/s] 139it [00:04, 29.31it/s] 143it [00:04, 30.16it/s] 147it [00:05, 30.05it/s] 150it [00:05, 29.30it/s]2025-05-26 05:23:51,620 - INFO - [Epoch 034 | Batch 0150] IWAE-loss 8369.6523 | mean log_px -0.0690 | KL -3539.58 + 154it [00:05, 29.67it/s] 158it [00:05, 30.03it/s] 161it [00:05, 29.44it/s] 165it [00:05, 29.14it/s] 169it [00:05, 30.31it/s] 173it [00:05, 30.17it/s] 177it [00:06, 29.71it/s] 181it [00:06, 29.95it/s] 184it [00:06, 29.36it/s] 188it [00:06, 29.62it/s] 191it [00:06, 29.64it/s] 194it [00:06, 29.71it/s] 196it [00:06, 29.16it/s] +2025-05-26 05:23:53,208 - INFO - Epoch: 34, Objective: tensor([5730.3848], device='cuda:0', grad_fn=), Loss: 0.035519614815711975, KL/n: 72.12670135498047 + 0it [00:00, ?it/s]2025-05-26 05:23:53,724 - INFO - [Epoch 035 | Batch 0000] IWAE-loss 6048.6689 | mean log_px -0.0359 | KL -3534.05 + 1it [00:00, 4.25it/s] 4it [00:00, 13.67it/s] 8it [00:00, 21.24it/s] 11it [00:00, 23.73it/s] 15it [00:00, 26.23it/s] 19it [00:00, 27.71it/s] 23it [00:00, 28.64it/s] 27it [00:01, 29.31it/s] 31it [00:01, 29.57it/s] 34it [00:01, 29.44it/s] 38it [00:01, 29.80it/s] 42it [00:01, 30.06it/s] 46it [00:01, 30.52it/s] 50it [00:01, 30.54it/s]2025-05-26 05:23:55,367 - INFO - [Epoch 035 | Batch 0050] IWAE-loss 7547.8418 | mean log_px -0.0574 | KL -3532.06 + 54it [00:01, 30.05it/s] 58it [00:02, 30.37it/s] 62it [00:02, 30.79it/s] 66it [00:02, 30.74it/s] 70it [00:02, 30.31it/s] 74it [00:02, 30.77it/s] 78it [00:02, 30.21it/s] 82it [00:02, 30.46it/s] 86it [00:03, 30.47it/s] 90it [00:03, 30.51it/s] 94it [00:03, 30.45it/s] 98it [00:03, 30.49it/s]2025-05-26 05:23:57,007 - INFO - [Epoch 035 | Batch 0100] IWAE-loss 6467.4780 | mean log_px -0.0420 | KL -3526.05 + 102it [00:03, 30.50it/s] 106it [00:03, 30.51it/s] 110it [00:03, 30.55it/s] 114it [00:03, 30.87it/s] 118it [00:04, 30.81it/s] 122it [00:04, 30.32it/s] 126it [00:04, 30.68it/s] 130it [00:04, 30.37it/s] 134it [00:04, 30.45it/s] 138it [00:04, 30.47it/s] 142it [00:04, 30.46it/s] 146it [00:04, 30.46it/s] 150it [00:05, 30.84it/s]2025-05-26 05:23:58,642 - INFO - [Epoch 035 | Batch 0150] IWAE-loss 4948.4082 | mean log_px -0.0203 | KL -3529.26 + 154it [00:05, 30.75it/s] 158it [00:05, 30.41it/s] 162it [00:05, 30.24it/s] 166it [00:05, 30.72it/s] 170it [00:05, 30.31it/s] 174it [00:05, 30.38it/s] 178it [00:06, 30.43it/s] 182it [00:06, 30.44it/s] 186it [00:06, 30.46it/s] 190it [00:06, 30.76it/s] 194it [00:06, 30.38it/s] 196it [00:06, 29.26it/s] +2025-05-26 05:24:00,202 - INFO - Epoch: 35, Objective: tensor([7949.3398], device='cuda:0', grad_fn=), Loss: 0.07318438589572906, KL/n: 72.0306396484375 + 0it [00:00, ?it/s]2025-05-26 05:24:00,591 - INFO - [Epoch 036 | Batch 0000] IWAE-loss 9333.0117 | mean log_px -0.0829 | KL -3532.75 + 1it [00:00, 9.86it/s] 4it [00:00, 20.61it/s] 8it [00:00, 26.44it/s] 11it [00:00, 27.18it/s] 15it [00:00, 28.76it/s] 18it [00:00, 28.45it/s] 22it [00:00, 29.58it/s] 25it [00:00, 29.31it/s] 28it [00:01, 29.30it/s] 32it [00:01, 30.11it/s] 35it [00:01, 28.84it/s] 38it [00:01, 28.95it/s] 42it [00:01, 29.85it/s] 45it [00:01, 29.40it/s] 48it [00:01, 29.52it/s]2025-05-26 05:24:02,274 - INFO - [Epoch 036 | Batch 0050] IWAE-loss 6635.5688 | mean log_px -0.0444 | KL -3526.99 + 52it [00:01, 29.55it/s] 56it [00:01, 30.34it/s] 60it [00:02, 30.23it/s] 64it [00:02, 29.29it/s] 67it [00:02, 28.88it/s] 70it [00:02, 27.82it/s] 73it [00:02, 27.98it/s] 77it [00:02, 28.75it/s] 80it [00:02, 28.88it/s] 84it [00:02, 29.84it/s] 87it [00:03, 29.48it/s] 90it [00:03, 29.48it/s] 94it [00:03, 30.19it/s] 98it [00:03, 30.05it/s]2025-05-26 05:24:03,984 - INFO - [Epoch 036 | Batch 0100] IWAE-loss 5391.4517 | mean log_px -0.0267 | KL -3524.87 + 101it [00:03, 29.23it/s] 105it [00:03, 29.44it/s] 109it [00:03, 29.72it/s] 112it [00:03, 29.72it/s] 115it [00:03, 29.19it/s] 119it [00:04, 29.93it/s] 122it [00:04, 29.46it/s] 126it [00:04, 29.90it/s] 129it [00:04, 29.59it/s] 132it [00:04, 29.56it/s] 136it [00:04, 29.88it/s] 139it [00:04, 29.66it/s] 143it [00:04, 29.90it/s] 146it [00:05, 29.61it/s] 149it [00:05, 29.69it/s]2025-05-26 05:24:05,659 - INFO - [Epoch 036 | Batch 0150] IWAE-loss 5428.3071 | mean log_px -0.0272 | KL -3524.24 + 153it [00:05, 29.66it/s] 157it [00:05, 30.15it/s] 161it [00:05, 30.49it/s] 165it [00:05, 29.97it/s] 169it [00:05, 30.33it/s] 173it [00:05, 30.27it/s] 177it [00:06, 30.15it/s] 181it [00:06, 29.94it/s] 184it [00:06, 29.37it/s] 188it [00:06, 30.25it/s] 192it [00:06, 30.08it/s] 196it [00:06, 29.42it/s] 196it [00:06, 29.06it/s] +2025-05-26 05:24:07,247 - INFO - Epoch: 36, Objective: tensor([5121.7222], device='cuda:0', grad_fn=), Loss: 0.02851932868361473, KL/n: 71.93126678466797 + 0it [00:00, ?it/s]2025-05-26 05:24:07,458 - INFO - [Epoch 037 | Batch 0000] IWAE-loss 6818.0244 | mean log_px -0.0470 | KL -3525.74 + 2it [00:00, 15.85it/s] 5it [00:00, 22.33it/s] 9it [00:00, 26.45it/s] 13it [00:00, 28.26it/s] 16it [00:00, 28.26it/s] 19it [00:00, 28.52it/s] 23it [00:00, 29.17it/s] 26it [00:00, 29.14it/s] 30it [00:01, 29.45it/s] 33it [00:01, 29.32it/s] 37it [00:01, 29.64it/s] 40it [00:01, 29.43it/s] 43it [00:01, 29.20it/s] 47it [00:01, 29.25it/s]2025-05-26 05:24:09,145 - INFO - [Epoch 037 | Batch 0050] IWAE-loss 6119.6309 | mean log_px -0.0371 | KL -3523.91 + 51it [00:01, 29.83it/s] 54it [00:01, 29.36it/s] 57it [00:01, 29.32it/s] 60it [00:02, 29.33it/s] 64it [00:02, 30.02it/s] 68it [00:02, 30.01it/s] 71it [00:02, 29.28it/s] 75it [00:02, 29.80it/s] 79it [00:02, 29.63it/s] 83it [00:02, 29.97it/s] 86it [00:02, 29.35it/s] 90it [00:03, 29.66it/s] 94it [00:03, 29.96it/s] 97it [00:03, 29.97it/s] 100it [00:03, 29.46it/s]2025-05-26 05:24:10,836 - INFO - [Epoch 037 | Batch 0100] IWAE-loss 6096.8174 | mean log_px -0.0368 | KL -3523.27 + 104it [00:03, 29.85it/s] 107it [00:03, 29.20it/s] 111it [00:03, 29.63it/s] 114it [00:03, 29.43it/s] 118it [00:04, 29.77it/s] 122it [00:04, 29.96it/s] 126it [00:04, 29.97it/s] 129it [00:04, 29.52it/s] 132it [00:04, 29.35it/s] 136it [00:04, 29.72it/s] 140it [00:04, 30.03it/s] 143it [00:04, 29.34it/s] 147it [00:05, 29.97it/s] 150it [00:05, 29.32it/s]2025-05-26 05:24:12,514 - INFO - [Epoch 037 | Batch 0150] IWAE-loss 5858.8037 | mean log_px -0.0333 | KL -3524.98 + 154it [00:05, 29.68it/s] 158it [00:05, 29.99it/s] 161it [00:05, 29.83it/s] 164it [00:05, 29.49it/s] 167it [00:05, 28.79it/s] 170it [00:05, 28.36it/s] 174it [00:05, 28.87it/s] 177it [00:06, 28.85it/s] 181it [00:06, 29.09it/s] 185it [00:06, 29.27it/s] 189it [00:06, 29.57it/s] 192it [00:06, 29.36it/s] 195it [00:06, 28.26it/s] 196it [00:06, 29.03it/s] +2025-05-26 05:24:14,128 - INFO - Epoch: 37, Objective: tensor([8412.7549], device='cuda:0', grad_fn=), Loss: 0.0734751895070076, KL/n: 71.82179260253906 + 0it [00:00, ?it/s]2025-05-26 05:24:14,340 - INFO - [Epoch 038 | Batch 0000] IWAE-loss 7314.7837 | mean log_px -0.0542 | KL -3518.82 + 2it [00:00, 15.67it/s] 5it [00:00, 23.11it/s] 8it [00:00, 25.10it/s] 12it [00:00, 26.67it/s] 16it [00:00, 28.96it/s] 20it [00:00, 29.35it/s] 23it [00:00, 28.80it/s] 27it [00:00, 29.83it/s] 30it [00:01, 29.03it/s] 34it [00:01, 29.55it/s] 38it [00:01, 30.00it/s] 41it [00:01, 29.19it/s] 45it [00:01, 29.74it/s] 48it [00:01, 29.53it/s]2025-05-26 05:24:16,018 - INFO - [Epoch 038 | Batch 0050] IWAE-loss 8369.5879 | mean log_px -0.0693 | KL -3520.88 + 52it [00:01, 30.12it/s] 56it [00:01, 30.06it/s] 59it [00:02, 29.57it/s] 62it [00:02, 29.46it/s] 66it [00:02, 30.02it/s] 69it [00:02, 29.39it/s] 73it [00:02, 29.24it/s] 77it [00:02, 29.99it/s] 80it [00:02, 29.41it/s] 84it [00:02, 30.08it/s] 87it [00:02, 29.39it/s] 91it [00:03, 29.57it/s] 95it [00:03, 30.13it/s] 99it [00:03, 30.14it/s]2025-05-26 05:24:17,706 - INFO - [Epoch 038 | Batch 0100] IWAE-loss 7469.8418 | mean log_px -0.0565 | KL -3516.50 + 103it [00:03, 29.98it/s] 106it [00:03, 29.31it/s] 110it [00:03, 29.64it/s] 113it [00:03, 29.44it/s] 117it [00:03, 29.83it/s] 121it [00:04, 30.05it/s] 124it [00:04, 29.33it/s] 128it [00:04, 30.16it/s] 132it [00:04, 29.46it/s] 136it [00:04, 30.06it/s] 140it [00:04, 29.46it/s] 144it [00:04, 29.79it/s] 148it [00:05, 29.96it/s]2025-05-26 05:24:19,386 - INFO - [Epoch 038 | Batch 0150] IWAE-loss 8205.4229 | mean log_px -0.0670 | KL -3514.02 + 151it [00:05, 29.40it/s] 155it [00:05, 29.96it/s] 158it [00:05, 29.14it/s] 162it [00:05, 29.06it/s] 166it [00:05, 29.28it/s] 170it [00:05, 29.47it/s] 173it [00:05, 28.82it/s] 177it [00:06, 28.88it/s] 180it [00:06, 29.06it/s] 183it [00:06, 28.84it/s] 186it [00:06, 28.79it/s] 189it [00:06, 28.98it/s] 192it [00:06, 28.76it/s] 195it [00:06, 27.64it/s] 196it [00:06, 29.01it/s] +2025-05-26 05:24:21,013 - INFO - Epoch: 38, Objective: tensor([6188.0107], device='cuda:0', grad_fn=), Loss: 0.039483845233917236, KL/n: 71.70988464355469 + 0it [00:00, ?it/s]2025-05-26 05:24:21,367 - INFO - [Epoch 039 | Batch 0000] IWAE-loss 5897.3501 | mean log_px -0.0341 | KL -3512.35 + 2it [00:00, 16.81it/s] 5it [00:00, 23.19it/s] 8it [00:00, 25.71it/s] 12it [00:00, 28.01it/s] 16it [00:00, 29.05it/s] 19it [00:00, 28.52it/s] 23it [00:00, 29.54it/s] 27it [00:00, 29.80it/s] 30it [00:01, 29.09it/s] 34it [00:01, 29.35it/s] 38it [00:01, 29.98it/s] 41it [00:01, 29.26it/s] 44it [00:01, 29.24it/s] 48it [00:01, 29.55it/s]2025-05-26 05:24:23,069 - INFO - [Epoch 039 | Batch 0050] IWAE-loss 7713.8794 | mean log_px -0.0600 | KL -3513.57 + 51it [00:01, 29.34it/s] 55it [00:01, 29.45it/s] 59it [00:02, 30.26it/s] 63it [00:02, 30.04it/s] 67it [00:02, 30.14it/s] 71it [00:02, 30.00it/s] 74it [00:02, 29.39it/s] 78it [00:02, 29.84it/s] 81it [00:02, 29.71it/s] 85it [00:02, 29.99it/s] 89it [00:03, 29.78it/s] 92it [00:03, 29.83it/s] 95it [00:03, 29.50it/s] 98it [00:03, 29.49it/s]2025-05-26 05:24:24,744 - INFO - [Epoch 039 | Batch 0100] IWAE-loss 8730.6738 | mean log_px -0.0745 | KL -3515.56 + 102it [00:03, 29.74it/s] 105it [00:03, 29.59it/s] 109it [00:03, 29.91it/s] 112it [00:03, 29.72it/s] 116it [00:03, 29.96it/s] 120it [00:04, 30.31it/s] 124it [00:04, 30.27it/s] 128it [00:04, 29.77it/s] 131it [00:04, 29.63it/s] 135it [00:04, 29.61it/s] 139it [00:04, 29.67it/s] 143it [00:04, 30.35it/s] 147it [00:04, 30.21it/s]2025-05-26 05:24:26,413 - INFO - [Epoch 039 | Batch 0150] IWAE-loss 6161.3574 | mean log_px -0.0379 | KL -3506.34 + 151it [00:05, 30.04it/s] 155it [00:05, 30.05it/s] 159it [00:05, 29.98it/s] 162it [00:05, 29.58it/s] 165it [00:05, 29.37it/s] 169it [00:05, 29.44it/s] 173it [00:05, 30.24it/s] 177it [00:05, 30.07it/s] 181it [00:06, 29.93it/s] 185it [00:06, 30.00it/s] 188it [00:06, 29.93it/s] 192it [00:06, 29.94it/s] 195it [00:06, 28.21it/s] 196it [00:06, 29.25it/s] +2025-05-26 05:24:28,005 - INFO - Epoch: 39, Objective: tensor([8232.8359], device='cuda:0', grad_fn=), Loss: 0.06686270982027054, KL/n: 71.5858154296875 + 0it [00:00, ?it/s]2025-05-26 05:24:28,224 - INFO - [Epoch 040 | Batch 0000] IWAE-loss 7030.0107 | mean log_px -0.0504 | KL -3502.05 + 1it [00:00, 8.75it/s] 5it [00:00, 22.72it/s] 8it [00:00, 25.03it/s] 11it [00:00, 26.29it/s] 15it [00:00, 27.81it/s] 18it [00:00, 28.01it/s] 22it [00:00, 28.41it/s] 26it [00:00, 29.30it/s] 29it [00:01, 28.64it/s] 32it [00:01, 28.98it/s] 35it [00:01, 28.65it/s] 38it [00:01, 28.69it/s] 41it [00:01, 28.63it/s] 44it [00:01, 28.72it/s] 47it [00:01, 28.63it/s] 50it [00:01, 28.60it/s]2025-05-26 05:24:29,953 - INFO - [Epoch 040 | Batch 0050] IWAE-loss 5363.6777 | mean log_px -0.0266 | KL -3504.19 + 53it [00:01, 28.55it/s] 56it [00:02, 28.51it/s] 59it [00:02, 28.66it/s] 62it [00:02, 28.53it/s] 65it [00:02, 28.43it/s] 68it [00:02, 28.81it/s] 71it [00:02, 29.15it/s] 74it [00:02, 29.33it/s] 77it [00:02, 29.07it/s] 80it [00:02, 29.01it/s] 83it [00:02, 28.98it/s] 86it [00:03, 28.83it/s] 89it [00:03, 28.87it/s] 92it [00:03, 28.98it/s] 95it [00:03, 28.86it/s] 98it [00:03, 28.79it/s]2025-05-26 05:24:31,684 - INFO - [Epoch 040 | Batch 0100] IWAE-loss 7653.5737 | mean log_px -0.0592 | KL -3508.40 + 101it [00:03, 28.73it/s] 104it [00:03, 28.60it/s] 107it [00:03, 28.42it/s] 110it [00:03, 28.72it/s] 113it [00:03, 28.43it/s] 116it [00:04, 28.71it/s] 119it [00:04, 28.81it/s] 122it [00:04, 28.87it/s] 125it [00:04, 28.87it/s] 128it [00:04, 29.08it/s] 131it [00:04, 29.16it/s] 134it [00:04, 29.03it/s] 137it [00:04, 29.11it/s] 140it [00:04, 29.07it/s] 143it [00:05, 28.94it/s] 146it [00:05, 29.11it/s] 149it [00:05, 28.96it/s]2025-05-26 05:24:33,414 - INFO - [Epoch 040 | Batch 0150] IWAE-loss 5078.6626 | mean log_px -0.0225 | KL -3500.41 + 152it [00:05, 29.10it/s] 155it [00:05, 28.96it/s] 158it [00:05, 29.11it/s] 161it [00:05, 28.36it/s] 165it [00:05, 29.48it/s] 168it [00:05, 28.70it/s] 172it [00:06, 28.98it/s] 175it [00:06, 28.16it/s] 178it [00:06, 28.06it/s] 182it [00:06, 28.82it/s] 186it [00:06, 29.37it/s] 189it [00:06, 28.52it/s] 193it [00:06, 28.73it/s] 196it [00:06, 28.71it/s] 196it [00:06, 28.31it/s] +2025-05-26 05:24:35,051 - INFO - Epoch: 40, Objective: tensor([5183.1216], device='cuda:0', grad_fn=), Loss: 0.023475281894207, KL/n: 71.48657989501953 + 0it [00:00, ?it/s]2025-05-26 05:24:35,432 - INFO - [Epoch 041 | Batch 0000] IWAE-loss 4403.5732 | mean log_px -0.0129 | KL -3502.67 + 1it [00:00, 9.72it/s] 4it [00:00, 20.12it/s] 8it [00:00, 25.83it/s] 11it [00:00, 17.75it/s] 15it [00:00, 21.91it/s] 18it [00:00, 23.20it/s] 22it [00:00, 25.78it/s] 25it [00:01, 26.13it/s] 29it [00:01, 27.09it/s] 33it [00:01, 28.22it/s] 36it [00:01, 28.43it/s] 40it [00:01, 28.63it/s] 44it [00:01, 29.71it/s] 47it [00:01, 28.70it/s]2025-05-26 05:24:37,276 - INFO - [Epoch 041 | Batch 0050] IWAE-loss 6013.5820 | mean log_px -0.0359 | KL -3499.60 + 51it [00:01, 29.28it/s] 54it [00:02, 29.15it/s] 58it [00:02, 29.62it/s] 61it [00:02, 29.63it/s] 65it [00:02, 29.45it/s] 69it [00:02, 30.27it/s] 73it [00:02, 29.99it/s] 77it [00:02, 30.31it/s] 81it [00:02, 29.42it/s] 85it [00:03, 29.58it/s] 89it [00:03, 29.80it/s] 92it [00:03, 29.06it/s] 95it [00:03, 29.25it/s] 99it [00:03, 29.89it/s]2025-05-26 05:24:38,966 - INFO - [Epoch 041 | Batch 0100] IWAE-loss 6300.6230 | mean log_px -0.0401 | KL -3497.01 + 102it [00:03, 28.83it/s] 105it [00:03, 28.89it/s] 109it [00:03, 29.11it/s] 112it [00:04, 28.56it/s] 115it [00:04, 28.71it/s] 118it [00:04, 28.24it/s] 121it [00:04, 28.39it/s] 124it [00:04, 28.58it/s] 127it [00:04, 28.02it/s] 131it [00:04, 28.67it/s] 134it [00:04, 28.52it/s] 138it [00:04, 29.00it/s] 141it [00:05, 28.14it/s] 144it [00:05, 27.88it/s] 147it [00:05, 27.30it/s] 150it [00:05, 26.05it/s]2025-05-26 05:24:40,769 - INFO - [Epoch 041 | Batch 0150] IWAE-loss 6032.0469 | mean log_px -0.0362 | KL -3499.16 + 153it [00:05, 26.81it/s] 156it [00:05, 27.61it/s] 159it [00:05, 27.83it/s] 163it [00:05, 28.69it/s] 167it [00:05, 29.23it/s] 170it [00:06, 29.17it/s] 174it [00:06, 29.59it/s] 178it [00:06, 29.80it/s] 182it [00:06, 29.68it/s] 186it [00:06, 30.83it/s] 190it [00:06, 30.58it/s] 194it [00:06, 30.50it/s] 196it [00:06, 28.01it/s] +2025-05-26 05:24:42,342 - INFO - Epoch: 41, Objective: tensor([6269.4609], device='cuda:0', grad_fn=), Loss: 0.0442596971988678, KL/n: 71.36074829101562 + 0it [00:00, ?it/s]2025-05-26 05:24:42,727 - INFO - [Epoch 042 | Batch 0000] IWAE-loss 7053.6738 | mean log_px -0.0508 | KL -3497.69 + 1it [00:00, 9.90it/s] 4it [00:00, 21.45it/s] 8it [00:00, 26.08it/s] 12it [00:00, 27.92it/s] 16it [00:00, 28.88it/s] 20it [00:00, 29.41it/s] 23it [00:00, 29.43it/s] 27it [00:00, 30.44it/s] 31it [00:01, 30.09it/s] 35it [00:01, 30.18it/s] 39it [00:01, 30.61it/s] 43it [00:01, 30.28it/s] 47it [00:01, 30.32it/s]2025-05-26 05:24:44,373 - INFO - [Epoch 042 | Batch 0050] IWAE-loss 8332.7178 | mean log_px -0.0690 | KL -3501.67 + 51it [00:01, 30.36it/s] 55it [00:01, 30.22it/s] 59it [00:02, 28.83it/s] 63it [00:02, 29.66it/s] 66it [00:02, 29.68it/s] 70it [00:02, 30.34it/s] 74it [00:02, 30.37it/s] 78it [00:02, 29.85it/s] 82it [00:02, 30.57it/s] 86it [00:02, 30.58it/s] 90it [00:03, 30.43it/s] 94it [00:03, 30.14it/s] 98it [00:03, 30.55it/s]2025-05-26 05:24:46,036 - INFO - [Epoch 042 | Batch 0100] IWAE-loss 4538.4160 | mean log_px -0.0149 | KL -3494.88 + 102it [00:03, 29.98it/s] 106it [00:03, 30.41it/s] 110it [00:03, 30.75it/s] 114it [00:03, 30.37it/s] 118it [00:03, 30.40it/s] 122it [00:04, 30.68it/s] 126it [00:04, 30.34it/s] 130it [00:04, 30.41it/s] 134it [00:04, 30.42it/s] 138it [00:04, 30.41it/s] 142it [00:04, 30.03it/s] 146it [00:04, 30.18it/s] 150it [00:05, 30.29it/s]2025-05-26 05:24:47,682 - INFO - [Epoch 042 | Batch 0150] IWAE-loss 6466.3130 | mean log_px -0.0425 | KL -3488.45 + 154it [00:05, 30.58it/s] 158it [00:05, 30.60it/s] 162it [00:05, 30.58it/s] 166it [00:05, 30.29it/s] 170it [00:05, 30.62it/s] 174it [00:05, 30.12it/s] 178it [00:05, 30.78it/s] 182it [00:06, 30.90it/s] 186it [00:06, 30.53it/s] 190it [00:06, 30.24it/s] 194it [00:06, 30.30it/s] 196it [00:06, 29.71it/s] +2025-05-26 05:24:49,237 - INFO - Epoch: 42, Objective: tensor([5149.8975], device='cuda:0', grad_fn=), Loss: 0.02193181775510311, KL/n: 71.23329162597656 + 0it [00:00, ?it/s]2025-05-26 05:24:49,445 - INFO - [Epoch 043 | Batch 0000] IWAE-loss 5306.7441 | mean log_px -0.0260 | KL -3489.69 + 2it [00:00, 15.45it/s] 6it [00:00, 24.36it/s] 9it [00:00, 25.87it/s] 13it [00:00, 27.90it/s] 16it [00:00, 28.24it/s] 20it [00:00, 28.79it/s] 24it [00:00, 29.92it/s] 27it [00:00, 29.27it/s] 31it [00:01, 29.99it/s] 34it [00:01, 29.45it/s] 38it [00:01, 30.38it/s] 42it [00:01, 30.43it/s] 46it [00:01, 30.49it/s] 50it [00:01, 30.23it/s]2025-05-26 05:24:51,102 - INFO - [Epoch 043 | Batch 0050] IWAE-loss 5717.6758 | mean log_px -0.0318 | KL -3488.62 + 54it [00:01, 30.25it/s] 58it [00:01, 30.31it/s] 62it [00:02, 30.78it/s] 66it [00:02, 30.14it/s] 70it [00:02, 30.90it/s] 74it [00:02, 30.80it/s] 78it [00:02, 30.36it/s] 82it [00:02, 30.45it/s] 86it [00:02, 30.63it/s] 90it [00:03, 30.32it/s] 94it [00:03, 30.62it/s] 98it [00:03, 30.64it/s]2025-05-26 05:24:52,741 - INFO - [Epoch 043 | Batch 0100] IWAE-loss 5621.8511 | mean log_px -0.0305 | KL -3485.84 + 102it [00:03, 30.26it/s] 106it [00:03, 30.51it/s] 110it [00:03, 30.12it/s] 114it [00:03, 30.23it/s] 118it [00:03, 29.99it/s] 122it [00:04, 30.37it/s] 126it [00:04, 30.12it/s] 130it [00:04, 30.52it/s] 134it [00:04, 30.19it/s] 138it [00:04, 30.50it/s] 142it [00:04, 30.54it/s] 146it [00:04, 30.02it/s] 150it [00:05, 30.57it/s]2025-05-26 05:24:54,395 - INFO - [Epoch 043 | Batch 0150] IWAE-loss 5314.7900 | mean log_px -0.0262 | KL -3484.09 + 154it [00:05, 30.57it/s] 158it [00:05, 30.50it/s] 162it [00:05, 30.18it/s] 166it [00:05, 30.58it/s] 170it [00:05, 30.21it/s] 174it [00:05, 30.59it/s] 178it [00:05, 30.26it/s] 182it [00:06, 30.26it/s] 186it [00:06, 30.33it/s] 190it [00:06, 30.62it/s] 194it [00:06, 30.24it/s] 196it [00:06, 29.76it/s] +2025-05-26 05:24:55,945 - INFO - Epoch: 43, Objective: tensor([6478.5850], device='cuda:0', grad_fn=), Loss: 0.04169122129678726, KL/n: 71.10687255859375 + 0it [00:00, ?it/s]2025-05-26 05:24:56,331 - INFO - [Epoch 044 | Batch 0000] IWAE-loss 5201.7139 | mean log_px -0.0246 | KL -3480.78 + 2it [00:00, 15.06it/s] 6it [00:00, 24.80it/s] 9it [00:00, 26.67it/s] 13it [00:00, 28.32it/s] 17it [00:00, 29.12it/s] 21it [00:00, 29.61it/s] 25it [00:00, 29.94it/s] 29it [00:01, 30.09it/s] 33it [00:01, 30.20it/s] 37it [00:01, 30.30it/s] 41it [00:01, 30.72it/s] 45it [00:01, 30.33it/s] 49it [00:01, 30.69it/s]2025-05-26 05:24:57,974 - INFO - [Epoch 044 | Batch 0050] IWAE-loss 6047.9131 | mean log_px -0.0366 | KL -3483.48 + 53it [00:01, 30.29it/s] 57it [00:01, 30.30it/s] 61it [00:02, 30.18it/s] 65it [00:02, 30.81it/s] 69it [00:02, 30.67it/s] 73it [00:02, 30.70it/s] 77it [00:02, 30.20it/s] 81it [00:02, 30.38it/s] 85it [00:02, 29.95it/s] 89it [00:02, 30.67it/s] 93it [00:03, 30.64it/s] 97it [00:03, 30.59it/s]2025-05-26 05:24:59,616 - INFO - [Epoch 044 | Batch 0100] IWAE-loss 5646.8691 | mean log_px -0.0309 | KL -3480.42 + 101it [00:03, 30.24it/s] 105it [00:03, 30.08it/s] 109it [00:03, 30.82it/s] 113it [00:03, 30.73it/s] 117it [00:03, 30.30it/s] 121it [00:04, 30.33it/s] 125it [00:04, 30.43it/s] 129it [00:04, 30.42it/s] 133it [00:04, 30.76it/s] 137it [00:04, 30.40it/s] 141it [00:04, 30.45it/s] 145it [00:04, 30.43it/s] 149it [00:04, 30.50it/s]2025-05-26 05:25:01,258 - INFO - [Epoch 044 | Batch 0150] IWAE-loss 4621.8511 | mean log_px -0.0163 | KL -3483.07 + 153it [00:05, 30.83it/s] 157it [00:05, 30.76it/s] 161it [00:05, 30.69it/s] 165it [00:05, 29.49it/s] 169it [00:05, 29.43it/s] 173it [00:05, 30.02it/s] 177it [00:05, 30.08it/s] 181it [00:06, 29.73it/s] 185it [00:06, 29.95it/s] 189it [00:06, 30.44it/s] 193it [00:06, 29.59it/s] 196it [00:06, 28.83it/s] 196it [00:06, 29.68it/s] +2025-05-26 05:25:02,854 - INFO - Epoch: 44, Objective: tensor([5385.1914], device='cuda:0', grad_fn=), Loss: 0.021883929148316383, KL/n: 70.9792251586914 + 0it [00:00, ?it/s]2025-05-26 05:25:03,070 - INFO - [Epoch 045 | Batch 0000] IWAE-loss 6117.1133 | mean log_px -0.0377 | KL -3478.24 + 2it [00:00, 15.19it/s] 6it [00:00, 24.04it/s] 9it [00:00, 25.73it/s] 13it [00:00, 27.41it/s] 17it [00:00, 29.06it/s] 20it [00:00, 28.74it/s] 24it [00:00, 29.84it/s] 27it [00:00, 29.24it/s] 31it [00:01, 29.55it/s] 35it [00:01, 30.31it/s] 39it [00:01, 30.35it/s] 43it [00:01, 29.89it/s] 46it [00:01, 29.71it/s] 50it [00:01, 30.12it/s]2025-05-26 05:25:04,736 - INFO - [Epoch 045 | Batch 0050] IWAE-loss 5906.2021 | mean log_px -0.0348 | KL -3469.90 + 54it [00:01, 29.60it/s] 57it [00:01, 29.67it/s] 60it [00:02, 29.51it/s] 64it [00:02, 29.66it/s] 68it [00:02, 30.01it/s] 72it [00:02, 30.26it/s] 76it [00:02, 29.62it/s] 79it [00:02, 29.15it/s] 82it [00:02, 28.81it/s] 85it [00:02, 28.64it/s] 88it [00:03, 28.69it/s] 92it [00:03, 29.30it/s] 96it [00:03, 29.53it/s] 99it [00:03, 29.43it/s]2025-05-26 05:25:06,433 - INFO - [Epoch 045 | Batch 0100] IWAE-loss 5693.9888 | mean log_px -0.0318 | KL -3467.85 + 102it [00:03, 29.48it/s] 106it [00:03, 29.88it/s] 110it [00:03, 30.25it/s] 114it [00:03, 29.43it/s] 118it [00:04, 29.80it/s] 122it [00:04, 30.11it/s] 126it [00:04, 30.13it/s] 130it [00:04, 30.04it/s] 134it [00:04, 29.47it/s] 138it [00:04, 29.59it/s] 142it [00:04, 30.10it/s] 146it [00:04, 30.22it/s] 150it [00:05, 29.83it/s]2025-05-26 05:25:08,109 - INFO - [Epoch 045 | Batch 0150] IWAE-loss 5339.2231 | mean log_px -0.0267 | KL -3473.57 + 153it [00:05, 29.83it/s] 157it [00:05, 30.10it/s] 161it [00:05, 30.09it/s] 165it [00:05, 29.67it/s] 168it [00:05, 29.55it/s] 172it [00:05, 30.03it/s] 176it [00:05, 30.14it/s] 180it [00:06, 29.46it/s] 184it [00:06, 29.51it/s] 188it [00:06, 30.10it/s] 192it [00:06, 30.08it/s] 196it [00:06, 29.41it/s] 196it [00:06, 29.21it/s] +2025-05-26 05:25:09,695 - INFO - Epoch: 45, Objective: tensor([7572.7393], device='cuda:0', grad_fn=), Loss: 0.04932942986488342, KL/n: 70.83316040039062 + 0it [00:00, ?it/s]2025-05-26 05:25:09,884 - INFO - [Epoch 046 | Batch 0000] IWAE-loss 5142.1602 | mean log_px -0.0239 | KL -3469.32 + 2it [00:00, 19.15it/s] 5it [00:00, 24.54it/s] 8it [00:00, 26.30it/s] 12it [00:00, 28.68it/s] 15it [00:00, 28.16it/s] 19it [00:00, 29.02it/s] 23it [00:00, 30.19it/s] 27it [00:00, 30.49it/s] 31it [00:01, 30.11it/s] 35it [00:01, 30.11it/s] 39it [00:01, 30.44it/s] 43it [00:01, 30.63it/s] 47it [00:01, 30.12it/s]2025-05-26 05:25:11,536 - INFO - [Epoch 046 | Batch 0050] IWAE-loss 7154.9971 | mean log_px -0.0526 | KL -3472.54 + 51it [00:01, 30.19it/s] 55it [00:01, 30.27it/s] 59it [00:01, 30.77it/s] 63it [00:02, 30.71it/s] 67it [00:02, 30.28it/s] 71it [00:02, 30.66it/s] 75it [00:02, 30.59it/s] 79it [00:02, 30.60it/s] 83it [00:02, 30.25it/s] 87it [00:02, 30.61it/s] 91it [00:03, 30.44it/s] 95it [00:03, 30.02it/s] 99it [00:03, 30.06it/s]2025-05-26 05:25:13,190 - INFO - [Epoch 046 | Batch 0100] IWAE-loss 5667.2842 | mean log_px -0.0315 | KL -3463.64 + 103it [00:03, 30.07it/s] 107it [00:03, 30.13it/s] 111it [00:03, 29.67it/s] 115it [00:03, 29.99it/s] 119it [00:03, 30.36it/s] 123it [00:04, 30.42it/s] 127it [00:04, 29.82it/s] 131it [00:04, 30.40it/s] 135it [00:04, 30.12it/s] 139it [00:04, 30.49it/s] 143it [00:04, 30.41it/s] 147it [00:04, 29.83it/s] 150it [00:05, 29.82it/s]2025-05-26 05:25:14,844 - INFO - [Epoch 046 | Batch 0150] IWAE-loss 5167.2905 | mean log_px -0.0243 | KL -3464.16 + 154it [00:05, 30.21it/s] 158it [00:05, 30.19it/s] 162it [00:05, 30.40it/s] 166it [00:05, 30.44it/s] 170it [00:05, 30.38it/s] 174it [00:05, 30.29it/s] 178it [00:05, 29.79it/s] 182it [00:06, 30.24it/s] 186it [00:06, 30.16it/s] 190it [00:06, 30.29it/s] 194it [00:06, 30.24it/s] 196it [00:06, 29.74it/s] +2025-05-26 05:25:16,409 - INFO - Epoch: 46, Objective: tensor([4936.7476], device='cuda:0', grad_fn=), Loss: 0.02368679828941822, KL/n: 70.708251953125 + 0it [00:00, ?it/s]2025-05-26 05:25:16,795 - INFO - [Epoch 047 | Batch 0000] IWAE-loss 7143.2705 | mean log_px -0.0526 | KL -3463.51 + 1it [00:00, 9.67it/s] 4it [00:00, 21.27it/s] 7it [00:00, 25.20it/s] 11it [00:00, 27.49it/s] 15it [00:00, 28.94it/s] 18it [00:00, 28.93it/s] 22it [00:00, 29.37it/s] 26it [00:00, 29.68it/s] 30it [00:01, 30.13it/s] 34it [00:01, 30.30it/s] 38it [00:01, 30.03it/s] 42it [00:01, 30.15it/s] 46it [00:01, 30.26it/s] 50it [00:01, 30.54it/s]2025-05-26 05:25:18,453 - INFO - [Epoch 047 | Batch 0050] IWAE-loss 5606.2593 | mean log_px -0.0306 | KL -3463.97 + 54it [00:01, 30.43it/s] 58it [00:01, 30.46it/s] 62it [00:02, 30.02it/s] 66it [00:02, 30.19it/s] 70it [00:02, 30.21it/s] 74it [00:02, 30.21it/s] 78it [00:02, 30.20it/s] 82it [00:02, 30.19it/s] 86it [00:02, 30.23it/s] 90it [00:03, 30.32it/s] 94it [00:03, 30.45it/s] 98it [00:03, 30.11it/s]2025-05-26 05:25:20,107 - INFO - [Epoch 047 | Batch 0100] IWAE-loss 5999.4395 | mean log_px -0.0363 | KL -3458.10 + 102it [00:03, 30.41it/s] 106it [00:03, 30.11it/s] 110it [00:03, 30.10it/s] 114it [00:03, 30.15it/s] 118it [00:03, 30.17it/s] 122it [00:04, 30.50it/s] 126it [00:04, 30.38it/s] 130it [00:04, 30.03it/s] 134it [00:04, 30.09it/s] 138it [00:04, 30.48it/s] 142it [00:04, 30.01it/s] 146it [00:04, 30.00it/s] 150it [00:05, 29.55it/s]2025-05-26 05:25:21,771 - INFO - [Epoch 047 | Batch 0150] IWAE-loss 6495.0508 | mean log_px -0.0434 | KL -3456.37 + 153it [00:05, 28.87it/s] 157it [00:05, 29.69it/s] 160it [00:05, 29.65it/s] 164it [00:05, 30.01it/s] 167it [00:05, 29.66it/s] 171it [00:05, 30.02it/s] 174it [00:05, 29.84it/s] 178it [00:05, 30.47it/s] 182it [00:06, 30.32it/s] 186it [00:06, 30.37it/s] 190it [00:06, 29.90it/s] 194it [00:06, 30.21it/s] 196it [00:06, 29.48it/s] +2025-05-26 05:25:23,354 - INFO - Epoch: 47, Objective: tensor([4586.9888], device='cuda:0', grad_fn=), Loss: 0.015991654247045517, KL/n: 70.57218933105469 + 0it [00:00, ?it/s]2025-05-26 05:25:23,569 - INFO - [Epoch 048 | Batch 0000] IWAE-loss 6657.1094 | mean log_px -0.0458 | KL -3454.53 + 1it [00:00, 9.25it/s] 5it [00:00, 22.92it/s] 8it [00:00, 25.35it/s] 11it [00:00, 26.77it/s] 15it [00:00, 27.83it/s] 19it [00:00, 28.97it/s] 22it [00:00, 28.60it/s] 26it [00:00, 29.06it/s] 30it [00:01, 30.20it/s] 34it [00:01, 29.58it/s] 38it [00:01, 30.06it/s] 42it [00:01, 30.45it/s] 46it [00:01, 30.52it/s] 50it [00:01, 29.91it/s]2025-05-26 05:25:25,231 - INFO - [Epoch 048 | Batch 0050] IWAE-loss 5901.9629 | mean log_px -0.0350 | KL -3453.03 + 54it [00:01, 30.04it/s] 58it [00:02, 30.43it/s] 62it [00:02, 30.69it/s] 66it [00:02, 30.48it/s] 70it [00:02, 30.59it/s] 74it [00:02, 30.22it/s] 78it [00:02, 30.67it/s] 82it [00:02, 30.07it/s] 86it [00:02, 30.12it/s] 90it [00:03, 30.79it/s] 94it [00:03, 30.60it/s] 98it [00:03, 30.78it/s]2025-05-26 05:25:26,880 - INFO - [Epoch 048 | Batch 0100] IWAE-loss 4750.5303 | mean log_px -0.0185 | KL -3452.55 + 102it [00:03, 30.04it/s] 106it [00:03, 30.67it/s] 110it [00:03, 30.72it/s] 114it [00:03, 30.66it/s] 118it [00:03, 30.05it/s] 122it [00:04, 30.61it/s] 126it [00:04, 30.75it/s] 130it [00:04, 30.07it/s] 134it [00:04, 30.21it/s] 138it [00:04, 30.83it/s] 142it [00:04, 30.76it/s] 146it [00:04, 30.35it/s] 150it [00:05, 30.76it/s]2025-05-26 05:25:28,513 - INFO - [Epoch 048 | Batch 0150] IWAE-loss 5010.0283 | mean log_px -0.0223 | KL -3451.66 + 154it [00:05, 30.03it/s] 158it [00:05, 30.77it/s] 162it [00:05, 30.56it/s] 166it [00:05, 30.68it/s] 170it [00:05, 30.23it/s] 174it [00:05, 30.31it/s] 178it [00:05, 30.37it/s] 182it [00:06, 30.51it/s] 186it [00:06, 30.23it/s] 190it [00:06, 30.33it/s] 194it [00:06, 30.72it/s] 196it [00:06, 29.75it/s] +2025-05-26 05:25:30,065 - INFO - Epoch: 48, Objective: tensor([6825.6470], device='cuda:0', grad_fn=), Loss: 0.048502352088689804, KL/n: 70.43475341796875 + 0it [00:00, ?it/s]2025-05-26 05:25:30,447 - INFO - [Epoch 049 | Batch 0000] IWAE-loss 5120.0049 | mean log_px -0.0239 | KL -3449.82 + 2it [00:00, 15.86it/s] 5it [00:00, 22.73it/s] 9it [00:00, 26.66it/s] 13it [00:00, 28.27it/s] 17it [00:00, 29.09it/s] 21it [00:00, 29.56it/s] 25it [00:00, 29.86it/s] 29it [00:01, 30.11it/s] 33it [00:01, 30.21it/s] 37it [00:01, 30.26it/s] 41it [00:01, 30.36it/s] 45it [00:01, 30.41it/s] 49it [00:01, 30.44it/s]2025-05-26 05:25:32,089 - INFO - [Epoch 049 | Batch 0050] IWAE-loss 5172.5244 | mean log_px -0.0247 | KL -3442.14 + 53it [00:01, 30.81it/s] 57it [00:01, 30.66it/s] 61it [00:02, 30.23it/s] 65it [00:02, 30.30it/s] 69it [00:02, 30.78it/s] 73it [00:02, 30.65it/s] 77it [00:02, 30.54it/s] 81it [00:02, 30.54it/s] 85it [00:02, 29.59it/s] 89it [00:02, 29.81it/s] 93it [00:03, 29.91it/s] 97it [00:03, 30.44it/s]2025-05-26 05:25:33,742 - INFO - [Epoch 049 | Batch 0100] IWAE-loss 6331.5757 | mean log_px -0.0412 | KL -3445.90 + 101it [00:03, 30.04it/s] 105it [00:03, 30.25it/s] 109it [00:03, 30.74it/s] 113it [00:03, 30.68it/s] 117it [00:03, 30.08it/s] 121it [00:04, 30.26it/s] 125it [00:04, 30.77it/s] 129it [00:04, 29.59it/s] 133it [00:04, 30.22it/s] 137it [00:04, 29.30it/s] 140it [00:04, 28.25it/s] 143it [00:04, 28.23it/s] 146it [00:04, 27.82it/s] 149it [00:05, 28.27it/s]2025-05-26 05:25:35,454 - INFO - [Epoch 049 | Batch 0150] IWAE-loss 7797.5391 | mean log_px -0.0622 | KL -3442.13 + 152it [00:05, 28.41it/s] 155it [00:05, 28.76it/s] 159it [00:05, 29.21it/s] 162it [00:05, 28.52it/s] 165it [00:05, 28.68it/s] 169it [00:05, 29.49it/s] 172it [00:05, 29.42it/s] 175it [00:05, 28.65it/s] 179it [00:06, 29.50it/s] 182it [00:06, 28.82it/s] 186it [00:06, 29.07it/s] 189it [00:06, 29.07it/s] 192it [00:06, 28.83it/s] 195it [00:06, 27.79it/s] 196it [00:06, 29.21it/s] +2025-05-26 05:25:37,076 - INFO - Epoch: 49, Objective: tensor([5318.8335], device='cuda:0', grad_fn=), Loss: 0.02061973512172699, KL/n: 70.28175354003906 + 0it [00:00, ?it/s]2025-05-26 05:25:37,294 - INFO - [Epoch 050 | Batch 0000] IWAE-loss 4784.5928 | mean log_px -0.0192 | KL -3439.95 + 2it [00:00, 15.60it/s] 5it [00:00, 21.63it/s] 9it [00:00, 25.39it/s] 12it [00:00, 26.84it/s] 15it [00:00, 27.04it/s] 18it [00:00, 27.91it/s] 21it [00:00, 27.75it/s] 24it [00:00, 27.99it/s] 27it [00:01, 28.21it/s] 30it [00:01, 28.40it/s] 33it [00:01, 27.70it/s] 36it [00:01, 28.00it/s] 39it [00:01, 27.65it/s] 43it [00:01, 28.43it/s] 46it [00:01, 28.43it/s] 49it [00:01, 28.72it/s]2025-05-26 05:25:39,054 - INFO - [Epoch 050 | Batch 0050] IWAE-loss 5931.2510 | mean log_px -0.0356 | KL -3441.72 + 52it [00:01, 28.80it/s] 55it [00:01, 28.83it/s] 59it [00:02, 29.28it/s] 62it [00:02, 29.05it/s] 65it [00:02, 29.06it/s] 68it [00:02, 28.70it/s] 71it [00:02, 28.89it/s] 74it [00:02, 29.13it/s] 77it [00:02, 28.12it/s] 80it [00:02, 28.17it/s] 84it [00:03, 28.14it/s] 87it [00:03, 28.06it/s] 90it [00:03, 27.81it/s] 94it [00:03, 28.52it/s] 97it [00:03, 28.41it/s] 100it [00:03, 28.57it/s]2025-05-26 05:25:40,804 - INFO - [Epoch 050 | Batch 0100] IWAE-loss 4650.6270 | mean log_px -0.0173 | KL -3437.96 + 103it [00:03, 28.65it/s] 106it [00:03, 28.82it/s] 110it [00:03, 28.61it/s] 114it [00:04, 29.29it/s] 117it [00:04, 29.41it/s] 120it [00:04, 29.37it/s] 123it [00:04, 28.83it/s] 127it [00:04, 29.84it/s] 130it [00:04, 29.79it/s] 133it [00:04, 28.89it/s] 137it [00:04, 29.15it/s] 141it [00:04, 29.80it/s] 144it [00:05, 29.14it/s] 148it [00:05, 29.48it/s]2025-05-26 05:25:42,508 - INFO - [Epoch 050 | Batch 0150] IWAE-loss 5496.5239 | mean log_px -0.0294 | KL -3436.08 + 151it [00:05, 29.14it/s] 155it [00:05, 29.46it/s] 158it [00:05, 29.27it/s] 161it [00:05, 28.98it/s] 165it [00:05, 29.47it/s] 168it [00:05, 29.48it/s] 171it [00:05, 28.77it/s] 175it [00:06, 28.75it/s] 178it [00:06, 29.04it/s] 182it [00:06, 29.33it/s] 185it [00:06, 28.59it/s] 189it [00:06, 29.41it/s] 192it [00:06, 28.80it/s] 195it [00:06, 27.27it/s] 196it [00:06, 28.30it/s] +2025-05-26 05:25:44,138 - INFO - Epoch: 50, Objective: tensor([6304.8389], device='cuda:0', grad_fn=), Loss: 0.04366378113627434, KL/n: 70.13224029541016 + 0it [00:00, ?it/s]2025-05-26 05:25:44,538 - INFO - [Epoch 051 | Batch 0000] IWAE-loss 6203.6821 | mean log_px -0.0396 | KL -3429.19 + 1it [00:00, 9.54it/s] 4it [00:00, 19.88it/s] 8it [00:00, 25.13it/s] 11it [00:00, 17.76it/s] 14it [00:00, 20.80it/s] 18it [00:00, 23.62it/s] 22it [00:00, 25.93it/s] 25it [00:01, 26.52it/s] 29it [00:01, 27.25it/s] 33it [00:01, 28.50it/s] 36it [00:01, 28.32it/s] 40it [00:01, 29.12it/s] 44it [00:01, 29.37it/s] 47it [00:01, 29.29it/s]2025-05-26 05:25:46,372 - INFO - [Epoch 051 | Batch 0050] IWAE-loss 5237.4727 | mean log_px -0.0257 | KL -3436.74 + 51it [00:01, 29.64it/s] 54it [00:02, 29.49it/s] 58it [00:02, 29.52it/s] 62it [00:02, 30.13it/s] 66it [00:02, 29.95it/s] 69it [00:02, 28.59it/s] 72it [00:02, 28.20it/s] 76it [00:02, 28.81it/s] 80it [00:02, 29.31it/s] 83it [00:03, 29.22it/s] 87it [00:03, 29.57it/s] 90it [00:03, 29.53it/s] 94it [00:03, 30.04it/s] 98it [00:03, 30.39it/s]2025-05-26 05:25:48,064 - INFO - [Epoch 051 | Batch 0100] IWAE-loss 4859.2930 | mean log_px -0.0203 | KL -3435.31 + 102it [00:03, 30.13it/s] 106it [00:03, 30.20it/s] 110it [00:03, 30.54it/s] 114it [00:04, 30.07it/s] 118it [00:04, 30.17it/s] 122it [00:04, 30.43it/s] 126it [00:04, 30.45it/s] 130it [00:04, 29.55it/s] 134it [00:04, 29.58it/s] 137it [00:04, 29.16it/s] 140it [00:04, 29.29it/s] 143it [00:05, 28.86it/s] 147it [00:05, 28.75it/s]2025-05-26 05:25:49,754 - INFO - [Epoch 051 | Batch 0150] IWAE-loss 4083.5815 | mean log_px -0.0093 | KL -3432.44 + 151it [00:05, 29.17it/s] 154it [00:05, 28.87it/s] 158it [00:05, 29.40it/s] 161it [00:05, 28.64it/s] 165it [00:05, 29.27it/s] 168it [00:05, 28.90it/s] 171it [00:06, 28.96it/s] 175it [00:06, 29.25it/s] 178it [00:06, 28.86it/s] 181it [00:06, 29.01it/s] 184it [00:06, 28.74it/s] 187it [00:06, 29.01it/s] 190it [00:06, 28.62it/s] 193it [00:06, 28.95it/s] 196it [00:06, 28.13it/s] 196it [00:06, 28.20it/s] +2025-05-26 05:25:51,399 - INFO - Epoch: 51, Objective: tensor([4970.8354], device='cuda:0', grad_fn=), Loss: 0.019495848566293716, KL/n: 69.98006439208984 + 0it [00:00, ?it/s]2025-05-26 05:25:51,788 - INFO - [Epoch 052 | Batch 0000] IWAE-loss 6093.7998 | mean log_px -0.0381 | KL -3425.07 + 2it [00:00, 15.67it/s] 5it [00:00, 22.30it/s] 9it [00:00, 26.25it/s] 13it [00:00, 27.99it/s] 17it [00:00, 28.59it/s] 21it [00:00, 29.94it/s] 25it [00:00, 30.18it/s] 29it [00:01, 30.31it/s] 33it [00:01, 30.50it/s] 37it [00:01, 30.25it/s] 41it [00:01, 30.54it/s] 45it [00:01, 30.27it/s] 49it [00:01, 30.68it/s]2025-05-26 05:25:53,437 - INFO - [Epoch 052 | Batch 0050] IWAE-loss 4860.5889 | mean log_px -0.0204 | KL -3430.13 + 53it [00:01, 30.72it/s] 57it [00:01, 30.64it/s] 61it [00:02, 30.74it/s] 65it [00:02, 30.41it/s] 69it [00:02, 30.49it/s] 73it [00:02, 30.74it/s] 77it [00:02, 30.85it/s] 81it [00:02, 30.82it/s] 85it [00:02, 30.48it/s] 89it [00:02, 30.55it/s] 93it [00:03, 30.81it/s] 97it [00:03, 30.77it/s]2025-05-26 05:25:55,060 - INFO - [Epoch 052 | Batch 0100] IWAE-loss 5270.4360 | mean log_px -0.0264 | KL -3425.16 + 101it [00:03, 30.72it/s] 105it [00:03, 30.40it/s] 109it [00:03, 30.75it/s] 113it [00:03, 30.68it/s] 117it [00:03, 30.29it/s] 121it [00:04, 29.98it/s] 125it [00:04, 30.83it/s] 129it [00:04, 30.58it/s] 133it [00:04, 30.10it/s] 137it [00:04, 29.72it/s] 141it [00:04, 30.16it/s] 145it [00:04, 29.99it/s] 149it [00:04, 29.23it/s]2025-05-26 05:25:56,723 - INFO - [Epoch 052 | Batch 0150] IWAE-loss 5292.9219 | mean log_px -0.0267 | KL -3426.06 + 153it [00:05, 29.53it/s] 157it [00:05, 30.01it/s] 161it [00:05, 30.22it/s] 165it [00:05, 30.03it/s] 169it [00:05, 30.16it/s] 173it [00:05, 30.54it/s] 177it [00:05, 30.61it/s] 181it [00:06, 30.28it/s] 185it [00:06, 29.82it/s] 188it [00:06, 29.82it/s] 192it [00:06, 30.52it/s] 196it [00:06, 29.51it/s] 196it [00:06, 29.73it/s] +2025-05-26 05:25:58,300 - INFO - Epoch: 52, Objective: tensor([4767.4678], device='cuda:0', grad_fn=), Loss: 0.018897708505392075, KL/n: 69.84442901611328 + 0it [00:00, ?it/s]2025-05-26 05:25:58,517 - INFO - [Epoch 053 | Batch 0000] IWAE-loss 4266.5762 | mean log_px -0.0121 | KL -3420.67 + 1it [00:00, 9.88it/s] 4it [00:00, 20.60it/s] 8it [00:00, 25.52it/s] 11it [00:00, 26.42it/s] 15it [00:00, 28.02it/s] 19it [00:00, 28.84it/s] 23it [00:00, 29.12it/s] 27it [00:00, 30.21it/s] 31it [00:01, 30.32it/s] 35it [00:01, 30.25it/s] 39it [00:01, 29.94it/s] 42it [00:01, 29.55it/s] 45it [00:01, 29.60it/s] 49it [00:01, 29.88it/s]2025-05-26 05:26:00,183 - INFO - [Epoch 053 | Batch 0050] IWAE-loss 5618.6821 | mean log_px -0.0314 | KL -3420.66 + 53it [00:01, 30.68it/s] 57it [00:01, 30.72it/s] 61it [00:02, 30.68it/s] 65it [00:02, 30.15it/s] 69it [00:02, 30.30it/s] 73it [00:02, 30.39it/s] 77it [00:02, 30.41it/s] 81it [00:02, 30.42it/s] 85it [00:02, 30.80it/s] 89it [00:03, 30.43it/s] 93it [00:03, 30.77it/s] 97it [00:03, 30.68it/s]2025-05-26 05:26:01,826 - INFO - [Epoch 053 | Batch 0100] IWAE-loss 4908.2837 | mean log_px -0.0213 | KL -3416.47 + 101it [00:03, 30.29it/s] 105it [00:03, 30.42it/s] 109it [00:03, 30.43it/s] 113it [00:03, 30.16it/s] 117it [00:03, 30.29it/s] 121it [00:04, 30.62it/s] 125it [00:04, 30.66it/s] 129it [00:04, 30.57it/s] 133it [00:04, 30.28it/s] 137it [00:04, 30.36it/s] 141it [00:04, 30.41it/s] 145it [00:04, 30.75it/s] 149it [00:04, 30.70it/s]2025-05-26 05:26:03,467 - INFO - [Epoch 053 | Batch 0150] IWAE-loss 5012.7490 | mean log_px -0.0229 | KL -3413.13 + 153it [00:05, 30.37it/s] 157it [00:05, 30.72it/s] 161it [00:05, 30.37it/s] 165it [00:05, 30.45it/s] 169it [00:05, 30.72it/s] 173it [00:05, 30.67it/s] 177it [00:05, 30.37it/s] 181it [00:06, 30.77it/s] 185it [00:06, 30.42it/s] 189it [00:06, 30.69it/s] 193it [00:06, 30.59it/s] 196it [00:06, 29.73it/s] +2025-05-26 05:26:05,022 - INFO - Epoch: 53, Objective: tensor([4726.3228], device='cuda:0', grad_fn=), Loss: 0.020918160676956177, KL/n: 69.6919937133789 + 0it [00:00, ?it/s]2025-05-26 05:26:05,229 - INFO - [Epoch 054 | Batch 0000] IWAE-loss 4591.0273 | mean log_px -0.0169 | KL -3411.38 + 2it [00:00, 15.83it/s] 5it [00:00, 22.30it/s] 8it [00:00, 25.51it/s] 11it [00:00, 26.74it/s] 15it [00:00, 27.76it/s] 19it [00:00, 28.79it/s] 23it [00:00, 29.26it/s] 27it [00:00, 29.54it/s] 31it [00:01, 29.82it/s] 35it [00:01, 29.94it/s] 38it [00:01, 29.85it/s] 42it [00:01, 29.81it/s] 46it [00:01, 30.08it/s] 50it [00:01, 30.23it/s]2025-05-26 05:26:06,903 - INFO - [Epoch 054 | Batch 0050] IWAE-loss 4861.4932 | mean log_px -0.0208 | KL -3407.42 + 54it [00:01, 30.52it/s] 58it [00:01, 30.46it/s] 62it [00:02, 29.88it/s] 65it [00:02, 29.38it/s] 69it [00:02, 29.76it/s] 72it [00:02, 29.62it/s] 76it [00:02, 30.19it/s] 80it [00:02, 30.15it/s] 84it [00:02, 30.10it/s] 88it [00:03, 29.54it/s] 92it [00:03, 29.98it/s] 96it [00:03, 30.16it/s] 100it [00:03, 29.12it/s]2025-05-26 05:26:08,592 - INFO - [Epoch 054 | Batch 0100] IWAE-loss 4739.4404 | mean log_px -0.0189 | KL -3413.11 + 103it [00:03, 29.00it/s] 106it [00:03, 28.48it/s] 110it [00:03, 29.68it/s] 113it [00:03, 29.21it/s] 117it [00:03, 29.66it/s] 121it [00:04, 29.78it/s] 124it [00:04, 29.76it/s] 128it [00:04, 29.87it/s] 131it [00:04, 29.53it/s] 135it [00:04, 29.75it/s] 139it [00:04, 30.07it/s] 143it [00:04, 30.20it/s] 147it [00:05, 29.62it/s]2025-05-26 05:26:10,263 - INFO - [Epoch 054 | Batch 0150] IWAE-loss 5010.0913 | mean log_px -0.0229 | KL -3407.54 + 151it [00:05, 29.92it/s] 155it [00:05, 30.29it/s] 159it [00:05, 30.38it/s] 163it [00:05, 30.02it/s] 167it [00:05, 30.38it/s] 171it [00:05, 30.36it/s] 175it [00:05, 30.21it/s] 179it [00:06, 29.70it/s] 183it [00:06, 30.39it/s] 187it [00:06, 30.38it/s] 191it [00:06, 30.36it/s] 195it [00:06, 28.48it/s] 196it [00:06, 29.31it/s] +2025-05-26 05:26:11,833 - INFO - Epoch: 54, Objective: tensor([5164.9370], device='cuda:0', grad_fn=), Loss: 0.027251476421952248, KL/n: 69.54241943359375 + 0it [00:00, ?it/s]2025-05-26 05:26:12,218 - INFO - [Epoch 055 | Batch 0000] IWAE-loss 4403.5381 | mean log_px -0.0143 | KL -3404.93 + 1it [00:00, 9.70it/s] 4it [00:00, 20.39it/s] 8it [00:00, 25.33it/s] 11it [00:00, 25.87it/s] 15it [00:00, 28.27it/s] 18it [00:00, 28.58it/s] 22it [00:00, 29.44it/s] 25it [00:00, 29.50it/s] 29it [00:01, 30.19it/s] 33it [00:01, 29.97it/s] 37it [00:01, 30.45it/s] 41it [00:01, 30.60it/s] 45it [00:01, 30.09it/s] 49it [00:01, 30.34it/s]2025-05-26 05:26:13,878 - INFO - [Epoch 055 | Batch 0050] IWAE-loss 4678.7397 | mean log_px -0.0181 | KL -3411.08 + 53it [00:01, 30.00it/s] 57it [00:01, 30.98it/s] 61it [00:02, 30.53it/s] 65it [00:02, 30.80it/s] 69it [00:02, 30.88it/s] 73it [00:02, 30.43it/s] 77it [00:02, 30.51it/s] 81it [00:02, 30.88it/s] 85it [00:02, 30.79it/s] 89it [00:03, 30.77it/s] 93it [00:03, 30.76it/s] 97it [00:03, 30.19it/s]2025-05-26 05:26:15,512 - INFO - [Epoch 055 | Batch 0100] IWAE-loss 4574.0552 | mean log_px -0.0168 | KL -3401.24 + 101it [00:03, 30.65it/s] 105it [00:03, 30.42it/s] 109it [00:03, 30.58it/s] 113it [00:03, 30.44it/s] 117it [00:03, 29.85it/s] 121it [00:04, 29.90it/s] 125it [00:04, 30.44it/s] 129it [00:04, 30.48it/s] 133it [00:04, 30.07it/s] 137it [00:04, 30.28it/s] 141it [00:04, 30.24it/s] 145it [00:04, 30.18it/s] 149it [00:04, 30.13it/s]2025-05-26 05:26:17,175 - INFO - [Epoch 055 | Batch 0150] IWAE-loss 4609.8857 | mean log_px -0.0173 | KL -3401.01 + 153it [00:05, 29.52it/s] 157it [00:05, 29.68it/s] 161it [00:05, 30.29it/s] 165it [00:05, 29.88it/s] 169it [00:05, 30.10it/s] 173it [00:05, 30.20it/s] 177it [00:05, 30.19it/s] 181it [00:06, 30.10it/s] 185it [00:06, 29.58it/s] 189it [00:06, 30.01it/s] 193it [00:06, 30.35it/s] 196it [00:06, 29.53it/s] +2025-05-26 05:26:18,768 - INFO - Epoch: 55, Objective: tensor([5018.3228], device='cuda:0', grad_fn=), Loss: 0.019467515870928764, KL/n: 69.36923217773438 + 0it [00:00, ?it/s]2025-05-26 05:26:18,985 - INFO - [Epoch 056 | Batch 0000] IWAE-loss 5319.4849 | mean log_px -0.0275 | KL -3396.40 + 1it [00:00, 9.94it/s] 4it [00:00, 20.07it/s] 8it [00:00, 24.79it/s] 12it [00:00, 26.90it/s] 15it [00:00, 27.80it/s] 18it [00:00, 28.00it/s] 21it [00:00, 27.98it/s] 24it [00:00, 28.47it/s] 28it [00:01, 29.21it/s] 31it [00:01, 29.30it/s] 34it [00:01, 29.31it/s] 38it [00:01, 30.16it/s] 42it [00:01, 30.27it/s] 46it [00:01, 29.54it/s] 49it [00:01, 29.65it/s]2025-05-26 05:26:20,679 - INFO - [Epoch 056 | Batch 0050] IWAE-loss 5900.0195 | mean log_px -0.0358 | KL -3395.66 + 53it [00:01, 29.72it/s] 57it [00:01, 30.10it/s] 61it [00:02, 30.47it/s] 65it [00:02, 29.77it/s] 69it [00:02, 29.84it/s] 73it [00:02, 30.19it/s] 77it [00:02, 30.18it/s] 81it [00:02, 30.47it/s] 85it [00:02, 29.93it/s] 88it [00:03, 29.72it/s] 92it [00:03, 29.97it/s] 95it [00:03, 29.76it/s] 99it [00:03, 29.71it/s]2025-05-26 05:26:22,346 - INFO - [Epoch 056 | Batch 0100] IWAE-loss 4808.5669 | mean log_px -0.0202 | KL -3396.12 + 102it [00:03, 29.69it/s] 106it [00:03, 29.82it/s] 110it [00:03, 30.19it/s] 114it [00:03, 30.28it/s] 118it [00:04, 30.29it/s] 122it [00:04, 29.58it/s] 126it [00:04, 30.18it/s] 130it [00:04, 29.90it/s] 133it [00:04, 29.64it/s] 137it [00:04, 30.05it/s] 141it [00:04, 30.38it/s] 145it [00:04, 30.30it/s] 149it [00:05, 30.20it/s]2025-05-26 05:26:24,021 - INFO - [Epoch 056 | Batch 0150] IWAE-loss 4848.2808 | mean log_px -0.0208 | KL -3392.14 + 153it [00:05, 30.05it/s] 157it [00:05, 30.00it/s] 160it [00:05, 29.34it/s] 164it [00:05, 29.39it/s] 168it [00:05, 29.20it/s] 172it [00:05, 29.97it/s] 175it [00:05, 29.53it/s] 178it [00:06, 29.35it/s] 182it [00:06, 29.84it/s] 186it [00:06, 29.98it/s] 190it [00:06, 30.00it/s] 193it [00:06, 29.41it/s] 196it [00:06, 28.92it/s] 196it [00:06, 29.17it/s] +2025-05-26 05:26:25,617 - INFO - Epoch: 56, Objective: tensor([5214.8564], device='cuda:0', grad_fn=), Loss: 0.023822709918022156, KL/n: 69.22828674316406 + 0it [00:00, ?it/s]2025-05-26 05:26:25,997 - INFO - [Epoch 057 | Batch 0000] IWAE-loss 5053.6621 | mean log_px -0.0237 | KL -3393.37 + 1it [00:00, 9.88it/s] 4it [00:00, 20.45it/s] 8it [00:00, 25.04it/s] 12it [00:00, 27.75it/s] 15it [00:00, 27.41it/s] 19it [00:00, 28.94it/s] 22it [00:00, 28.39it/s] 26it [00:00, 28.74it/s] 30it [00:01, 29.62it/s] 33it [00:01, 28.83it/s] 37it [00:01, 29.20it/s] 41it [00:01, 29.74it/s] 44it [00:01, 29.14it/s] 48it [00:01, 29.52it/s]2025-05-26 05:26:27,697 - INFO - [Epoch 057 | Batch 0050] IWAE-loss 4763.9077 | mean log_px -0.0197 | KL -3386.74 + 52it [00:01, 29.89it/s] 55it [00:01, 29.24it/s] 58it [00:02, 29.28it/s] 62it [00:02, 22.25it/s] 65it [00:02, 23.87it/s] 68it [00:02, 25.24it/s] 71it [00:02, 26.37it/s] 74it [00:02, 26.94it/s] 77it [00:02, 27.45it/s] 81it [00:02, 28.68it/s] 84it [00:03, 28.26it/s] 88it [00:03, 28.59it/s] 92it [00:03, 29.44it/s] 95it [00:03, 28.76it/s] 99it [00:03, 29.11it/s]2025-05-26 05:26:29,534 - INFO - [Epoch 057 | Batch 0100] IWAE-loss 4860.6079 | mean log_px -0.0211 | KL -3386.66 + 102it [00:03, 29.09it/s] 106it [00:03, 29.17it/s] 110it [00:03, 29.53it/s] 113it [00:04, 29.24it/s] 117it [00:04, 29.69it/s] 120it [00:04, 29.73it/s] 123it [00:04, 29.04it/s] 126it [00:04, 29.30it/s] 130it [00:04, 29.80it/s] 133it [00:04, 28.68it/s] 136it [00:04, 28.76it/s] 139it [00:04, 27.39it/s] 143it [00:05, 28.17it/s] 146it [00:05, 27.99it/s] 150it [00:05, 28.54it/s]2025-05-26 05:26:31,266 - INFO - [Epoch 057 | Batch 0150] IWAE-loss 4931.0508 | mean log_px -0.0221 | KL -3385.35 + 153it [00:05, 28.66it/s] 156it [00:05, 28.99it/s] 159it [00:05, 29.01it/s] 162it [00:05, 28.61it/s] 165it [00:05, 28.32it/s] 169it [00:05, 28.52it/s] 173it [00:06, 29.09it/s] 176it [00:06, 28.56it/s] 179it [00:06, 28.71it/s] 183it [00:06, 28.93it/s] 187it [00:06, 29.03it/s] 191it [00:06, 29.31it/s] 195it [00:06, 28.28it/s] 196it [00:06, 28.06it/s] +2025-05-26 05:26:32,895 - INFO - Epoch: 57, Objective: tensor([5121.4829], device='cuda:0', grad_fn=), Loss: 0.024134118109941483, KL/n: 69.05847930908203 + 0it [00:00, ?it/s]2025-05-26 05:26:33,294 - INFO - [Epoch 058 | Batch 0000] IWAE-loss 4614.4980 | mean log_px -0.0176 | KL -3379.13 + 1it [00:00, 9.91it/s] 4it [00:00, 20.88it/s] 8it [00:00, 26.67it/s] 11it [00:00, 27.45it/s] 15it [00:00, 28.98it/s] 19it [00:00, 30.12it/s] 22it [00:00, 29.54it/s] 26it [00:00, 30.52it/s] 30it [00:01, 30.67it/s] 34it [00:01, 30.69it/s] 38it [00:01, 30.04it/s] 42it [00:01, 30.38it/s] 46it [00:01, 30.88it/s] 50it [00:01, 30.10it/s]2025-05-26 05:26:34,929 - INFO - [Epoch 058 | Batch 0050] IWAE-loss 4743.3682 | mean log_px -0.0195 | KL -3380.50 + 54it [00:01, 30.76it/s] 58it [00:01, 30.33it/s] 62it [00:02, 30.40it/s] 66it [00:02, 30.87it/s] 70it [00:02, 30.14it/s] 74it [00:02, 30.67it/s] 78it [00:02, 30.66it/s] 82it [00:02, 30.76it/s] 86it [00:02, 30.05it/s] 90it [00:03, 30.42it/s] 94it [00:03, 30.52it/s] 98it [00:03, 30.92it/s]2025-05-26 05:26:36,572 - INFO - [Epoch 058 | Batch 0100] IWAE-loss 4392.2617 | mean log_px -0.0145 | KL -3380.00 + 102it [00:03, 30.81it/s] 106it [00:03, 30.13it/s] 110it [00:03, 30.80it/s] 114it [00:03, 30.69it/s] 118it [00:03, 30.29it/s] 122it [00:04, 30.77it/s] 126it [00:04, 30.21it/s] 130it [00:04, 30.47it/s] 134it [00:04, 30.53it/s] 138it [00:04, 30.94it/s] 142it [00:04, 30.32it/s] 146it [00:04, 30.29it/s] 150it [00:04, 30.66it/s]2025-05-26 05:26:38,207 - INFO - [Epoch 058 | Batch 0150] IWAE-loss 4639.5186 | mean log_px -0.0180 | KL -3378.82 + 154it [00:05, 30.58it/s] 158it [00:05, 30.62it/s] 162it [00:05, 30.91it/s] 166it [00:05, 30.94it/s] 170it [00:05, 30.25it/s] 174it [00:05, 30.53it/s] 178it [00:05, 30.93it/s] 182it [00:06, 30.47it/s] 186it [00:06, 30.81it/s] 190it [00:06, 30.27it/s] 194it [00:06, 30.54it/s] 196it [00:06, 29.94it/s] +2025-05-26 05:26:39,752 - INFO - Epoch: 58, Objective: tensor([5821.3262], device='cuda:0', grad_fn=), Loss: 0.025807034224271774, KL/n: 68.87557983398438 + 0it [00:00, ?it/s]2025-05-26 05:26:39,949 - INFO - [Epoch 059 | Batch 0000] IWAE-loss 4289.1025 | mean log_px -0.0130 | KL -3378.00 + 2it [00:00, 17.74it/s] 5it [00:00, 23.87it/s] 9it [00:00, 26.43it/s] 12it [00:00, 27.39it/s] 16it [00:00, 28.58it/s] 20it [00:00, 29.22it/s] 23it [00:00, 29.20it/s] 27it [00:00, 29.55it/s] 30it [00:01, 29.52it/s] 33it [00:01, 29.63it/s] 37it [00:01, 30.06it/s] 40it [00:01, 29.25it/s] 44it [00:01, 30.14it/s] 48it [00:01, 29.70it/s]2025-05-26 05:26:41,630 - INFO - [Epoch 059 | Batch 0050] IWAE-loss 4696.3696 | mean log_px -0.0189 | KL -3372.04 + 52it [00:01, 29.75it/s] 55it [00:01, 29.54it/s] 58it [00:02, 29.18it/s] 61it [00:02, 29.19it/s] 65it [00:02, 29.96it/s] 69it [00:02, 30.22it/s] 73it [00:02, 29.86it/s] 76it [00:02, 29.83it/s] 80it [00:02, 30.57it/s] 84it [00:02, 30.49it/s] 88it [00:02, 30.31it/s] 92it [00:03, 29.85it/s] 96it [00:03, 29.99it/s] 100it [00:03, 30.25it/s]2025-05-26 05:26:43,301 - INFO - [Epoch 059 | Batch 0100] IWAE-loss 5113.4785 | mean log_px -0.0249 | KL -3368.78 + 104it [00:03, 29.62it/s] 108it [00:03, 30.45it/s] 112it [00:03, 30.43it/s] 116it [00:03, 30.03it/s] 120it [00:04, 29.64it/s] 123it [00:04, 29.00it/s] 126it [00:04, 29.15it/s] 129it [00:04, 28.67it/s] 133it [00:04, 28.94it/s] 137it [00:04, 29.23it/s] 140it [00:04, 28.61it/s] 144it [00:04, 28.94it/s] 147it [00:05, 28.69it/s] 150it [00:05, 28.89it/s]2025-05-26 05:26:45,020 - INFO - [Epoch 059 | Batch 0150] IWAE-loss 4628.6143 | mean log_px -0.0181 | KL -3363.96 + 154it [00:05, 29.08it/s] 157it [00:05, 29.21it/s] 160it [00:05, 28.62it/s] 164it [00:05, 29.29it/s] 168it [00:05, 29.08it/s] 172it [00:05, 29.86it/s] 175it [00:05, 29.33it/s] 179it [00:06, 29.68it/s] 183it [00:06, 29.88it/s] 187it [00:06, 30.59it/s] 191it [00:06, 30.13it/s] 195it [00:06, 29.30it/s] 196it [00:06, 29.22it/s] +2025-05-26 05:26:46,589 - INFO - Epoch: 59, Objective: tensor([4434.2725], device='cuda:0', grad_fn=), Loss: 0.016963569447398186, KL/n: 68.69198608398438 + 0it [00:00, ?it/s]2025-05-26 05:26:46,797 - INFO - [Epoch 060 | Batch 0000] IWAE-loss 5351.4604 | mean log_px -0.0284 | KL -3363.75 + 2it [00:00, 15.07it/s] 6it [00:00, 24.22it/s] 9it [00:00, 26.22it/s] 13it [00:00, 28.09it/s] 16it [00:00, 28.55it/s] 20it [00:00, 29.11it/s] 23it [00:00, 29.04it/s] 27it [00:00, 29.28it/s] 31it [00:01, 30.08it/s] 35it [00:01, 30.20it/s] 39it [00:01, 29.44it/s] 43it [00:01, 30.11it/s] 47it [00:01, 29.59it/s]2025-05-26 05:26:48,465 - INFO - [Epoch 060 | Batch 0050] IWAE-loss 6476.6641 | mean log_px -0.0445 | KL -3362.14 + 51it [00:01, 30.24it/s] 55it [00:01, 30.22it/s] 59it [00:02, 30.32it/s] 63it [00:02, 30.20it/s] 67it [00:02, 29.80it/s] 70it [00:02, 29.66it/s] 74it [00:02, 30.23it/s] 78it [00:02, 30.35it/s] 82it [00:02, 29.57it/s] 85it [00:02, 29.34it/s] 89it [00:03, 29.72it/s] 93it [00:03, 30.00it/s] 96it [00:03, 29.38it/s] 100it [00:03, 29.65it/s]2025-05-26 05:26:50,142 - INFO - [Epoch 060 | Batch 0100] IWAE-loss 4837.9287 | mean log_px -0.0211 | KL -3359.56 + 104it [00:03, 30.46it/s] 108it [00:03, 29.82it/s] 112it [00:03, 29.97it/s] 116it [00:03, 30.00it/s] 120it [00:04, 30.04it/s] 124it [00:04, 30.44it/s] 128it [00:04, 30.34it/s] 132it [00:04, 29.63it/s] 136it [00:04, 30.17it/s] 140it [00:04, 30.13it/s] 144it [00:04, 29.88it/s] 147it [00:04, 29.75it/s]2025-05-26 05:26:51,800 - INFO - [Epoch 060 | Batch 0150] IWAE-loss 4506.9629 | mean log_px -0.0164 | KL -3356.25 + 151it [00:05, 30.28it/s] 155it [00:05, 30.48it/s] 159it [00:05, 29.68it/s] 163it [00:05, 29.82it/s] 167it [00:05, 30.32it/s] 171it [00:05, 29.70it/s] 175it [00:05, 30.27it/s] 179it [00:06, 30.30it/s] 183it [00:06, 30.09it/s] 187it [00:06, 30.01it/s] 191it [00:06, 30.04it/s] 195it [00:06, 28.50it/s] 196it [00:06, 29.42it/s] +2025-05-26 05:26:53,379 - INFO - Epoch: 60, Objective: tensor([5288.2446], device='cuda:0', grad_fn=), Loss: 0.02729859948158264, KL/n: 68.52053833007812 + 0it [00:00, ?it/s]2025-05-26 05:26:53,902 - INFO - [Epoch 061 | Batch 0000] IWAE-loss 4701.5654 | mean log_px -0.0193 | KL -3353.15 + 1it [00:00, 4.27it/s] 4it [00:00, 13.54it/s] 8it [00:00, 20.24it/s] 12it [00:00, 24.23it/s] 15it [00:00, 25.13it/s] 19it [00:00, 26.48it/s] 23it [00:00, 27.62it/s] 27it [00:01, 28.32it/s] 31it [00:01, 29.25it/s] 34it [00:01, 28.63it/s] 37it [00:01, 28.84it/s] 41it [00:01, 29.80it/s] 44it [00:01, 29.00it/s] 48it [00:01, 29.19it/s]2025-05-26 05:26:55,597 - INFO - [Epoch 061 | Batch 0050] IWAE-loss 4651.4004 | mean log_px -0.0185 | KL -3355.76 + 52it [00:01, 29.62it/s] 55it [00:02, 29.19it/s] 59it [00:02, 29.26it/s] 63it [00:02, 29.91it/s] 66it [00:02, 29.19it/s] 70it [00:02, 29.54it/s] 73it [00:02, 29.33it/s] 77it [00:02, 29.42it/s] 81it [00:02, 29.87it/s] 85it [00:03, 30.28it/s] 89it [00:03, 29.58it/s] 93it [00:03, 29.62it/s] 97it [00:03, 29.89it/s] 100it [00:03, 29.71it/s]2025-05-26 05:26:57,281 - INFO - [Epoch 061 | Batch 0100] IWAE-loss 7465.7324 | mean log_px -0.0588 | KL -3352.10 + 103it [00:03, 29.55it/s] 107it [00:03, 30.32it/s] 111it [00:03, 30.13it/s] 115it [00:04, 30.05it/s] 119it [00:04, 29.21it/s] 123it [00:04, 29.39it/s] 127it [00:04, 29.49it/s] 131it [00:04, 30.12it/s] 135it [00:04, 30.04it/s] 139it [00:04, 29.34it/s] 143it [00:05, 29.45it/s] 147it [00:05, 30.04it/s]2025-05-26 05:26:58,974 - INFO - [Epoch 061 | Batch 0150] IWAE-loss 4236.6489 | mean log_px -0.0127 | KL -3349.10 + 151it [00:05, 29.33it/s] 154it [00:05, 29.28it/s] 158it [00:05, 29.71it/s] 161it [00:05, 29.05it/s] 165it [00:05, 29.29it/s] 169it [00:05, 29.38it/s] 173it [00:06, 29.41it/s] 177it [00:06, 29.79it/s] 181it [00:06, 30.02it/s] 184it [00:06, 29.16it/s] 187it [00:06, 29.23it/s] 191it [00:06, 29.99it/s] 194it [00:06, 29.26it/s] 196it [00:06, 28.43it/s] +2025-05-26 05:27:00,576 - INFO - Epoch: 61, Objective: tensor([5131.7832], device='cuda:0', grad_fn=), Loss: 0.025880202651023865, KL/n: 68.3313217163086 + 0it [00:00, ?it/s]2025-05-26 05:27:00,963 - INFO - [Epoch 062 | Batch 0000] IWAE-loss 4730.7261 | mean log_px -0.0198 | KL -3347.98 + 2it [00:00, 15.57it/s] 5it [00:00, 22.22it/s] 9it [00:00, 26.94it/s] 12it [00:00, 27.58it/s] 15it [00:00, 28.25it/s] 19it [00:00, 29.36it/s] 22it [00:00, 29.05it/s] 26it [00:00, 29.74it/s] 30it [00:01, 29.32it/s] 34it [00:01, 29.75it/s] 38it [00:01, 29.67it/s] 42it [00:01, 30.41it/s] 46it [00:01, 30.01it/s] 50it [00:01, 29.88it/s]2025-05-26 05:27:02,625 - INFO - [Epoch 062 | Batch 0050] IWAE-loss 4250.7446 | mean log_px -0.0129 | KL -3345.10 + 53it [00:01, 29.86it/s] 57it [00:01, 30.00it/s] 61it [00:02, 30.11it/s] 65it [00:02, 30.71it/s] 69it [00:02, 29.81it/s] 73it [00:02, 30.19it/s] 77it [00:02, 30.69it/s] 81it [00:02, 30.14it/s] 85it [00:02, 30.58it/s] 89it [00:03, 30.56it/s] 93it [00:03, 30.10it/s] 97it [00:03, 30.60it/s]2025-05-26 05:27:04,278 - INFO - [Epoch 062 | Batch 0100] IWAE-loss 4104.8604 | mean log_px -0.0109 | KL -3345.21 + 101it [00:03, 30.34it/s] 105it [00:03, 30.16it/s] 109it [00:03, 30.65it/s] 113it [00:03, 29.71it/s] 116it [00:03, 29.26it/s] 120it [00:04, 30.36it/s] 124it [00:04, 30.31it/s] 128it [00:04, 30.20it/s] 132it [00:04, 29.83it/s] 136it [00:04, 29.90it/s] 140it [00:04, 30.30it/s] 144it [00:04, 30.12it/s] 148it [00:04, 30.10it/s]2025-05-26 05:27:05,950 - INFO - [Epoch 062 | Batch 0150] IWAE-loss 3983.5308 | mean log_px -0.0092 | KL -3338.70 + 152it [00:05, 30.16it/s] 156it [00:05, 30.19it/s] 160it [00:05, 30.10it/s] 164it [00:05, 29.55it/s] 168it [00:05, 30.13it/s] 172it [00:05, 29.94it/s] 175it [00:05, 29.33it/s] 178it [00:05, 29.09it/s] 182it [00:06, 29.70it/s] 186it [00:06, 29.84it/s] 190it [00:06, 29.72it/s] 194it [00:06, 29.90it/s] 196it [00:06, 29.41it/s] +2025-05-26 05:27:07,542 - INFO - Epoch: 62, Objective: tensor([5111.1948], device='cuda:0', grad_fn=), Loss: 0.021965859457850456, KL/n: 68.15470886230469 + 0it [00:00, ?it/s]2025-05-26 05:27:07,753 - INFO - [Epoch 063 | Batch 0000] IWAE-loss 4222.7715 | mean log_px -0.0126 | KL -3340.34 + 1it [00:00, 9.82it/s] 4it [00:00, 20.97it/s] 8it [00:00, 26.68it/s] 11it [00:00, 27.29it/s] 15it [00:00, 28.65it/s] 19it [00:00, 29.51it/s] 22it [00:00, 28.80it/s] 26it [00:00, 29.68it/s] 29it [00:01, 29.63it/s] 33it [00:01, 29.76it/s] 36it [00:01, 29.67it/s] 40it [00:01, 30.49it/s] 44it [00:01, 30.34it/s] 48it [00:01, 30.44it/s]2025-05-26 05:27:09,418 - INFO - [Epoch 063 | Batch 0050] IWAE-loss 5249.9072 | mean log_px -0.0273 | KL -3337.54 + 52it [00:01, 29.82it/s] 56it [00:01, 29.95it/s] 60it [00:02, 30.04it/s] 64it [00:02, 30.60it/s] 68it [00:02, 30.58it/s] 72it [00:02, 30.11it/s] 76it [00:02, 30.28it/s] 80it [00:02, 30.24it/s] 84it [00:02, 30.00it/s] 88it [00:02, 30.65it/s] 92it [00:03, 30.58it/s] 96it [00:03, 30.19it/s] 100it [00:03, 30.35it/s]2025-05-26 05:27:11,073 - INFO - [Epoch 063 | Batch 0100] IWAE-loss 4134.0146 | mean log_px -0.0115 | KL -3329.93 + 104it [00:03, 29.64it/s] 107it [00:03, 28.88it/s] 110it [00:03, 28.35it/s] 114it [00:03, 28.78it/s] 117it [00:03, 28.68it/s] 121it [00:04, 28.80it/s] 125it [00:04, 29.26it/s] 129it [00:04, 29.89it/s] 132it [00:04, 29.63it/s] 136it [00:04, 29.77it/s] 140it [00:04, 30.09it/s] 144it [00:04, 30.13it/s] 148it [00:05, 30.23it/s]2025-05-26 05:27:12,768 - INFO - [Epoch 063 | Batch 0150] IWAE-loss 5663.5557 | mean log_px -0.0333 | KL -3329.52 + 152it [00:05, 29.61it/s] 156it [00:05, 30.34it/s] 160it [00:05, 29.90it/s] 164it [00:05, 30.00it/s] 168it [00:05, 30.08it/s] 172it [00:05, 30.73it/s] 176it [00:05, 30.62it/s] 180it [00:06, 30.59it/s] 184it [00:06, 30.51it/s] 188it [00:06, 30.47it/s] 192it [00:06, 29.88it/s] 195it [00:06, 28.94it/s] 196it [00:06, 29.44it/s] +2025-05-26 05:27:14,325 - INFO - Epoch: 63, Objective: tensor([3992.4661], device='cuda:0', grad_fn=), Loss: 0.00966509897261858, KL/n: 67.97527313232422 + 0it [00:00, ?it/s]2025-05-26 05:27:14,720 - INFO - [Epoch 064 | Batch 0000] IWAE-loss 4626.7886 | mean log_px -0.0185 | KL -3331.43 + 2it [00:00, 15.58it/s] 5it [00:00, 22.64it/s] 9it [00:00, 26.46it/s] 13it [00:00, 27.99it/s] 16it [00:00, 28.11it/s] 20it [00:00, 29.48it/s] 23it [00:00, 29.17it/s] 27it [00:00, 30.24it/s] 31it [00:01, 29.97it/s] 35it [00:01, 30.14it/s] 39it [00:01, 30.25it/s] 43it [00:01, 29.96it/s] 46it [00:01, 29.74it/s] 49it [00:01, 29.53it/s]2025-05-26 05:27:16,380 - INFO - [Epoch 064 | Batch 0050] IWAE-loss 4621.3721 | mean log_px -0.0185 | KL -3327.45 + 53it [00:01, 29.85it/s] 57it [00:01, 30.73it/s] 61it [00:02, 30.21it/s] 65it [00:02, 30.00it/s] 69it [00:02, 30.83it/s] 73it [00:02, 30.26it/s] 77it [00:02, 30.15it/s] 81it [00:02, 30.87it/s] 85it [00:02, 30.17it/s] 89it [00:03, 30.79it/s] 93it [00:03, 30.16it/s] 97it [00:03, 30.13it/s]2025-05-26 05:27:18,022 - INFO - [Epoch 064 | Batch 0100] IWAE-loss 5079.6343 | mean log_px -0.0250 | KL -3326.46 + 101it [00:03, 30.74it/s] 105it [00:03, 30.30it/s] 109it [00:03, 30.27it/s] 113it [00:03, 30.77it/s] 117it [00:03, 30.24it/s] 121it [00:04, 30.17it/s] 125it [00:04, 30.79it/s] 129it [00:04, 30.16it/s] 133it [00:04, 30.30it/s] 137it [00:04, 30.13it/s] 141it [00:04, 30.84it/s] 145it [00:04, 30.24it/s] 149it [00:04, 30.23it/s]2025-05-26 05:27:19,671 - INFO - [Epoch 064 | Batch 0150] IWAE-loss 5125.8848 | mean log_px -0.0258 | KL -3318.95 + 153it [00:05, 30.74it/s] 157it [00:05, 30.17it/s] 161it [00:05, 30.07it/s] 165it [00:05, 30.81it/s] 169it [00:05, 30.11it/s] 173it [00:05, 30.10it/s] 177it [00:05, 30.62it/s] 181it [00:06, 29.85it/s] 185it [00:06, 30.73it/s] 189it [00:06, 30.06it/s] 193it [00:06, 30.05it/s] 196it [00:06, 29.73it/s] +2025-05-26 05:27:21,229 - INFO - Epoch: 64, Objective: tensor([5511.2998], device='cuda:0', grad_fn=), Loss: 0.03269851952791214, KL/n: 67.779052734375 + 0it [00:00, ?it/s]2025-05-26 05:27:21,438 - INFO - [Epoch 065 | Batch 0000] IWAE-loss 4226.9961 | mean log_px -0.0130 | KL -3318.64 + 2it [00:00, 15.41it/s] 6it [00:00, 24.35it/s] 9it [00:00, 25.62it/s] 13it [00:00, 27.44it/s] 17it [00:00, 28.46it/s] 21it [00:00, 29.13it/s] 25it [00:00, 29.42it/s] 28it [00:01, 29.40it/s] 31it [00:01, 29.51it/s] 35it [00:01, 29.81it/s] 38it [00:01, 29.64it/s] 42it [00:01, 29.65it/s] 46it [00:01, 30.16it/s] 50it [00:01, 29.61it/s]2025-05-26 05:27:23,113 - INFO - [Epoch 065 | Batch 0050] IWAE-loss 5085.6377 | mean log_px -0.0252 | KL -3321.68 + 53it [00:01, 29.54it/s] 57it [00:01, 30.05it/s] 61it [00:02, 30.03it/s] 65it [00:02, 29.98it/s] 68it [00:02, 29.27it/s] 72it [00:02, 29.99it/s] 76it [00:02, 30.00it/s] 79it [00:02, 29.31it/s] 83it [00:02, 29.57it/s] 87it [00:02, 30.09it/s] 91it [00:03, 30.12it/s] 95it [00:03, 29.47it/s] 98it [00:03, 29.39it/s]2025-05-26 05:27:24,797 - INFO - [Epoch 065 | Batch 0100] IWAE-loss 4229.5815 | mean log_px -0.0130 | KL -3316.18 + 102it [00:03, 29.70it/s] 105it [00:03, 29.49it/s] 109it [00:03, 29.52it/s] 113it [00:03, 29.61it/s] 117it [00:03, 29.65it/s] 120it [00:04, 29.67it/s] 123it [00:04, 29.66it/s] 126it [00:04, 29.59it/s] 130it [00:04, 29.74it/s] 133it [00:04, 29.77it/s] 136it [00:04, 29.80it/s] 139it [00:04, 29.77it/s] 142it [00:04, 29.78it/s] 145it [00:04, 29.78it/s] 148it [00:05, 29.82it/s]2025-05-26 05:27:26,483 - INFO - [Epoch 065 | Batch 0150] IWAE-loss 4635.0166 | mean log_px -0.0189 | KL -3313.80 + 151it [00:05, 29.77it/s] 154it [00:05, 29.73it/s] 157it [00:05, 29.68it/s] 161it [00:05, 29.81it/s] 165it [00:05, 29.80it/s] 168it [00:05, 29.84it/s] 171it [00:05, 29.39it/s] 175it [00:05, 29.96it/s] 178it [00:06, 28.98it/s] 181it [00:06, 28.98it/s] 184it [00:06, 29.25it/s] 187it [00:06, 29.38it/s] 190it [00:06, 29.46it/s] 194it [00:06, 30.35it/s] 196it [00:06, 29.15it/s] +2025-05-26 05:27:28,080 - INFO - Epoch: 65, Objective: tensor([5383.5820], device='cuda:0', grad_fn=), Loss: 0.028728904202580452, KL/n: 67.57471466064453 + 0it [00:00, ?it/s]2025-05-26 05:27:28,294 - INFO - [Epoch 066 | Batch 0000] IWAE-loss 4755.5146 | mean log_px -0.0206 | KL -3310.46 + 1it [00:00, 9.59it/s] 4it [00:00, 20.85it/s] 8it [00:00, 25.49it/s] 11it [00:00, 27.09it/s] 15it [00:00, 28.45it/s] 19it [00:00, 29.21it/s] 22it [00:00, 28.84it/s] 26it [00:00, 29.30it/s] 30it [00:01, 29.54it/s] 34it [00:01, 29.86it/s] 37it [00:01, 29.69it/s] 41it [00:01, 29.94it/s] 45it [00:01, 30.31it/s] 49it [00:01, 30.39it/s]2025-05-26 05:27:29,968 - INFO - [Epoch 066 | Batch 0050] IWAE-loss 4560.9541 | mean log_px -0.0180 | KL -3303.38 + 53it [00:01, 30.23it/s] 57it [00:01, 30.15it/s] 61it [00:02, 29.82it/s] 64it [00:02, 29.58it/s] 68it [00:02, 29.87it/s] 72it [00:02, 29.92it/s] 75it [00:02, 29.76it/s] 79it [00:02, 29.80it/s] 83it [00:02, 29.80it/s] 87it [00:02, 30.08it/s] 91it [00:03, 30.49it/s] 95it [00:03, 30.22it/s] 99it [00:03, 30.02it/s]2025-05-26 05:27:31,634 - INFO - [Epoch 066 | Batch 0100] IWAE-loss 4922.7832 | mean log_px -0.0231 | KL -3308.38 + 103it [00:03, 30.43it/s] 107it [00:03, 29.67it/s] 111it [00:03, 29.76it/s] 115it [00:03, 29.81it/s] 119it [00:04, 29.85it/s] 123it [00:04, 30.05it/s] 127it [00:04, 30.53it/s] 131it [00:04, 30.35it/s] 135it [00:04, 30.22it/s] 139it [00:04, 29.57it/s] 143it [00:04, 29.61it/s] 147it [00:04, 29.89it/s]2025-05-26 05:27:33,299 - INFO - [Epoch 066 | Batch 0150] IWAE-loss 4404.7422 | mean log_px -0.0157 | KL -3303.61 + 151it [00:05, 29.97it/s] 154it [00:05, 29.68it/s] 158it [00:05, 29.90it/s] 162it [00:05, 30.34it/s] 166it [00:05, 30.20it/s] 170it [00:05, 29.61it/s] 173it [00:05, 29.58it/s] 177it [00:05, 29.92it/s] 181it [00:06, 29.89it/s] 184it [00:06, 29.72it/s] 188it [00:06, 29.83it/s] 192it [00:06, 30.26it/s] 196it [00:06, 29.47it/s] 196it [00:06, 29.35it/s] +2025-05-26 05:27:34,883 - INFO - Epoch: 66, Objective: tensor([4174.8047], device='cuda:0', grad_fn=), Loss: 0.010129961185157299, KL/n: 67.4141845703125 + 0it [00:00, ?it/s]2025-05-26 05:27:35,279 - INFO - [Epoch 067 | Batch 0000] IWAE-loss 4738.0557 | mean log_px -0.0205 | KL -3303.20 + 1it [00:00, 9.46it/s] 4it [00:00, 20.56it/s] 8it [00:00, 26.14it/s] 11it [00:00, 26.75it/s] 15it [00:00, 28.35it/s] 19it [00:00, 29.30it/s] 22it [00:00, 29.02it/s] 26it [00:00, 29.32it/s] 29it [00:01, 29.44it/s] 32it [00:01, 29.53it/s] 36it [00:01, 29.79it/s] 40it [00:01, 30.17it/s] 44it [00:01, 29.57it/s] 48it [00:01, 29.82it/s]2025-05-26 05:27:36,956 - INFO - [Epoch 067 | Batch 0050] IWAE-loss 4515.2500 | mean log_px -0.0174 | KL -3294.87 + 51it [00:01, 29.65it/s] 55it [00:01, 29.67it/s] 59it [00:02, 30.42it/s] 63it [00:02, 30.28it/s] 67it [00:02, 30.23it/s] 71it [00:02, 29.65it/s] 75it [00:02, 30.16it/s] 79it [00:02, 30.23it/s] 83it [00:02, 30.08it/s] 87it [00:02, 29.49it/s] 91it [00:03, 29.87it/s] 95it [00:03, 30.26it/s] 99it [00:03, 30.21it/s]2025-05-26 05:27:38,624 - INFO - [Epoch 067 | Batch 0100] IWAE-loss 4279.1245 | mean log_px -0.0140 | KL -3296.57 + 103it [00:03, 30.05it/s] 107it [00:03, 28.98it/s] 111it [00:03, 29.23it/s] 115it [00:03, 29.89it/s] 118it [00:04, 29.36it/s] 122it [00:04, 30.17it/s] 126it [00:04, 29.82it/s] 129it [00:04, 29.70it/s] 132it [00:04, 29.48it/s] 135it [00:04, 29.58it/s] 138it [00:04, 29.41it/s] 142it [00:04, 30.01it/s] 146it [00:04, 29.97it/s] 149it [00:05, 29.44it/s]2025-05-26 05:27:40,303 - INFO - [Epoch 067 | Batch 0150] IWAE-loss 4792.4834 | mean log_px -0.0214 | KL -3292.12 + 153it [00:05, 30.07it/s] 156it [00:05, 29.52it/s] 160it [00:05, 30.35it/s] 164it [00:05, 29.87it/s] 167it [00:05, 29.38it/s] 171it [00:05, 29.53it/s] 175it [00:05, 29.84it/s] 179it [00:06, 29.98it/s] 182it [00:06, 29.27it/s] 186it [00:06, 29.51it/s] 190it [00:06, 30.11it/s] 194it [00:06, 30.22it/s] 196it [00:06, 29.22it/s] +2025-05-26 05:27:41,893 - INFO - Epoch: 67, Objective: tensor([5069.5425], device='cuda:0', grad_fn=), Loss: 0.02400057576596737, KL/n: 67.20359802246094 + 0it [00:00, ?it/s]2025-05-26 05:27:42,103 - INFO - [Epoch 068 | Batch 0000] IWAE-loss 4748.5825 | mean log_px -0.0208 | KL -3294.28 + 2it [00:00, 15.59it/s] 5it [00:00, 23.05it/s] 8it [00:00, 24.91it/s] 11it [00:00, 26.40it/s] 14it [00:00, 26.97it/s] 17it [00:00, 26.96it/s] 20it [00:00, 27.18it/s] 24it [00:00, 28.22it/s] 28it [00:01, 29.19it/s] 31it [00:01, 28.70it/s] 35it [00:01, 28.93it/s] 39it [00:01, 29.23it/s] 43it [00:01, 29.88it/s] 46it [00:01, 29.14it/s] 50it [00:01, 29.29it/s]2025-05-26 05:27:43,826 - INFO - [Epoch 068 | Batch 0050] IWAE-loss 4425.6670 | mean log_px -0.0162 | KL -3294.61 + 54it [00:01, 29.84it/s] 57it [00:02, 29.04it/s] 61it [00:02, 29.19it/s] 65it [00:02, 29.97it/s] 68it [00:02, 29.20it/s] 72it [00:02, 29.56it/s] 76it [00:02, 30.02it/s] 79it [00:02, 29.20it/s] 83it [00:02, 29.50it/s] 87it [00:03, 29.76it/s] 90it [00:03, 29.38it/s] 94it [00:03, 29.36it/s] 98it [00:03, 30.11it/s]2025-05-26 05:27:45,516 - INFO - [Epoch 068 | Batch 0100] IWAE-loss 3964.5161 | mean log_px -0.0097 | KL -3286.60 + 102it [00:03, 29.96it/s] 105it [00:03, 29.23it/s] 109it [00:03, 29.53it/s] 112it [00:03, 28.92it/s] 116it [00:04, 28.99it/s] 120it [00:04, 29.68it/s] 123it [00:04, 28.77it/s] 127it [00:04, 29.28it/s] 131it [00:04, 29.74it/s] 134it [00:04, 29.29it/s] 137it [00:04, 29.17it/s] 141it [00:04, 29.54it/s] 145it [00:05, 29.88it/s] 148it [00:05, 28.99it/s]2025-05-26 05:27:47,220 - INFO - [Epoch 068 | Batch 0150] IWAE-loss 4732.7954 | mean log_px -0.0206 | KL -3287.31 + 152it [00:05, 29.22it/s] 156it [00:05, 29.56it/s] 159it [00:05, 29.54it/s] 162it [00:05, 28.93it/s] 166it [00:05, 29.44it/s] 169it [00:05, 29.14it/s] 173it [00:05, 29.40it/s] 176it [00:06, 29.22it/s] 180it [00:06, 29.48it/s] 184it [00:06, 29.81it/s] 187it [00:06, 29.04it/s] 191it [00:06, 29.26it/s] 195it [00:06, 28.68it/s] 196it [00:06, 28.82it/s] +2025-05-26 05:27:48,821 - INFO - Epoch: 68, Objective: tensor([5776.5640], device='cuda:0', grad_fn=), Loss: 0.03412821888923645, KL/n: 67.01081848144531 + 0it [00:00, ?it/s]2025-05-26 05:27:49,215 - INFO - [Epoch 069 | Batch 0000] IWAE-loss 5160.4429 | mean log_px -0.0268 | KL -3282.19 + 1it [00:00, 9.80it/s] 4it [00:00, 20.24it/s] 8it [00:00, 25.11it/s] 12it [00:00, 27.28it/s] 16it [00:00, 28.97it/s] 19it [00:00, 28.50it/s] 22it [00:00, 28.63it/s] 26it [00:00, 29.71it/s] 29it [00:01, 29.26it/s] 32it [00:01, 28.73it/s] 35it [00:01, 28.80it/s] 38it [00:01, 28.27it/s] 42it [00:01, 28.78it/s] 46it [00:01, 29.67it/s] 49it [00:01, 28.58it/s]2025-05-26 05:27:50,927 - INFO - [Epoch 069 | Batch 0050] IWAE-loss 4836.0820 | mean log_px -0.0222 | KL -3279.22 + 53it [00:01, 28.67it/s] 57it [00:02, 29.58it/s] 60it [00:02, 29.35it/s] 63it [00:02, 29.51it/s] 66it [00:02, 29.22it/s] 70it [00:02, 29.37it/s] 74it [00:02, 30.08it/s] 78it [00:02, 29.39it/s] 82it [00:02, 29.40it/s] 86it [00:02, 29.76it/s] 90it [00:03, 30.20it/s] 94it [00:03, 29.38it/s] 98it [00:03, 29.55it/s]2025-05-26 05:27:52,611 - INFO - [Epoch 069 | Batch 0100] IWAE-loss 4195.8569 | mean log_px -0.0132 | KL -3273.90 + 102it [00:03, 30.14it/s] 106it [00:03, 29.99it/s] 110it [00:03, 29.34it/s] 113it [00:03, 29.42it/s] 117it [00:04, 29.43it/s] 121it [00:04, 29.77it/s] 124it [00:04, 29.41it/s] 128it [00:04, 29.75it/s] 132it [00:04, 30.07it/s] 136it [00:04, 30.01it/s] 139it [00:04, 29.35it/s] 143it [00:04, 29.51it/s] 147it [00:05, 30.15it/s]2025-05-26 05:27:54,296 - INFO - [Epoch 069 | Batch 0150] IWAE-loss 3853.5173 | mean log_px -0.0083 | KL -3273.98 + 151it [00:05, 29.90it/s] 154it [00:05, 29.12it/s] 158it [00:05, 29.90it/s] 161it [00:05, 29.18it/s] 165it [00:05, 29.39it/s] 169it [00:05, 29.59it/s] 173it [00:05, 29.77it/s] 177it [00:06, 30.16it/s] 181it [00:06, 30.01it/s] 184it [00:06, 29.25it/s] 188it [00:06, 29.76it/s] 191it [00:06, 29.55it/s] 195it [00:06, 28.65it/s] 196it [00:06, 28.96it/s] +2025-05-26 05:27:55,895 - INFO - Epoch: 69, Objective: tensor([5158.5811], device='cuda:0', grad_fn=), Loss: 0.02521890588104725, KL/n: 66.81456756591797 + 0it [00:00, ?it/s]2025-05-26 05:27:56,103 - INFO - [Epoch 070 | Batch 0000] IWAE-loss 6289.8228 | mean log_px -0.0431 | KL -3273.46 + 2it [00:00, 15.41it/s] 5it [00:00, 21.79it/s] 9it [00:00, 25.48it/s] 13it [00:00, 27.86it/s] 16it [00:00, 27.74it/s] 20it [00:00, 28.32it/s] 24it [00:00, 29.35it/s] 27it [00:00, 28.47it/s] 31it [00:01, 28.96it/s] 35it [00:01, 29.62it/s] 38it [00:01, 28.99it/s] 42it [00:01, 29.07it/s] 46it [00:01, 29.57it/s] 50it [00:01, 29.97it/s]2025-05-26 05:27:57,801 - INFO - [Epoch 070 | Batch 0050] IWAE-loss 4238.9434 | mean log_px -0.0138 | KL -3270.52 + 53it [00:01, 29.23it/s] 57it [00:02, 29.27it/s] 61it [00:02, 29.98it/s] 64it [00:02, 29.27it/s] 68it [00:02, 29.60it/s] 71it [00:02, 29.64it/s] 74it [00:02, 29.53it/s] 78it [00:02, 29.57it/s] 82it [00:02, 29.66it/s] 86it [00:02, 30.37it/s] 90it [00:03, 30.09it/s] 94it [00:03, 29.57it/s] 97it [00:03, 29.54it/s] 100it [00:03, 29.35it/s]2025-05-26 05:27:59,486 - INFO - [Epoch 070 | Batch 0100] IWAE-loss 4667.5620 | mean log_px -0.0200 | KL -3267.44 + 104it [00:03, 29.76it/s] 108it [00:03, 29.65it/s] 111it [00:03, 29.37it/s] 115it [00:03, 29.51it/s] 119it [00:04, 30.13it/s] 123it [00:04, 30.02it/s] 126it [00:04, 29.13it/s] 129it [00:04, 29.30it/s] 133it [00:04, 29.56it/s] 137it [00:04, 29.96it/s] 140it [00:04, 29.20it/s] 144it [00:04, 29.32it/s] 148it [00:05, 29.84it/s]2025-05-26 05:28:01,186 - INFO - [Epoch 070 | Batch 0150] IWAE-loss 5052.1294 | mean log_px -0.0255 | KL -3266.45 + 151it [00:05, 29.05it/s] 155it [00:05, 29.21it/s] 159it [00:05, 30.03it/s] 162it [00:05, 28.93it/s] 166it [00:05, 28.82it/s] 170it [00:05, 29.09it/s] 174it [00:05, 29.43it/s] 177it [00:06, 29.38it/s] 180it [00:06, 28.64it/s] 184it [00:06, 29.40it/s] 188it [00:06, 29.98it/s] 191it [00:06, 29.72it/s] 195it [00:06, 28.37it/s] 196it [00:06, 28.97it/s] +2025-05-26 05:28:02,784 - INFO - Epoch: 70, Objective: tensor([4617.2183], device='cuda:0', grad_fn=), Loss: 0.020552074536681175, KL/n: 66.61614990234375 + 0it [00:00, ?it/s]2025-05-26 05:28:03,167 - INFO - [Epoch 071 | Batch 0000] IWAE-loss 4164.6030 | mean log_px -0.0128 | KL -3268.67 + 1it [00:00, 9.74it/s] 4it [00:00, 20.78it/s] 8it [00:00, 26.52it/s] 11it [00:00, 27.15it/s] 15it [00:00, 29.07it/s] 18it [00:00, 29.16it/s] 22it [00:00, 29.84it/s] 25it [00:00, 29.88it/s] 28it [00:01, 29.23it/s] 32it [00:01, 29.80it/s] 35it [00:01, 29.64it/s] 39it [00:01, 29.73it/s] 43it [00:01, 29.80it/s] 46it [00:01, 29.60it/s] 49it [00:01, 29.34it/s]2025-05-26 05:28:04,837 - INFO - [Epoch 071 | Batch 0050] IWAE-loss 4600.4023 | mean log_px -0.0191 | KL -3261.73 + 53it [00:01, 29.42it/s] 57it [00:01, 30.27it/s] 61it [00:02, 30.10it/s] 65it [00:02, 29.20it/s] 69it [00:02, 29.58it/s] 73it [00:02, 30.10it/s] 77it [00:02, 29.74it/s] 80it [00:02, 29.69it/s] 83it [00:02, 29.61it/s] 87it [00:02, 30.43it/s] 91it [00:03, 30.33it/s] 95it [00:03, 29.63it/s] 99it [00:03, 30.37it/s]2025-05-26 05:28:06,514 - INFO - [Epoch 071 | Batch 0100] IWAE-loss 4752.2539 | mean log_px -0.0214 | KL -3253.72 + 103it [00:03, 29.75it/s] 106it [00:03, 29.81it/s] 109it [00:03, 29.80it/s] 113it [00:03, 29.83it/s] 117it [00:03, 30.52it/s] 121it [00:04, 30.43it/s] 125it [00:04, 29.90it/s] 128it [00:04, 29.84it/s] 132it [00:04, 30.10it/s] 136it [00:04, 30.45it/s] 140it [00:04, 29.76it/s] 144it [00:04, 29.94it/s] 147it [00:04, 29.86it/s]2025-05-26 05:28:08,174 - INFO - [Epoch 071 | Batch 0150] IWAE-loss 5054.4976 | mean log_px -0.0257 | KL -3258.69 + 151it [00:05, 30.07it/s] 155it [00:05, 30.43it/s] 159it [00:05, 30.35it/s] 163it [00:05, 29.63it/s] 167it [00:05, 30.29it/s] 171it [00:05, 30.25it/s] 175it [00:05, 29.65it/s] 179it [00:06, 29.27it/s] 183it [00:06, 29.49it/s] 187it [00:06, 30.24it/s] 191it [00:06, 29.94it/s] 195it [00:06, 28.85it/s] 196it [00:06, 29.35it/s] +2025-05-26 05:28:09,755 - INFO - Epoch: 71, Objective: tensor([5410.8906], device='cuda:0', grad_fn=), Loss: 0.031669292598962784, KL/n: 66.40533447265625 + 0it [00:00, ?it/s]2025-05-26 05:28:09,975 - INFO - [Epoch 072 | Batch 0000] IWAE-loss 3863.3535 | mean log_px -0.0087 | KL -3252.36 + 1it [00:00, 8.89it/s] 5it [00:00, 23.93it/s] 8it [00:00, 25.38it/s] 11it [00:00, 26.79it/s] 15it [00:00, 28.08it/s] 18it [00:00, 28.25it/s] 22it [00:00, 29.14it/s] 25it [00:00, 29.11it/s] 29it [00:01, 29.43it/s] 32it [00:01, 29.34it/s] 36it [00:01, 29.61it/s] 39it [00:01, 29.00it/s] 42it [00:01, 29.07it/s] 46it [00:01, 30.07it/s] 49it [00:01, 28.88it/s]2025-05-26 05:28:11,662 - INFO - [Epoch 072 | Batch 0050] IWAE-loss 4189.3794 | mean log_px -0.0134 | KL -3250.63 + 53it [00:01, 29.58it/s] 57it [00:01, 30.10it/s] 61it [00:02, 29.21it/s] 64it [00:02, 29.40it/s] 67it [00:02, 29.43it/s] 71it [00:02, 29.72it/s] 74it [00:02, 29.54it/s] 78it [00:02, 30.33it/s] 82it [00:02, 29.44it/s] 85it [00:02, 29.10it/s] 89it [00:03, 29.84it/s] 92it [00:03, 29.10it/s] 95it [00:03, 29.25it/s] 98it [00:03, 28.58it/s]2025-05-26 05:28:13,367 - INFO - [Epoch 072 | Batch 0100] IWAE-loss 4139.4766 | mean log_px -0.0127 | KL -3248.74 + 102it [00:03, 28.73it/s] 106it [00:03, 29.42it/s] 109it [00:03, 29.35it/s] 113it [00:03, 28.75it/s] 117it [00:04, 28.60it/s] 120it [00:04, 28.16it/s] 123it [00:04, 28.04it/s] 127it [00:04, 28.34it/s] 131it [00:04, 29.22it/s] 134it [00:04, 29.25it/s] 137it [00:04, 28.85it/s] 140it [00:04, 28.63it/s] 144it [00:04, 29.19it/s] 148it [00:05, 29.60it/s]2025-05-26 05:28:15,103 - INFO - [Epoch 072 | Batch 0150] IWAE-loss 4509.6626 | mean log_px -0.0181 | KL -3241.52 + 151it [00:05, 28.66it/s] 155it [00:05, 28.97it/s] 159it [00:05, 29.27it/s] 163it [00:05, 29.54it/s] 166it [00:05, 29.03it/s] 170it [00:05, 29.12it/s] 174it [00:06, 29.55it/s] 177it [00:06, 29.03it/s] 180it [00:06, 28.92it/s] 184it [00:06, 29.48it/s] 187it [00:06, 29.40it/s] 190it [00:06, 29.04it/s] 193it [00:06, 28.87it/s] 196it [00:06, 28.83it/s] 196it [00:06, 28.68it/s] +2025-05-26 05:28:16,716 - INFO - Epoch: 72, Objective: tensor([4276.2158], device='cuda:0', grad_fn=), Loss: 0.014400888234376907, KL/n: 66.18006134033203 + 0it [00:00, ?it/s]2025-05-26 05:28:17,095 - INFO - [Epoch 073 | Batch 0000] IWAE-loss 3887.7847 | mean log_px -0.0093 | KL -3239.48 + 2it [00:00, 16.38it/s] 5it [00:00, 22.57it/s] 9it [00:00, 26.32it/s] 13it [00:00, 27.61it/s] 16it [00:00, 27.01it/s] 19it [00:00, 27.10it/s] 22it [00:00, 27.11it/s] 25it [00:00, 27.65it/s] 28it [00:01, 27.62it/s] 32it [00:01, 29.41it/s] 36it [00:01, 28.87it/s] 40it [00:01, 29.81it/s] 44it [00:01, 30.18it/s] 48it [00:01, 30.34it/s]2025-05-26 05:28:18,811 - INFO - [Epoch 073 | Batch 0050] IWAE-loss 3862.1946 | mean log_px -0.0089 | KL -3237.66 + 52it [00:01, 30.38it/s] 56it [00:01, 30.16it/s] 60it [00:02, 30.22it/s] 64it [00:02, 30.26it/s] 68it [00:02, 30.63it/s] 72it [00:02, 30.50it/s] 76it [00:02, 29.99it/s] 80it [00:02, 30.55it/s] 84it [00:02, 30.31it/s] 88it [00:03, 30.27it/s] 92it [00:03, 29.95it/s] 96it [00:03, 30.37it/s] 100it [00:03, 30.26it/s]2025-05-26 05:28:20,462 - INFO - [Epoch 073 | Batch 0100] IWAE-loss 4765.9736 | mean log_px -0.0219 | KL -3234.63 + 104it [00:03, 30.31it/s] 108it [00:03, 30.33it/s] 112it [00:03, 30.11it/s] 116it [00:03, 29.75it/s] 120it [00:04, 30.08it/s] 124it [00:04, 30.61it/s] 128it [00:04, 30.25it/s] 132it [00:04, 30.11it/s] 136it [00:04, 30.10it/s] 140it [00:04, 29.85it/s] 144it [00:04, 30.38it/s] 148it [00:05, 30.34it/s]2025-05-26 05:28:22,119 - INFO - [Epoch 073 | Batch 0150] IWAE-loss 4515.1055 | mean log_px -0.0183 | KL -3233.31 + 152it [00:05, 30.47it/s] 156it [00:05, 30.38it/s] 160it [00:05, 29.56it/s] 164it [00:05, 30.36it/s] 168it [00:05, 30.33it/s] 172it [00:05, 30.33it/s] 176it [00:05, 29.62it/s] 180it [00:06, 29.94it/s] 183it [00:06, 29.51it/s] 187it [00:06, 29.74it/s] 191it [00:06, 29.98it/s] 195it [00:06, 28.96it/s] 196it [00:06, 29.41it/s] +2025-05-26 05:28:23,683 - INFO - Epoch: 73, Objective: tensor([4461.6387], device='cuda:0', grad_fn=), Loss: 0.017936188727617264, KL/n: 65.97233581542969 + 0it [00:00, ?it/s]2025-05-26 05:28:23,890 - INFO - [Epoch 074 | Batch 0000] IWAE-loss 5131.6729 | mean log_px -0.0272 | KL -3230.27 + 2it [00:00, 15.45it/s] 5it [00:00, 22.87it/s] 8it [00:00, 24.92it/s] 12it [00:00, 26.83it/s] 15it [00:00, 27.39it/s] 19it [00:00, 28.32it/s] 22it [00:00, 28.26it/s] 26it [00:00, 28.65it/s] 30it [00:01, 29.14it/s] 33it [00:01, 28.56it/s] 37it [00:01, 29.17it/s] 41it [00:01, 29.53it/s] 44it [00:01, 29.17it/s] 47it [00:01, 29.20it/s] 50it [00:01, 29.33it/s]2025-05-26 05:28:25,597 - INFO - [Epoch 074 | Batch 0050] IWAE-loss 4212.5435 | mean log_px -0.0140 | KL -3230.62 + 53it [00:01, 29.35it/s] 56it [00:01, 29.46it/s] 59it [00:02, 29.54it/s] 62it [00:02, 29.49it/s] 65it [00:02, 29.55it/s] 68it [00:02, 29.56it/s] 71it [00:02, 29.64it/s] 74it [00:02, 29.55it/s] 77it [00:02, 29.51it/s] 80it [00:02, 29.59it/s] 83it [00:02, 29.54it/s] 86it [00:02, 29.52it/s] 89it [00:03, 29.46it/s] 92it [00:03, 29.58it/s] 95it [00:03, 29.53it/s] 98it [00:03, 29.56it/s]2025-05-26 05:28:27,293 - INFO - [Epoch 074 | Batch 0100] IWAE-loss 3936.8843 | mean log_px -0.0101 | KL -3227.75 + 101it [00:03, 29.69it/s] 104it [00:03, 29.67it/s] 107it [00:03, 29.63it/s] 110it [00:03, 29.49it/s] 113it [00:03, 29.53it/s] 116it [00:04, 29.50it/s] 119it [00:04, 29.53it/s] 122it [00:04, 29.53it/s] 125it [00:04, 29.56it/s] 128it [00:04, 29.59it/s] 131it [00:04, 29.66it/s] 134it [00:04, 29.65it/s] 137it [00:04, 29.64it/s] 140it [00:04, 29.73it/s] 143it [00:04, 29.70it/s] 146it [00:05, 29.71it/s] 149it [00:05, 29.71it/s]2025-05-26 05:28:28,980 - INFO - [Epoch 074 | Batch 0150] IWAE-loss 3922.8477 | mean log_px -0.0100 | KL -3221.75 + 152it [00:05, 29.62it/s] 155it [00:05, 29.63it/s] 158it [00:05, 29.70it/s] 161it [00:05, 29.62it/s] 164it [00:05, 29.64it/s] 167it [00:05, 29.67it/s] 170it [00:05, 29.27it/s] 174it [00:05, 29.58it/s] 177it [00:06, 29.36it/s] 181it [00:06, 30.29it/s] 185it [00:06, 29.55it/s] 189it [00:06, 29.47it/s] 193it [00:06, 29.54it/s] 196it [00:06, 29.48it/s] 196it [00:06, 29.02it/s] +2025-05-26 05:28:30,560 - INFO - Epoch: 74, Objective: tensor([4248.8350], device='cuda:0', grad_fn=), Loss: 0.01647838018834591, KL/n: 65.7720718383789 + 0it [00:00, ?it/s]2025-05-26 05:28:30,946 - INFO - [Epoch 075 | Batch 0000] IWAE-loss 3994.8215 | mean log_px -0.0110 | KL -3221.85 + 1it [00:00, 9.58it/s] 4it [00:00, 20.25it/s] 8it [00:00, 25.43it/s] 12it [00:00, 27.65it/s] 15it [00:00, 27.53it/s] 19it [00:00, 29.08it/s] 22it [00:00, 28.85it/s] 25it [00:00, 29.09it/s] 28it [00:01, 29.26it/s] 31it [00:01, 29.36it/s] 34it [00:01, 29.23it/s] 38it [00:01, 29.57it/s] 42it [00:01, 29.99it/s] 45it [00:01, 29.47it/s] 49it [00:01, 29.89it/s]2025-05-26 05:28:32,635 - INFO - [Epoch 075 | Batch 0050] IWAE-loss 4156.1499 | mean log_px -0.0134 | KL -3218.43 + 52it [00:01, 29.63it/s] 56it [00:01, 29.67it/s] 60it [00:02, 29.90it/s] 64it [00:02, 30.09it/s] 68it [00:02, 30.21it/s] 72it [00:02, 29.63it/s] 75it [00:02, 29.69it/s] 78it [00:02, 29.57it/s] 82it [00:02, 29.86it/s] 86it [00:02, 30.01it/s] 89it [00:03, 29.42it/s] 93it [00:03, 29.46it/s] 97it [00:03, 30.14it/s]2025-05-26 05:28:34,308 - INFO - [Epoch 075 | Batch 0100] IWAE-loss 4155.2363 | mean log_px -0.0134 | KL -3217.12 + 101it [00:03, 30.04it/s] 105it [00:03, 30.03it/s] 109it [00:03, 29.62it/s] 112it [00:03, 29.52it/s] 116it [00:03, 30.12it/s] 120it [00:04, 29.93it/s] 123it [00:04, 29.47it/s] 126it [00:04, 29.31it/s] 130it [00:04, 30.12it/s] 134it [00:04, 29.66it/s] 138it [00:04, 29.91it/s] 141it [00:04, 28.92it/s] 145it [00:04, 29.29it/s] 149it [00:05, 29.76it/s]2025-05-26 05:28:36,000 - INFO - [Epoch 075 | Batch 0150] IWAE-loss 4307.5762 | mean log_px -0.0156 | KL -3213.46 + 152it [00:05, 29.33it/s] 156it [00:05, 29.55it/s] 160it [00:05, 30.26it/s] 164it [00:05, 30.25it/s] 168it [00:05, 29.71it/s] 171it [00:05, 29.65it/s] 175it [00:05, 29.53it/s] 179it [00:06, 30.11it/s] 183it [00:06, 30.19it/s] 187it [00:06, 29.56it/s] 191it [00:06, 30.07it/s] 195it [00:06, 28.90it/s] 196it [00:06, 29.15it/s] +2025-05-26 05:28:37,579 - INFO - Epoch: 75, Objective: tensor([4054.9939], device='cuda:0', grad_fn=), Loss: 0.015226984396576881, KL/n: 65.55622863769531 + 0it [00:00, ?it/s]2025-05-26 05:28:37,792 - INFO - [Epoch 076 | Batch 0000] IWAE-loss 4398.7080 | mean log_px -0.0170 | KL -3212.21 + 1it [00:00, 9.91it/s] 4it [00:00, 20.84it/s] 8it [00:00, 26.11it/s] 12it [00:00, 27.65it/s] 15it [00:00, 27.72it/s] 19it [00:00, 28.66it/s] 22it [00:00, 28.86it/s] 26it [00:00, 29.31it/s] 29it [00:01, 29.11it/s] 33it [00:01, 29.63it/s] 36it [00:01, 29.25it/s] 40it [00:01, 30.04it/s] 43it [00:01, 29.33it/s] 47it [00:01, 30.15it/s]2025-05-26 05:28:39,475 - INFO - [Epoch 076 | Batch 0050] IWAE-loss 3982.2517 | mean log_px -0.0111 | KL -3203.45 + 51it [00:01, 29.98it/s] 54it [00:01, 29.41it/s] 58it [00:02, 30.17it/s] 62it [00:02, 29.98it/s] 65it [00:02, 29.62it/s] 68it [00:02, 29.47it/s] 71it [00:02, 29.55it/s] 75it [00:02, 30.27it/s] 79it [00:02, 29.61it/s] 83it [00:02, 29.62it/s] 87it [00:02, 29.88it/s] 90it [00:03, 29.43it/s] 94it [00:03, 29.97it/s] 98it [00:03, 29.91it/s]2025-05-26 05:28:41,158 - INFO - [Epoch 076 | Batch 0100] IWAE-loss 4387.0835 | mean log_px -0.0168 | KL -3208.08 + 101it [00:03, 29.55it/s] 104it [00:03, 29.35it/s] 107it [00:03, 29.35it/s] 110it [00:03, 29.11it/s] 114it [00:03, 29.63it/s] 117it [00:04, 29.39it/s] 121it [00:04, 30.00it/s] 124it [00:04, 29.51it/s] 127it [00:04, 29.54it/s] 131it [00:04, 30.07it/s] 134it [00:04, 29.38it/s] 138it [00:04, 29.79it/s] 141it [00:04, 29.30it/s] 144it [00:04, 29.40it/s] 147it [00:05, 29.39it/s]2025-05-26 05:28:42,854 - INFO - [Epoch 076 | Batch 0150] IWAE-loss 4277.3281 | mean log_px -0.0153 | KL -3205.26 + 151it [00:05, 29.35it/s] 155it [00:05, 29.99it/s] 158it [00:05, 29.33it/s] 162it [00:05, 29.70it/s] 165it [00:05, 29.52it/s] 169it [00:05, 29.73it/s] 172it [00:05, 29.58it/s] 176it [00:06, 29.85it/s] 180it [00:06, 30.00it/s] 183it [00:06, 29.45it/s] 187it [00:06, 30.09it/s] 190it [00:06, 29.08it/s] 193it [00:06, 29.09it/s] 196it [00:06, 29.10it/s] +2025-05-26 05:28:44,440 - INFO - Epoch: 76, Objective: tensor([4605.1011], device='cuda:0', grad_fn=), Loss: 0.01954031176865101, KL/n: 65.336181640625 + 0it [00:00, ?it/s]2025-05-26 05:28:44,817 - INFO - [Epoch 077 | Batch 0000] IWAE-loss 4094.0244 | mean log_px -0.0127 | KL -3207.36 + 2it [00:00, 15.67it/s] 5it [00:00, 21.89it/s] 9it [00:00, 26.16it/s] 12it [00:00, 26.76it/s] 16it [00:00, 27.18it/s] 20it [00:00, 27.89it/s] 23it [00:00, 28.30it/s] 27it [00:00, 29.10it/s] 30it [00:01, 28.56it/s] 34it [00:01, 29.54it/s] 37it [00:01, 28.92it/s] 41it [00:01, 29.17it/s] 45it [00:01, 29.58it/s] 48it [00:01, 22.09it/s]2025-05-26 05:28:46,651 - INFO - [Epoch 077 | Batch 0050] IWAE-loss 4307.3828 | mean log_px -0.0159 | KL -3194.49 + 52it [00:01, 24.45it/s] 55it [00:02, 25.35it/s] 59it [00:02, 27.13it/s] 62it [00:02, 27.36it/s] 65it [00:02, 27.28it/s] 69it [00:02, 28.29it/s] 72it [00:02, 28.57it/s] 76it [00:02, 29.48it/s] 79it [00:02, 29.11it/s] 82it [00:02, 29.17it/s] 86it [00:03, 29.35it/s] 90it [00:03, 30.18it/s] 94it [00:03, 29.81it/s] 97it [00:03, 29.68it/s]2025-05-26 05:28:48,338 - INFO - [Epoch 077 | Batch 0100] IWAE-loss 3981.6162 | mean log_px -0.0112 | KL -3195.93 + 101it [00:03, 29.65it/s] 105it [00:03, 29.97it/s] 108it [00:03, 29.71it/s] 111it [00:03, 29.69it/s] 115it [00:04, 29.92it/s] 118it [00:04, 29.74it/s] 122it [00:04, 29.67it/s] 126it [00:04, 29.92it/s] 130it [00:04, 29.74it/s] 134it [00:04, 29.96it/s] 137it [00:04, 29.66it/s] 141it [00:04, 29.85it/s] 144it [00:05, 29.88it/s] 147it [00:05, 29.83it/s] 150it [00:05, 29.72it/s]2025-05-26 05:28:50,011 - INFO - [Epoch 077 | Batch 0150] IWAE-loss 4071.9658 | mean log_px -0.0126 | KL -3189.92 + 154it [00:05, 29.59it/s] 158it [00:05, 30.21it/s] 162it [00:05, 30.14it/s] 166it [00:05, 29.39it/s] 170it [00:05, 29.50it/s] 174it [00:06, 29.80it/s] 178it [00:06, 30.09it/s] 182it [00:06, 30.18it/s] 186it [00:06, 29.42it/s] 190it [00:06, 29.73it/s] 193it [00:06, 29.65it/s] 196it [00:06, 28.53it/s] +2025-05-26 05:28:51,602 - INFO - Epoch: 77, Objective: tensor([4465.7988], device='cuda:0', grad_fn=), Loss: 0.030269712209701538, KL/n: 65.11568450927734 + 0it [00:00, ?it/s]2025-05-26 05:28:51,996 - INFO - [Epoch 078 | Batch 0000] IWAE-loss 3828.5244 | mean log_px -0.0091 | KL -3190.22 + 1it [00:00, 9.83it/s] 4it [00:00, 20.83it/s] 8it [00:00, 26.50it/s] 12it [00:00, 27.57it/s] 16it [00:00, 29.05it/s] 19it [00:00, 28.70it/s] 23it [00:00, 29.75it/s] 26it [00:00, 29.22it/s] 30it [00:01, 29.15it/s] 34it [00:01, 29.88it/s] 38it [00:01, 29.81it/s] 41it [00:01, 29.51it/s] 44it [00:01, 29.56it/s] 48it [00:01, 30.08it/s]2025-05-26 05:28:53,672 - INFO - [Epoch 078 | Batch 0050] IWAE-loss 4657.2725 | mean log_px -0.0210 | KL -3189.41 + 51it [00:01, 29.39it/s] 55it [00:01, 29.78it/s] 59it [00:02, 29.85it/s] 63it [00:02, 30.12it/s] 67it [00:02, 30.50it/s] 71it [00:02, 29.70it/s] 75it [00:02, 30.29it/s] 79it [00:02, 29.48it/s] 83it [00:02, 30.31it/s] 87it [00:02, 30.07it/s] 91it [00:03, 29.31it/s] 95it [00:03, 29.47it/s] 99it [00:03, 29.97it/s]2025-05-26 05:28:55,347 - INFO - [Epoch 078 | Batch 0100] IWAE-loss 3990.4695 | mean log_px -0.0115 | KL -3183.60 + 103it [00:03, 30.06it/s] 107it [00:03, 30.07it/s] 111it [00:03, 30.06it/s] 115it [00:03, 29.63it/s] 118it [00:04, 29.56it/s] 122it [00:04, 29.92it/s] 125it [00:04, 29.76it/s] 129it [00:04, 30.30it/s] 133it [00:04, 29.92it/s] 136it [00:04, 29.76it/s] 139it [00:04, 29.76it/s] 143it [00:04, 30.12it/s] 147it [00:04, 30.32it/s]2025-05-26 05:28:57,009 - INFO - [Epoch 078 | Batch 0150] IWAE-loss 3825.6169 | mean log_px -0.0092 | KL -3182.13 + 151it [00:05, 30.17it/s] 155it [00:05, 29.58it/s] 159it [00:05, 29.86it/s] 162it [00:05, 29.73it/s] 166it [00:05, 29.77it/s] 170it [00:05, 30.34it/s] 174it [00:05, 30.26it/s] 178it [00:06, 29.84it/s] 181it [00:06, 29.77it/s] 184it [00:06, 29.67it/s] 188it [00:06, 30.36it/s] 192it [00:06, 30.36it/s] 196it [00:06, 29.07it/s] 196it [00:06, 29.27it/s] +2025-05-26 05:28:58,603 - INFO - Epoch: 78, Objective: tensor([5545.3887], device='cuda:0', grad_fn=), Loss: 0.030365370213985443, KL/n: 64.92745971679688 + 0it [00:00, ?it/s]2025-05-26 05:28:58,811 - INFO - [Epoch 079 | Batch 0000] IWAE-loss 4194.7300 | mean log_px -0.0145 | KL -3176.73 + 2it [00:00, 15.43it/s] 6it [00:00, 24.43it/s] 9it [00:00, 25.75it/s] 13it [00:00, 28.10it/s] 16it [00:00, 27.08it/s] 19it [00:00, 27.88it/s] 22it [00:00, 27.50it/s] 25it [00:00, 27.64it/s] 29it [00:01, 28.23it/s] 32it [00:01, 27.57it/s] 36it [00:01, 28.31it/s] 39it [00:01, 27.65it/s] 42it [00:01, 28.18it/s] 45it [00:01, 28.07it/s] 48it [00:01, 27.74it/s]2025-05-26 05:29:00,570 - INFO - [Epoch 079 | Batch 0050] IWAE-loss 4827.3843 | mean log_px -0.0235 | KL -3179.10 + 52it [00:01, 28.14it/s] 56it [00:02, 28.48it/s] 59it [00:02, 27.80it/s] 62it [00:02, 28.05it/s] 65it [00:02, 27.74it/s] 68it [00:02, 27.85it/s] 71it [00:02, 28.37it/s] 74it [00:02, 27.78it/s] 77it [00:02, 28.32it/s] 80it [00:02, 27.63it/s] 83it [00:03, 28.28it/s] 86it [00:03, 27.72it/s] 89it [00:03, 28.28it/s] 92it [00:03, 27.46it/s] 95it [00:03, 28.02it/s] 98it [00:03, 27.50it/s]2025-05-26 05:29:02,370 - INFO - [Epoch 079 | Batch 0100] IWAE-loss 4317.6353 | mean log_px -0.0163 | KL -3175.41 + 101it [00:03, 27.50it/s] 104it [00:03, 28.20it/s] 107it [00:03, 27.97it/s] 111it [00:03, 29.15it/s] 114it [00:04, 28.70it/s] 118it [00:04, 29.33it/s] 122it [00:04, 29.93it/s] 125it [00:04, 29.41it/s] 128it [00:04, 29.37it/s] 132it [00:04, 29.70it/s] 136it [00:04, 30.01it/s] 140it [00:04, 30.14it/s] 144it [00:05, 29.57it/s] 147it [00:05, 29.61it/s] 150it [00:05, 29.70it/s]2025-05-26 05:29:04,051 - INFO - [Epoch 079 | Batch 0150] IWAE-loss 4311.8350 | mean log_px -0.0163 | KL -3172.05 + 153it [00:05, 29.49it/s] 157it [00:05, 29.78it/s] 160it [00:05, 29.57it/s] 164it [00:05, 30.15it/s] 168it [00:05, 30.09it/s] 172it [00:06, 29.35it/s] 175it [00:06, 28.96it/s] 178it [00:06, 28.72it/s] 182it [00:06, 29.00it/s] 185it [00:06, 28.31it/s] 188it [00:06, 28.62it/s] 191it [00:06, 28.85it/s] 194it [00:06, 27.84it/s] 196it [00:06, 28.16it/s] +2025-05-26 05:29:05,690 - INFO - Epoch: 79, Objective: tensor([5860.7207], device='cuda:0', grad_fn=), Loss: 0.04421786218881607, KL/n: 64.694091796875 + 0it [00:00, ?it/s]2025-05-26 05:29:05,902 - INFO - [Epoch 080 | Batch 0000] IWAE-loss 4088.6172 | mean log_px -0.0132 | KL -3164.99 + 1it [00:00, 9.89it/s] 4it [00:00, 21.00it/s] 8it [00:00, 26.72it/s] 11it [00:00, 27.16it/s] 15it [00:00, 29.35it/s] 19it [00:00, 29.13it/s] 23it [00:00, 29.60it/s] 27it [00:00, 29.89it/s] 31it [00:01, 30.55it/s] 35it [00:01, 30.56it/s] 39it [00:01, 30.55it/s] 43it [00:01, 30.18it/s] 47it [00:01, 30.31it/s]2025-05-26 05:29:07,551 - INFO - [Epoch 080 | Batch 0050] IWAE-loss 4526.7085 | mean log_px -0.0194 | KL -3168.81 + 51it [00:01, 30.06it/s] 55it [00:01, 30.74it/s] 59it [00:02, 30.46it/s] 63it [00:02, 30.48it/s] 67it [00:02, 30.14it/s] 71it [00:02, 30.26it/s] 75it [00:02, 30.37it/s] 79it [00:02, 30.40it/s] 83it [00:02, 30.45it/s] 87it [00:02, 30.45it/s] 91it [00:03, 30.47it/s] 95it [00:03, 30.29it/s] 99it [00:03, 30.84it/s]2025-05-26 05:29:09,192 - INFO - [Epoch 080 | Batch 0100] IWAE-loss 4312.2236 | mean log_px -0.0164 | KL -3163.00 + 103it [00:03, 30.88it/s] 107it [00:03, 30.13it/s] 111it [00:03, 30.28it/s] 115it [00:03, 30.37it/s] 119it [00:03, 29.93it/s] 122it [00:04, 29.62it/s] 125it [00:04, 29.64it/s] 129it [00:04, 29.85it/s] 133it [00:04, 30.15it/s] 137it [00:04, 30.31it/s] 141it [00:04, 30.38it/s] 145it [00:04, 30.46it/s] 149it [00:04, 30.51it/s]2025-05-26 05:29:10,844 - INFO - [Epoch 080 | Batch 0150] IWAE-loss 4863.0352 | mean log_px -0.0243 | KL -3160.10 + 153it [00:05, 30.48it/s] 157it [00:05, 30.53it/s] 161it [00:05, 30.52it/s] 165it [00:05, 30.51it/s] 169it [00:05, 30.55it/s] 173it [00:05, 30.56it/s] 177it [00:05, 30.57it/s] 181it [00:06, 30.56it/s] 185it [00:06, 30.60it/s] 189it [00:06, 30.61it/s] 193it [00:06, 30.57it/s] 196it [00:06, 29.81it/s] +2025-05-26 05:29:12,389 - INFO - Epoch: 80, Objective: tensor([3650.3477], device='cuda:0', grad_fn=), Loss: 0.007161382120102644, KL/n: 64.47715759277344 + 0it [00:00, ?it/s]2025-05-26 05:29:12,908 - INFO - [Epoch 081 | Batch 0000] IWAE-loss 3828.7778 | mean log_px -0.0096 | KL -3157.30 + 1it [00:00, 4.18it/s] 5it [00:00, 15.76it/s] 8it [00:00, 20.17it/s] 12it [00:00, 24.29it/s] 15it [00:00, 25.70it/s] 18it [00:00, 26.92it/s] 21it [00:00, 27.51it/s] 25it [00:01, 28.85it/s] 28it [00:01, 28.59it/s] 32it [00:01, 29.22it/s] 35it [00:01, 29.28it/s] 38it [00:01, 29.34it/s] 42it [00:01, 30.17it/s] 46it [00:01, 30.08it/s] 50it [00:01, 29.29it/s]2025-05-26 05:29:14,580 - INFO - [Epoch 081 | Batch 0050] IWAE-loss 4764.0112 | mean log_px -0.0230 | KL -3154.63 + 53it [00:01, 29.45it/s] 57it [00:02, 29.82it/s] 61it [00:02, 29.74it/s] 64it [00:02, 29.39it/s] 68it [00:02, 29.52it/s] 72it [00:02, 29.83it/s] 75it [00:02, 29.30it/s] 79it [00:02, 29.89it/s] 82it [00:02, 29.37it/s] 86it [00:03, 29.55it/s] 90it [00:03, 29.91it/s] 94it [00:03, 30.07it/s] 98it [00:03, 30.26it/s]2025-05-26 05:29:16,269 - INFO - [Epoch 081 | Batch 0100] IWAE-loss 3924.3594 | mean log_px -0.0110 | KL -3151.29 + 102it [00:03, 30.10it/s] 106it [00:03, 29.32it/s] 110it [00:03, 29.66it/s] 113it [00:04, 29.31it/s] 116it [00:04, 28.38it/s] 119it [00:04, 28.06it/s] 122it [00:04, 28.28it/s] 126it [00:04, 28.88it/s] 130it [00:04, 29.49it/s] 133it [00:04, 29.18it/s] 136it [00:04, 28.77it/s] 140it [00:04, 29.27it/s] 143it [00:05, 29.37it/s] 146it [00:05, 29.26it/s] 149it [00:05, 29.26it/s]2025-05-26 05:29:17,984 - INFO - [Epoch 081 | Batch 0150] IWAE-loss 5447.3198 | mean log_px -0.0328 | KL -3154.13 + 153it [00:05, 29.24it/s] 157it [00:05, 29.90it/s] 160it [00:05, 29.31it/s] 164it [00:05, 29.75it/s] 168it [00:05, 30.08it/s] 171it [00:05, 29.52it/s] 174it [00:06, 29.47it/s] 178it [00:06, 29.51it/s] 182it [00:06, 30.07it/s] 186it [00:06, 30.11it/s] 190it [00:06, 29.23it/s] 194it [00:06, 29.64it/s] 196it [00:06, 28.41it/s] +2025-05-26 05:29:19,584 - INFO - Epoch: 81, Objective: tensor([4252.6670], device='cuda:0', grad_fn=), Loss: 0.01819196157157421, KL/n: 64.2647933959961 + 0it [00:00, ?it/s]2025-05-26 05:29:19,953 - INFO - [Epoch 082 | Batch 0000] IWAE-loss 3831.3748 | mean log_px -0.0098 | KL -3145.42 + 2it [00:00, 18.81it/s] 5it [00:00, 23.73it/s] 9it [00:00, 27.50it/s] 12it [00:00, 27.98it/s] 15it [00:00, 28.56it/s] 18it [00:00, 28.97it/s] 21it [00:00, 29.07it/s] 25it [00:00, 29.32it/s] 29it [00:01, 30.01it/s] 32it [00:01, 29.40it/s] 35it [00:01, 29.36it/s] 38it [00:01, 29.46it/s] 41it [00:01, 28.85it/s] 45it [00:01, 29.19it/s] 49it [00:01, 29.64it/s]2025-05-26 05:29:21,647 - INFO - [Epoch 082 | Batch 0050] IWAE-loss 4389.9233 | mean log_px -0.0178 | KL -3142.92 + 52it [00:01, 29.55it/s] 56it [00:01, 30.21it/s] 60it [00:02, 30.19it/s] 64it [00:02, 29.68it/s] 67it [00:02, 29.59it/s] 71it [00:02, 30.24it/s] 75it [00:02, 30.00it/s] 78it [00:02, 29.70it/s] 81it [00:02, 29.51it/s] 85it [00:02, 29.97it/s] 89it [00:03, 30.20it/s] 93it [00:03, 29.79it/s] 96it [00:03, 29.70it/s] 100it [00:03, 29.77it/s]2025-05-26 05:29:23,317 - INFO - [Epoch 082 | Batch 0100] IWAE-loss 4631.8896 | mean log_px -0.0213 | KL -3140.99 + 103it [00:03, 29.75it/s] 106it [00:03, 29.66it/s] 110it [00:03, 29.78it/s] 114it [00:03, 30.12it/s] 118it [00:04, 29.62it/s] 121it [00:04, 29.30it/s] 124it [00:04, 28.47it/s] 127it [00:04, 28.18it/s] 131it [00:04, 28.96it/s] 134it [00:04, 28.65it/s] 138it [00:04, 29.36it/s] 141it [00:04, 28.85it/s] 145it [00:04, 29.52it/s] 148it [00:05, 28.88it/s]2025-05-26 05:29:25,031 - INFO - [Epoch 082 | Batch 0150] IWAE-loss 4407.9258 | mean log_px -0.0181 | KL -3138.42 + 152it [00:05, 29.11it/s] 156it [00:05, 29.66it/s] 159it [00:05, 29.03it/s] 163it [00:05, 29.25it/s] 167it [00:05, 29.75it/s] 170it [00:05, 29.25it/s] 174it [00:05, 29.72it/s] 178it [00:06, 30.17it/s] 182it [00:06, 30.19it/s] 186it [00:06, 29.43it/s] 190it [00:06, 30.22it/s] 194it [00:06, 30.13it/s] 196it [00:06, 29.12it/s] +2025-05-26 05:29:26,621 - INFO - Epoch: 82, Objective: tensor([5252.1035], device='cuda:0', grad_fn=), Loss: 0.024639014154672623, KL/n: 64.05130004882812 + 0it [00:00, ?it/s]2025-05-26 05:29:26,834 - INFO - [Epoch 083 | Batch 0000] IWAE-loss 4420.0698 | mean log_px -0.0183 | KL -3139.32 + 1it [00:00, 9.93it/s] 4it [00:00, 21.10it/s] 8it [00:00, 26.41it/s] 11it [00:00, 27.42it/s] 15it [00:00, 28.78it/s] 18it [00:00, 28.95it/s] 22it [00:00, 30.07it/s] 26it [00:00, 29.75it/s] 29it [00:01, 29.64it/s] 32it [00:01, 29.64it/s] 36it [00:01, 29.96it/s] 40it [00:01, 30.08it/s] 44it [00:01, 30.49it/s] 48it [00:01, 30.38it/s]2025-05-26 05:29:28,497 - INFO - [Epoch 083 | Batch 0050] IWAE-loss 3860.5254 | mean log_px -0.0104 | KL -3132.13 + 52it [00:01, 30.29it/s] 56it [00:01, 30.30it/s] 60it [00:02, 30.25it/s] 64it [00:02, 29.90it/s] 67it [00:02, 29.51it/s] 71it [00:02, 29.94it/s] 74it [00:02, 29.81it/s] 78it [00:02, 30.49it/s] 82it [00:02, 30.50it/s] 86it [00:02, 30.40it/s] 90it [00:03, 30.35it/s] 94it [00:03, 30.19it/s] 98it [00:03, 30.18it/s]2025-05-26 05:29:30,157 - INFO - [Epoch 083 | Batch 0100] IWAE-loss 3594.4180 | mean log_px -0.0066 | KL -3132.04 + 102it [00:03, 30.17it/s] 106it [00:03, 29.45it/s] 110it [00:03, 29.72it/s] 114it [00:03, 30.40it/s] 118it [00:03, 30.22it/s] 122it [00:04, 30.20it/s] 126it [00:04, 30.26it/s] 130it [00:04, 29.89it/s] 134it [00:04, 29.68it/s] 138it [00:04, 30.41it/s] 142it [00:04, 29.97it/s] 146it [00:04, 30.42it/s] 150it [00:05, 29.79it/s]2025-05-26 05:29:31,811 - INFO - [Epoch 083 | Batch 0150] IWAE-loss 4050.9419 | mean log_px -0.0132 | KL -3127.14 + 153it [00:05, 29.84it/s] 157it [00:05, 30.17it/s] 161it [00:05, 29.96it/s] 164it [00:05, 29.82it/s] 168it [00:05, 30.37it/s] 172it [00:05, 29.81it/s] 175it [00:05, 29.37it/s] 179it [00:06, 29.86it/s] 182it [00:06, 29.40it/s] 186it [00:06, 29.79it/s] 190it [00:06, 29.89it/s] 193it [00:06, 29.74it/s] 196it [00:06, 29.49it/s] +2025-05-26 05:29:33,393 - INFO - Epoch: 83, Objective: tensor([4091.2358], device='cuda:0', grad_fn=), Loss: 0.012145907618105412, KL/n: 63.854610443115234 + 0it [00:00, ?it/s]2025-05-26 05:29:33,609 - INFO - [Epoch 084 | Batch 0000] IWAE-loss 3726.4863 | mean log_px -0.0086 | KL -3123.17 + 1it [00:00, 9.55it/s] 4it [00:00, 20.85it/s] 8it [00:00, 25.95it/s] 11it [00:00, 27.35it/s] 14it [00:00, 28.07it/s] 18it [00:00, 28.83it/s] 22it [00:00, 29.53it/s] 25it [00:00, 29.49it/s] 29it [00:01, 29.93it/s] 32it [00:01, 29.77it/s] 36it [00:01, 30.44it/s] 40it [00:01, 30.27it/s] 44it [00:01, 30.22it/s] 48it [00:01, 30.20it/s]2025-05-26 05:29:35,277 - INFO - [Epoch 084 | Batch 0050] IWAE-loss 3458.3462 | mean log_px -0.0048 | KL -3125.33 + 52it [00:01, 29.51it/s] 56it [00:01, 29.78it/s] 60it [00:02, 30.20it/s] 64it [00:02, 30.51it/s] 68it [00:02, 30.00it/s] 72it [00:02, 30.55it/s] 76it [00:02, 30.51it/s] 80it [00:02, 30.46it/s] 84it [00:02, 30.35it/s] 88it [00:02, 30.41it/s] 92it [00:03, 29.77it/s] 95it [00:03, 29.10it/s] 98it [00:03, 29.32it/s]2025-05-26 05:29:36,939 - INFO - [Epoch 084 | Batch 0100] IWAE-loss 4976.4111 | mean log_px -0.0265 | KL -3121.79 + 102it [00:03, 30.20it/s] 106it [00:03, 29.87it/s] 110it [00:03, 29.85it/s] 114it [00:03, 30.57it/s] 118it [00:03, 30.21it/s] 122it [00:04, 30.07it/s] 126it [00:04, 30.76it/s] 130it [00:04, 30.71it/s] 134it [00:04, 30.33it/s] 138it [00:04, 30.23it/s] 142it [00:04, 30.24it/s] 146it [00:04, 30.74it/s] 150it [00:05, 30.34it/s]2025-05-26 05:29:38,583 - INFO - [Epoch 084 | Batch 0150] IWAE-loss 4088.7295 | mean log_px -0.0139 | KL -3118.40 + 154it [00:05, 30.22it/s] 158it [00:05, 30.74it/s] 162it [00:05, 30.32it/s] 166it [00:05, 30.11it/s] 170it [00:05, 30.81it/s] 174it [00:05, 30.73it/s] 178it [00:05, 30.41it/s] 182it [00:06, 30.24it/s] 186it [00:06, 30.18it/s] 190it [00:06, 30.85it/s] 194it [00:06, 30.38it/s] 196it [00:06, 29.62it/s] +2025-05-26 05:29:40,135 - INFO - Epoch: 84, Objective: tensor([3801.6511], device='cuda:0', grad_fn=), Loss: 0.011263754218816757, KL/n: 63.63286590576172 + 0it [00:00, ?it/s]2025-05-26 05:29:40,510 - INFO - [Epoch 085 | Batch 0000] IWAE-loss 3941.2964 | mean log_px -0.0119 | KL -3110.52 + 2it [00:00, 15.48it/s] 6it [00:00, 24.44it/s] 9it [00:00, 26.51it/s] 13it [00:00, 27.50it/s] 17it [00:00, 28.94it/s] 21it [00:00, 29.45it/s] 25it [00:00, 30.05it/s] 29it [00:01, 30.28it/s] 33it [00:01, 30.04it/s] 37it [00:01, 29.56it/s] 41it [00:01, 30.13it/s] 45it [00:01, 30.54it/s] 49it [00:01, 30.49it/s]2025-05-26 05:29:42,165 - INFO - [Epoch 085 | Batch 0050] IWAE-loss 4162.5371 | mean log_px -0.0150 | KL -3114.51 + 53it [00:01, 30.10it/s] 57it [00:01, 30.25it/s] 61it [00:02, 30.74it/s] 65it [00:02, 30.47it/s] 69it [00:02, 30.56it/s] 73it [00:02, 30.56it/s] 77it [00:02, 30.91it/s] 81it [00:02, 30.82it/s] 85it [00:02, 30.22it/s] 89it [00:02, 30.65it/s] 93it [00:03, 30.96it/s] 97it [00:03, 30.87it/s]2025-05-26 05:29:43,794 - INFO - [Epoch 085 | Batch 0100] IWAE-loss 4253.9092 | mean log_px -0.0163 | KL -3112.00 + 101it [00:03, 30.43it/s] 105it [00:03, 30.66it/s] 109it [00:03, 30.21it/s] 113it [00:03, 30.04it/s] 117it [00:03, 30.21it/s] 121it [00:04, 30.56it/s] 125it [00:04, 29.88it/s] 128it [00:04, 29.73it/s] 132it [00:04, 29.91it/s] 136it [00:04, 30.37it/s] 140it [00:04, 30.37it/s] 144it [00:04, 30.30it/s] 148it [00:04, 30.04it/s]2025-05-26 05:29:45,454 - INFO - [Epoch 085 | Batch 0150] IWAE-loss 3706.9902 | mean log_px -0.0086 | KL -3108.36 + 152it [00:05, 30.16it/s] 156it [00:05, 30.49it/s] 160it [00:05, 30.18it/s] 164it [00:05, 30.24it/s] 168it [00:05, 30.60it/s] 172it [00:05, 30.26it/s] 176it [00:05, 30.56it/s] 180it [00:05, 30.52it/s] 184it [00:06, 30.20it/s] 188it [00:06, 30.27it/s] 192it [00:06, 30.07it/s] 196it [00:06, 29.93it/s] 196it [00:06, 29.73it/s] +2025-05-26 05:29:47,021 - INFO - Epoch: 85, Objective: tensor([4067.0212], device='cuda:0', grad_fn=), Loss: 0.014330035075545311, KL/n: 63.40304946899414 + 0it [00:00, ?it/s]2025-05-26 05:29:47,214 - INFO - [Epoch 086 | Batch 0000] IWAE-loss 4068.9893 | mean log_px -0.0138 | KL -3106.09 + 2it [00:00, 18.40it/s] 5it [00:00, 24.78it/s] 8it [00:00, 26.47it/s] 12it [00:00, 28.34it/s] 15it [00:00, 28.21it/s] 19it [00:00, 29.04it/s] 23it [00:00, 29.57it/s] 26it [00:00, 28.73it/s] 30it [00:01, 28.78it/s] 33it [00:01, 29.04it/s] 36it [00:01, 28.86it/s] 39it [00:01, 28.89it/s] 43it [00:01, 29.64it/s] 46it [00:01, 29.73it/s] 49it [00:01, 29.15it/s]2025-05-26 05:29:48,918 - INFO - [Epoch 086 | Batch 0050] IWAE-loss 3675.7251 | mean log_px -0.0082 | KL -3102.51 + 52it [00:01, 29.30it/s] 56it [00:01, 29.63it/s] 59it [00:02, 29.70it/s] 62it [00:02, 29.28it/s] 65it [00:02, 29.14it/s] 69it [00:02, 29.98it/s] 73it [00:02, 29.90it/s] 76it [00:02, 29.68it/s] 79it [00:02, 29.63it/s] 83it [00:02, 29.62it/s] 87it [00:02, 29.65it/s] 91it [00:03, 30.27it/s] 95it [00:03, 29.64it/s] 99it [00:03, 29.69it/s]2025-05-26 05:29:50,591 - INFO - [Epoch 086 | Batch 0100] IWAE-loss 3924.1753 | mean log_px -0.0118 | KL -3100.22 + 103it [00:03, 30.05it/s] 107it [00:03, 30.27it/s] 111it [00:03, 29.90it/s] 114it [00:03, 29.65it/s] 118it [00:04, 30.08it/s] 122it [00:04, 30.33it/s] 126it [00:04, 29.94it/s] 130it [00:04, 30.23it/s] 134it [00:04, 29.69it/s] 138it [00:04, 30.27it/s] 142it [00:04, 30.00it/s] 146it [00:04, 30.32it/s] 150it [00:05, 29.88it/s]2025-05-26 05:29:52,260 - INFO - [Epoch 086 | Batch 0150] IWAE-loss 3893.2014 | mean log_px -0.0114 | KL -3093.64 + 153it [00:05, 29.88it/s] 157it [00:05, 29.95it/s] 161it [00:05, 30.07it/s] 165it [00:05, 30.19it/s] 169it [00:05, 30.04it/s] 173it [00:05, 30.13it/s] 177it [00:05, 30.09it/s] 181it [00:06, 30.11it/s] 185it [00:06, 30.03it/s] 189it [00:06, 30.09it/s] 193it [00:06, 30.13it/s] 196it [00:06, 29.32it/s] +2025-05-26 05:29:53,835 - INFO - Epoch: 86, Objective: tensor([4236.9863], device='cuda:0', grad_fn=), Loss: 0.012787101790308952, KL/n: 63.176753997802734 + 0it [00:00, ?it/s]2025-05-26 05:29:54,350 - INFO - [Epoch 087 | Batch 0000] IWAE-loss 4358.9453 | mean log_px -0.0181 | KL -3089.78 + 1it [00:00, 4.28it/s] 4it [00:00, 13.66it/s] 8it [00:00, 21.00it/s] 11it [00:00, 23.34it/s] 14it [00:00, 25.24it/s] 17it [00:00, 26.00it/s] 20it [00:00, 26.35it/s] 23it [00:00, 27.11it/s] 26it [00:01, 26.63it/s] 29it [00:01, 27.14it/s] 32it [00:01, 26.41it/s] 35it [00:01, 26.68it/s] 38it [00:01, 27.28it/s] 41it [00:01, 27.95it/s] 45it [00:01, 29.40it/s] 48it [00:01, 28.99it/s]2025-05-26 05:29:56,100 - INFO - [Epoch 087 | Batch 0050] IWAE-loss 3764.6992 | mean log_px -0.0097 | KL -3087.79 + 52it [00:02, 29.63it/s] 56it [00:02, 30.13it/s] 60it [00:02, 29.71it/s] 64it [00:02, 30.26it/s] 68it [00:02, 30.28it/s] 72it [00:02, 30.28it/s] 76it [00:02, 30.22it/s] 80it [00:02, 30.18it/s] 84it [00:03, 30.16it/s] 88it [00:03, 29.94it/s] 92it [00:03, 30.26it/s] 96it [00:03, 30.10it/s] 100it [00:03, 30.06it/s]2025-05-26 05:29:57,756 - INFO - [Epoch 087 | Batch 0100] IWAE-loss 4102.3193 | mean log_px -0.0145 | KL -3086.62 + 104it [00:03, 29.79it/s] 108it [00:03, 30.27it/s] 112it [00:04, 30.32it/s] 116it [00:04, 30.36it/s] 120it [00:04, 30.30it/s] 124it [00:04, 30.31it/s] 128it [00:04, 30.27it/s] 132it [00:04, 30.26it/s] 136it [00:04, 30.26it/s] 140it [00:04, 30.29it/s] 144it [00:05, 29.94it/s] 147it [00:05, 29.62it/s]2025-05-26 05:29:59,409 - INFO - [Epoch 087 | Batch 0150] IWAE-loss 3752.8010 | mean log_px -0.0095 | KL -3086.34 + 151it [00:05, 30.35it/s] 155it [00:05, 30.40it/s] 159it [00:05, 30.37it/s] 163it [00:05, 30.25it/s] 167it [00:05, 30.19it/s] 171it [00:05, 30.20it/s] 175it [00:06, 30.22it/s] 179it [00:06, 30.24it/s] 183it [00:06, 30.26it/s] 187it [00:06, 29.94it/s] 191it [00:06, 30.30it/s] 195it [00:06, 28.69it/s] 196it [00:06, 28.63it/s] +2025-05-26 05:30:00,977 - INFO - Epoch: 87, Objective: tensor([4625.4038], device='cuda:0', grad_fn=), Loss: 0.026148444041609764, KL/n: 62.9666748046875 + 0it [00:00, ?it/s]2025-05-26 05:30:01,362 - INFO - [Epoch 088 | Batch 0000] IWAE-loss 3669.1304 | mean log_px -0.0084 | KL -3084.35 + 2it [00:00, 15.66it/s] 6it [00:00, 24.23it/s] 10it [00:00, 27.07it/s] 13it [00:00, 27.64it/s] 16it [00:00, 28.10it/s] 19it [00:00, 28.54it/s] 22it [00:00, 27.32it/s] 26it [00:00, 27.56it/s] 29it [00:01, 27.78it/s] 33it [00:01, 29.17it/s] 36it [00:01, 28.94it/s] 40it [00:01, 29.23it/s] 44it [00:01, 30.27it/s] 48it [00:01, 29.73it/s]2025-05-26 05:30:03,082 - INFO - [Epoch 088 | Batch 0050] IWAE-loss 3723.8115 | mean log_px -0.0092 | KL -3081.36 + 51it [00:01, 28.46it/s] 55it [00:01, 28.91it/s] 59it [00:02, 29.24it/s] 63it [00:02, 29.76it/s] 67it [00:02, 29.91it/s] 71it [00:02, 29.78it/s] 75it [00:02, 30.62it/s] 79it [00:02, 30.66it/s] 83it [00:02, 30.19it/s] 87it [00:03, 30.26it/s] 91it [00:03, 30.34it/s] 95it [00:03, 30.36it/s] 99it [00:03, 30.72it/s]2025-05-26 05:30:04,733 - INFO - [Epoch 088 | Batch 0100] IWAE-loss 4192.2432 | mean log_px -0.0159 | KL -3077.38 + 103it [00:03, 30.18it/s] 107it [00:03, 30.21it/s] 111it [00:03, 30.24it/s] 115it [00:03, 30.16it/s] 119it [00:04, 30.81it/s] 123it [00:04, 30.68it/s] 127it [00:04, 30.59it/s] 131it [00:04, 29.98it/s] 135it [00:04, 29.99it/s] 139it [00:04, 30.39it/s] 143it [00:04, 30.74it/s] 147it [00:04, 30.64it/s]2025-05-26 05:30:06,371 - INFO - [Epoch 088 | Batch 0150] IWAE-loss 3817.7671 | mean log_px -0.0106 | KL -3075.39 + 151it [00:05, 30.54it/s] 155it [00:05, 30.60it/s] 159it [00:05, 30.50it/s] 163it [00:05, 30.40it/s] 167it [00:05, 29.55it/s] 171it [00:05, 29.68it/s] 175it [00:05, 30.42it/s] 179it [00:06, 30.33it/s] 183it [00:06, 30.44it/s] 187it [00:06, 30.11it/s] 191it [00:06, 30.00it/s] 195it [00:06, 28.88it/s] 196it [00:06, 29.39it/s] +2025-05-26 05:30:07,950 - INFO - Epoch: 88, Objective: tensor([3927.5105], device='cuda:0', grad_fn=), Loss: 0.013497211039066315, KL/n: 62.73975372314453 + 0it [00:00, ?it/s]2025-05-26 05:30:08,163 - INFO - [Epoch 089 | Batch 0000] IWAE-loss 4610.1006 | mean log_px -0.0220 | KL -3071.57 + 2it [00:00, 15.82it/s] 5it [00:00, 22.24it/s] 9it [00:00, 26.03it/s] 13it [00:00, 28.12it/s] 16it [00:00, 28.14it/s] 20it [00:00, 28.76it/s] 24it [00:00, 29.75it/s] 27it [00:00, 29.24it/s] 30it [00:01, 29.27it/s] 34it [00:01, 29.47it/s] 38it [00:01, 30.20it/s] 42it [00:01, 30.13it/s] 46it [00:01, 29.42it/s] 49it [00:01, 29.41it/s]2025-05-26 05:30:09,851 - INFO - [Epoch 089 | Batch 0050] IWAE-loss 3911.0552 | mean log_px -0.0120 | KL -3070.09 + 53it [00:01, 29.51it/s] 56it [00:01, 29.40it/s] 60it [00:02, 29.57it/s] 64it [00:02, 29.83it/s] 67it [00:02, 29.67it/s] 71it [00:02, 29.96it/s] 75it [00:02, 30.15it/s] 79it [00:02, 29.76it/s] 83it [00:02, 30.15it/s] 87it [00:02, 30.17it/s] 91it [00:03, 30.14it/s] 95it [00:03, 29.42it/s] 99it [00:03, 30.20it/s]2025-05-26 05:30:11,521 - INFO - [Epoch 089 | Batch 0100] IWAE-loss 3895.0288 | mean log_px -0.0118 | KL -3070.19 + 103it [00:03, 30.05it/s] 107it [00:03, 30.04it/s] 111it [00:03, 29.98it/s] 115it [00:03, 29.41it/s] 119it [00:04, 29.57it/s] 123it [00:04, 30.14it/s] 127it [00:04, 30.10it/s] 131it [00:04, 30.11it/s] 135it [00:04, 30.12it/s] 139it [00:04, 29.98it/s] 142it [00:04, 29.48it/s] 146it [00:04, 30.28it/s] 150it [00:05, 30.26it/s]2025-05-26 05:30:13,182 - INFO - [Epoch 089 | Batch 0150] IWAE-loss 4188.3027 | mean log_px -0.0160 | KL -3065.17 + 154it [00:05, 29.95it/s] 158it [00:05, 30.26it/s] 162it [00:05, 30.32it/s] 166it [00:05, 29.52it/s] 170it [00:05, 30.20it/s] 174it [00:05, 29.89it/s] 178it [00:06, 29.98it/s] 182it [00:06, 30.06it/s] 186it [00:06, 30.30it/s] 190it [00:06, 30.40it/s] 194it [00:06, 29.84it/s] 196it [00:06, 29.37it/s] +2025-05-26 05:30:14,753 - INFO - Epoch: 89, Objective: tensor([5425.4277], device='cuda:0', grad_fn=), Loss: 0.03324078023433685, KL/n: 62.52193069458008 + 0it [00:00, ?it/s]2025-05-26 05:30:15,145 - INFO - [Epoch 090 | Batch 0000] IWAE-loss 3676.2129 | mean log_px -0.0088 | KL -3063.65 + 1it [00:00, 9.84it/s] 4it [00:00, 20.79it/s] 8it [00:00, 26.49it/s] 12it [00:00, 28.01it/s] 15it [00:00, 27.93it/s] 19it [00:00, 29.00it/s] 23it [00:00, 29.32it/s] 27it [00:00, 29.70it/s] 31it [00:01, 29.87it/s] 35it [00:01, 29.98it/s] 39it [00:01, 30.04it/s] 42it [00:01, 30.01it/s] 46it [00:01, 30.30it/s] 50it [00:01, 30.21it/s]2025-05-26 05:30:16,806 - INFO - [Epoch 090 | Batch 0050] IWAE-loss 3673.1714 | mean log_px -0.0088 | KL -3056.10 + 54it [00:01, 29.63it/s] 58it [00:01, 30.23it/s] 62it [00:02, 30.40it/s] 66it [00:02, 30.36it/s] 70it [00:02, 30.29it/s] 74it [00:02, 29.71it/s] 78it [00:02, 30.10it/s] 82it [00:02, 30.36it/s] 86it [00:02, 30.25it/s] 90it [00:03, 29.81it/s] 94it [00:03, 29.79it/s] 97it [00:03, 29.63it/s]2025-05-26 05:30:18,466 - INFO - [Epoch 090 | Batch 0100] IWAE-loss 3575.1206 | mean log_px -0.0074 | KL -3054.40 + 101it [00:03, 30.47it/s] 105it [00:03, 29.92it/s] 109it [00:03, 29.98it/s] 113it [00:03, 30.16it/s] 117it [00:03, 31.05it/s] 121it [00:04, 30.25it/s] 125it [00:04, 30.48it/s] 129it [00:04, 30.92it/s] 133it [00:04, 29.97it/s] 137it [00:04, 29.90it/s] 140it [00:04, 29.49it/s] 143it [00:04, 28.78it/s] 147it [00:04, 29.91it/s]2025-05-26 05:30:20,140 - INFO - [Epoch 090 | Batch 0150] IWAE-loss 4007.3735 | mean log_px -0.0137 | KL -3051.20 + 151it [00:05, 29.45it/s] 155it [00:05, 29.87it/s] 158it [00:05, 29.86it/s] 162it [00:05, 30.49it/s] 166it [00:05, 29.87it/s] 170it [00:05, 29.85it/s] 174it [00:05, 30.42it/s] 178it [00:05, 30.75it/s] 182it [00:06, 30.39it/s] 186it [00:06, 30.16it/s] 190it [00:06, 29.63it/s] 194it [00:06, 30.35it/s] 196it [00:06, 29.47it/s] +2025-05-26 05:30:21,708 - INFO - Epoch: 90, Objective: tensor([4207.4912], device='cuda:0', grad_fn=), Loss: 0.01723044365644455, KL/n: 62.30411911010742 + 0it [00:00, ?it/s]2025-05-26 05:30:21,901 - INFO - [Epoch 091 | Batch 0000] IWAE-loss 3952.2444 | mean log_px -0.0129 | KL -3050.70 + 2it [00:00, 18.05it/s] 5it [00:00, 23.50it/s] 9it [00:00, 27.01it/s] 12it [00:00, 27.93it/s] 16it [00:00, 28.74it/s] 19it [00:00, 28.99it/s] 23it [00:00, 29.45it/s] 26it [00:00, 29.48it/s] 30it [00:01, 29.80it/s] 34it [00:01, 30.25it/s] 38it [00:01, 30.16it/s] 42it [00:01, 30.23it/s] 46it [00:01, 29.71it/s] 50it [00:01, 30.22it/s]2025-05-26 05:30:23,570 - INFO - [Epoch 091 | Batch 0050] IWAE-loss 3891.5623 | mean log_px -0.0121 | KL -3045.28 + 54it [00:01, 29.82it/s] 58it [00:01, 30.37it/s] 62it [00:02, 29.91it/s] 66it [00:02, 30.38it/s] 70it [00:02, 29.94it/s] 73it [00:02, 29.79it/s] 77it [00:02, 30.04it/s] 81it [00:02, 30.48it/s] 85it [00:02, 30.40it/s] 89it [00:03, 30.34it/s] 93it [00:03, 29.82it/s] 97it [00:03, 30.35it/s]2025-05-26 05:30:25,227 - INFO - [Epoch 091 | Batch 0100] IWAE-loss 4361.3638 | mean log_px -0.0188 | KL -3045.56 + 101it [00:03, 30.28it/s] 105it [00:03, 29.77it/s] 109it [00:03, 30.32it/s] 113it [00:03, 29.79it/s] 117it [00:03, 30.25it/s] 121it [00:04, 29.85it/s] 124it [00:04, 29.70it/s] 128it [00:04, 30.53it/s] 132it [00:04, 30.37it/s] 136it [00:04, 29.87it/s] 140it [00:04, 30.07it/s] 144it [00:04, 30.58it/s] 148it [00:04, 30.44it/s]2025-05-26 05:30:26,889 - INFO - [Epoch 091 | Batch 0150] IWAE-loss 4017.5464 | mean log_px -0.0139 | KL -3046.43 + 152it [00:05, 29.90it/s] 156it [00:05, 30.47it/s] 160it [00:05, 29.74it/s] 164it [00:05, 30.02it/s] 168it [00:05, 30.53it/s] 172it [00:05, 29.92it/s] 175it [00:05, 29.92it/s] 179it [00:06, 29.70it/s] 183it [00:06, 29.85it/s] 187it [00:06, 30.48it/s] 191it [00:06, 30.53it/s] 195it [00:06, 28.81it/s] 196it [00:06, 29.59it/s] +2025-05-26 05:30:28,455 - INFO - Epoch: 91, Objective: tensor([4768.0332], device='cuda:0', grad_fn=), Loss: 0.024673206731677055, KL/n: 62.10816955566406 + 0it [00:00, ?it/s]2025-05-26 05:30:28,673 - INFO - [Epoch 092 | Batch 0000] IWAE-loss 4199.7969 | mean log_px -0.0165 | KL -3043.09 + 1it [00:00, 9.93it/s] 4it [00:00, 20.66it/s] 8it [00:00, 25.72it/s] 11it [00:00, 27.03it/s] 15it [00:00, 28.03it/s] 19it [00:00, 29.22it/s] 23it [00:00, 29.51it/s] 26it [00:00, 28.94it/s] 30it [00:01, 29.37it/s] 33it [00:01, 29.02it/s] 36it [00:01, 28.97it/s] 40it [00:01, 29.12it/s] 44it [00:01, 29.36it/s] 48it [00:01, 30.02it/s]2025-05-26 05:30:30,372 - INFO - [Epoch 092 | Batch 0050] IWAE-loss 3716.8953 | mean log_px -0.0097 | KL -3039.14 + 51it [00:01, 29.14it/s] 55it [00:01, 29.42it/s] 58it [00:02, 29.14it/s] 61it [00:02, 29.34it/s] 64it [00:02, 29.27it/s] 67it [00:02, 29.28it/s] 71it [00:02, 29.72it/s] 74it [00:02, 29.50it/s] 78it [00:02, 29.77it/s] 81it [00:02, 29.50it/s] 85it [00:02, 29.67it/s] 89it [00:03, 29.85it/s] 93it [00:03, 30.15it/s] 97it [00:03, 30.14it/s]2025-05-26 05:30:32,052 - INFO - [Epoch 092 | Batch 0100] IWAE-loss 5064.5151 | mean log_px -0.0290 | KL -3037.68 + 101it [00:03, 29.95it/s] 104it [00:03, 29.23it/s] 108it [00:03, 29.67it/s] 111it [00:03, 29.53it/s] 115it [00:03, 30.14it/s] 119it [00:04, 29.97it/s] 122it [00:04, 29.28it/s] 125it [00:04, 29.16it/s] 129it [00:04, 29.65it/s] 132it [00:04, 29.44it/s] 136it [00:04, 29.43it/s] 140it [00:04, 29.79it/s] 143it [00:04, 29.53it/s] 147it [00:05, 29.53it/s]2025-05-26 05:30:33,743 - INFO - [Epoch 092 | Batch 0150] IWAE-loss 4017.4958 | mean log_px -0.0140 | KL -3035.12 + 151it [00:05, 29.79it/s] 154it [00:05, 29.57it/s] 158it [00:05, 29.79it/s] 161it [00:05, 29.53it/s] 165it [00:05, 29.56it/s] 169it [00:05, 29.80it/s] 172it [00:05, 29.75it/s] 175it [00:05, 29.27it/s] 178it [00:06, 29.25it/s] 181it [00:06, 29.27it/s] 185it [00:06, 29.64it/s] 188it [00:06, 29.10it/s] 192it [00:06, 29.55it/s] 195it [00:06, 28.51it/s] 196it [00:06, 29.03it/s] +2025-05-26 05:30:35,338 - INFO - Epoch: 92, Objective: tensor([3728.2188], device='cuda:0', grad_fn=), Loss: 0.00990612618625164, KL/n: 61.91209030151367 + 0it [00:00, ?it/s]2025-05-26 05:30:35,721 - INFO - [Epoch 093 | Batch 0000] IWAE-loss 3929.0991 | mean log_px -0.0129 | KL -3029.58 + 2it [00:00, 15.72it/s] 5it [00:00, 23.10it/s] 8it [00:00, 25.56it/s] 12it [00:00, 27.56it/s] 15it [00:00, 28.29it/s] 19it [00:00, 28.99it/s] 22it [00:00, 29.26it/s] 26it [00:00, 29.58it/s] 29it [00:01, 29.68it/s] 32it [00:01, 29.74it/s] 36it [00:01, 30.25it/s] 40it [00:01, 29.56it/s] 44it [00:01, 29.99it/s] 48it [00:01, 30.35it/s]2025-05-26 05:30:37,388 - INFO - [Epoch 093 | Batch 0050] IWAE-loss 3707.9614 | mean log_px -0.0096 | KL -3034.37 + 52it [00:01, 30.37it/s] 56it [00:01, 29.71it/s] 60it [00:02, 29.75it/s] 64it [00:02, 30.44it/s] 68it [00:02, 29.93it/s] 72it [00:02, 30.36it/s] 76it [00:02, 29.77it/s] 80it [00:02, 29.95it/s] 84it [00:02, 30.30it/s] 88it [00:02, 29.92it/s] 92it [00:03, 30.30it/s] 96it [00:03, 30.18it/s] 100it [00:03, 29.58it/s]2025-05-26 05:30:39,048 - INFO - [Epoch 093 | Batch 0100] IWAE-loss 4339.8755 | mean log_px -0.0188 | KL -3026.79 + 104it [00:03, 29.64it/s] 108it [00:03, 30.30it/s] 112it [00:03, 30.36it/s] 116it [00:03, 29.92it/s] 120it [00:04, 30.08it/s] 124it [00:04, 30.27it/s] 128it [00:04, 29.62it/s] 132it [00:04, 30.18it/s] 136it [00:04, 30.18it/s] 140it [00:04, 29.57it/s] 144it [00:04, 29.83it/s] 147it [00:04, 29.70it/s]2025-05-26 05:30:40,720 - INFO - [Epoch 093 | Batch 0150] IWAE-loss 4476.9248 | mean log_px -0.0208 | KL -3023.78 + 151it [00:05, 29.64it/s] 155it [00:05, 29.84it/s] 159it [00:05, 30.47it/s] 163it [00:05, 30.23it/s] 167it [00:05, 29.83it/s] 170it [00:05, 29.31it/s] 173it [00:05, 29.45it/s] 177it [00:05, 29.64it/s] 181it [00:06, 29.76it/s] 184it [00:06, 29.73it/s] 187it [00:06, 29.77it/s] 191it [00:06, 29.83it/s] 194it [00:06, 29.82it/s] 196it [00:06, 29.35it/s] +2025-05-26 05:30:42,312 - INFO - Epoch: 93, Objective: tensor([3971.8271], device='cuda:0', grad_fn=), Loss: 0.013218323700129986, KL/n: 61.70732498168945 + 0it [00:00, ?it/s]2025-05-26 05:30:42,519 - INFO - [Epoch 094 | Batch 0000] IWAE-loss 3692.0515 | mean log_px -0.0096 | KL -3019.28 + 2it [00:00, 15.88it/s] 5it [00:00, 22.67it/s] 8it [00:00, 25.54it/s] 12it [00:00, 27.75it/s] 15it [00:00, 27.72it/s] 19it [00:00, 29.22it/s] 22it [00:00, 28.82it/s] 26it [00:00, 29.33it/s] 29it [00:01, 29.30it/s] 33it [00:01, 30.08it/s] 36it [00:01, 29.45it/s] 40it [00:01, 30.09it/s] 43it [00:01, 29.58it/s] 47it [00:01, 29.84it/s] 50it [00:01, 29.83it/s]2025-05-26 05:30:44,196 - INFO - [Epoch 094 | Batch 0050] IWAE-loss 3415.6335 | mean log_px -0.0057 | KL -3018.58 + 53it [00:01, 29.74it/s] 56it [00:01, 29.65it/s] 60it [00:02, 30.24it/s] 64it [00:02, 30.15it/s] 68it [00:02, 30.05it/s] 72it [00:02, 30.02it/s] 76it [00:02, 29.58it/s] 79it [00:02, 29.48it/s] 83it [00:02, 29.66it/s] 87it [00:02, 29.99it/s] 90it [00:03, 29.37it/s] 94it [00:03, 29.64it/s] 98it [00:03, 30.30it/s]2025-05-26 05:30:45,879 - INFO - [Epoch 094 | Batch 0100] IWAE-loss 4501.3726 | mean log_px -0.0212 | KL -3014.79 + 102it [00:03, 30.04it/s] 106it [00:03, 29.65it/s] 109it [00:03, 29.53it/s] 113it [00:03, 30.09it/s] 117it [00:03, 30.06it/s] 121it [00:04, 30.18it/s] 125it [00:04, 29.47it/s] 129it [00:04, 30.24it/s] 133it [00:04, 30.10it/s] 137it [00:04, 29.69it/s] 140it [00:04, 29.74it/s] 143it [00:04, 29.64it/s] 147it [00:04, 29.72it/s]2025-05-26 05:30:47,544 - INFO - [Epoch 094 | Batch 0150] IWAE-loss 4486.3765 | mean log_px -0.0210 | KL -3018.51 + 151it [00:05, 29.99it/s] 154it [00:05, 29.45it/s] 158it [00:05, 29.74it/s] 161it [00:05, 29.48it/s] 164it [00:05, 29.57it/s] 167it [00:05, 29.26it/s] 171it [00:05, 29.99it/s] 174it [00:05, 29.34it/s] 178it [00:06, 29.50it/s] 182it [00:06, 30.11it/s] 186it [00:06, 29.30it/s] 190it [00:06, 30.09it/s] 194it [00:06, 29.95it/s] 196it [00:06, 29.25it/s] +2025-05-26 05:30:49,137 - INFO - Epoch: 94, Objective: tensor([3698.0793], device='cuda:0', grad_fn=), Loss: 0.011440644972026348, KL/n: 61.510562896728516 + 0it [00:00, ?it/s]2025-05-26 05:30:49,515 - INFO - [Epoch 095 | Batch 0000] IWAE-loss 3977.1692 | mean log_px -0.0138 | KL -3011.00 + 2it [00:00, 15.20it/s] 5it [00:00, 21.63it/s] 9it [00:00, 25.68it/s] 12it [00:00, 26.94it/s] 15it [00:00, 27.90it/s] 18it [00:00, 28.48it/s] 21it [00:00, 28.88it/s] 25it [00:00, 29.61it/s] 28it [00:01, 28.69it/s] 32it [00:01, 28.86it/s] 36it [00:01, 29.24it/s] 39it [00:01, 28.50it/s] 43it [00:01, 29.12it/s] 46it [00:01, 27.59it/s] 49it [00:01, 27.79it/s]2025-05-26 05:30:51,253 - INFO - [Epoch 095 | Batch 0050] IWAE-loss 4243.2178 | mean log_px -0.0177 | KL -3007.56 + 52it [00:01, 28.04it/s] 55it [00:01, 28.18it/s] 59it [00:02, 28.63it/s] 63it [00:02, 29.17it/s] 67it [00:02, 29.66it/s] 70it [00:02, 29.03it/s] 73it [00:02, 29.16it/s] 77it [00:02, 29.77it/s] 80it [00:02, 28.96it/s] 83it [00:02, 29.02it/s] 87it [00:03, 29.70it/s] 90it [00:03, 29.13it/s] 93it [00:03, 28.78it/s] 97it [00:03, 29.32it/s] 100it [00:03, 29.38it/s]2025-05-26 05:30:52,962 - INFO - [Epoch 095 | Batch 0100] IWAE-loss 4067.2896 | mean log_px -0.0152 | KL -3005.44 + 103it [00:03, 29.02it/s] 106it [00:03, 29.08it/s] 110it [00:03, 29.56it/s] 113it [00:03, 29.44it/s] 117it [00:04, 29.58it/s] 121it [00:04, 30.18it/s] 125it [00:04, 30.21it/s] 129it [00:04, 29.49it/s] 133it [00:04, 30.07it/s] 137it [00:04, 30.00it/s] 141it [00:04, 29.94it/s] 144it [00:04, 29.49it/s] 147it [00:05, 29.41it/s] 150it [00:05, 29.48it/s]2025-05-26 05:30:54,642 - INFO - [Epoch 095 | Batch 0150] IWAE-loss 4149.8564 | mean log_px -0.0164 | KL -3004.71 + 153it [00:05, 29.27it/s] 157it [00:05, 30.15it/s] 161it [00:05, 30.04it/s] 164it [00:05, 29.39it/s] 168it [00:05, 29.47it/s] 171it [00:05, 28.83it/s] 174it [00:06, 29.02it/s] 177it [00:06, 28.48it/s] 181it [00:06, 29.15it/s] 185it [00:06, 29.38it/s] 189it [00:06, 29.88it/s] 192it [00:06, 29.26it/s] 195it [00:06, 28.61it/s] 196it [00:06, 28.74it/s] +2025-05-26 05:30:56,249 - INFO - Epoch: 95, Objective: tensor([3720.6602], device='cuda:0', grad_fn=), Loss: 0.011292683891952038, KL/n: 61.2777214050293 + 0it [00:00, ?it/s]2025-05-26 05:30:56,469 - INFO - [Epoch 096 | Batch 0000] IWAE-loss 3823.0386 | mean log_px -0.0118 | KL -2996.26 + 1it [00:00, 9.15it/s] 4it [00:00, 19.87it/s] 8it [00:00, 25.18it/s] 11it [00:00, 26.43it/s] 15it [00:00, 28.07it/s] 19it [00:00, 28.96it/s] 22it [00:00, 28.61it/s] 26it [00:00, 29.31it/s] 29it [00:01, 28.84it/s] 32it [00:01, 29.08it/s] 36it [00:01, 29.29it/s] 40it [00:01, 29.61it/s] 43it [00:01, 28.93it/s] 47it [00:01, 29.15it/s]2025-05-26 05:30:58,171 - INFO - [Epoch 096 | Batch 0050] IWAE-loss 4019.6848 | mean log_px -0.0146 | KL -2995.68 + 51it [00:01, 29.36it/s] 55it [00:01, 29.73it/s] 58it [00:02, 29.05it/s] 62it [00:02, 29.29it/s] 65it [00:02, 28.81it/s] 69it [00:02, 29.16it/s] 72it [00:02, 28.95it/s] 75it [00:02, 29.10it/s] 78it [00:02, 28.86it/s] 81it [00:02, 29.08it/s] 84it [00:02, 28.67it/s] 88it [00:03, 28.86it/s] 91it [00:03, 28.94it/s] 94it [00:03, 29.18it/s] 97it [00:03, 28.74it/s] 100it [00:03, 29.03it/s]2025-05-26 05:30:59,896 - INFO - [Epoch 096 | Batch 0100] IWAE-loss 3780.0317 | mean log_px -0.0112 | KL -2998.08 + 103it [00:03, 29.16it/s] 107it [00:03, 29.61it/s] 110it [00:03, 28.83it/s] 113it [00:03, 29.02it/s] 116it [00:04, 28.85it/s] 120it [00:04, 29.17it/s] 124it [00:04, 29.59it/s] 127it [00:04, 28.67it/s] 131it [00:04, 28.84it/s] 135it [00:04, 29.43it/s] 138it [00:04, 28.86it/s] 142it [00:04, 28.80it/s] 145it [00:05, 28.66it/s] 149it [00:05, 28.57it/s]2025-05-26 05:31:01,627 - INFO - [Epoch 096 | Batch 0150] IWAE-loss 3605.9509 | mean log_px -0.0087 | KL -2993.60 + 153it [00:05, 28.86it/s] 156it [00:05, 28.25it/s] 159it [00:05, 28.59it/s] 162it [00:05, 27.68it/s] 165it [00:05, 28.03it/s] 168it [00:05, 28.04it/s] 171it [00:05, 27.37it/s] 175it [00:06, 28.02it/s] 178it [00:06, 28.02it/s] 181it [00:06, 27.37it/s] 185it [00:06, 27.68it/s] 189it [00:06, 28.40it/s] 192it [00:06, 28.36it/s] 195it [00:06, 26.67it/s] 196it [00:06, 28.24it/s] +2025-05-26 05:31:03,313 - INFO - Epoch: 96, Objective: tensor([3576.1594], device='cuda:0', grad_fn=), Loss: 0.007815864868462086, KL/n: 61.08281326293945 + 0it [00:00, ?it/s]2025-05-26 05:31:03,667 - INFO - [Epoch 097 | Batch 0000] IWAE-loss 3672.9385 | mean log_px -0.0097 | KL -2993.12 + 2it [00:00, 16.32it/s] 6it [00:00, 24.66it/s] 9it [00:00, 26.66it/s] 12it [00:00, 18.21it/s] 16it [00:00, 22.07it/s] 20it [00:00, 24.53it/s] 24it [00:00, 26.25it/s] 27it [00:01, 27.03it/s] 31it [00:01, 28.44it/s] 34it [00:01, 28.26it/s] 38it [00:01, 28.95it/s] 41it [00:01, 28.94it/s] 44it [00:01, 28.52it/s] 47it [00:01, 28.73it/s]2025-05-26 05:31:05,509 - INFO - [Epoch 097 | Batch 0050] IWAE-loss 4370.7178 | mean log_px -0.0198 | KL -2987.52 + 51it [00:01, 29.00it/s] 55it [00:02, 29.09it/s] 58it [00:02, 29.21it/s] 61it [00:02, 28.76it/s] 65it [00:02, 28.63it/s] 69it [00:02, 29.24it/s] 72it [00:02, 28.60it/s] 76it [00:02, 29.04it/s] 80it [00:02, 29.23it/s] 83it [00:03, 28.81it/s] 87it [00:03, 29.54it/s] 90it [00:03, 28.84it/s] 94it [00:03, 29.52it/s] 97it [00:03, 28.98it/s]2025-05-26 05:31:07,233 - INFO - [Epoch 097 | Batch 0100] IWAE-loss 3778.5891 | mean log_px -0.0113 | KL -2986.04 + 101it [00:03, 28.79it/s] 105it [00:03, 28.90it/s] 109it [00:03, 29.14it/s] 112it [00:04, 28.92it/s] 115it [00:04, 29.12it/s] 118it [00:04, 28.62it/s] 122it [00:04, 28.45it/s] 125it [00:04, 28.66it/s] 128it [00:04, 27.77it/s] 131it [00:04, 28.05it/s] 134it [00:04, 28.36it/s] 137it [00:04, 27.54it/s] 140it [00:05, 27.54it/s] 144it [00:05, 27.50it/s] 147it [00:05, 27.51it/s] 150it [00:05, 28.04it/s]2025-05-26 05:31:09,011 - INFO - [Epoch 097 | Batch 0150] IWAE-loss 3849.5334 | mean log_px -0.0124 | KL -2983.99 + 153it [00:05, 28.11it/s] 156it [00:05, 27.89it/s] 159it [00:05, 27.61it/s] 162it [00:05, 27.08it/s] 165it [00:05, 27.58it/s] 168it [00:06, 25.85it/s] 171it [00:06, 24.62it/s] 174it [00:06, 24.08it/s] 177it [00:06, 24.88it/s] 180it [00:06, 26.09it/s] 183it [00:06, 26.48it/s] 187it [00:06, 27.69it/s] 190it [00:06, 27.37it/s] 194it [00:07, 28.76it/s] 196it [00:07, 27.36it/s] +2025-05-26 05:31:10,770 - INFO - Epoch: 97, Objective: tensor([3655.8162], device='cuda:0', grad_fn=), Loss: 0.007865343242883682, KL/n: 60.88451385498047 + 0it [00:00, ?it/s]2025-05-26 05:31:11,159 - INFO - [Epoch 098 | Batch 0000] IWAE-loss 3445.0972 | mean log_px -0.0066 | KL -2981.72 + 2it [00:00, 14.71it/s] 6it [00:00, 23.82it/s] 9it [00:00, 25.22it/s] 13it [00:00, 28.09it/s] 16it [00:00, 27.84it/s] 20it [00:00, 28.38it/s] 24it [00:00, 29.38it/s] 27it [00:00, 28.70it/s] 31it [00:01, 29.28it/s] 34it [00:01, 29.39it/s] 37it [00:01, 28.91it/s] 40it [00:01, 29.05it/s] 44it [00:01, 30.20it/s] 48it [00:01, 29.59it/s]2025-05-26 05:31:12,854 - INFO - [Epoch 098 | Batch 0050] IWAE-loss 3896.7939 | mean log_px -0.0132 | KL -2973.53 + 51it [00:01, 29.60it/s] 55it [00:01, 29.21it/s] 59it [00:02, 29.41it/s] 63it [00:02, 30.24it/s] 67it [00:02, 29.79it/s] 71it [00:02, 29.91it/s] 74it [00:02, 29.79it/s] 77it [00:02, 29.48it/s] 81it [00:02, 30.18it/s] 85it [00:02, 30.07it/s] 89it [00:03, 29.56it/s] 93it [00:03, 29.82it/s] 96it [00:03, 29.75it/s] 99it [00:03, 29.69it/s]2025-05-26 05:31:14,531 - INFO - [Epoch 098 | Batch 0100] IWAE-loss 3905.4084 | mean log_px -0.0133 | KL -2975.83 + 102it [00:03, 29.33it/s] 106it [00:03, 30.35it/s] 110it [00:03, 30.07it/s] 114it [00:03, 30.18it/s] 118it [00:04, 29.58it/s] 122it [00:04, 29.73it/s] 125it [00:04, 29.74it/s] 128it [00:04, 29.45it/s] 131it [00:04, 29.40it/s] 135it [00:04, 29.60it/s] 138it [00:04, 29.56it/s] 142it [00:04, 29.78it/s] 146it [00:04, 30.17it/s] 150it [00:05, 29.78it/s]2025-05-26 05:31:16,213 - INFO - [Epoch 098 | Batch 0150] IWAE-loss 4004.4780 | mean log_px -0.0147 | KL -2976.23 + 153it [00:05, 29.69it/s] 156it [00:05, 29.10it/s] 159it [00:05, 28.60it/s] 163it [00:05, 28.70it/s] 166it [00:05, 28.35it/s] 169it [00:05, 27.87it/s] 172it [00:05, 28.26it/s] 175it [00:06, 27.83it/s] 178it [00:06, 28.14it/s] 181it [00:06, 27.31it/s] 185it [00:06, 28.12it/s] 188it [00:06, 27.43it/s] 191it [00:06, 27.77it/s] 194it [00:06, 27.51it/s] 196it [00:06, 28.72it/s] +2025-05-26 05:31:17,899 - INFO - Epoch: 98, Objective: tensor([4241.2046], device='cuda:0', grad_fn=), Loss: 0.014962981455028057, KL/n: 60.67826843261719 + 0it [00:00, ?it/s]2025-05-26 05:31:18,113 - INFO - [Epoch 099 | Batch 0000] IWAE-loss 4390.7607 | mean log_px -0.0203 | KL -2969.95 + 2it [00:00, 15.78it/s] 5it [00:00, 22.29it/s] 9it [00:00, 25.96it/s] 13it [00:00, 27.70it/s] 16it [00:00, 27.61it/s] 20it [00:00, 28.45it/s] 24it [00:00, 29.36it/s] 28it [00:01, 29.43it/s] 31it [00:01, 28.88it/s] 35it [00:01, 29.67it/s] 39it [00:01, 29.32it/s] 42it [00:01, 29.30it/s] 46it [00:01, 29.91it/s] 49it [00:01, 29.37it/s]2025-05-26 05:31:19,795 - INFO - [Epoch 099 | Batch 0050] IWAE-loss 3797.9841 | mean log_px -0.0119 | KL -2966.91 + 53it [00:01, 29.84it/s] 57it [00:01, 30.06it/s] 60it [00:02, 29.24it/s] 64it [00:02, 29.79it/s] 67it [00:02, 29.55it/s] 71it [00:02, 29.72it/s] 75it [00:02, 29.76it/s] 78it [00:02, 29.51it/s] 81it [00:02, 29.30it/s] 85it [00:02, 29.70it/s] 88it [00:03, 29.21it/s] 92it [00:03, 29.93it/s] 95it [00:03, 29.91it/s] 98it [00:03, 29.09it/s]2025-05-26 05:31:21,486 - INFO - [Epoch 099 | Batch 0100] IWAE-loss 3583.3040 | mean log_px -0.0088 | KL -2966.69 + 102it [00:03, 29.49it/s] 106it [00:03, 29.82it/s] 109it [00:03, 29.23it/s] 113it [00:03, 29.75it/s] 116it [00:03, 29.48it/s] 120it [00:04, 29.72it/s] 123it [00:04, 29.55it/s] 126it [00:04, 29.29it/s] 129it [00:04, 29.01it/s] 132it [00:04, 28.67it/s] 135it [00:04, 28.66it/s] 138it [00:04, 28.74it/s] 141it [00:04, 29.10it/s] 144it [00:04, 28.98it/s] 147it [00:05, 28.48it/s] 150it [00:05, 28.26it/s]2025-05-26 05:31:23,216 - INFO - [Epoch 099 | Batch 0150] IWAE-loss 3738.5691 | mean log_px -0.0111 | KL -2963.81 + 154it [00:05, 28.83it/s] 157it [00:05, 28.29it/s] 160it [00:05, 28.40it/s] 163it [00:05, 28.76it/s] 166it [00:05, 28.50it/s] 170it [00:05, 28.85it/s] 174it [00:05, 29.62it/s] 177it [00:06, 29.05it/s] 181it [00:06, 29.22it/s] 185it [00:06, 29.45it/s] 189it [00:06, 29.74it/s] 193it [00:06, 29.18it/s] 196it [00:06, 29.05it/s] 196it [00:06, 28.79it/s] +2025-05-26 05:31:24,833 - INFO - Epoch: 99, Objective: tensor([3932.8035], device='cuda:0', grad_fn=), Loss: 0.01374893356114626, KL/n: 60.47543716430664 +2025-05-26 05:31:24,836 - INFO - Select objective: bbb + 0it [00:00, ?it/s] 2it [00:00, 15.52it/s] 5it [00:00, 22.70it/s] 9it [00:00, 26.33it/s] 12it [00:00, 27.58it/s] 15it [00:00, 28.35it/s] 18it [00:00, 28.88it/s] 21it [00:00, 29.19it/s] 24it [00:00, 29.43it/s] 27it [00:00, 29.56it/s] 30it [00:01, 29.66it/s] 33it [00:01, 29.69it/s] 36it [00:01, 29.73it/s] 39it [00:01, 29.77it/s] 42it [00:01, 29.75it/s] 45it [00:01, 29.76it/s] 48it [00:01, 29.47it/s] 51it [00:01, 29.24it/s] 55it [00:01, 29.49it/s] 58it [00:02, 29.57it/s] 61it [00:02, 29.66it/s] 64it [00:02, 29.62it/s] 67it [00:02, 29.71it/s] 70it [00:02, 29.72it/s] 73it [00:02, 29.79it/s] 76it [00:02, 29.75it/s] 79it [00:02, 29.77it/s] 82it [00:02, 29.82it/s] 85it [00:02, 29.79it/s] 89it [00:03, 29.89it/s] 92it [00:03, 29.82it/s] 96it [00:03, 29.90it/s] 100it [00:03, 29.91it/s] 103it [00:03, 29.90it/s] 106it [00:03, 29.74it/s] 109it [00:03, 29.69it/s] 112it [00:03, 29.62it/s] 115it [00:03, 29.59it/s] 118it [00:04, 29.67it/s] 121it [00:04, 29.67it/s] 124it [00:04, 29.73it/s] 127it [00:04, 29.73it/s] 131it [00:04, 29.81it/s] 134it [00:04, 29.75it/s] 137it [00:04, 29.73it/s] 140it [00:04, 29.80it/s] 143it [00:04, 29.75it/s] 146it [00:04, 29.79it/s] 149it [00:05, 29.73it/s] 152it [00:05, 29.65it/s] 155it [00:05, 29.65it/s] 158it [00:05, 29.67it/s] 161it [00:05, 29.68it/s] 164it [00:05, 29.52it/s] 168it [00:05, 29.81it/s] 171it [00:05, 29.82it/s] 174it [00:05, 29.79it/s] 177it [00:06, 29.70it/s] 180it [00:06, 29.76it/s] 183it [00:06, 29.76it/s] 186it [00:06, 29.73it/s] 189it [00:06, 29.68it/s] 192it [00:06, 29.71it/s] 195it [00:06, 29.67it/s] 198it [00:06, 29.59it/s] 201it [00:06, 29.60it/s] 204it [00:06, 29.56it/s] 207it [00:07, 29.63it/s] 210it [00:07, 29.69it/s] 213it [00:07, 29.74it/s] 216it [00:07, 29.46it/s] 219it [00:07, 29.53it/s] 222it [00:07, 29.57it/s] 225it [00:07, 29.50it/s] 228it [00:07, 29.56it/s] 231it [00:07, 29.60it/s] 234it [00:07, 29.65it/s] 237it [00:08, 29.60it/s] 240it [00:08, 29.59it/s] 243it [00:08, 29.62it/s] 246it [00:08, 29.69it/s] 249it [00:08, 29.73it/s] 252it [00:08, 29.74it/s] 255it [00:08, 29.75it/s] 258it [00:08, 29.56it/s] 261it [00:08, 29.62it/s] 264it [00:08, 29.66it/s] 267it [00:09, 29.70it/s] 270it [00:09, 29.73it/s] 273it [00:09, 29.72it/s] 276it [00:09, 29.66it/s] 279it [00:09, 26.89it/s] 280it [00:09, 29.28it/s] +2025-05-26 05:31:34,736 - INFO - Epoch: 0, Objective: 0.028284952044487, Loss: 0.025774501264095306, KL/n: 0.002510451478883624 + 0%| | 0/84 [00:00), Loss: 0.43466299772262573, KL/n: 68.75403594970703 + 0it [00:00, ?it/s]2025-05-26 05:34:05,702 - INFO - [Epoch 001 | Batch 0000] IWAE-loss 28074.5488 | mean log_px -0.3577 | KL -3369.96 + 1it [00:00, 5.46it/s] 2it [00:00, 7.22it/s] 3it [00:00, 8.11it/s] 4it [00:00, 8.60it/s] 5it [00:00, 8.70it/s] 6it [00:00, 8.70it/s] 7it [00:00, 8.98it/s] 8it [00:00, 9.09it/s] 9it [00:01, 9.17it/s] 10it [00:01, 9.23it/s] 11it [00:01, 9.18it/s] 12it [00:01, 9.22it/s] 13it [00:01, 9.26it/s] 14it [00:01, 9.28it/s] 15it [00:01, 9.34it/s] 16it [00:01, 9.36it/s] 17it [00:01, 9.37it/s] 18it [00:02, 9.32it/s] 19it [00:02, 9.36it/s] 20it [00:02, 9.40it/s] 21it [00:02, 9.42it/s] 22it [00:02, 9.37it/s] 23it [00:02, 9.38it/s] 24it [00:02, 9.31it/s] 25it [00:02, 9.35it/s] 26it [00:02, 9.40it/s] 27it [00:02, 9.35it/s] 28it [00:03, 9.38it/s] 29it [00:03, 9.39it/s] 30it [00:03, 9.41it/s] 31it [00:03, 9.41it/s] 32it [00:03, 9.44it/s] 33it [00:03, 9.38it/s] 34it [00:03, 9.33it/s] 35it [00:03, 9.42it/s] 36it [00:03, 9.45it/s] 37it [00:04, 9.43it/s] 38it [00:04, 9.37it/s] 39it [00:04, 9.40it/s] 40it [00:04, 9.37it/s] 41it [00:04, 9.37it/s] 42it [00:04, 9.38it/s] 43it [00:04, 9.42it/s] 44it [00:04, 9.40it/s] 45it [00:04, 9.36it/s] 46it [00:04, 9.44it/s] 47it [00:05, 9.49it/s] 48it [00:05, 9.45it/s] 49it [00:05, 9.43it/s] 50it [00:05, 9.44it/s]2025-05-26 05:34:11,038 - INFO - [Epoch 001 | Batch 0050] IWAE-loss 26761.6230 | mean log_px -0.3389 | KL -3393.95 + 51it [00:05, 9.47it/s] 52it [00:05, 9.41it/s] 53it [00:05, 9.44it/s] 54it [00:05, 9.42it/s] 55it [00:05, 9.46it/s] 56it [00:06, 9.42it/s] 57it [00:06, 9.43it/s] 58it [00:06, 9.42it/s] 59it [00:06, 9.43it/s] 60it [00:06, 9.47it/s] 61it [00:06, 9.44it/s] 62it [00:06, 9.40it/s] 63it [00:06, 9.32it/s] 64it [00:06, 9.34it/s] 65it [00:07, 9.34it/s] 66it [00:07, 9.35it/s] 67it [00:07, 9.39it/s] 68it [00:07, 9.41it/s] 69it [00:07, 9.41it/s] 70it [00:07, 9.41it/s] 71it [00:07, 9.36it/s] 72it [00:07, 9.39it/s] 73it [00:07, 9.41it/s] 74it [00:07, 9.35it/s] 75it [00:08, 9.35it/s] 76it [00:08, 9.37it/s] 77it [00:08, 9.37it/s] 78it [00:08, 9.35it/s] 79it [00:08, 9.36it/s] 80it [00:08, 9.37it/s] 81it [00:08, 9.38it/s] 82it [00:08, 9.35it/s] 83it [00:08, 9.41it/s] 84it [00:09, 9.41it/s] 85it [00:09, 9.45it/s] 86it [00:09, 9.41it/s] 87it [00:09, 9.41it/s] 88it [00:09, 9.37it/s] 89it [00:09, 9.38it/s] 90it [00:09, 9.36it/s] 91it [00:09, 9.39it/s] 92it [00:09, 9.40it/s] 93it [00:09, 9.46it/s] 94it [00:10, 9.50it/s] 95it [00:10, 9.47it/s] 96it [00:10, 9.41it/s] 97it [00:10, 9.40it/s] 98it [00:10, 9.37it/s] 99it [00:10, 9.36it/s] 100it [00:10, 9.38it/s]2025-05-26 05:34:16,361 - INFO - [Epoch 001 | Batch 0100] IWAE-loss 28285.6133 | mean log_px -0.3769 | KL -3410.21 + 101it [00:10, 9.35it/s] 102it [00:10, 9.36it/s] 103it [00:11, 9.38it/s] 104it [00:11, 9.38it/s] 105it [00:11, 9.45it/s] 106it [00:11, 9.48it/s] 107it [00:11, 9.48it/s] 108it [00:11, 9.49it/s] 109it [00:11, 9.48it/s] 110it [00:11, 9.48it/s] 111it [00:11, 9.48it/s] 112it [00:12, 9.44it/s] 113it [00:12, 9.36it/s] 114it [00:12, 9.24it/s] 115it [00:12, 9.36it/s] 116it [00:12, 9.37it/s] 117it [00:12, 9.40it/s] 118it [00:12, 9.34it/s] 119it [00:12, 9.37it/s] 120it [00:12, 9.32it/s] 121it [00:12, 9.38it/s] 122it [00:13, 9.35it/s] 123it [00:13, 9.39it/s] 124it [00:13, 9.43it/s] 125it [00:13, 9.41it/s] 126it [00:13, 9.39it/s] 127it [00:13, 9.40it/s] 128it [00:13, 9.41it/s] 129it [00:13, 9.37it/s] 130it [00:13, 9.39it/s] 131it [00:14, 9.33it/s] 132it [00:14, 9.39it/s] 133it [00:14, 9.40it/s] 134it [00:14, 9.39it/s] 135it [00:14, 9.41it/s] 136it [00:14, 9.42it/s] 137it [00:14, 9.38it/s] 138it [00:14, 9.33it/s] 139it [00:14, 9.17it/s] 140it [00:15, 9.23it/s] 141it [00:15, 9.33it/s] 142it [00:15, 9.36it/s] 143it [00:15, 9.29it/s] 144it [00:15, 9.36it/s] 145it [00:15, 9.39it/s] 146it [00:15, 9.42it/s] 147it [00:15, 9.39it/s] 148it [00:15, 9.41it/s] 149it [00:15, 9.42it/s] 150it [00:16, 9.46it/s]2025-05-26 05:34:21,687 - INFO - [Epoch 001 | Batch 0150] IWAE-loss 24188.4082 | mean log_px -0.3034 | KL -3424.15 + 151it [00:16, 9.47it/s] 152it [00:16, 9.43it/s] 153it [00:16, 9.13it/s] 154it [00:16, 9.22it/s] 155it [00:16, 9.30it/s] 156it [00:16, 9.34it/s] 157it [00:16, 9.38it/s] 158it [00:16, 9.37it/s] 159it [00:17, 9.40it/s] 160it [00:17, 9.40it/s] 161it [00:17, 9.42it/s] 162it [00:17, 9.41it/s] 163it [00:17, 9.42it/s] 164it [00:17, 9.41it/s] 165it [00:17, 9.41it/s] 166it [00:17, 9.42it/s] 167it [00:17, 9.46it/s] 168it [00:17, 9.45it/s] 169it [00:18, 9.40it/s] 170it [00:18, 9.38it/s] 171it [00:18, 9.38it/s] 172it [00:18, 9.43it/s] 173it [00:18, 9.41it/s] 174it [00:18, 9.37it/s] 175it [00:18, 9.34it/s] 176it [00:18, 9.33it/s] 177it [00:18, 9.36it/s] 178it [00:19, 9.37it/s] 179it [00:19, 9.40it/s] 180it [00:19, 9.40it/s] 181it [00:19, 9.37it/s] 182it [00:19, 9.39it/s] 183it [00:19, 9.42it/s] 184it [00:19, 9.43it/s] 185it [00:19, 9.41it/s] 186it [00:19, 9.41it/s] 187it [00:20, 9.40it/s] 188it [00:20, 9.40it/s] 189it [00:20, 9.40it/s] 190it [00:20, 9.37it/s] 191it [00:20, 9.36it/s] 192it [00:20, 9.38it/s] 193it [00:20, 9.41it/s] 194it [00:20, 9.40it/s] 195it [00:20, 8.95it/s] 196it [00:20, 9.10it/s] 196it [00:21, 9.31it/s] +2025-05-26 05:34:26,606 - INFO - Epoch: 1, Objective: tensor([25134.6309], device='cuda:0', grad_fn=), Loss: 0.3120049238204956, KL/n: 70.07382202148438 + 0it [00:00, ?it/s]2025-05-26 05:34:26,876 - INFO - [Epoch 002 | Batch 0000] IWAE-loss 26034.8926 | mean log_px -0.3319 | KL -3429.36 + 1it [00:00, 4.75it/s] 2it [00:00, 6.71it/s] 3it [00:00, 7.83it/s] 4it [00:00, 8.38it/s] 5it [00:00, 8.69it/s] 6it [00:00, 8.91it/s] 7it [00:00, 9.09it/s] 8it [00:00, 9.21it/s] 9it [00:01, 9.31it/s] 10it [00:01, 9.38it/s] 11it [00:01, 8.84it/s] 12it [00:01, 9.03it/s] 13it [00:01, 9.15it/s] 14it [00:01, 9.24it/s] 15it [00:01, 9.30it/s] 16it [00:01, 9.33it/s] 17it [00:01, 8.95it/s] 18it [00:02, 9.09it/s] 19it [00:02, 9.21it/s] 20it [00:02, 9.27it/s] 21it [00:02, 9.31it/s] 22it [00:02, 9.24it/s] 23it [00:02, 9.25it/s] 24it [00:02, 9.28it/s] 25it [00:02, 9.31it/s] 26it [00:02, 9.37it/s] 27it [00:03, 9.44it/s] 28it [00:03, 9.46it/s] 29it [00:03, 8.93it/s] 30it [00:03, 8.91it/s] 31it [00:03, 9.05it/s] 32it [00:03, 9.18it/s] 33it [00:03, 9.29it/s] 34it [00:03, 9.31it/s] 35it [00:03, 9.38it/s] 36it [00:04, 8.67it/s] 37it [00:04, 8.64it/s] 38it [00:04, 8.85it/s] 39it [00:04, 8.97it/s] 40it [00:04, 9.09it/s] 41it [00:04, 9.19it/s] 42it [00:04, 9.25it/s] 43it [00:04, 9.34it/s] 44it [00:04, 9.31it/s] 45it [00:04, 9.28it/s] 46it [00:05, 9.28it/s] 47it [00:05, 9.00it/s] 48it [00:05, 9.15it/s] 49it [00:05, 9.23it/s] 50it [00:05, 9.29it/s]2025-05-26 05:34:32,327 - INFO - [Epoch 002 | Batch 0050] IWAE-loss 24607.2324 | mean log_px -0.3063 | KL -3444.27 + 51it [00:05, 9.37it/s] 52it [00:05, 9.38it/s] 53it [00:05, 9.39it/s] 54it [00:05, 9.40it/s] 55it [00:06, 9.42it/s] 56it [00:06, 9.42it/s] 57it [00:06, 9.45it/s] 58it [00:06, 9.48it/s] 59it [00:06, 9.45it/s] 60it [00:06, 9.43it/s] 61it [00:06, 9.47it/s] 62it [00:06, 9.06it/s] 63it [00:06, 8.68it/s] 64it [00:07, 8.87it/s] 65it [00:07, 8.54it/s] 66it [00:07, 8.91it/s] 67it [00:07, 9.20it/s] 68it [00:07, 9.37it/s] 69it [00:07, 8.96it/s] 70it [00:07, 9.23it/s] 71it [00:07, 9.43it/s] 72it [00:07, 9.59it/s] 73it [00:08, 9.71it/s] 74it [00:08, 9.77it/s] 76it [00:08, 9.89it/s] 77it [00:08, 9.48it/s] 78it [00:08, 9.59it/s] 80it [00:08, 9.76it/s] 81it [00:08, 9.81it/s] 82it [00:08, 9.83it/s] 83it [00:09, 9.86it/s] 84it [00:09, 9.88it/s] 85it [00:09, 9.91it/s] 86it [00:09, 9.92it/s] 87it [00:09, 9.56it/s] 88it [00:09, 9.51it/s] 89it [00:09, 9.59it/s] 90it [00:09, 9.58it/s] 91it [00:09, 9.63it/s] 92it [00:09, 9.55it/s] 93it [00:10, 9.01it/s] 94it [00:10, 9.21it/s] 95it [00:10, 9.35it/s] 96it [00:10, 9.44it/s] 97it [00:10, 9.53it/s] 98it [00:10, 9.55it/s] 99it [00:10, 9.61it/s] 100it [00:10, 9.67it/s]2025-05-26 05:34:37,608 - INFO - [Epoch 002 | Batch 0100] IWAE-loss 20464.7461 | mean log_px -0.2492 | KL -3452.10 + 101it [00:10, 9.00it/s] 102it [00:11, 9.22it/s] 103it [00:11, 9.29it/s] 104it [00:11, 9.34it/s] 105it [00:11, 9.39it/s] 106it [00:11, 9.39it/s] 107it [00:11, 9.47it/s] 108it [00:11, 6.30it/s] 109it [00:11, 6.76it/s] 110it [00:12, 7.44it/s] 111it [00:12, 7.99it/s] 112it [00:12, 8.37it/s] 113it [00:12, 8.75it/s] 114it [00:12, 8.90it/s] 115it [00:12, 9.11it/s] 116it [00:12, 9.32it/s] 117it [00:12, 9.42it/s] 118it [00:12, 9.50it/s] 119it [00:13, 9.58it/s] 120it [00:13, 9.64it/s] 121it [00:13, 9.61it/s] 122it [00:13, 9.66it/s] 123it [00:13, 9.61it/s] 124it [00:13, 9.66it/s] 125it [00:13, 8.98it/s] 126it [00:13, 9.15it/s] 127it [00:13, 9.27it/s] 128it [00:13, 9.32it/s] 129it [00:14, 8.94it/s] 130it [00:14, 9.16it/s] 131it [00:14, 9.29it/s] 132it [00:14, 9.48it/s] 133it [00:14, 9.62it/s] 134it [00:14, 9.72it/s] 136it [00:14, 9.85it/s] 137it [00:14, 9.87it/s] 138it [00:15, 9.89it/s] 139it [00:15, 9.92it/s] 140it [00:15, 9.93it/s] 141it [00:15, 9.95it/s] 142it [00:15, 9.94it/s] 143it [00:15, 9.95it/s] 144it [00:15, 9.92it/s] 145it [00:15, 9.93it/s] 146it [00:15, 9.94it/s] 148it [00:16, 9.96it/s] 149it [00:16, 9.97it/s] 150it [00:16, 9.97it/s]2025-05-26 05:34:43,001 - INFO - [Epoch 002 | Batch 0150] IWAE-loss 18063.8633 | mean log_px -0.2179 | KL -3453.99 + 151it [00:16, 9.36it/s] 152it [00:16, 9.01it/s] 153it [00:16, 9.27it/s] 155it [00:16, 9.57it/s] 156it [00:16, 9.66it/s] 157it [00:16, 9.72it/s] 158it [00:17, 9.20it/s] 159it [00:17, 9.40it/s] 160it [00:17, 9.53it/s] 161it [00:17, 9.62it/s] 162it [00:17, 9.65it/s] 163it [00:17, 9.13it/s] 164it [00:17, 9.35it/s] 165it [00:17, 9.45it/s] 166it [00:17, 9.50it/s] 167it [00:18, 9.00it/s] 168it [00:18, 9.20it/s] 169it [00:18, 9.41it/s] 170it [00:18, 9.50it/s] 171it [00:18, 9.64it/s] 172it [00:18, 9.73it/s] 173it [00:18, 9.80it/s] 174it [00:18, 9.23it/s] 175it [00:18, 9.45it/s] 176it [00:18, 9.55it/s] 177it [00:19, 9.67it/s] 178it [00:19, 9.75it/s] 179it [00:19, 9.76it/s] 180it [00:19, 9.75it/s] 181it [00:19, 9.81it/s] 182it [00:19, 9.87it/s] 183it [00:19, 9.88it/s] 184it [00:19, 9.91it/s] 185it [00:19, 9.92it/s] 186it [00:19, 9.92it/s] 187it [00:20, 9.94it/s] 188it [00:20, 9.92it/s] 189it [00:20, 9.95it/s] 190it [00:20, 9.93it/s] 192it [00:20, 9.48it/s] 193it [00:20, 9.59it/s] 194it [00:20, 9.14it/s] 195it [00:20, 8.97it/s] 196it [00:21, 9.28it/s] +2025-05-26 05:34:47,847 - INFO - Epoch: 2, Objective: tensor([23773.6406], device='cuda:0', grad_fn=), Loss: 0.30370157957077026, KL/n: 70.60922241210938 + 0it [00:00, ?it/s]2025-05-26 05:34:48,117 - INFO - [Epoch 003 | Batch 0000] IWAE-loss 22127.6270 | mean log_px -0.2715 | KL -3458.96 + 1it [00:00, 4.68it/s] 3it [00:00, 7.77it/s] 5it [00:00, 8.77it/s] 7it [00:00, 9.29it/s] 9it [00:01, 9.58it/s] 10it [00:01, 9.24it/s] 12it [00:01, 9.54it/s] 14it [00:01, 9.36it/s] 16it [00:01, 9.59it/s] 18it [00:01, 9.74it/s] 20it [00:02, 9.82it/s] 22it [00:02, 9.88it/s] 24it [00:02, 9.92it/s] 26it [00:02, 9.97it/s] 28it [00:02, 9.99it/s] 30it [00:03, 9.97it/s] 31it [00:03, 9.93it/s] 32it [00:03, 9.90it/s] 33it [00:03, 9.88it/s] 34it [00:03, 9.85it/s] 35it [00:03, 9.82it/s] 37it [00:03, 9.90it/s] 38it [00:03, 9.29it/s] 39it [00:04, 9.38it/s] 40it [00:04, 9.48it/s] 41it [00:04, 9.58it/s] 42it [00:04, 9.64it/s] 43it [00:04, 9.13it/s] 44it [00:04, 9.07it/s] 45it [00:04, 9.11it/s] 46it [00:04, 9.08it/s] 47it [00:04, 9.20it/s] 48it [00:05, 9.21it/s] 49it [00:05, 9.29it/s] 50it [00:05, 8.91it/s]2025-05-26 05:34:53,330 - INFO - [Epoch 003 | Batch 0050] IWAE-loss 18690.7363 | mean log_px -0.2205 | KL -3462.40 + 51it [00:05, 9.04it/s] 52it [00:05, 9.18it/s] 53it [00:05, 9.22it/s] 54it [00:05, 9.19it/s] 55it [00:05, 9.27it/s] 56it [00:05, 9.26it/s] 57it [00:06, 9.22it/s] 58it [00:06, 9.20it/s] 59it [00:06, 9.17it/s] 60it [00:06, 9.22it/s] 61it [00:06, 9.24it/s] 62it [00:06, 8.83it/s] 63it [00:06, 8.93it/s] 64it [00:06, 9.05it/s] 65it [00:06, 9.15it/s] 66it [00:07, 9.24it/s] 67it [00:07, 9.37it/s] 68it [00:07, 9.48it/s] 69it [00:07, 9.59it/s] 70it [00:07, 9.66it/s] 71it [00:07, 9.73it/s] 72it [00:07, 9.75it/s] 73it [00:07, 9.80it/s] 74it [00:07, 9.81it/s] 75it [00:07, 9.83it/s] 76it [00:08, 9.84it/s] 77it [00:08, 9.85it/s] 78it [00:08, 9.85it/s] 79it [00:08, 9.23it/s] 80it [00:08, 9.40it/s] 81it [00:08, 9.55it/s] 82it [00:08, 9.62it/s] 83it [00:08, 9.68it/s] 84it [00:08, 9.73it/s] 85it [00:08, 9.74it/s] 86it [00:09, 9.77it/s] 87it [00:09, 9.79it/s] 88it [00:09, 9.80it/s] 89it [00:09, 9.84it/s] 90it [00:09, 9.83it/s] 91it [00:09, 9.85it/s] 92it [00:09, 9.83it/s] 93it [00:09, 9.85it/s] 94it [00:09, 9.84it/s] 95it [00:10, 9.85it/s] 96it [00:10, 9.18it/s] 97it [00:10, 9.33it/s] 98it [00:10, 9.45it/s] 99it [00:10, 9.55it/s] 100it [00:10, 9.02it/s]2025-05-26 05:34:58,597 - INFO - [Epoch 003 | Batch 0100] IWAE-loss 22098.5781 | mean log_px -0.2703 | KL -3471.58 + 101it [00:10, 9.20it/s] 102it [00:10, 9.41it/s] 103it [00:10, 9.51it/s] 104it [00:10, 9.59it/s] 105it [00:11, 9.65it/s] 106it [00:11, 9.10it/s] 107it [00:11, 9.32it/s] 108it [00:11, 9.47it/s] 109it [00:11, 9.58it/s] 110it [00:11, 9.66it/s] 111it [00:11, 9.73it/s] 112it [00:11, 9.78it/s] 113it [00:11, 9.81it/s] 114it [00:12, 9.82it/s] 115it [00:12, 9.83it/s] 116it [00:12, 9.85it/s] 117it [00:12, 9.22it/s] 118it [00:12, 9.38it/s] 119it [00:12, 9.52it/s] 120it [00:12, 9.61it/s] 121it [00:12, 9.70it/s] 122it [00:12, 9.73it/s] 123it [00:12, 9.78it/s] 124it [00:13, 9.78it/s] 125it [00:13, 9.81it/s] 126it [00:13, 9.80it/s] 127it [00:13, 9.81it/s] 128it [00:13, 9.81it/s] 129it [00:13, 9.82it/s] 130it [00:13, 9.70it/s] 131it [00:13, 9.70it/s] 132it [00:13, 9.54it/s] 133it [00:13, 9.57it/s] 134it [00:14, 9.60it/s] 135it [00:14, 9.54it/s] 136it [00:14, 9.28it/s] 137it [00:14, 9.24it/s] 138it [00:14, 9.30it/s] 139it [00:14, 8.72it/s] 140it [00:14, 8.82it/s] 141it [00:14, 8.79it/s] 142it [00:14, 8.85it/s] 143it [00:15, 8.90it/s] 144it [00:15, 8.94it/s] 145it [00:15, 8.49it/s] 146it [00:15, 8.67it/s] 147it [00:15, 8.80it/s] 148it [00:15, 9.07it/s] 149it [00:15, 9.24it/s] 150it [00:15, 9.28it/s]2025-05-26 05:35:03,904 - INFO - [Epoch 003 | Batch 0150] IWAE-loss 23228.7480 | mean log_px -0.2856 | KL -3470.63 + 151it [00:15, 8.85it/s] 152it [00:16, 9.08it/s] 153it [00:16, 9.30it/s] 154it [00:16, 9.45it/s] 155it [00:16, 9.56it/s] 156it [00:16, 9.62it/s] 157it [00:16, 9.65it/s] 158it [00:16, 9.69it/s] 159it [00:16, 9.09it/s] 160it [00:16, 9.26it/s] 161it [00:17, 9.39it/s] 162it [00:17, 9.49it/s] 163it [00:17, 8.99it/s] 164it [00:17, 9.19it/s] 165it [00:17, 9.34it/s] 166it [00:17, 9.44it/s] 167it [00:17, 8.96it/s] 168it [00:17, 9.17it/s] 169it [00:17, 9.35it/s] 170it [00:18, 9.43it/s] 171it [00:18, 9.53it/s] 172it [00:18, 9.59it/s] 173it [00:18, 9.62it/s] 174it [00:18, 9.62it/s] 175it [00:18, 9.70it/s] 176it [00:18, 9.73it/s] 177it [00:18, 9.53it/s] 178it [00:18, 8.88it/s] 179it [00:18, 8.98it/s] 180it [00:19, 9.20it/s] 181it [00:19, 9.39it/s] 182it [00:19, 9.51it/s] 183it [00:19, 9.59it/s] 184it [00:19, 9.06it/s] 185it [00:19, 9.29it/s] 186it [00:19, 9.39it/s] 187it [00:19, 9.51it/s] 188it [00:19, 9.62it/s] 189it [00:20, 9.58it/s] 190it [00:20, 9.61it/s] 191it [00:20, 9.07it/s] 192it [00:20, 9.27it/s] 193it [00:20, 9.37it/s] 194it [00:20, 9.46it/s] 195it [00:20, 9.07it/s] 196it [00:20, 9.32it/s] 196it [00:20, 9.41it/s] +2025-05-26 05:35:08,799 - INFO - Epoch: 3, Objective: tensor([23300.8750], device='cuda:0', grad_fn=), Loss: 0.2900332510471344, KL/n: 70.9906005859375 + 0it [00:00, ?it/s]2025-05-26 05:35:09,257 - INFO - [Epoch 004 | Batch 0000] IWAE-loss 12282.2793 | mean log_px -0.1411 | KL -3474.90 + 1it [00:00, 5.41it/s] 2it [00:00, 7.21it/s] 3it [00:00, 7.57it/s] 4it [00:00, 8.24it/s] 5it [00:00, 8.74it/s] 6it [00:00, 9.02it/s] 7it [00:00, 9.26it/s] 8it [00:00, 9.40it/s] 9it [00:01, 9.49it/s] 10it [00:01, 9.54it/s] 11it [00:01, 9.62it/s] 12it [00:01, 9.63it/s] 13it [00:01, 9.68it/s] 14it [00:01, 9.67it/s] 15it [00:01, 9.67it/s] 16it [00:01, 8.98it/s] 17it [00:01, 8.99it/s] 18it [00:01, 9.16it/s] 19it [00:02, 9.34it/s] 20it [00:02, 9.45it/s] 21it [00:02, 9.55it/s] 22it [00:02, 9.03it/s] 23it [00:02, 9.27it/s] 24it [00:02, 9.41it/s] 25it [00:02, 9.49it/s] 26it [00:02, 9.56it/s] 27it [00:02, 9.60it/s] 28it [00:03, 9.63it/s] 29it [00:03, 9.67it/s] 30it [00:03, 9.69it/s] 31it [00:03, 9.74it/s] 32it [00:03, 9.76it/s] 33it [00:03, 9.79it/s] 34it [00:03, 9.79it/s] 35it [00:03, 9.81it/s] 36it [00:03, 9.80it/s] 37it [00:03, 9.78it/s] 38it [00:04, 9.13it/s] 39it [00:04, 9.31it/s] 40it [00:04, 9.43it/s] 41it [00:04, 9.53it/s] 42it [00:04, 9.57it/s] 43it [00:04, 9.63it/s] 44it [00:04, 9.61it/s] 45it [00:04, 9.67it/s] 46it [00:04, 9.67it/s] 47it [00:05, 9.67it/s] 48it [00:05, 9.71it/s] 49it [00:05, 9.75it/s] 50it [00:05, 9.77it/s]2025-05-26 05:35:14,498 - INFO - [Epoch 004 | Batch 0050] IWAE-loss 23196.6523 | mean log_px -0.2816 | KL -3483.42 + 51it [00:05, 9.77it/s] 52it [00:05, 9.76it/s] 53it [00:05, 9.24it/s] 54it [00:05, 9.21it/s] 55it [00:05, 9.05it/s] 56it [00:06, 8.50it/s] 57it [00:06, 8.42it/s] 58it [00:06, 8.61it/s] 59it [00:06, 8.79it/s] 60it [00:06, 8.43it/s] 61it [00:06, 8.70it/s] 62it [00:06, 9.00it/s] 63it [00:06, 9.22it/s] 64it [00:06, 9.39it/s] 65it [00:07, 8.95it/s] 66it [00:07, 9.22it/s] 67it [00:07, 9.44it/s] 68it [00:07, 9.56it/s] 70it [00:07, 9.76it/s] 72it [00:07, 9.43it/s] 74it [00:07, 9.64it/s] 75it [00:08, 9.70it/s] 76it [00:08, 9.75it/s] 77it [00:08, 9.81it/s] 78it [00:08, 9.82it/s] 79it [00:08, 9.86it/s] 80it [00:08, 9.87it/s] 82it [00:08, 9.94it/s] 83it [00:08, 9.91it/s] 84it [00:08, 9.73it/s] 85it [00:09, 9.38it/s] 86it [00:09, 9.51it/s] 87it [00:09, 9.63it/s] 88it [00:09, 9.47it/s] 89it [00:09, 9.46it/s] 90it [00:09, 9.58it/s] 91it [00:09, 9.69it/s] 92it [00:09, 9.73it/s] 93it [00:09, 9.29it/s] 94it [00:10, 9.46it/s] 95it [00:10, 9.60it/s] 96it [00:10, 9.68it/s] 97it [00:10, 9.71it/s] 98it [00:10, 9.76it/s] 99it [00:10, 9.83it/s] 100it [00:10, 9.87it/s]2025-05-26 05:35:19,794 - INFO - [Epoch 004 | Batch 0100] IWAE-loss 22043.1543 | mean log_px -0.2736 | KL -3483.78 + 101it [00:10, 9.23it/s] 102it [00:10, 9.37it/s] 103it [00:10, 9.55it/s] 104it [00:11, 9.60it/s] 106it [00:11, 9.19it/s] 107it [00:11, 9.35it/s] 108it [00:11, 9.48it/s] 109it [00:11, 9.58it/s] 110it [00:11, 9.08it/s] 111it [00:11, 9.29it/s] 112it [00:11, 9.43it/s] 113it [00:12, 9.50it/s] 114it [00:12, 9.62it/s] 115it [00:12, 9.69it/s] 116it [00:12, 9.75it/s] 118it [00:12, 9.88it/s] 119it [00:12, 9.89it/s] 120it [00:12, 9.91it/s] 122it [00:12, 9.95it/s] 123it [00:13, 9.96it/s] 124it [00:13, 9.94it/s] 125it [00:13, 9.94it/s] 126it [00:13, 9.92it/s] 127it [00:13, 9.92it/s] 128it [00:13, 9.92it/s] 129it [00:13, 9.92it/s] 130it [00:13, 9.92it/s] 131it [00:13, 9.91it/s] 132it [00:13, 9.87it/s] 133it [00:14, 9.84it/s] 134it [00:14, 9.81it/s] 135it [00:14, 9.82it/s] 136it [00:14, 9.81it/s] 137it [00:14, 9.83it/s] 138it [00:14, 9.84it/s] 139it [00:14, 9.87it/s] 140it [00:14, 9.88it/s] 141it [00:14, 9.86it/s] 142it [00:14, 9.84it/s] 143it [00:15, 9.23it/s] 144it [00:15, 9.43it/s] 145it [00:15, 9.59it/s] 146it [00:15, 9.69it/s] 147it [00:15, 9.77it/s] 148it [00:15, 9.15it/s] 149it [00:15, 9.29it/s] 150it [00:15, 9.44it/s]2025-05-26 05:35:24,976 - INFO - [Epoch 004 | Batch 0150] IWAE-loss 22188.4727 | mean log_px -0.2672 | KL -3485.55 + 151it [00:15, 9.52it/s] 152it [00:16, 9.62it/s] 153it [00:16, 9.69it/s] 154it [00:16, 9.73it/s] 155it [00:16, 9.77it/s] 156it [00:16, 9.81it/s] 157it [00:16, 9.82it/s] 158it [00:16, 9.84it/s] 159it [00:16, 9.85it/s] 160it [00:16, 9.88it/s] 161it [00:16, 9.89it/s] 162it [00:17, 9.89it/s] 163it [00:17, 9.90it/s] 164it [00:17, 9.88it/s] 165it [00:17, 9.88it/s] 166it [00:17, 9.88it/s] 167it [00:17, 9.82it/s] 168it [00:17, 9.71it/s] 169it [00:17, 8.97it/s] 170it [00:17, 9.10it/s] 171it [00:17, 9.30it/s] 172it [00:18, 9.44it/s] 173it [00:18, 9.55it/s] 174it [00:18, 9.64it/s] 175it [00:18, 9.68it/s] 176it [00:18, 9.74it/s] 177it [00:18, 9.81it/s] 178it [00:18, 9.81it/s] 179it [00:18, 9.86it/s] 180it [00:18, 9.78it/s] 181it [00:18, 9.82it/s] 182it [00:19, 9.81it/s] 183it [00:19, 9.83it/s] 184it [00:19, 9.85it/s] 185it [00:19, 9.87it/s] 186it [00:19, 9.30it/s] 187it [00:19, 9.32it/s] 188it [00:19, 9.46it/s] 189it [00:19, 9.52it/s] 190it [00:19, 9.16it/s] 191it [00:20, 9.35it/s] 192it [00:20, 9.48it/s] 193it [00:20, 9.59it/s] 194it [00:20, 9.67it/s] 195it [00:20, 9.31it/s] 196it [00:20, 9.07it/s] 196it [00:20, 9.49it/s] +2025-05-26 05:35:29,765 - INFO - Epoch: 4, Objective: tensor([19702.6348], device='cuda:0', grad_fn=), Loss: 0.23782320320606232, KL/n: 71.2601089477539 + 0it [00:00, ?it/s]2025-05-26 05:35:30,043 - INFO - [Epoch 005 | Batch 0000] IWAE-loss 16530.5488 | mean log_px -0.1878 | KL -3492.38 + 1it [00:00, 5.40it/s] 2it [00:00, 6.78it/s] 3it [00:00, 7.93it/s] 4it [00:00, 8.60it/s] 5it [00:00, 8.96it/s] 6it [00:00, 9.24it/s] 7it [00:00, 9.42it/s] 8it [00:00, 9.56it/s] 9it [00:01, 9.66it/s] 10it [00:01, 9.70it/s] 11it [00:01, 9.74it/s] 12it [00:01, 9.77it/s] 13it [00:01, 9.84it/s] 14it [00:01, 9.87it/s] 15it [00:01, 9.89it/s] 16it [00:01, 9.91it/s] 17it [00:01, 9.89it/s] 18it [00:01, 9.88it/s] 19it [00:02, 9.90it/s] 20it [00:02, 9.90it/s] 21it [00:02, 9.90it/s] 22it [00:02, 9.85it/s] 23it [00:02, 9.65it/s] 24it [00:02, 9.04it/s] 25it [00:02, 8.71it/s] 26it [00:02, 8.88it/s] 27it [00:02, 9.14it/s] 28it [00:03, 9.34it/s] 29it [00:03, 9.48it/s] 30it [00:03, 9.03it/s] 31it [00:03, 9.27it/s] 32it [00:03, 9.46it/s] 33it [00:03, 9.60it/s] 34it [00:03, 9.50it/s] 35it [00:03, 9.21it/s] 36it [00:03, 8.65it/s] 38it [00:04, 9.21it/s] 39it [00:04, 9.35it/s] 40it [00:04, 9.46it/s] 41it [00:04, 9.56it/s] 42it [00:04, 9.09it/s] 43it [00:04, 9.28it/s] 44it [00:04, 9.43it/s] 45it [00:04, 9.52it/s] 46it [00:04, 9.63it/s] 48it [00:05, 9.79it/s] 49it [00:05, 9.73it/s] 50it [00:05, 9.65it/s]2025-05-26 05:35:35,301 - INFO - [Epoch 005 | Batch 0050] IWAE-loss 17774.5938 | mean log_px -0.2058 | KL -3492.53 + 51it [00:05, 9.09it/s] 52it [00:05, 9.31it/s] 53it [00:05, 9.45it/s] 54it [00:05, 9.55it/s] 55it [00:05, 9.60it/s] 56it [00:05, 9.67it/s] 57it [00:06, 9.71it/s] 58it [00:06, 9.76it/s] 59it [00:06, 9.81it/s] 60it [00:06, 9.82it/s] 61it [00:06, 9.84it/s] 62it [00:06, 9.68it/s] 63it [00:06, 9.64it/s] 64it [00:06, 9.73it/s] 65it [00:06, 9.79it/s] 66it [00:06, 9.82it/s] 67it [00:07, 9.86it/s] 68it [00:07, 9.87it/s] 69it [00:07, 9.88it/s] 70it [00:07, 9.88it/s] 71it [00:07, 9.24it/s] 72it [00:07, 9.44it/s] 73it [00:07, 9.60it/s] 74it [00:07, 9.66it/s] 75it [00:07, 9.72it/s] 76it [00:08, 9.79it/s] 77it [00:08, 9.72it/s] 78it [00:08, 9.78it/s] 79it [00:08, 9.80it/s] 80it [00:08, 9.83it/s] 81it [00:08, 9.88it/s] 82it [00:08, 9.88it/s] 83it [00:08, 9.92it/s] 84it [00:08, 9.93it/s] 86it [00:09, 9.96it/s] 88it [00:09, 9.94it/s] 89it [00:09, 9.95it/s] 90it [00:09, 9.96it/s] 91it [00:09, 9.52it/s] 92it [00:09, 9.62it/s] 93it [00:09, 9.72it/s] 94it [00:09, 9.77it/s] 95it [00:09, 9.83it/s] 96it [00:10, 9.84it/s] 97it [00:10, 9.87it/s] 98it [00:10, 9.87it/s] 99it [00:10, 9.86it/s] 100it [00:10, 9.83it/s]2025-05-26 05:35:40,428 - INFO - [Epoch 005 | Batch 0100] IWAE-loss 13819.5430 | mean log_px -0.1567 | KL -3497.92 + 101it [00:10, 9.20it/s] 102it [00:10, 9.41it/s] 103it [00:10, 9.56it/s] 104it [00:10, 9.63it/s] 105it [00:10, 9.68it/s] 106it [00:11, 9.69it/s] 107it [00:11, 9.74it/s] 108it [00:11, 9.75it/s] 109it [00:11, 9.80it/s] 110it [00:11, 9.82it/s] 111it [00:11, 9.84it/s] 112it [00:11, 9.85it/s] 113it [00:11, 9.88it/s] 114it [00:11, 9.87it/s] 115it [00:12, 9.87it/s] 116it [00:12, 9.85it/s] 117it [00:12, 9.88it/s] 118it [00:12, 9.87it/s] 119it [00:12, 9.86it/s] 120it [00:12, 9.89it/s] 121it [00:12, 9.91it/s] 122it [00:12, 9.90it/s] 123it [00:12, 9.91it/s] 124it [00:12, 9.89it/s] 125it [00:13, 9.90it/s] 126it [00:13, 9.81it/s] 127it [00:13, 9.83it/s] 128it [00:13, 9.79it/s] 130it [00:13, 9.88it/s] 131it [00:13, 9.89it/s] 132it [00:13, 9.89it/s] 133it [00:13, 9.88it/s] 134it [00:13, 9.25it/s] 135it [00:14, 9.44it/s] 136it [00:14, 9.57it/s] 137it [00:14, 9.67it/s] 138it [00:14, 9.74it/s] 139it [00:14, 9.77it/s] 140it [00:14, 9.79it/s] 141it [00:14, 9.84it/s] 142it [00:14, 9.84it/s] 144it [00:14, 9.91it/s] 145it [00:15, 9.91it/s] 146it [00:15, 9.94it/s] 147it [00:15, 9.93it/s] 148it [00:15, 9.37it/s] 149it [00:15, 9.52it/s] 150it [00:15, 9.62it/s]2025-05-26 05:35:45,556 - INFO - [Epoch 005 | Batch 0150] IWAE-loss 18954.9707 | mean log_px -0.2272 | KL -3503.50 + 151it [00:15, 9.71it/s] 152it [00:15, 9.16it/s] 153it [00:15, 9.38it/s] 154it [00:16, 9.51it/s] 155it [00:16, 9.60it/s] 156it [00:16, 9.68it/s] 157it [00:16, 9.76it/s] 158it [00:16, 9.79it/s] 159it [00:16, 9.80it/s] 160it [00:16, 9.83it/s] 161it [00:16, 9.84it/s] 162it [00:16, 9.86it/s] 163it [00:16, 9.85it/s] 164it [00:17, 9.84it/s] 165it [00:17, 9.86it/s] 166it [00:17, 9.85it/s] 167it [00:17, 9.84it/s] 168it [00:17, 9.85it/s] 169it [00:17, 9.85it/s] 170it [00:17, 9.84it/s] 171it [00:17, 9.84it/s] 172it [00:17, 9.87it/s] 173it [00:17, 9.89it/s] 174it [00:18, 9.88it/s] 175it [00:18, 9.90it/s] 176it [00:18, 9.87it/s] 177it [00:18, 9.87it/s] 178it [00:18, 9.85it/s] 179it [00:18, 9.84it/s] 180it [00:18, 9.81it/s] 181it [00:18, 9.82it/s] 182it [00:18, 9.82it/s] 183it [00:18, 9.86it/s] 184it [00:19, 9.83it/s] 185it [00:19, 9.87it/s] 186it [00:19, 9.89it/s] 187it [00:19, 9.92it/s] 188it [00:19, 9.90it/s] 189it [00:19, 9.78it/s] 190it [00:19, 9.73it/s] 191it [00:19, 9.74it/s] 192it [00:19, 9.76it/s] 193it [00:19, 9.81it/s] 194it [00:20, 9.85it/s] 195it [00:20, 9.45it/s] 196it [00:20, 9.63it/s] +2025-05-26 05:35:50,256 - INFO - Epoch: 5, Objective: tensor([12165.8643], device='cuda:0', grad_fn=), Loss: 0.1356792002916336, KL/n: 71.50433349609375 + 0it [00:00, ?it/s]2025-05-26 05:35:50,711 - INFO - [Epoch 006 | Batch 0000] IWAE-loss 17046.0859 | mean log_px -0.1989 | KL -3502.32 + 1it [00:00, 4.75it/s] 2it [00:00, 6.87it/s] 4it [00:00, 8.57it/s] 5it [00:00, 8.94it/s] 6it [00:00, 9.22it/s] 7it [00:00, 8.96it/s] 8it [00:00, 9.24it/s] 10it [00:01, 9.59it/s] 12it [00:01, 9.76it/s] 13it [00:01, 9.81it/s] 14it [00:01, 9.84it/s] 16it [00:01, 9.91it/s] 18it [00:01, 9.96it/s] 20it [00:02, 9.98it/s] 21it [00:02, 9.98it/s] 22it [00:02, 9.97it/s] 23it [00:02, 9.97it/s] 24it [00:02, 9.88it/s] 25it [00:02, 9.30it/s] 26it [00:02, 9.45it/s] 27it [00:02, 9.59it/s] 28it [00:02, 9.69it/s] 30it [00:03, 9.85it/s] 32it [00:03, 9.92it/s] 33it [00:03, 9.93it/s] 34it [00:03, 9.94it/s] 35it [00:03, 9.51it/s] 36it [00:03, 9.62it/s] 38it [00:03, 9.45it/s] 40it [00:04, 9.67it/s] 42it [00:04, 9.79it/s] 44it [00:04, 9.86it/s] 46it [00:04, 9.91it/s] 48it [00:04, 9.96it/s] 50it [00:05, 9.71it/s]2025-05-26 05:35:55,840 - INFO - [Epoch 006 | Batch 0050] IWAE-loss 15465.3457 | mean log_px -0.1867 | KL -3503.66 + 51it [00:05, 9.74it/s] 52it [00:05, 9.77it/s] 54it [00:05, 9.46it/s] 55it [00:05, 9.57it/s] 56it [00:05, 9.66it/s] 58it [00:06, 9.82it/s] 59it [00:06, 9.47it/s] 60it [00:06, 9.59it/s] 62it [00:06, 9.77it/s] 64it [00:06, 9.46it/s] 66it [00:06, 9.66it/s] 68it [00:07, 9.79it/s] 70it [00:07, 9.87it/s] 72it [00:07, 9.90it/s] 73it [00:07, 9.91it/s] 74it [00:07, 9.55it/s] 75it [00:07, 9.65it/s] 76it [00:07, 9.73it/s] 78it [00:08, 9.85it/s] 80it [00:08, 9.59it/s] 82it [00:08, 9.75it/s] 84it [00:08, 9.84it/s] 86it [00:08, 9.91it/s] 87it [00:09, 9.90it/s] 88it [00:09, 9.82it/s] 89it [00:09, 9.83it/s] 90it [00:09, 9.87it/s] 92it [00:09, 9.94it/s] 93it [00:09, 9.95it/s] 94it [00:09, 9.95it/s] 96it [00:09, 10.00it/s] 98it [00:10, 10.02it/s] 100it [00:10, 9.55it/s]2025-05-26 05:36:00,968 - INFO - [Epoch 006 | Batch 0100] IWAE-loss 16232.7539 | mean log_px -0.1872 | KL -3505.36 + 101it [00:10, 9.64it/s] 102it [00:10, 9.68it/s] 103it [00:10, 9.71it/s] 104it [00:10, 9.77it/s] 105it [00:10, 9.82it/s] 107it [00:11, 9.91it/s] 109it [00:11, 9.92it/s] 110it [00:11, 9.93it/s] 112it [00:11, 9.96it/s] 114it [00:11, 9.98it/s] 116it [00:11, 10.00it/s] 118it [00:12, 10.02it/s] 120it [00:12, 10.03it/s] 122it [00:12, 9.77it/s] 123it [00:12, 9.79it/s] 124it [00:12, 9.81it/s] 126it [00:12, 9.91it/s] 127it [00:13, 9.53it/s] 128it [00:13, 9.63it/s] 129it [00:13, 9.71it/s] 130it [00:13, 9.78it/s] 132it [00:13, 9.89it/s] 134it [00:13, 9.96it/s] 135it [00:13, 9.96it/s] 136it [00:13, 9.97it/s] 138it [00:14, 9.99it/s] 139it [00:14, 9.96it/s] 140it [00:14, 9.23it/s] 141it [00:14, 9.19it/s] 142it [00:14, 9.32it/s] 143it [00:14, 9.04it/s] 144it [00:14, 9.23it/s] 145it [00:14, 9.39it/s] 146it [00:15, 9.49it/s] 147it [00:15, 9.00it/s] 148it [00:15, 9.21it/s] 149it [00:15, 9.39it/s] 150it [00:15, 9.50it/s]2025-05-26 05:36:06,114 - INFO - [Epoch 006 | Batch 0150] IWAE-loss 16457.2578 | mean log_px -0.1880 | KL -3506.98 + 151it [00:15, 9.56it/s] 152it [00:15, 9.64it/s] 154it [00:15, 9.82it/s] 156it [00:16, 9.91it/s] 157it [00:16, 9.92it/s] 159it [00:16, 9.97it/s] 160it [00:16, 9.98it/s] 162it [00:16, 9.99it/s] 163it [00:16, 9.96it/s] 165it [00:16, 9.99it/s] 167it [00:17, 9.98it/s] 169it [00:17, 10.01it/s] 170it [00:17, 10.00it/s] 171it [00:17, 9.88it/s] 172it [00:17, 9.51it/s] 174it [00:17, 9.68it/s] 175it [00:18, 9.71it/s] 177it [00:18, 9.83it/s] 178it [00:18, 9.86it/s] 180it [00:18, 9.92it/s] 181it [00:18, 9.43it/s] 183it [00:18, 9.67it/s] 184it [00:18, 9.73it/s] 186it [00:19, 9.86it/s] 188it [00:19, 9.93it/s] 189it [00:19, 9.94it/s] 191it [00:19, 9.58it/s] 192it [00:19, 9.65it/s] 194it [00:19, 9.79it/s] 195it [00:20, 9.51it/s] 196it [00:20, 9.28it/s] 196it [00:20, 9.68it/s] +2025-05-26 05:36:10,825 - INFO - Epoch: 6, Objective: tensor([15376.6016], device='cuda:0', grad_fn=), Loss: 0.17358337342739105, KL/n: 71.75361633300781 + 0it [00:00, ?it/s]2025-05-26 05:36:11,097 - INFO - [Epoch 007 | Batch 0000] IWAE-loss 17575.0977 | mean log_px -0.2084 | KL -3514.32 + 1it [00:00, 5.47it/s] 2it [00:00, 6.65it/s] 3it [00:00, 7.84it/s] 4it [00:00, 8.55it/s] 5it [00:00, 9.01it/s] 6it [00:00, 9.28it/s] 7it [00:00, 9.50it/s] 8it [00:00, 9.60it/s] 9it [00:01, 9.71it/s] 10it [00:01, 9.75it/s] 11it [00:01, 9.63it/s] 12it [00:01, 9.67it/s] 13it [00:01, 9.69it/s] 14it [00:01, 9.67it/s] 15it [00:01, 9.76it/s] 16it [00:01, 9.17it/s] 17it [00:01, 9.39it/s] 18it [00:01, 9.51it/s] 19it [00:02, 9.57it/s] 20it [00:02, 9.02it/s] 21it [00:02, 9.26it/s] 22it [00:02, 9.45it/s] 23it [00:02, 9.60it/s] 24it [00:02, 9.69it/s] 25it [00:02, 9.74it/s] 26it [00:02, 9.78it/s] 27it [00:02, 9.82it/s] 28it [00:02, 9.84it/s] 29it [00:03, 9.87it/s] 30it [00:03, 9.88it/s] 31it [00:03, 9.90it/s] 32it [00:03, 9.89it/s] 33it [00:03, 9.92it/s] 34it [00:03, 9.91it/s] 35it [00:03, 9.92it/s] 36it [00:03, 9.91it/s] 37it [00:03, 9.93it/s] 38it [00:04, 9.93it/s] 40it [00:04, 9.96it/s] 41it [00:04, 9.95it/s] 42it [00:04, 9.94it/s] 43it [00:04, 9.95it/s] 44it [00:04, 9.94it/s] 45it [00:04, 9.94it/s] 46it [00:04, 9.92it/s] 47it [00:04, 9.92it/s] 48it [00:05, 9.91it/s] 49it [00:05, 9.44it/s] 50it [00:05, 9.56it/s]2025-05-26 05:36:16,248 - INFO - [Epoch 007 | Batch 0050] IWAE-loss 11222.3057 | mean log_px -0.1177 | KL -3518.79 + 51it [00:05, 9.66it/s] 52it [00:05, 9.73it/s] 53it [00:05, 9.78it/s] 54it [00:05, 9.82it/s] 55it [00:05, 9.86it/s] 56it [00:05, 9.86it/s] 57it [00:05, 9.87it/s] 58it [00:06, 9.87it/s] 59it [00:06, 9.89it/s] 60it [00:06, 9.89it/s] 61it [00:06, 9.89it/s] 62it [00:06, 9.90it/s] 63it [00:06, 9.91it/s] 64it [00:06, 9.92it/s] 65it [00:06, 9.92it/s] 66it [00:06, 9.92it/s] 67it [00:06, 9.93it/s] 68it [00:07, 9.94it/s] 69it [00:07, 9.95it/s] 70it [00:07, 9.94it/s] 71it [00:07, 9.96it/s] 72it [00:07, 9.95it/s] 73it [00:07, 9.94it/s] 74it [00:07, 9.91it/s] 76it [00:07, 9.93it/s] 77it [00:07, 9.94it/s] 78it [00:08, 9.93it/s] 79it [00:08, 9.94it/s] 80it [00:08, 9.91it/s] 81it [00:08, 9.91it/s] 82it [00:08, 9.92it/s] 83it [00:08, 9.92it/s] 84it [00:08, 9.92it/s] 85it [00:08, 9.91it/s] 86it [00:08, 9.87it/s] 87it [00:08, 9.90it/s] 88it [00:09, 9.90it/s] 89it [00:09, 9.93it/s] 90it [00:09, 9.92it/s] 91it [00:09, 9.92it/s] 92it [00:09, 9.90it/s] 93it [00:09, 9.89it/s] 94it [00:09, 9.88it/s] 96it [00:09, 9.94it/s] 97it [00:09, 9.93it/s] 98it [00:10, 9.92it/s] 99it [00:10, 9.91it/s] 100it [00:10, 9.90it/s]2025-05-26 05:36:21,291 - INFO - [Epoch 007 | Batch 0100] IWAE-loss 15323.3848 | mean log_px -0.1767 | KL -3517.25 + 101it [00:10, 9.90it/s] 102it [00:10, 9.91it/s] 103it [00:10, 9.93it/s] 104it [00:10, 9.91it/s] 105it [00:10, 9.93it/s] 106it [00:10, 9.92it/s] 107it [00:10, 9.92it/s] 108it [00:11, 9.92it/s] 110it [00:11, 9.94it/s] 111it [00:11, 9.94it/s] 112it [00:11, 9.93it/s] 113it [00:11, 9.94it/s] 114it [00:11, 9.95it/s] 115it [00:11, 9.96it/s] 116it [00:11, 9.94it/s] 118it [00:12, 9.97it/s] 119it [00:12, 9.96it/s] 120it [00:12, 9.91it/s] 121it [00:12, 9.93it/s] 122it [00:12, 9.87it/s] 123it [00:12, 9.82it/s] 124it [00:12, 9.84it/s] 125it [00:12, 9.88it/s] 126it [00:12, 9.88it/s] 128it [00:13, 9.92it/s] 130it [00:13, 9.95it/s] 131it [00:13, 9.95it/s] 132it [00:13, 9.54it/s] 133it [00:13, 9.64it/s] 134it [00:13, 9.66it/s] 135it [00:13, 9.63it/s] 136it [00:13, 9.69it/s] 137it [00:14, 9.77it/s] 138it [00:14, 9.81it/s] 139it [00:14, 9.85it/s] 140it [00:14, 9.87it/s] 141it [00:14, 9.90it/s] 142it [00:14, 9.90it/s] 143it [00:14, 9.93it/s] 144it [00:14, 9.92it/s] 145it [00:14, 9.92it/s] 146it [00:14, 9.92it/s] 147it [00:15, 9.94it/s] 148it [00:15, 9.94it/s] 149it [00:15, 9.94it/s] 150it [00:15, 9.94it/s]2025-05-26 05:36:26,351 - INFO - [Epoch 007 | Batch 0150] IWAE-loss 19223.7129 | mean log_px -0.2297 | KL -3526.62 + 151it [00:15, 9.92it/s] 152it [00:15, 9.93it/s] 153it [00:15, 9.94it/s] 154it [00:15, 9.94it/s] 156it [00:15, 9.97it/s] 157it [00:16, 9.96it/s] 158it [00:16, 9.96it/s] 159it [00:16, 9.96it/s] 160it [00:16, 9.94it/s] 161it [00:16, 9.95it/s] 162it [00:16, 9.95it/s] 163it [00:16, 9.94it/s] 164it [00:16, 9.95it/s] 165it [00:16, 9.96it/s] 166it [00:16, 9.97it/s] 167it [00:17, 9.89it/s] 168it [00:17, 9.90it/s] 169it [00:17, 9.89it/s] 170it [00:17, 9.89it/s] 171it [00:17, 9.25it/s] 172it [00:17, 9.42it/s] 173it [00:17, 9.55it/s] 174it [00:17, 9.61it/s] 175it [00:17, 9.70it/s] 176it [00:17, 9.74it/s] 177it [00:18, 9.80it/s] 178it [00:18, 9.81it/s] 179it [00:18, 9.86it/s] 180it [00:18, 9.87it/s] 181it [00:18, 9.25it/s] 182it [00:18, 9.42it/s] 183it [00:18, 9.57it/s] 184it [00:18, 9.65it/s] 185it [00:18, 9.75it/s] 186it [00:19, 9.78it/s] 187it [00:19, 9.81it/s] 188it [00:19, 9.82it/s] 189it [00:19, 9.86it/s] 190it [00:19, 9.85it/s] 191it [00:19, 9.85it/s] 192it [00:19, 9.84it/s] 193it [00:19, 9.78it/s] 194it [00:19, 9.19it/s] 195it [00:19, 9.01it/s] 196it [00:20, 9.74it/s] +2025-05-26 05:36:31,079 - INFO - Epoch: 7, Objective: tensor([11751.9316], device='cuda:0', grad_fn=), Loss: 0.11317390948534012, KL/n: 71.94717407226562 + 0it [00:00, ?it/s]2025-05-26 05:36:31,541 - INFO - [Epoch 008 | Batch 0000] IWAE-loss 14055.2070 | mean log_px -0.1545 | KL -3523.18 + 1it [00:00, 5.26it/s] 2it [00:00, 7.25it/s] 4it [00:00, 8.76it/s] 6it [00:00, 9.27it/s] 8it [00:00, 9.55it/s] 9it [00:00, 9.63it/s] 10it [00:01, 9.70it/s] 11it [00:01, 9.74it/s] 12it [00:01, 9.76it/s] 13it [00:01, 9.82it/s] 14it [00:01, 9.82it/s] 15it [00:01, 9.83it/s] 16it [00:01, 9.87it/s] 17it [00:01, 9.87it/s] 18it [00:01, 9.85it/s] 20it [00:02, 9.92it/s] 22it [00:02, 9.91it/s] 23it [00:02, 9.56it/s] 24it [00:02, 9.64it/s] 25it [00:02, 9.72it/s] 26it [00:02, 9.77it/s] 27it [00:02, 9.81it/s] 28it [00:02, 9.83it/s] 29it [00:03, 9.85it/s] 30it [00:03, 9.86it/s] 31it [00:03, 9.89it/s] 32it [00:03, 9.89it/s] 34it [00:03, 9.88it/s] 35it [00:03, 9.83it/s] 36it [00:03, 9.85it/s] 37it [00:03, 9.87it/s] 38it [00:03, 9.88it/s] 39it [00:04, 9.87it/s] 40it [00:04, 9.87it/s] 41it [00:04, 9.86it/s] 42it [00:04, 9.83it/s] 43it [00:04, 9.84it/s] 44it [00:04, 9.84it/s] 45it [00:04, 9.87it/s] 46it [00:04, 9.86it/s] 47it [00:04, 9.89it/s] 48it [00:04, 9.78it/s] 49it [00:05, 9.06it/s] 50it [00:05, 9.03it/s]2025-05-26 05:36:36,658 - INFO - [Epoch 008 | Batch 0050] IWAE-loss 12810.5664 | mean log_px -0.1418 | KL -3528.74 + 51it [00:05, 9.14it/s] 52it [00:05, 9.25it/s] 53it [00:05, 9.35it/s] 54it [00:05, 9.43it/s] 55it [00:05, 9.52it/s] 56it [00:05, 9.53it/s] 57it [00:05, 9.57it/s] 58it [00:06, 9.55it/s] 59it [00:06, 9.59it/s] 60it [00:06, 9.49it/s] 61it [00:06, 9.55it/s] 62it [00:06, 9.62it/s] 63it [00:06, 9.71it/s] 64it [00:06, 9.75it/s] 65it [00:06, 9.80it/s] 66it [00:06, 9.82it/s] 67it [00:06, 9.81it/s] 68it [00:07, 9.80it/s] 69it [00:07, 9.79it/s] 70it [00:07, 9.81it/s] 71it [00:07, 9.81it/s] 72it [00:07, 9.82it/s] 73it [00:07, 9.84it/s] 74it [00:07, 9.85it/s] 75it [00:07, 9.48it/s] 76it [00:07, 9.54it/s] 77it [00:08, 9.15it/s] 78it [00:08, 9.37it/s] 79it [00:08, 9.50it/s] 80it [00:08, 9.62it/s] 81it [00:08, 9.71it/s] 82it [00:08, 9.74it/s] 83it [00:08, 9.79it/s] 84it [00:08, 9.80it/s] 85it [00:08, 9.80it/s] 86it [00:08, 9.81it/s] 87it [00:09, 9.83it/s] 88it [00:09, 9.84it/s] 89it [00:09, 9.88it/s] 90it [00:09, 9.88it/s] 91it [00:09, 9.88it/s] 92it [00:09, 9.85it/s] 93it [00:09, 9.18it/s] 94it [00:09, 9.37it/s] 95it [00:09, 9.53it/s] 96it [00:09, 9.63it/s] 97it [00:10, 9.73it/s] 98it [00:10, 9.78it/s] 99it [00:10, 9.82it/s] 100it [00:10, 9.20it/s]2025-05-26 05:36:41,842 - INFO - [Epoch 008 | Batch 0100] IWAE-loss 9847.4746 | mean log_px -0.0930 | KL -3528.36 + 101it [00:10, 9.37it/s] 102it [00:10, 9.50it/s] 103it [00:10, 9.61it/s] 104it [00:10, 9.68it/s] 105it [00:10, 9.75it/s] 106it [00:11, 9.15it/s] 107it [00:11, 9.34it/s] 108it [00:11, 9.51it/s] 109it [00:11, 9.63it/s] 110it [00:11, 9.72it/s] 111it [00:11, 9.78it/s] 112it [00:11, 9.69it/s] 113it [00:11, 9.76it/s] 114it [00:11, 9.75it/s] 115it [00:11, 9.81it/s] 116it [00:12, 9.84it/s] 117it [00:12, 9.87it/s] 118it [00:12, 9.85it/s] 119it [00:12, 9.83it/s] 120it [00:12, 9.81it/s] 121it [00:12, 9.82it/s] 122it [00:12, 9.84it/s] 123it [00:12, 9.86it/s] 124it [00:12, 9.85it/s] 125it [00:12, 9.87it/s] 126it [00:13, 9.35it/s] 127it [00:13, 9.51it/s] 128it [00:13, 9.60it/s] 129it [00:13, 9.68it/s] 130it [00:13, 9.76it/s] 131it [00:13, 9.79it/s] 132it [00:13, 9.19it/s] 133it [00:13, 9.39it/s] 134it [00:13, 9.53it/s] 135it [00:14, 9.64it/s] 136it [00:14, 9.69it/s] 137it [00:14, 9.73it/s] 138it [00:14, 9.12it/s] 139it [00:14, 9.34it/s] 140it [00:14, 9.48it/s] 141it [00:14, 9.60it/s] 142it [00:14, 9.65it/s] 143it [00:14, 9.70it/s] 144it [00:14, 8.98it/s] 145it [00:15, 9.13it/s] 146it [00:15, 9.32it/s] 147it [00:15, 9.49it/s] 148it [00:15, 9.61it/s] 149it [00:15, 9.70it/s] 150it [00:15, 9.74it/s]2025-05-26 05:36:47,038 - INFO - [Epoch 008 | Batch 0150] IWAE-loss 11725.8896 | mean log_px -0.1225 | KL -3532.75 + 151it [00:15, 9.72it/s] 152it [00:15, 9.76it/s] 153it [00:15, 9.78it/s] 154it [00:15, 9.80it/s] 155it [00:16, 9.80it/s] 156it [00:16, 9.76it/s] 157it [00:16, 9.78it/s] 158it [00:16, 9.80it/s] 159it [00:16, 9.81it/s] 160it [00:16, 9.82it/s] 161it [00:16, 9.86it/s] 162it [00:16, 9.83it/s] 163it [00:16, 9.86it/s] 164it [00:17, 9.90it/s] 165it [00:17, 9.93it/s] 166it [00:17, 9.92it/s] 168it [00:17, 9.95it/s] 169it [00:17, 9.95it/s] 170it [00:17, 9.94it/s] 171it [00:17, 9.95it/s] 172it [00:17, 9.94it/s] 173it [00:17, 9.93it/s] 174it [00:18, 9.93it/s] 175it [00:18, 9.83it/s] 176it [00:18, 9.82it/s] 177it [00:18, 9.70it/s] 178it [00:18, 9.76it/s] 179it [00:18, 9.81it/s] 180it [00:18, 9.83it/s] 181it [00:18, 9.88it/s] 182it [00:18, 9.88it/s] 183it [00:18, 9.92it/s] 184it [00:19, 9.93it/s] 185it [00:19, 9.94it/s] 186it [00:19, 9.96it/s] 187it [00:19, 9.90it/s] 188it [00:19, 9.88it/s] 189it [00:19, 9.89it/s] 190it [00:19, 9.88it/s] 192it [00:19, 9.93it/s] 193it [00:19, 9.93it/s] 194it [00:20, 9.92it/s] 195it [00:20, 9.51it/s] 196it [00:20, 9.65it/s] +2025-05-26 05:36:51,694 - INFO - Epoch: 8, Objective: tensor([19531.0215], device='cuda:0', grad_fn=), Loss: 0.22876138985157013, KL/n: 72.13713073730469 + 0it [00:00, ?it/s]2025-05-26 05:36:51,972 - INFO - [Epoch 009 | Batch 0000] IWAE-loss 15139.6064 | mean log_px -0.1711 | KL -3532.32 + 1it [00:00, 4.66it/s] 2it [00:00, 6.78it/s] 3it [00:00, 7.89it/s] 4it [00:00, 8.54it/s] 5it [00:00, 8.33it/s] 6it [00:00, 8.78it/s] 7it [00:00, 9.12it/s] 8it [00:00, 9.37it/s] 9it [00:01, 9.55it/s] 10it [00:01, 9.65it/s] 12it [00:01, 9.81it/s] 13it [00:01, 9.85it/s] 14it [00:01, 9.82it/s] 16it [00:01, 9.91it/s] 18it [00:01, 9.96it/s] 19it [00:02, 9.96it/s] 20it [00:02, 9.97it/s] 21it [00:02, 9.97it/s] 22it [00:02, 9.96it/s] 23it [00:02, 9.97it/s] 24it [00:02, 9.93it/s] 25it [00:02, 9.92it/s] 26it [00:02, 9.91it/s] 27it [00:02, 9.92it/s] 28it [00:02, 9.94it/s] 29it [00:03, 9.95it/s] 30it [00:03, 9.94it/s] 31it [00:03, 9.96it/s] 32it [00:03, 9.20it/s] 33it [00:03, 9.39it/s] 34it [00:03, 9.50it/s] 35it [00:03, 9.63it/s] 36it [00:03, 9.07it/s] 37it [00:03, 9.31it/s] 38it [00:04, 9.40it/s] 39it [00:04, 9.54it/s] 40it [00:04, 9.63it/s] 41it [00:04, 9.51it/s] 42it [00:04, 9.37it/s] 43it [00:04, 9.49it/s] 44it [00:04, 8.98it/s] 45it [00:04, 9.20it/s] 46it [00:04, 9.32it/s] 47it [00:04, 9.45it/s] 48it [00:05, 9.53it/s] 49it [00:05, 9.65it/s] 50it [00:05, 9.69it/s]2025-05-26 05:36:57,171 - INFO - [Epoch 009 | Batch 0050] IWAE-loss 10535.8184 | mean log_px -0.1103 | KL -3535.26 + 51it [00:05, 9.72it/s] 52it [00:05, 9.75it/s] 53it [00:05, 9.79it/s] 54it [00:05, 9.80it/s] 55it [00:05, 9.68it/s] 56it [00:05, 9.66it/s] 57it [00:06, 9.71it/s] 58it [00:06, 9.68it/s] 59it [00:06, 9.59it/s] 60it [00:06, 9.10it/s] 61it [00:06, 9.33it/s] 62it [00:06, 9.46it/s] 63it [00:06, 9.57it/s] 64it [00:06, 9.58it/s] 65it [00:06, 9.51it/s] 66it [00:06, 9.12it/s] 67it [00:07, 9.35it/s] 68it [00:07, 9.50it/s] 69it [00:07, 9.59it/s] 70it [00:07, 9.66it/s] 71it [00:07, 9.74it/s] 72it [00:07, 9.78it/s] 73it [00:07, 9.83it/s] 74it [00:07, 9.84it/s] 75it [00:07, 9.87it/s] 76it [00:07, 9.86it/s] 77it [00:08, 9.88it/s] 78it [00:08, 9.88it/s] 79it [00:08, 9.87it/s] 80it [00:08, 9.84it/s] 81it [00:08, 9.83it/s] 82it [00:08, 9.84it/s] 83it [00:08, 9.86it/s] 84it [00:08, 9.89it/s] 85it [00:08, 9.85it/s] 86it [00:08, 9.87it/s] 88it [00:09, 9.93it/s] 89it [00:09, 9.91it/s] 90it [00:09, 9.91it/s] 91it [00:09, 9.87it/s] 92it [00:09, 9.87it/s] 93it [00:09, 9.86it/s] 94it [00:09, 9.79it/s] 95it [00:09, 9.81it/s] 96it [00:10, 9.82it/s] 97it [00:10, 9.86it/s] 98it [00:10, 9.87it/s] 100it [00:10, 9.40it/s]2025-05-26 05:37:02,326 - INFO - [Epoch 009 | Batch 0100] IWAE-loss 12649.1650 | mean log_px -0.1434 | KL -3534.93 + 101it [00:10, 9.54it/s] 102it [00:10, 9.59it/s] 103it [00:10, 9.69it/s] 104it [00:10, 9.70it/s] 105it [00:10, 9.76it/s] 106it [00:11, 9.80it/s] 107it [00:11, 9.84it/s] 108it [00:11, 9.82it/s] 109it [00:11, 9.83it/s] 110it [00:11, 9.83it/s] 111it [00:11, 9.85it/s] 112it [00:11, 9.86it/s] 113it [00:11, 9.88it/s] 114it [00:11, 9.88it/s] 115it [00:11, 9.91it/s] 116it [00:12, 9.91it/s] 117it [00:12, 9.92it/s] 118it [00:12, 9.90it/s] 119it [00:12, 9.90it/s] 120it [00:12, 9.90it/s] 121it [00:12, 9.91it/s] 122it [00:12, 9.90it/s] 123it [00:12, 9.91it/s] 124it [00:12, 9.87it/s] 125it [00:12, 9.90it/s] 126it [00:13, 9.93it/s] 127it [00:13, 9.93it/s] 128it [00:13, 9.94it/s] 129it [00:13, 9.93it/s] 130it [00:13, 9.36it/s] 131it [00:13, 9.50it/s] 132it [00:13, 9.60it/s] 133it [00:13, 9.70it/s] 134it [00:13, 9.76it/s] 135it [00:13, 9.80it/s] 136it [00:14, 9.82it/s] 137it [00:14, 9.86it/s] 138it [00:14, 9.86it/s] 139it [00:14, 9.88it/s] 140it [00:14, 9.89it/s] 141it [00:14, 9.90it/s] 142it [00:14, 9.90it/s] 143it [00:14, 9.90it/s] 144it [00:14, 9.86it/s] 145it [00:15, 9.88it/s] 146it [00:15, 9.88it/s] 147it [00:15, 9.90it/s] 148it [00:15, 9.89it/s] 149it [00:15, 9.91it/s] 150it [00:15, 9.89it/s]2025-05-26 05:37:07,400 - INFO - [Epoch 009 | Batch 0150] IWAE-loss 14599.3418 | mean log_px -0.1665 | KL -3540.62 + 151it [00:15, 9.87it/s] 152it [00:15, 9.85it/s] 153it [00:15, 9.86it/s] 154it [00:15, 9.80it/s] 155it [00:16, 9.10it/s] 156it [00:16, 9.12it/s] 157it [00:16, 9.32it/s] 158it [00:16, 9.48it/s] 159it [00:16, 9.60it/s] 160it [00:16, 9.69it/s] 161it [00:16, 9.75it/s] 162it [00:16, 9.77it/s] 163it [00:16, 9.79it/s] 164it [00:16, 9.79it/s] 165it [00:17, 9.79it/s] 166it [00:17, 9.77it/s] 167it [00:17, 9.79it/s] 168it [00:17, 9.80it/s] 169it [00:17, 9.83it/s] 170it [00:17, 9.67it/s] 171it [00:17, 9.68it/s] 172it [00:17, 9.68it/s] 173it [00:17, 9.75it/s] 174it [00:17, 9.79it/s] 175it [00:18, 9.85it/s] 176it [00:18, 9.87it/s] 177it [00:18, 9.87it/s] 178it [00:18, 9.87it/s] 179it [00:18, 9.81it/s] 180it [00:18, 9.80it/s] 181it [00:18, 9.84it/s] 182it [00:18, 9.86it/s] 183it [00:18, 9.88it/s] 184it [00:19, 9.88it/s] 185it [00:19, 9.90it/s] 186it [00:19, 9.87it/s] 187it [00:19, 9.86it/s] 188it [00:19, 9.84it/s] 189it [00:19, 9.87it/s] 190it [00:19, 9.84it/s] 191it [00:19, 9.85it/s] 192it [00:19, 9.86it/s] 193it [00:19, 9.88it/s] 194it [00:20, 9.91it/s] 195it [00:20, 9.47it/s] 196it [00:20, 9.66it/s] +2025-05-26 05:37:12,119 - INFO - Epoch: 9, Objective: tensor([12982.9697], device='cuda:0', grad_fn=), Loss: 0.14898112416267395, KL/n: 72.30970001220703 + 0it [00:00, ?it/s]2025-05-26 05:37:12,577 - INFO - [Epoch 010 | Batch 0000] IWAE-loss 13698.6484 | mean log_px -0.1451 | KL -3541.10 + 1it [00:00, 4.70it/s] 2it [00:00, 6.79it/s] 3it [00:00, 7.94it/s] 4it [00:00, 8.64it/s] 5it [00:00, 9.03it/s] 6it [00:00, 9.02it/s] 7it [00:00, 8.72it/s] 8it [00:00, 9.07it/s] 9it [00:01, 9.33it/s] 10it [00:01, 9.46it/s] 11it [00:01, 9.60it/s] 12it [00:01, 9.17it/s] 13it [00:01, 9.39it/s] 14it [00:01, 9.53it/s] 15it [00:01, 9.65it/s] 16it [00:01, 9.72it/s] 17it [00:01, 9.79it/s] 18it [00:01, 9.82it/s] 19it [00:02, 9.85it/s] 20it [00:02, 9.85it/s] 21it [00:02, 9.75it/s] 22it [00:02, 9.78it/s] 23it [00:02, 9.82it/s] 24it [00:02, 9.84it/s] 25it [00:02, 9.86it/s] 26it [00:02, 9.90it/s] 27it [00:02, 9.27it/s] 28it [00:03, 9.45it/s] 29it [00:03, 9.58it/s] 30it [00:03, 9.68it/s] 31it [00:03, 9.76it/s] 32it [00:03, 9.81it/s] 33it [00:03, 9.85it/s] 34it [00:03, 9.86it/s] 35it [00:03, 9.89it/s] 36it [00:03, 9.25it/s] 37it [00:03, 9.45it/s] 38it [00:04, 9.57it/s] 39it [00:04, 9.67it/s] 40it [00:04, 9.14it/s] 42it [00:04, 9.53it/s] 43it [00:04, 9.61it/s] 44it [00:04, 9.68it/s] 45it [00:04, 9.77it/s] 46it [00:04, 9.81it/s] 47it [00:04, 9.86it/s] 48it [00:05, 9.86it/s] 49it [00:05, 9.88it/s] 50it [00:05, 9.85it/s]2025-05-26 05:37:17,772 - INFO - [Epoch 010 | Batch 0050] IWAE-loss 15355.1699 | mean log_px -0.1796 | KL -3543.84 + 51it [00:05, 9.87it/s] 52it [00:05, 9.89it/s] 53it [00:05, 9.91it/s] 54it [00:05, 9.86it/s] 55it [00:05, 9.87it/s] 56it [00:05, 9.87it/s] 57it [00:05, 9.89it/s] 58it [00:06, 9.88it/s] 59it [00:06, 9.90it/s] 60it [00:06, 9.89it/s] 62it [00:06, 9.94it/s] 63it [00:06, 9.93it/s] 64it [00:06, 9.94it/s] 65it [00:06, 9.94it/s] 66it [00:06, 9.95it/s] 67it [00:06, 9.92it/s] 68it [00:07, 9.92it/s] 69it [00:07, 9.92it/s] 70it [00:07, 9.93it/s] 71it [00:07, 9.94it/s] 72it [00:07, 9.93it/s] 73it [00:07, 9.95it/s] 74it [00:07, 9.93it/s] 75it [00:07, 9.33it/s] 76it [00:07, 9.47it/s] 77it [00:08, 9.58it/s] 78it [00:08, 9.69it/s] 79it [00:08, 9.73it/s] 80it [00:08, 9.06it/s] 81it [00:08, 9.28it/s] 82it [00:08, 9.46it/s] 83it [00:08, 9.59it/s] 84it [00:08, 9.66it/s] 85it [00:08, 9.75it/s] 86it [00:08, 9.76it/s] 87it [00:09, 9.81it/s] 88it [00:09, 9.83it/s] 89it [00:09, 9.86it/s] 90it [00:09, 9.86it/s] 91it [00:09, 9.89it/s] 92it [00:09, 9.89it/s] 93it [00:09, 9.28it/s] 94it [00:09, 9.41it/s] 95it [00:09, 9.55it/s] 96it [00:09, 9.65it/s] 97it [00:10, 9.73it/s] 98it [00:10, 9.74it/s] 99it [00:10, 9.29it/s] 100it [00:10, 9.47it/s]2025-05-26 05:37:22,913 - INFO - [Epoch 010 | Batch 0100] IWAE-loss 10181.3457 | mean log_px -0.1026 | KL -3547.27 + 101it [00:10, 9.60it/s] 102it [00:10, 9.68it/s] 103it [00:10, 9.48it/s] 104it [00:10, 9.16it/s] 105it [00:10, 9.37it/s] 106it [00:11, 9.51it/s] 107it [00:11, 9.62it/s] 108it [00:11, 9.09it/s] 109it [00:11, 9.34it/s] 110it [00:11, 9.51it/s] 111it [00:11, 9.64it/s] 112it [00:11, 9.71it/s] 113it [00:11, 9.79it/s] 114it [00:11, 9.84it/s] 115it [00:11, 9.88it/s] 116it [00:12, 9.88it/s] 118it [00:12, 9.53it/s] 119it [00:12, 9.62it/s] 120it [00:12, 9.69it/s] 121it [00:12, 9.76it/s] 122it [00:12, 9.80it/s] 124it [00:12, 9.40it/s] 125it [00:13, 9.53it/s] 126it [00:13, 9.63it/s] 128it [00:13, 9.79it/s] 129it [00:13, 9.82it/s] 130it [00:13, 9.82it/s] 131it [00:13, 9.85it/s] 132it [00:13, 9.50it/s] 133it [00:13, 9.61it/s] 134it [00:13, 9.69it/s] 135it [00:14, 9.74it/s] 136it [00:14, 9.73it/s] 137it [00:14, 9.79it/s] 138it [00:14, 9.34it/s] 139it [00:14, 9.51it/s] 140it [00:14, 9.58it/s] 141it [00:14, 9.68it/s] 142it [00:14, 9.70it/s] 143it [00:14, 9.74it/s] 144it [00:14, 9.81it/s] 145it [00:15, 9.86it/s] 146it [00:15, 9.88it/s] 148it [00:15, 9.89it/s] 149it [00:15, 9.92it/s] 150it [00:15, 9.89it/s]2025-05-26 05:37:28,081 - INFO - [Epoch 010 | Batch 0150] IWAE-loss 12556.6738 | mean log_px -0.1344 | KL -3543.33 + 151it [00:15, 9.87it/s] 152it [00:15, 9.86it/s] 153it [00:15, 9.89it/s] 154it [00:16, 9.44it/s] 155it [00:16, 9.57it/s] 156it [00:16, 9.67it/s] 157it [00:16, 9.73it/s] 158it [00:16, 9.78it/s] 159it [00:16, 9.82it/s] 160it [00:16, 9.84it/s] 161it [00:16, 9.86it/s] 162it [00:16, 9.88it/s] 163it [00:16, 9.90it/s] 164it [00:17, 9.89it/s] 165it [00:17, 9.89it/s] 166it [00:17, 9.89it/s] 167it [00:17, 9.92it/s] 168it [00:17, 9.91it/s] 169it [00:17, 9.91it/s] 170it [00:17, 9.93it/s] 171it [00:17, 9.92it/s] 172it [00:17, 9.90it/s] 173it [00:17, 9.90it/s] 174it [00:18, 9.90it/s] 175it [00:18, 9.90it/s] 176it [00:18, 9.90it/s] 177it [00:18, 9.91it/s] 178it [00:18, 9.91it/s] 179it [00:18, 9.92it/s] 180it [00:18, 9.91it/s] 181it [00:18, 9.27it/s] 182it [00:18, 9.44it/s] 183it [00:18, 9.59it/s] 184it [00:19, 9.68it/s] 185it [00:19, 9.77it/s] 186it [00:19, 9.18it/s] 187it [00:19, 9.39it/s] 188it [00:19, 9.49it/s] 189it [00:19, 9.60it/s] 190it [00:19, 9.68it/s] 191it [00:19, 9.53it/s] 192it [00:19, 9.64it/s] 193it [00:20, 9.71it/s] 194it [00:20, 9.76it/s] 195it [00:20, 9.38it/s] 196it [00:20, 9.62it/s] +2025-05-26 05:37:32,815 - INFO - Epoch: 10, Objective: tensor([15107.3916], device='cuda:0', grad_fn=), Loss: 0.16303861141204834, KL/n: 72.43524169921875 + 0it [00:00, ?it/s]2025-05-26 05:37:33,091 - INFO - [Epoch 011 | Batch 0000] IWAE-loss 10246.0049 | mean log_px -0.1013 | KL -3548.55 + 1it [00:00, 4.64it/s] 2it [00:00, 6.71it/s] 3it [00:00, 7.88it/s] 4it [00:00, 8.55it/s] 5it [00:00, 8.37it/s] 6it [00:00, 8.80it/s] 7it [00:00, 9.11it/s] 8it [00:00, 9.34it/s] 9it [00:01, 9.52it/s] 10it [00:01, 9.62it/s] 11it [00:01, 9.69it/s] 12it [00:01, 9.74it/s] 13it [00:01, 9.77it/s] 14it [00:01, 9.77it/s] 16it [00:01, 9.88it/s] 17it [00:01, 9.91it/s] 18it [00:01, 9.90it/s] 20it [00:02, 9.95it/s] 21it [00:02, 9.96it/s] 22it [00:02, 9.95it/s] 23it [00:02, 9.94it/s] 24it [00:02, 9.91it/s] 25it [00:02, 9.92it/s] 26it [00:02, 9.89it/s] 28it [00:02, 9.91it/s] 29it [00:03, 9.92it/s] 30it [00:03, 9.89it/s] 31it [00:03, 9.89it/s] 32it [00:03, 9.91it/s] 33it [00:03, 9.92it/s] 34it [00:03, 9.90it/s] 35it [00:03, 9.91it/s] 36it [00:03, 9.90it/s] 37it [00:03, 9.88it/s] 38it [00:03, 9.91it/s] 39it [00:04, 9.89it/s] 40it [00:04, 9.90it/s] 41it [00:04, 9.91it/s] 42it [00:04, 9.92it/s] 43it [00:04, 9.93it/s] 44it [00:04, 9.95it/s] 45it [00:04, 9.95it/s] 46it [00:04, 9.95it/s] 48it [00:04, 9.98it/s] 49it [00:05, 9.96it/s] 50it [00:05, 9.96it/s]2025-05-26 05:37:38,189 - INFO - [Epoch 011 | Batch 0050] IWAE-loss 13919.8701 | mean log_px -0.1529 | KL -3551.17 + 51it [00:05, 9.94it/s] 52it [00:05, 9.90it/s] 53it [00:05, 9.88it/s] 54it [00:05, 9.88it/s] 55it [00:05, 9.90it/s] 56it [00:05, 9.93it/s] 57it [00:05, 9.95it/s] 58it [00:05, 9.95it/s] 60it [00:06, 10.00it/s] 61it [00:06, 9.86it/s] 62it [00:06, 9.72it/s] 63it [00:06, 9.47it/s] 64it [00:06, 9.52it/s] 65it [00:06, 9.58it/s] 66it [00:06, 9.57it/s] 67it [00:06, 9.61it/s] 68it [00:07, 9.58it/s] 69it [00:07, 9.59it/s] 70it [00:07, 9.59it/s] 71it [00:07, 9.58it/s] 72it [00:07, 9.57it/s] 73it [00:07, 9.58it/s] 74it [00:07, 9.59it/s] 75it [00:07, 9.62it/s] 76it [00:07, 9.64it/s] 77it [00:07, 9.50it/s] 78it [00:08, 9.50it/s] 79it [00:08, 9.39it/s] 80it [00:08, 9.48it/s] 81it [00:08, 9.56it/s] 82it [00:08, 9.59it/s] 83it [00:08, 9.61it/s] 84it [00:08, 9.61it/s] 85it [00:08, 9.62it/s] 86it [00:08, 9.63it/s] 87it [00:09, 9.66it/s] 88it [00:09, 9.63it/s] 89it [00:09, 9.62it/s] 90it [00:09, 9.61it/s] 91it [00:09, 9.60it/s] 92it [00:09, 9.62it/s] 93it [00:09, 9.64it/s] 94it [00:09, 9.66it/s] 95it [00:09, 9.66it/s] 96it [00:09, 9.62it/s] 97it [00:10, 9.61it/s] 98it [00:10, 9.64it/s] 99it [00:10, 9.54it/s] 100it [00:10, 9.56it/s]2025-05-26 05:37:43,379 - INFO - [Epoch 011 | Batch 0100] IWAE-loss 11395.6230 | mean log_px -0.1321 | KL -3551.43 + 101it [00:10, 9.56it/s] 102it [00:10, 9.56it/s] 103it [00:10, 9.44it/s] 104it [00:10, 9.47it/s] 105it [00:10, 9.51it/s] 106it [00:11, 9.56it/s] 107it [00:11, 9.55it/s] 108it [00:11, 9.57it/s] 109it [00:11, 9.58it/s] 110it [00:11, 9.61it/s] 111it [00:11, 9.63it/s] 112it [00:11, 9.63it/s] 113it [00:11, 9.64it/s] 114it [00:11, 9.64it/s] 115it [00:11, 9.65it/s] 116it [00:12, 9.65it/s] 117it [00:12, 9.62it/s] 118it [00:12, 9.63it/s] 119it [00:12, 9.64it/s] 120it [00:12, 9.64it/s] 121it [00:12, 9.63it/s] 122it [00:12, 9.60it/s] 123it [00:12, 9.64it/s] 124it [00:12, 9.65it/s] 125it [00:12, 9.66it/s] 126it [00:13, 9.64it/s] 127it [00:13, 9.64it/s] 128it [00:13, 9.61it/s] 129it [00:13, 9.59it/s] 130it [00:13, 9.60it/s] 131it [00:13, 9.63it/s] 132it [00:13, 9.63it/s] 133it [00:13, 9.66it/s] 134it [00:13, 9.64it/s] 135it [00:14, 9.64it/s] 136it [00:14, 9.62it/s] 137it [00:14, 9.66it/s] 138it [00:14, 9.63it/s] 139it [00:14, 9.64it/s] 140it [00:14, 9.64it/s] 141it [00:14, 9.68it/s] 142it [00:14, 9.68it/s] 143it [00:14, 9.69it/s] 144it [00:14, 9.69it/s] 145it [00:15, 9.66it/s] 146it [00:15, 9.63it/s] 147it [00:15, 9.61it/s] 148it [00:15, 9.60it/s] 149it [00:15, 9.62it/s] 150it [00:15, 9.65it/s]2025-05-26 05:37:48,575 - INFO - [Epoch 011 | Batch 0150] IWAE-loss 14350.5879 | mean log_px -0.1595 | KL -3548.78 + 151it [00:15, 9.63it/s] 152it [00:15, 9.62it/s] 153it [00:15, 9.63it/s] 154it [00:15, 9.62it/s] 155it [00:16, 9.63it/s] 156it [00:16, 9.64it/s] 157it [00:16, 9.63it/s] 158it [00:16, 9.62it/s] 159it [00:16, 9.63it/s] 160it [00:16, 9.60it/s] 161it [00:16, 9.61it/s] 162it [00:16, 9.59it/s] 163it [00:16, 9.63it/s] 164it [00:17, 9.62it/s] 165it [00:17, 9.65it/s] 166it [00:17, 9.64it/s] 167it [00:17, 9.62it/s] 168it [00:17, 9.62it/s] 169it [00:17, 9.66it/s] 170it [00:17, 9.65it/s] 171it [00:17, 9.63it/s] 172it [00:17, 9.64it/s] 173it [00:17, 9.63it/s] 174it [00:18, 9.62it/s] 175it [00:18, 9.63it/s] 176it [00:18, 9.62it/s] 177it [00:18, 9.61it/s] 178it [00:18, 9.60it/s] 179it [00:18, 9.62it/s] 180it [00:18, 9.64it/s] 181it [00:18, 9.66it/s] 182it [00:18, 9.66it/s] 183it [00:18, 9.65it/s] 184it [00:19, 9.63it/s] 185it [00:19, 9.66it/s] 186it [00:19, 9.65it/s] 187it [00:19, 9.64it/s] 188it [00:19, 9.63it/s] 189it [00:19, 9.66it/s] 190it [00:19, 9.64it/s] 191it [00:19, 9.64it/s] 192it [00:19, 9.63it/s] 193it [00:20, 9.43it/s] 194it [00:20, 9.46it/s] 195it [00:20, 9.19it/s] 196it [00:20, 9.41it/s] 196it [00:20, 9.60it/s] +2025-05-26 05:37:53,363 - INFO - Epoch: 11, Objective: tensor([10451.8135], device='cuda:0', grad_fn=), Loss: 0.1001165509223938, KL/n: 72.5517807006836 + 0it [00:00, ?it/s]2025-05-26 05:37:53,822 - INFO - [Epoch 012 | Batch 0000] IWAE-loss 8402.5049 | mean log_px -0.0712 | KL -3554.51 + 1it [00:00, 5.44it/s] 2it [00:00, 7.28it/s] 3it [00:00, 8.21it/s] 4it [00:00, 8.69it/s] 5it [00:00, 9.05it/s] 6it [00:00, 9.21it/s] 7it [00:00, 9.40it/s] 8it [00:00, 9.52it/s] 9it [00:01, 9.54it/s] 10it [00:01, 9.58it/s] 11it [00:01, 9.60it/s] 12it [00:01, 9.65it/s] 13it [00:01, 9.55it/s] 14it [00:01, 9.06it/s] 15it [00:01, 9.28it/s] 16it [00:01, 9.49it/s] 17it [00:01, 9.58it/s] 18it [00:01, 9.67it/s] 19it [00:02, 9.75it/s] 20it [00:02, 9.80it/s] 21it [00:02, 9.85it/s] 22it [00:02, 9.85it/s] 23it [00:02, 9.89it/s] 24it [00:02, 9.88it/s] 26it [00:02, 9.95it/s] 27it [00:02, 9.51it/s] 28it [00:02, 9.61it/s] 29it [00:03, 9.68it/s] 30it [00:03, 9.76it/s] 31it [00:03, 9.80it/s] 32it [00:03, 9.83it/s] 33it [00:03, 9.25it/s] 34it [00:03, 9.43it/s] 36it [00:03, 9.69it/s] 37it [00:03, 9.76it/s] 38it [00:04, 9.81it/s] 39it [00:04, 9.85it/s] 40it [00:04, 9.87it/s] 41it [00:04, 9.88it/s] 42it [00:04, 9.90it/s] 43it [00:04, 9.90it/s] 44it [00:04, 9.90it/s] 45it [00:04, 9.59it/s] 46it [00:04, 9.70it/s] 47it [00:04, 9.78it/s] 48it [00:05, 9.82it/s] 49it [00:05, 9.86it/s] 50it [00:05, 9.86it/s]2025-05-26 05:37:58,973 - INFO - [Epoch 012 | Batch 0050] IWAE-loss 10922.4316 | mean log_px -0.1087 | KL -3553.06 + 51it [00:05, 9.23it/s] 52it [00:05, 9.25it/s] 54it [00:05, 9.57it/s] 55it [00:05, 9.66it/s] 56it [00:05, 9.73it/s] 57it [00:05, 9.80it/s] 58it [00:06, 9.83it/s] 59it [00:06, 9.86it/s] 60it [00:06, 9.88it/s] 61it [00:06, 9.88it/s] 62it [00:06, 9.21it/s] 63it [00:06, 9.41it/s] 64it [00:06, 9.56it/s] 65it [00:06, 9.68it/s] 66it [00:06, 9.64it/s] 67it [00:07, 9.04it/s] 68it [00:07, 9.28it/s] 69it [00:07, 9.46it/s] 70it [00:07, 9.61it/s] 71it [00:07, 9.71it/s] 72it [00:07, 9.79it/s] 73it [00:07, 9.85it/s] 74it [00:07, 9.37it/s] 75it [00:07, 9.54it/s] 76it [00:07, 9.57it/s] 78it [00:08, 9.77it/s] 79it [00:08, 9.82it/s] 80it [00:08, 9.86it/s] 82it [00:08, 9.94it/s] 83it [00:08, 9.95it/s] 84it [00:08, 9.96it/s] 86it [00:08, 9.98it/s] 88it [00:09, 9.99it/s] 89it [00:09, 9.99it/s] 90it [00:09, 9.99it/s] 91it [00:09, 9.96it/s] 92it [00:09, 9.93it/s] 94it [00:09, 9.97it/s] 96it [00:09, 9.57it/s] 98it [00:10, 9.72it/s] 99it [00:10, 9.77it/s] 100it [00:10, 9.80it/s]2025-05-26 05:38:04,126 - INFO - [Epoch 012 | Batch 0100] IWAE-loss 11670.1055 | mean log_px -0.1183 | KL -3560.71 + 101it [00:10, 9.18it/s] 102it [00:10, 9.13it/s] 103it [00:10, 9.32it/s] 104it [00:10, 9.44it/s] 105it [00:10, 9.58it/s] 106it [00:11, 9.07it/s] 107it [00:11, 9.28it/s] 108it [00:11, 9.46it/s] 109it [00:11, 9.61it/s] 110it [00:11, 9.69it/s] 112it [00:11, 9.34it/s] 113it [00:11, 9.49it/s] 114it [00:11, 9.57it/s] 115it [00:11, 9.67it/s] 116it [00:12, 9.58it/s] 117it [00:12, 9.64it/s] 118it [00:12, 9.69it/s] 119it [00:12, 9.77it/s] 120it [00:12, 9.81it/s] 122it [00:12, 9.82it/s] 123it [00:12, 9.84it/s] 124it [00:12, 9.86it/s] 125it [00:12, 9.85it/s] 126it [00:13, 9.85it/s] 128it [00:13, 9.94it/s] 130it [00:13, 9.98it/s] 131it [00:13, 9.97it/s] 132it [00:13, 9.44it/s] 133it [00:13, 9.56it/s] 134it [00:13, 9.62it/s] 135it [00:14, 9.71it/s] 136it [00:14, 9.77it/s] 137it [00:14, 9.82it/s] 138it [00:14, 9.83it/s] 139it [00:14, 9.88it/s] 140it [00:14, 9.86it/s] 141it [00:14, 9.85it/s] 142it [00:14, 9.84it/s] 143it [00:14, 9.76it/s] 144it [00:14, 9.75it/s] 145it [00:15, 9.78it/s] 146it [00:15, 9.73it/s] 147it [00:15, 9.73it/s] 148it [00:15, 9.72it/s] 149it [00:15, 9.73it/s] 150it [00:15, 9.67it/s]2025-05-26 05:38:09,304 - INFO - [Epoch 012 | Batch 0150] IWAE-loss 9823.7705 | mean log_px -0.0984 | KL -3558.63 + 151it [00:15, 9.63it/s] 152it [00:15, 9.66it/s] 153it [00:15, 9.73it/s] 154it [00:15, 9.74it/s] 155it [00:16, 9.70it/s] 156it [00:16, 9.68it/s] 157it [00:16, 9.65it/s] 158it [00:16, 9.65it/s] 159it [00:16, 9.65it/s] 160it [00:16, 9.63it/s] 161it [00:16, 9.62it/s] 162it [00:16, 9.59it/s] 163it [00:16, 9.54it/s] 164it [00:17, 9.31it/s] 165it [00:17, 8.70it/s] 166it [00:17, 8.88it/s] 167it [00:17, 9.00it/s] 168it [00:17, 9.10it/s] 169it [00:17, 9.21it/s] 170it [00:17, 9.28it/s] 171it [00:17, 9.31it/s] 172it [00:17, 9.34it/s] 173it [00:18, 9.36it/s] 174it [00:18, 9.38it/s] 175it [00:18, 9.36it/s] 176it [00:18, 9.26it/s] 177it [00:18, 9.24it/s] 178it [00:18, 9.26it/s] 179it [00:18, 9.26it/s] 180it [00:18, 9.31it/s] 181it [00:18, 9.32it/s] 182it [00:18, 9.29it/s] 183it [00:19, 9.36it/s] 184it [00:19, 9.44it/s] 185it [00:19, 9.40it/s] 186it [00:19, 9.37it/s] 187it [00:19, 9.34it/s] 188it [00:19, 9.32it/s] 189it [00:19, 9.35it/s] 190it [00:19, 9.41it/s] 191it [00:19, 9.43it/s] 192it [00:20, 9.43it/s] 193it [00:20, 9.44it/s] 194it [00:20, 9.05it/s] 195it [00:20, 8.65it/s] 196it [00:20, 8.90it/s] 196it [00:20, 9.53it/s] +2025-05-26 05:38:14,246 - INFO - Epoch: 12, Objective: tensor([11959.2480], device='cuda:0', grad_fn=), Loss: 0.12528853118419647, KL/n: 72.63204193115234 + 0it [00:00, ?it/s]2025-05-26 05:38:14,546 - INFO - [Epoch 013 | Batch 0000] IWAE-loss 10673.3086 | mean log_px -0.1125 | KL -3559.28 + 1it [00:00, 4.29it/s] 2it [00:00, 6.25it/s] 3it [00:00, 7.44it/s] 4it [00:00, 8.14it/s] 5it [00:00, 8.61it/s] 6it [00:00, 8.25it/s] 7it [00:00, 8.62it/s] 8it [00:00, 8.84it/s] 9it [00:01, 9.04it/s] 10it [00:01, 8.64it/s] 11it [00:01, 8.91it/s] 12it [00:01, 9.06it/s] 13it [00:01, 9.22it/s] 14it [00:01, 8.86it/s] 15it [00:01, 9.03it/s] 16it [00:01, 9.15it/s] 17it [00:01, 9.28it/s] 18it [00:02, 9.39it/s] 19it [00:02, 9.45it/s] 20it [00:02, 9.49it/s] 21it [00:02, 9.50it/s] 22it [00:02, 9.52it/s] 23it [00:02, 9.55it/s] 24it [00:02, 9.52it/s] 25it [00:02, 9.53it/s] 26it [00:02, 9.53it/s] 27it [00:03, 9.57it/s] 28it [00:03, 9.58it/s] 29it [00:03, 9.59it/s] 30it [00:03, 9.51it/s] 31it [00:03, 9.48it/s] 32it [00:03, 8.97it/s] 33it [00:03, 9.14it/s] 34it [00:03, 9.26it/s] 35it [00:03, 9.31it/s] 36it [00:03, 9.40it/s] 37it [00:04, 9.45it/s] 38it [00:04, 9.49it/s] 39it [00:04, 9.53it/s] 40it [00:04, 9.50it/s] 41it [00:04, 9.52it/s] 42it [00:04, 9.50it/s] 43it [00:04, 9.50it/s] 44it [00:04, 9.50it/s] 45it [00:04, 9.57it/s] 46it [00:05, 9.53it/s] 47it [00:05, 9.53it/s] 48it [00:05, 9.56it/s] 49it [00:05, 9.60it/s] 50it [00:05, 9.59it/s]2025-05-26 05:38:19,905 - INFO - [Epoch 013 | Batch 0050] IWAE-loss 14811.1055 | mean log_px -0.1740 | KL -3564.73 + 51it [00:05, 9.57it/s] 52it [00:05, 9.57it/s] 53it [00:05, 9.61it/s] 54it [00:05, 9.54it/s] 55it [00:05, 9.54it/s] 56it [00:06, 9.53it/s] 57it [00:06, 9.53it/s] 58it [00:06, 9.51it/s] 59it [00:06, 9.55it/s] 60it [00:06, 9.49it/s] 61it [00:06, 9.53it/s] 62it [00:06, 9.56it/s] 63it [00:06, 9.53it/s] 64it [00:06, 9.55it/s] 65it [00:07, 9.55it/s] 66it [00:07, 9.00it/s] 67it [00:07, 9.14it/s] 68it [00:07, 9.26it/s] 69it [00:07, 9.32it/s] 70it [00:07, 9.36it/s] 71it [00:07, 9.38it/s] 72it [00:07, 9.43it/s] 73it [00:07, 9.51it/s] 74it [00:07, 9.52it/s] 75it [00:08, 9.50it/s] 76it [00:08, 9.55it/s] 77it [00:08, 9.58it/s] 78it [00:08, 9.64it/s] 79it [00:08, 9.65it/s] 80it [00:08, 9.62it/s] 81it [00:08, 9.61it/s] 82it [00:08, 9.56it/s] 83it [00:08, 9.56it/s] 84it [00:09, 9.56it/s] 85it [00:09, 9.54it/s] 86it [00:09, 9.50it/s] 87it [00:09, 9.50it/s] 88it [00:09, 9.51it/s] 89it [00:09, 9.54it/s] 90it [00:09, 9.57it/s] 91it [00:09, 9.03it/s] 92it [00:09, 9.18it/s] 93it [00:10, 9.32it/s] 94it [00:10, 9.38it/s] 95it [00:10, 9.44it/s] 96it [00:10, 9.43it/s] 97it [00:10, 9.51it/s] 98it [00:10, 9.50it/s] 99it [00:10, 9.01it/s] 100it [00:10, 9.15it/s]2025-05-26 05:38:25,205 - INFO - [Epoch 013 | Batch 0100] IWAE-loss 11084.1914 | mean log_px -0.1101 | KL -3557.34 + 101it [00:10, 9.24it/s] 102it [00:10, 9.36it/s] 103it [00:11, 9.43it/s] 104it [00:11, 9.45it/s] 105it [00:11, 8.97it/s] 106it [00:11, 9.11it/s] 107it [00:11, 9.26it/s] 108it [00:11, 9.36it/s] 109it [00:11, 8.87it/s] 110it [00:11, 9.11it/s] 111it [00:11, 9.26it/s] 112it [00:12, 9.30it/s] 113it [00:12, 9.34it/s] 114it [00:12, 9.38it/s] 115it [00:12, 9.43it/s] 116it [00:12, 9.44it/s] 117it [00:12, 9.50it/s] 118it [00:12, 8.95it/s] 119it [00:12, 9.12it/s] 120it [00:12, 9.27it/s] 121it [00:13, 9.38it/s] 122it [00:13, 9.46it/s] 123it [00:13, 9.48it/s] 124it [00:13, 9.53it/s] 125it [00:13, 9.55it/s] 126it [00:13, 9.56it/s] 127it [00:13, 9.54it/s] 128it [00:13, 9.57it/s] 129it [00:13, 9.57it/s] 130it [00:13, 9.59it/s] 131it [00:14, 9.62it/s] 132it [00:14, 9.60it/s] 133it [00:14, 9.56it/s] 134it [00:14, 9.51it/s] 135it [00:14, 9.55it/s] 136it [00:14, 9.53it/s] 137it [00:14, 9.52it/s] 138it [00:14, 9.50it/s] 139it [00:14, 8.89it/s] 140it [00:15, 9.10it/s] 141it [00:15, 9.22it/s] 142it [00:15, 9.29it/s] 143it [00:15, 9.27it/s] 144it [00:15, 9.38it/s] 145it [00:15, 9.46it/s] 146it [00:15, 9.44it/s] 147it [00:15, 9.49it/s] 148it [00:15, 9.45it/s] 149it [00:15, 9.46it/s] 150it [00:16, 9.49it/s]2025-05-26 05:38:30,530 - INFO - [Epoch 013 | Batch 0150] IWAE-loss 8056.9863 | mean log_px -0.0642 | KL -3562.25 + 151it [00:16, 9.54it/s] 152it [00:16, 9.51it/s] 153it [00:16, 9.55it/s] 154it [00:16, 9.54it/s] 155it [00:16, 9.57it/s] 156it [00:16, 9.45it/s] 157it [00:16, 9.52it/s] 158it [00:16, 9.52it/s] 159it [00:17, 9.55it/s] 160it [00:17, 9.48it/s] 161it [00:17, 9.51it/s] 162it [00:17, 9.53it/s] 163it [00:17, 9.48it/s] 164it [00:17, 9.54it/s] 165it [00:17, 9.57it/s] 166it [00:17, 9.54it/s] 167it [00:17, 9.57it/s] 168it [00:17, 9.54it/s] 169it [00:18, 9.57it/s] 170it [00:18, 9.58it/s] 171it [00:18, 9.41it/s] 172it [00:18, 9.44it/s] 173it [00:18, 9.45it/s] 174it [00:18, 9.47it/s] 175it [00:18, 9.53it/s] 176it [00:18, 9.56it/s] 177it [00:18, 9.51it/s] 178it [00:19, 9.50it/s] 179it [00:19, 9.52it/s] 180it [00:19, 9.54it/s] 181it [00:19, 9.53it/s] 182it [00:19, 9.54it/s] 183it [00:19, 9.59it/s] 184it [00:19, 9.56it/s] 185it [00:19, 9.55it/s] 186it [00:19, 9.52it/s] 187it [00:19, 9.55it/s] 188it [00:20, 9.58it/s] 189it [00:20, 9.17it/s] 190it [00:20, 9.30it/s] 191it [00:20, 9.38it/s] 192it [00:20, 8.86it/s] 193it [00:20, 9.07it/s] 194it [00:20, 9.12it/s] 195it [00:20, 8.65it/s] 196it [00:20, 8.89it/s] 196it [00:21, 9.32it/s] +2025-05-26 05:38:35,417 - INFO - Epoch: 13, Objective: tensor([13255.1807], device='cuda:0', grad_fn=), Loss: 0.15383651852607727, KL/n: 72.70011138916016 + 0it [00:00, ?it/s]2025-05-26 05:38:35,882 - INFO - [Epoch 014 | Batch 0000] IWAE-loss 11022.1055 | mean log_px -0.1185 | KL -3559.76 + 1it [00:00, 2.70it/s] 2it [00:00, 4.64it/s] 3it [00:00, 6.09it/s] 4it [00:00, 7.14it/s] 5it [00:00, 7.85it/s] 6it [00:00, 8.36it/s] 7it [00:00, 8.73it/s] 8it [00:01, 8.96it/s] 9it [00:01, 9.16it/s] 10it [00:01, 9.30it/s] 11it [00:01, 9.37it/s] 12it [00:01, 9.44it/s] 13it [00:01, 9.49it/s] 14it [00:01, 9.43it/s] 15it [00:01, 9.47it/s] 16it [00:01, 9.48it/s] 17it [00:02, 9.48it/s] 18it [00:02, 9.49it/s] 19it [00:02, 9.47it/s] 20it [00:02, 9.49it/s] 21it [00:02, 9.45it/s] 22it [00:02, 9.46it/s] 23it [00:02, 9.50it/s] 24it [00:02, 9.49it/s] 25it [00:02, 9.54it/s] 26it [00:02, 9.50it/s] 27it [00:03, 9.51it/s] 28it [00:03, 9.46it/s] 29it [00:03, 9.48it/s] 30it [00:03, 9.51it/s] 31it [00:03, 9.47it/s] 32it [00:03, 8.94it/s] 33it [00:03, 9.11it/s] 34it [00:03, 9.22it/s] 35it [00:03, 9.27it/s] 36it [00:04, 9.34it/s] 37it [00:04, 9.42it/s] 38it [00:04, 9.42it/s] 39it [00:04, 9.47it/s] 40it [00:04, 9.48it/s] 41it [00:04, 9.49it/s] 42it [00:04, 9.52it/s] 43it [00:04, 9.57it/s] 44it [00:04, 9.52it/s] 45it [00:05, 9.41it/s] 46it [00:05, 9.50it/s] 47it [00:05, 9.55it/s] 48it [00:05, 9.49it/s] 49it [00:05, 9.50it/s] 50it [00:05, 9.49it/s]2025-05-26 05:38:41,159 - INFO - [Epoch 014 | Batch 0050] IWAE-loss 8267.6357 | mean log_px -0.0700 | KL -3559.77 + 51it [00:05, 9.54it/s] 52it [00:05, 9.51it/s] 53it [00:05, 9.48it/s] 54it [00:05, 9.43it/s] 55it [00:06, 9.46it/s] 56it [00:06, 9.49it/s] 57it [00:06, 9.52it/s] 58it [00:06, 9.48it/s] 59it [00:06, 9.30it/s] 60it [00:06, 8.76it/s] 61it [00:06, 8.94it/s] 62it [00:06, 9.11it/s] 63it [00:06, 9.22it/s] 64it [00:07, 9.32it/s] 65it [00:07, 9.40it/s] 66it [00:07, 9.44it/s] 67it [00:07, 9.47it/s] 68it [00:07, 9.49it/s] 69it [00:07, 9.54it/s] 70it [00:07, 9.46it/s] 71it [00:07, 9.46it/s] 72it [00:07, 8.93it/s] 73it [00:08, 9.05it/s] 74it [00:08, 9.14it/s] 75it [00:08, 9.28it/s] 76it [00:08, 9.31it/s] 77it [00:08, 9.37it/s] 78it [00:08, 9.38it/s] 79it [00:08, 9.41it/s] 80it [00:08, 9.43it/s] 81it [00:08, 9.46it/s] 82it [00:08, 9.47it/s] 83it [00:09, 8.89it/s] 84it [00:09, 8.91it/s] 85it [00:09, 9.01it/s] 86it [00:09, 9.15it/s] 87it [00:09, 9.24it/s] 88it [00:09, 9.31it/s] 89it [00:09, 9.38it/s] 90it [00:09, 9.45it/s] 91it [00:09, 9.46it/s] 92it [00:10, 9.49it/s] 93it [00:10, 9.52it/s] 94it [00:10, 9.49it/s] 95it [00:10, 9.50it/s] 96it [00:10, 9.48it/s] 97it [00:10, 9.52it/s] 98it [00:10, 9.50it/s] 99it [00:10, 9.49it/s] 100it [00:10, 9.52it/s]2025-05-26 05:38:46,510 - INFO - [Epoch 014 | Batch 0100] IWAE-loss 13712.4199 | mean log_px -0.1565 | KL -3561.90 + 101it [00:10, 9.54it/s] 102it [00:11, 9.53it/s] 103it [00:11, 9.50it/s] 104it [00:11, 9.47it/s] 105it [00:11, 9.49it/s] 106it [00:11, 9.56it/s] 107it [00:11, 9.47it/s] 108it [00:11, 9.48it/s] 109it [00:11, 9.54it/s] 110it [00:11, 9.53it/s] 111it [00:12, 9.49it/s] 112it [00:12, 9.46it/s] 113it [00:12, 9.48it/s] 114it [00:12, 9.49it/s] 115it [00:12, 9.53it/s] 116it [00:12, 9.50it/s] 117it [00:12, 9.54it/s] 118it [00:12, 9.44it/s] 119it [00:12, 9.50it/s] 120it [00:12, 9.49it/s] 121it [00:13, 9.56it/s] 122it [00:13, 9.53it/s] 123it [00:13, 9.56it/s] 124it [00:13, 9.55it/s] 125it [00:13, 9.56it/s] 126it [00:13, 9.56it/s] 127it [00:13, 9.56it/s] 128it [00:13, 9.57it/s] 129it [00:13, 9.52it/s] 130it [00:14, 9.52it/s] 131it [00:14, 9.47it/s] 132it [00:14, 9.47it/s] 133it [00:14, 9.48it/s] 134it [00:14, 9.49it/s] 135it [00:14, 9.51it/s] 136it [00:14, 9.51it/s] 137it [00:14, 9.50it/s] 138it [00:14, 9.53it/s] 139it [00:14, 9.53it/s] 140it [00:15, 9.57it/s] 141it [00:15, 9.59it/s] 142it [00:15, 9.57it/s] 143it [00:15, 9.58it/s] 144it [00:15, 9.52it/s] 145it [00:15, 9.53it/s] 146it [00:15, 9.51it/s] 147it [00:15, 9.51it/s] 148it [00:15, 9.51it/s] 149it [00:16, 9.55it/s] 150it [00:16, 9.54it/s]2025-05-26 05:38:51,763 - INFO - [Epoch 014 | Batch 0150] IWAE-loss 13030.7373 | mean log_px -0.1424 | KL -3557.82 + 151it [00:16, 8.97it/s] 152it [00:16, 9.14it/s] 153it [00:16, 9.13it/s] 154it [00:16, 9.26it/s] 155it [00:16, 9.35it/s] 156it [00:16, 9.40it/s] 157it [00:16, 9.47it/s] 158it [00:17, 9.48it/s] 159it [00:17, 9.54it/s] 160it [00:17, 9.56it/s] 161it [00:17, 9.58it/s] 162it [00:17, 9.56it/s] 163it [00:17, 9.61it/s] 164it [00:17, 9.55it/s] 165it [00:17, 9.58it/s] 166it [00:17, 9.61it/s] 167it [00:17, 9.60it/s] 168it [00:18, 9.53it/s] 169it [00:18, 9.55it/s] 170it [00:18, 9.53it/s] 171it [00:18, 9.49it/s] 172it [00:18, 9.49it/s] 173it [00:18, 9.01it/s] 174it [00:18, 9.16it/s] 175it [00:18, 9.30it/s] 176it [00:18, 9.41it/s] 177it [00:19, 9.46it/s] 178it [00:19, 9.39it/s] 179it [00:19, 9.46it/s] 180it [00:19, 9.51it/s] 181it [00:19, 9.54it/s] 182it [00:19, 9.51it/s] 183it [00:19, 9.51it/s] 184it [00:19, 9.47it/s] 185it [00:19, 9.48it/s] 186it [00:19, 9.50it/s] 187it [00:20, 9.54it/s] 188it [00:20, 9.47it/s] 189it [00:20, 9.51it/s] 190it [00:20, 9.49it/s] 191it [00:20, 9.57it/s] 192it [00:20, 9.50it/s] 193it [00:20, 9.51it/s] 194it [00:20, 9.51it/s] 195it [00:20, 8.45it/s] 196it [00:21, 8.75it/s] 196it [00:21, 9.28it/s] +2025-05-26 05:38:56,677 - INFO - Epoch: 14, Objective: tensor([11565.9922], device='cuda:0', grad_fn=), Loss: 0.11370649188756943, KL/n: 72.74580383300781 + 0it [00:00, ?it/s]2025-05-26 05:38:56,949 - INFO - [Epoch 015 | Batch 0000] IWAE-loss 10721.7217 | mean log_px -0.1022 | KL -3567.32 + 1it [00:00, 5.64it/s] 2it [00:00, 7.36it/s] 3it [00:00, 8.24it/s] 4it [00:00, 8.65it/s] 5it [00:00, 8.35it/s] 6it [00:00, 8.65it/s] 7it [00:00, 8.93it/s] 8it [00:00, 9.09it/s] 9it [00:01, 9.18it/s] 10it [00:01, 9.31it/s] 11it [00:01, 9.35it/s] 12it [00:01, 8.99it/s] 13it [00:01, 9.09it/s] 14it [00:01, 9.18it/s] 15it [00:01, 9.27it/s] 16it [00:01, 9.30it/s] 17it [00:01, 9.36it/s] 18it [00:02, 9.39it/s] 19it [00:02, 9.43it/s] 20it [00:02, 9.47it/s] 21it [00:02, 9.49it/s] 22it [00:02, 9.48it/s] 23it [00:02, 9.49it/s] 24it [00:02, 9.10it/s] 25it [00:02, 9.21it/s] 26it [00:02, 9.30it/s] 27it [00:02, 9.31it/s] 28it [00:03, 9.30it/s] 29it [00:03, 9.37it/s] 30it [00:03, 9.38it/s] 31it [00:03, 9.42it/s] 32it [00:03, 9.41it/s] 33it [00:03, 9.46it/s] 34it [00:03, 8.99it/s] 35it [00:03, 9.11it/s] 36it [00:03, 9.19it/s] 37it [00:04, 9.29it/s] 38it [00:04, 9.32it/s] 39it [00:04, 9.38it/s] 40it [00:04, 8.84it/s] 41it [00:04, 9.05it/s] 42it [00:04, 9.14it/s] 43it [00:04, 9.21it/s] 44it [00:04, 9.27it/s] 45it [00:04, 9.35it/s] 46it [00:05, 9.43it/s] 47it [00:05, 9.47it/s] 48it [00:05, 9.46it/s] 49it [00:05, 9.45it/s] 50it [00:05, 9.42it/s]2025-05-26 05:39:02,329 - INFO - [Epoch 015 | Batch 0050] IWAE-loss 11714.7119 | mean log_px -0.1263 | KL -3566.29 + 51it [00:05, 9.45it/s] 52it [00:05, 9.39it/s] 53it [00:05, 9.46it/s] 54it [00:05, 9.49it/s] 55it [00:05, 9.44it/s] 56it [00:06, 9.43it/s] 57it [00:06, 9.45it/s] 58it [00:06, 9.43it/s] 59it [00:06, 9.33it/s] 60it [00:06, 8.70it/s] 61it [00:06, 8.91it/s] 62it [00:06, 9.09it/s] 63it [00:06, 9.26it/s] 64it [00:06, 8.93it/s] 65it [00:07, 9.11it/s] 66it [00:07, 9.20it/s] 67it [00:07, 9.29it/s] 68it [00:07, 8.82it/s] 69it [00:07, 9.05it/s] 70it [00:07, 9.22it/s] 71it [00:07, 9.33it/s] 72it [00:07, 8.85it/s] 73it [00:07, 8.99it/s] 74it [00:08, 9.13it/s] 75it [00:08, 9.23it/s] 76it [00:08, 8.86it/s] 77it [00:08, 9.08it/s] 78it [00:08, 9.21it/s] 79it [00:08, 9.29it/s] 80it [00:08, 8.87it/s] 81it [00:08, 9.06it/s] 82it [00:08, 9.17it/s] 83it [00:09, 9.23it/s] 84it [00:09, 8.78it/s] 85it [00:09, 8.98it/s] 86it [00:09, 9.16it/s] 87it [00:09, 9.28it/s] 88it [00:09, 8.85it/s] 89it [00:09, 9.09it/s] 90it [00:09, 9.23it/s] 91it [00:09, 9.34it/s] 92it [00:10, 8.85it/s] 93it [00:10, 9.07it/s] 94it [00:10, 9.16it/s] 95it [00:10, 9.23it/s] 96it [00:10, 8.85it/s] 97it [00:10, 9.03it/s] 98it [00:10, 9.19it/s] 99it [00:10, 9.32it/s] 100it [00:10, 8.87it/s]2025-05-26 05:39:07,817 - INFO - [Epoch 015 | Batch 0100] IWAE-loss 10056.2070 | mean log_px -0.1000 | KL -3566.32 + 101it [00:11, 9.04it/s] 102it [00:11, 9.14it/s] 103it [00:11, 9.24it/s] 104it [00:11, 8.80it/s] 105it [00:11, 9.01it/s] 106it [00:11, 9.16it/s] 107it [00:11, 9.25it/s] 108it [00:11, 8.80it/s] 109it [00:11, 8.86it/s] 110it [00:12, 9.06it/s] 111it [00:12, 9.22it/s] 112it [00:12, 8.79it/s] 113it [00:12, 9.02it/s] 114it [00:12, 9.15it/s] 115it [00:12, 9.05it/s] 116it [00:12, 8.82it/s] 117it [00:12, 8.50it/s] 118it [00:12, 8.77it/s] 119it [00:13, 9.02it/s] 120it [00:13, 9.20it/s] 121it [00:13, 9.24it/s] 122it [00:13, 9.32it/s] 123it [00:13, 9.41it/s] 124it [00:13, 9.45it/s] 125it [00:13, 9.15it/s] 126it [00:13, 9.25it/s] 127it [00:13, 8.86it/s] 128it [00:14, 9.00it/s] 129it [00:14, 9.16it/s] 130it [00:14, 9.29it/s] 131it [00:14, 8.86it/s] 132it [00:14, 9.08it/s] 133it [00:14, 9.20it/s] 134it [00:14, 9.29it/s] 135it [00:14, 8.89it/s] 136it [00:14, 9.05it/s] 137it [00:15, 9.16it/s] 138it [00:15, 9.26it/s] 139it [00:15, 8.84it/s] 140it [00:15, 9.04it/s] 141it [00:15, 9.19it/s] 142it [00:15, 9.32it/s] 143it [00:15, 8.92it/s] 144it [00:15, 9.08it/s] 145it [00:15, 9.23it/s] 146it [00:15, 9.33it/s] 147it [00:16, 8.93it/s] 148it [00:16, 9.09it/s] 149it [00:16, 9.15it/s] 150it [00:16, 9.31it/s]2025-05-26 05:39:13,311 - INFO - [Epoch 015 | Batch 0150] IWAE-loss 9198.8525 | mean log_px -0.0873 | KL -3561.38 + 151it [00:16, 9.31it/s] 152it [00:16, 8.57it/s] 153it [00:16, 8.64it/s] 154it [00:16, 8.91it/s] 155it [00:17, 9.11it/s] 156it [00:17, 9.24it/s] 157it [00:17, 9.32it/s] 158it [00:17, 9.31it/s] 159it [00:17, 9.32it/s] 160it [00:17, 9.42it/s] 161it [00:17, 9.45it/s] 162it [00:17, 9.49it/s] 163it [00:17, 9.15it/s] 164it [00:17, 9.25it/s] 165it [00:18, 9.38it/s] 166it [00:18, 8.87it/s] 167it [00:18, 9.09it/s] 168it [00:18, 9.22it/s] 169it [00:18, 9.34it/s] 170it [00:18, 8.93it/s] 171it [00:18, 9.07it/s] 172it [00:18, 9.20it/s] 173it [00:18, 9.29it/s] 174it [00:19, 8.85it/s] 175it [00:19, 9.02it/s] 176it [00:19, 9.16it/s] 177it [00:19, 9.30it/s] 178it [00:19, 8.80it/s] 179it [00:19, 8.72it/s] 180it [00:19, 8.94it/s] 181it [00:19, 9.12it/s] 182it [00:19, 8.72it/s] 183it [00:20, 8.97it/s] 184it [00:20, 9.13it/s] 185it [00:20, 9.26it/s] 186it [00:20, 8.85it/s] 187it [00:20, 9.07it/s] 188it [00:20, 9.12it/s] 189it [00:20, 8.79it/s] 190it [00:20, 9.03it/s] 191it [00:20, 9.17it/s] 192it [00:21, 9.28it/s] 193it [00:21, 8.86it/s] 194it [00:21, 8.88it/s] 195it [00:21, 8.31it/s] 196it [00:21, 8.68it/s] 196it [00:21, 9.08it/s] +2025-05-26 05:39:18,392 - INFO - Epoch: 15, Objective: tensor([12319.4551], device='cuda:0', grad_fn=), Loss: 0.13309964537620544, KL/n: 72.79181671142578 + 0it [00:00, ?it/s]2025-05-26 05:39:18,670 - INFO - [Epoch 016 | Batch 0000] IWAE-loss 7340.2905 | mean log_px -0.0581 | KL -3566.00 + 1it [00:00, 4.73it/s] 2it [00:00, 6.63it/s] 3it [00:00, 7.70it/s] 4it [00:00, 8.32it/s] 5it [00:00, 8.73it/s] 6it [00:00, 8.94it/s] 7it [00:00, 9.16it/s] 8it [00:00, 9.27it/s] 9it [00:01, 9.37it/s] 10it [00:01, 9.33it/s] 11it [00:01, 9.30it/s] 12it [00:01, 9.29it/s] 13it [00:01, 9.35it/s] 14it [00:01, 9.40it/s] 15it [00:01, 9.47it/s] 16it [00:01, 9.41it/s] 17it [00:01, 9.47it/s] 18it [00:02, 9.43it/s] 19it [00:02, 9.46it/s] 20it [00:02, 9.44it/s] 21it [00:02, 9.44it/s] 22it [00:02, 9.41it/s] 23it [00:02, 9.45it/s] 24it [00:02, 6.18it/s] 25it [00:02, 6.89it/s] 26it [00:03, 7.52it/s] 27it [00:03, 8.01it/s] 28it [00:03, 8.39it/s] 29it [00:03, 8.70it/s] 30it [00:03, 8.94it/s] 31it [00:03, 9.11it/s] 32it [00:03, 9.20it/s] 33it [00:03, 9.29it/s] 34it [00:03, 9.37it/s] 35it [00:03, 9.37it/s] 36it [00:04, 9.43it/s] 37it [00:04, 9.42it/s] 38it [00:04, 9.45it/s] 39it [00:04, 9.51it/s] 40it [00:04, 9.45it/s] 41it [00:04, 9.44it/s] 42it [00:04, 9.46it/s] 43it [00:04, 9.47it/s] 44it [00:04, 9.43it/s] 45it [00:05, 9.43it/s] 46it [00:05, 9.45it/s] 47it [00:05, 9.41it/s] 48it [00:05, 9.45it/s] 49it [00:05, 9.45it/s] 50it [00:05, 9.48it/s]2025-05-26 05:39:24,169 - INFO - [Epoch 016 | Batch 0050] IWAE-loss 9277.7939 | mean log_px -0.0837 | KL -3565.87 + 51it [00:05, 8.95it/s] 52it [00:05, 9.10it/s] 53it [00:05, 9.26it/s] 54it [00:06, 9.27it/s] 55it [00:06, 9.34it/s] 56it [00:06, 9.41it/s] 57it [00:06, 9.48it/s] 58it [00:06, 9.47it/s] 59it [00:06, 9.51it/s] 60it [00:06, 9.53it/s] 61it [00:06, 9.49it/s] 62it [00:06, 8.96it/s] 63it [00:06, 9.11it/s] 64it [00:07, 9.22it/s] 65it [00:07, 9.32it/s] 66it [00:07, 9.40it/s] 67it [00:07, 9.36it/s] 68it [00:07, 9.40it/s] 69it [00:07, 9.36it/s] 70it [00:07, 9.38it/s] 71it [00:07, 9.29it/s] 72it [00:07, 9.36it/s] 73it [00:08, 9.36it/s] 74it [00:08, 9.42it/s] 75it [00:08, 9.48it/s] 76it [00:08, 9.46it/s] 77it [00:08, 9.50it/s] 78it [00:08, 9.48it/s] 79it [00:08, 9.51it/s] 80it [00:08, 9.45it/s] 81it [00:08, 9.47it/s] 82it [00:08, 9.44it/s] 83it [00:09, 9.41it/s] 84it [00:09, 9.41it/s] 85it [00:09, 9.44it/s] 86it [00:09, 9.45it/s] 87it [00:09, 9.41it/s] 88it [00:09, 8.87it/s] 89it [00:09, 9.06it/s] 90it [00:09, 9.13it/s] 91it [00:09, 9.19it/s] 92it [00:10, 9.26it/s] 93it [00:10, 9.29it/s] 94it [00:10, 8.93it/s] 95it [00:10, 9.10it/s] 96it [00:10, 9.21it/s] 97it [00:10, 9.24it/s] 98it [00:10, 9.30it/s] 99it [00:10, 9.41it/s] 100it [00:10, 9.42it/s]2025-05-26 05:39:29,537 - INFO - [Epoch 016 | Batch 0100] IWAE-loss 11751.0801 | mean log_px -0.1212 | KL -3566.18 + 101it [00:11, 9.45it/s] 102it [00:11, 9.48it/s] 103it [00:11, 9.42it/s] 104it [00:11, 9.42it/s] 105it [00:11, 9.46it/s] 106it [00:11, 9.41it/s] 107it [00:11, 9.47it/s] 108it [00:11, 9.45it/s] 109it [00:11, 9.41it/s] 110it [00:12, 9.37it/s] 111it [00:12, 9.43it/s] 112it [00:12, 9.42it/s] 113it [00:12, 9.45it/s] 114it [00:12, 9.43it/s] 115it [00:12, 9.41it/s] 116it [00:12, 9.37it/s] 117it [00:12, 9.37it/s] 118it [00:12, 9.38it/s] 119it [00:12, 9.41it/s] 120it [00:13, 9.42it/s] 121it [00:13, 9.49it/s] 122it [00:13, 9.48it/s] 123it [00:13, 9.50it/s] 124it [00:13, 9.49it/s] 125it [00:13, 9.45it/s] 126it [00:13, 9.44it/s] 127it [00:13, 9.42it/s] 128it [00:13, 9.44it/s] 129it [00:14, 9.41it/s] 130it [00:14, 9.40it/s] 131it [00:14, 9.49it/s] 132it [00:14, 9.49it/s] 133it [00:14, 9.52it/s] 134it [00:14, 9.49it/s] 135it [00:14, 9.46it/s] 136it [00:14, 9.42it/s] 137it [00:14, 9.46it/s] 138it [00:14, 9.48it/s] 139it [00:15, 9.48it/s] 140it [00:15, 9.45it/s] 141it [00:15, 9.45it/s] 142it [00:15, 9.44it/s] 143it [00:15, 9.42it/s] 144it [00:15, 9.42it/s] 145it [00:15, 9.42it/s] 146it [00:15, 9.46it/s] 147it [00:15, 9.50it/s] 148it [00:16, 9.46it/s] 149it [00:16, 9.46it/s] 150it [00:16, 9.47it/s]2025-05-26 05:39:34,831 - INFO - [Epoch 016 | Batch 0150] IWAE-loss 10209.6055 | mean log_px -0.0996 | KL -3564.47 + 151it [00:16, 9.48it/s] 152it [00:16, 9.44it/s] 153it [00:16, 9.44it/s] 154it [00:16, 9.47it/s] 155it [00:16, 9.49it/s] 156it [00:16, 9.49it/s] 157it [00:16, 9.47it/s] 158it [00:17, 9.47it/s] 159it [00:17, 9.46it/s] 160it [00:17, 9.46it/s] 161it [00:17, 9.46it/s] 162it [00:17, 9.39it/s] 163it [00:17, 9.48it/s] 164it [00:17, 9.43it/s] 165it [00:17, 9.43it/s] 166it [00:17, 9.44it/s] 167it [00:18, 9.48it/s] 168it [00:18, 9.47it/s] 169it [00:18, 9.43it/s] 170it [00:18, 9.43it/s] 171it [00:18, 9.46it/s] 172it [00:18, 9.45it/s] 173it [00:18, 9.49it/s] 174it [00:18, 9.47it/s] 175it [00:18, 9.48it/s] 176it [00:18, 9.45it/s] 177it [00:19, 9.49it/s] 178it [00:19, 9.45it/s] 179it [00:19, 9.33it/s] 180it [00:19, 9.37it/s] 181it [00:19, 8.89it/s] 182it [00:19, 9.08it/s] 183it [00:19, 9.20it/s] 184it [00:19, 9.26it/s] 185it [00:19, 9.34it/s] 186it [00:20, 9.39it/s] 187it [00:20, 9.41it/s] 188it [00:20, 9.39it/s] 189it [00:20, 9.42it/s] 190it [00:20, 9.45it/s] 191it [00:20, 9.46it/s] 192it [00:20, 9.45it/s] 193it [00:20, 9.46it/s] 194it [00:20, 9.48it/s] 195it [00:21, 8.89it/s] 196it [00:21, 9.11it/s] 196it [00:21, 9.24it/s] +2025-05-26 05:39:39,740 - INFO - Epoch: 16, Objective: tensor([10027.8145], device='cuda:0', grad_fn=), Loss: 0.09540171176195145, KL/n: 72.8223648071289 + 0it [00:00, ?it/s]2025-05-26 05:39:39,996 - INFO - [Epoch 017 | Batch 0000] IWAE-loss 10231.7510 | mean log_px -0.0985 | KL -3565.85 + 1it [00:00, 6.04it/s] 2it [00:00, 7.61it/s] 3it [00:00, 8.41it/s] 4it [00:00, 8.84it/s] 5it [00:00, 9.08it/s] 6it [00:00, 9.23it/s] 7it [00:00, 9.33it/s] 8it [00:00, 9.34it/s] 9it [00:01, 9.43it/s] 10it [00:01, 9.47it/s] 11it [00:01, 9.46it/s] 12it [00:01, 9.49it/s] 13it [00:01, 9.54it/s] 14it [00:01, 9.50it/s] 15it [00:01, 9.52it/s] 16it [00:01, 9.51it/s] 17it [00:01, 9.49it/s] 18it [00:01, 9.46it/s] 19it [00:02, 9.47it/s] 20it [00:02, 9.50it/s] 21it [00:02, 9.55it/s] 22it [00:02, 9.53it/s] 23it [00:02, 9.56it/s] 24it [00:02, 9.53it/s] 25it [00:02, 9.55it/s] 26it [00:02, 9.52it/s] 27it [00:02, 9.54it/s] 28it [00:03, 9.50it/s] 29it [00:03, 9.46it/s] 30it [00:03, 9.45it/s] 31it [00:03, 9.41it/s] 32it [00:03, 9.46it/s] 33it [00:03, 9.51it/s] 34it [00:03, 9.54it/s] 35it [00:03, 9.56it/s] 36it [00:03, 9.52it/s] 37it [00:03, 9.54it/s] 38it [00:04, 9.50it/s] 39it [00:04, 9.54it/s] 40it [00:04, 9.50it/s] 41it [00:04, 9.50it/s] 42it [00:04, 9.48it/s] 43it [00:04, 9.50it/s] 44it [00:04, 9.53it/s] 45it [00:04, 9.01it/s] 46it [00:04, 9.17it/s] 47it [00:05, 9.16it/s] 48it [00:05, 9.11it/s] 49it [00:05, 9.02it/s] 50it [00:05, 9.16it/s]2025-05-26 05:39:45,293 - INFO - [Epoch 017 | Batch 0050] IWAE-loss 8144.4380 | mean log_px -0.0670 | KL -3562.43 + 51it [00:05, 9.28it/s] 52it [00:05, 9.38it/s] 53it [00:05, 9.38it/s] 54it [00:05, 9.43it/s] 55it [00:05, 9.49it/s] 56it [00:05, 9.49it/s] 57it [00:06, 9.50it/s] 58it [00:06, 9.42it/s] 59it [00:06, 9.19it/s] 60it [00:06, 9.06it/s] 61it [00:06, 9.23it/s] 62it [00:06, 9.32it/s] 63it [00:06, 9.42it/s] 64it [00:06, 9.42it/s] 65it [00:06, 9.47it/s] 66it [00:07, 9.44it/s] 67it [00:07, 9.43it/s] 68it [00:07, 9.47it/s] 69it [00:07, 9.48it/s] 70it [00:07, 9.50it/s] 71it [00:07, 9.49it/s] 72it [00:07, 9.49it/s] 73it [00:07, 9.52it/s] 74it [00:07, 9.48it/s] 75it [00:08, 9.48it/s] 76it [00:08, 9.52it/s] 77it [00:08, 9.55it/s] 78it [00:08, 9.53it/s] 79it [00:08, 9.54it/s] 80it [00:08, 9.54it/s] 81it [00:08, 9.58it/s] 82it [00:08, 9.58it/s] 83it [00:08, 9.57it/s] 84it [00:08, 9.52it/s] 85it [00:09, 9.51it/s] 86it [00:09, 9.53it/s] 87it [00:09, 8.86it/s] 88it [00:09, 8.85it/s] 89it [00:09, 8.89it/s] 90it [00:09, 9.08it/s] 91it [00:09, 9.26it/s] 92it [00:09, 9.31it/s] 93it [00:09, 9.40it/s] 94it [00:10, 9.45it/s] 95it [00:10, 9.48it/s] 96it [00:10, 9.54it/s] 97it [00:10, 9.55it/s] 98it [00:10, 9.54it/s] 99it [00:10, 9.25it/s] 100it [00:10, 9.31it/s]2025-05-26 05:39:50,610 - INFO - [Epoch 017 | Batch 0100] IWAE-loss 8396.8623 | mean log_px -0.0690 | KL -3563.99 + 101it [00:10, 8.85it/s] 102it [00:10, 9.03it/s] 103it [00:11, 9.20it/s] 104it [00:11, 9.32it/s] 105it [00:11, 9.38it/s] 106it [00:11, 8.97it/s] 107it [00:11, 9.15it/s] 108it [00:11, 9.23it/s] 109it [00:11, 9.32it/s] 110it [00:11, 9.40it/s] 111it [00:11, 9.47it/s] 112it [00:11, 9.45it/s] 113it [00:12, 9.44it/s] 114it [00:12, 9.35it/s] 115it [00:12, 9.42it/s] 116it [00:12, 9.47it/s] 117it [00:12, 9.53it/s] 118it [00:12, 9.50it/s] 119it [00:12, 9.41it/s] 120it [00:12, 9.31it/s] 121it [00:12, 9.38it/s] 122it [00:13, 9.45it/s] 123it [00:13, 9.49it/s] 124it [00:13, 9.54it/s] 125it [00:13, 9.01it/s] 126it [00:13, 9.17it/s] 127it [00:13, 9.24it/s] 128it [00:13, 9.22it/s] 129it [00:13, 9.27it/s] 130it [00:13, 9.31it/s] 131it [00:14, 9.32it/s] 132it [00:14, 9.38it/s] 133it [00:14, 9.46it/s] 134it [00:14, 9.49it/s] 135it [00:14, 9.50it/s] 136it [00:14, 9.54it/s] 137it [00:14, 9.52it/s] 138it [00:14, 9.54it/s] 139it [00:14, 9.56it/s] 140it [00:14, 9.56it/s] 141it [00:15, 9.59it/s] 142it [00:15, 9.50it/s] 143it [00:15, 9.48it/s] 144it [00:15, 9.47it/s] 145it [00:15, 9.43it/s] 146it [00:15, 9.47it/s] 147it [00:15, 9.51it/s] 148it [00:15, 9.52it/s] 149it [00:15, 9.53it/s] 150it [00:15, 9.46it/s]2025-05-26 05:39:55,938 - INFO - [Epoch 017 | Batch 0150] IWAE-loss 9258.7881 | mean log_px -0.0835 | KL -3569.38 + 151it [00:16, 8.90it/s] 152it [00:16, 9.08it/s] 153it [00:16, 9.21it/s] 154it [00:16, 9.29it/s] 155it [00:16, 9.32it/s] 156it [00:16, 9.32it/s] 157it [00:16, 9.38it/s] 158it [00:16, 9.44it/s] 159it [00:16, 9.41it/s] 160it [00:17, 9.48it/s] 161it [00:17, 9.56it/s] 162it [00:17, 9.55it/s] 163it [00:17, 9.51it/s] 164it [00:17, 9.51it/s] 165it [00:17, 9.50it/s] 166it [00:17, 9.48it/s] 167it [00:17, 9.54it/s] 168it [00:17, 9.37it/s] 169it [00:18, 9.39it/s] 170it [00:18, 9.47it/s] 171it [00:18, 9.47it/s] 172it [00:18, 9.44it/s] 173it [00:18, 8.90it/s] 174it [00:18, 8.96it/s] 175it [00:18, 9.07it/s] 176it [00:18, 9.13it/s] 177it [00:18, 9.22it/s] 178it [00:19, 9.30it/s] 179it [00:19, 9.38it/s] 180it [00:19, 8.96it/s] 181it [00:19, 9.13it/s] 182it [00:19, 9.23it/s] 183it [00:19, 9.32it/s] 184it [00:19, 9.41it/s] 185it [00:19, 9.44it/s] 186it [00:19, 9.47it/s] 187it [00:19, 9.53it/s] 188it [00:20, 9.08it/s] 189it [00:20, 9.25it/s] 190it [00:20, 9.32it/s] 191it [00:20, 9.39it/s] 192it [00:20, 9.42it/s] 193it [00:20, 9.50it/s] 194it [00:20, 9.51it/s] 195it [00:20, 8.27it/s] 196it [00:20, 8.63it/s] 196it [00:21, 9.32it/s] +2025-05-26 05:40:00,912 - INFO - Epoch: 17, Objective: tensor([9598.7822], device='cuda:0', grad_fn=), Loss: 0.08933060616254807, KL/n: 72.83203125 + 0it [00:00, ?it/s]2025-05-26 05:40:01,192 - INFO - [Epoch 018 | Batch 0000] IWAE-loss 12348.8164 | mean log_px -0.1254 | KL -3569.31 + 1it [00:00, 5.13it/s] 2it [00:00, 7.00it/s] 3it [00:00, 7.96it/s] 4it [00:00, 8.47it/s] 5it [00:00, 8.72it/s] 6it [00:00, 8.90it/s] 7it [00:00, 8.93it/s] 8it [00:00, 8.97it/s] 9it [00:01, 9.15it/s] 10it [00:01, 9.23it/s] 11it [00:01, 9.31it/s] 12it [00:01, 9.39it/s] 13it [00:01, 9.30it/s] 14it [00:01, 9.19it/s] 15it [00:01, 9.13it/s] 16it [00:01, 9.21it/s] 17it [00:01, 8.77it/s] 18it [00:02, 8.98it/s] 19it [00:02, 9.14it/s] 20it [00:02, 9.27it/s] 21it [00:02, 9.28it/s] 22it [00:02, 9.31it/s] 23it [00:02, 9.35it/s] 24it [00:02, 9.37it/s] 25it [00:02, 9.42it/s] 26it [00:02, 9.44it/s] 27it [00:02, 9.48it/s] 28it [00:03, 6.23it/s] 29it [00:03, 6.95it/s] 30it [00:03, 7.56it/s] 31it [00:03, 8.04it/s] 32it [00:03, 8.44it/s] 33it [00:03, 8.74it/s] 34it [00:03, 8.91it/s] 35it [00:04, 9.11it/s] 36it [00:04, 9.17it/s] 37it [00:04, 9.29it/s] 38it [00:04, 9.39it/s] 39it [00:04, 9.40it/s] 40it [00:04, 9.41it/s] 41it [00:04, 9.40it/s] 42it [00:04, 9.43it/s] 43it [00:04, 9.47it/s] 44it [00:04, 9.47it/s] 45it [00:05, 9.44it/s] 46it [00:05, 8.94it/s] 47it [00:05, 9.09it/s] 48it [00:05, 9.21it/s] 49it [00:05, 9.27it/s] 50it [00:05, 8.79it/s]2025-05-26 05:40:06,750 - INFO - [Epoch 018 | Batch 0050] IWAE-loss 8044.7241 | mean log_px -0.0678 | KL -3567.06 + 51it [00:05, 8.98it/s] 52it [00:05, 9.10it/s] 53it [00:05, 9.28it/s] 54it [00:06, 9.36it/s] 55it [00:06, 9.41it/s] 56it [00:06, 9.06it/s] 57it [00:06, 9.20it/s] 58it [00:06, 9.29it/s] 59it [00:06, 9.32it/s] 60it [00:06, 9.39it/s] 61it [00:06, 9.43it/s] 62it [00:06, 9.44it/s] 63it [00:07, 9.44it/s] 64it [00:07, 9.45it/s] 65it [00:07, 9.51it/s] 66it [00:07, 9.55it/s] 67it [00:07, 9.57it/s] 68it [00:07, 9.00it/s] 69it [00:07, 9.15it/s] 70it [00:07, 9.27it/s] 71it [00:07, 9.36it/s] 72it [00:07, 9.35it/s] 73it [00:08, 9.40it/s] 74it [00:08, 9.39it/s] 75it [00:08, 9.45it/s] 76it [00:08, 9.47it/s] 77it [00:08, 8.98it/s] 78it [00:08, 9.11it/s] 79it [00:08, 9.25it/s] 80it [00:08, 9.33it/s] 81it [00:08, 9.34it/s] 82it [00:09, 9.39it/s] 83it [00:09, 9.36it/s] 84it [00:09, 8.95it/s] 85it [00:09, 9.12it/s] 86it [00:09, 9.22it/s] 87it [00:09, 8.87it/s] 88it [00:09, 9.09it/s] 89it [00:09, 9.20it/s] 90it [00:09, 9.23it/s] 91it [00:10, 9.30it/s] 92it [00:10, 8.90it/s] 93it [00:10, 9.08it/s] 94it [00:10, 9.14it/s] 95it [00:10, 9.29it/s] 96it [00:10, 9.30it/s] 97it [00:10, 9.39it/s] 98it [00:10, 9.40it/s] 99it [00:10, 9.38it/s] 100it [00:11, 9.22it/s]2025-05-26 05:40:12,132 - INFO - [Epoch 018 | Batch 0100] IWAE-loss 8123.0947 | mean log_px -0.0684 | KL -3570.99 + 101it [00:11, 8.76it/s] 102it [00:11, 8.95it/s] 103it [00:11, 9.11it/s] 104it [00:11, 9.20it/s] 105it [00:11, 9.32it/s] 106it [00:11, 9.35it/s] 107it [00:11, 9.40it/s] 108it [00:11, 9.41it/s] 109it [00:12, 9.43it/s] 110it [00:12, 9.41it/s] 111it [00:12, 9.42it/s] 112it [00:12, 9.43it/s] 113it [00:12, 9.41it/s] 114it [00:12, 9.44it/s] 115it [00:12, 9.44it/s] 116it [00:12, 9.46it/s] 117it [00:12, 9.47it/s] 118it [00:12, 9.47it/s] 119it [00:13, 9.46it/s] 120it [00:13, 9.42it/s] 121it [00:13, 9.40it/s] 122it [00:13, 9.39it/s] 123it [00:13, 9.39it/s] 124it [00:13, 9.47it/s] 125it [00:13, 9.51it/s] 126it [00:13, 9.52it/s] 127it [00:13, 9.54it/s] 128it [00:14, 9.47it/s] 129it [00:14, 9.49it/s] 130it [00:14, 9.44it/s] 131it [00:14, 9.41it/s] 132it [00:14, 8.89it/s] 133it [00:14, 9.10it/s] 134it [00:14, 9.21it/s] 135it [00:14, 9.28it/s] 136it [00:14, 9.28it/s] 137it [00:14, 9.34it/s] 138it [00:15, 9.36it/s] 139it [00:15, 9.33it/s] 140it [00:15, 8.95it/s] 141it [00:15, 8.49it/s] 142it [00:15, 8.76it/s] 143it [00:15, 8.94it/s] 144it [00:15, 9.05it/s] 145it [00:15, 9.20it/s] 146it [00:15, 9.28it/s] 147it [00:16, 9.30it/s] 148it [00:16, 9.33it/s] 149it [00:16, 9.39it/s] 150it [00:16, 8.79it/s]2025-05-26 05:40:17,536 - INFO - [Epoch 018 | Batch 0150] IWAE-loss 6793.8252 | mean log_px -0.0610 | KL -3563.42 + 151it [00:16, 8.88it/s] 152it [00:16, 9.06it/s] 153it [00:16, 9.14it/s] 154it [00:16, 9.25it/s] 155it [00:16, 9.27it/s] 156it [00:17, 9.34it/s] 157it [00:17, 9.37it/s] 158it [00:17, 9.43it/s] 159it [00:17, 9.45it/s] 160it [00:17, 9.44it/s] 161it [00:17, 9.42it/s] 162it [00:17, 9.42it/s] 163it [00:17, 8.86it/s] 164it [00:17, 9.03it/s] 165it [00:18, 9.19it/s] 166it [00:18, 9.25it/s] 167it [00:18, 9.33it/s] 168it [00:18, 8.83it/s] 169it [00:18, 9.00it/s] 170it [00:18, 9.12it/s] 171it [00:18, 9.23it/s] 172it [00:18, 9.16it/s] 173it [00:18, 8.70it/s] 174it [00:19, 8.95it/s] 175it [00:19, 9.09it/s] 176it [00:19, 9.21it/s] 177it [00:19, 9.27it/s] 178it [00:19, 9.33it/s] 179it [00:19, 9.37it/s] 180it [00:19, 9.46it/s] 181it [00:19, 9.44it/s] 182it [00:19, 9.50it/s] 183it [00:19, 9.53it/s] 184it [00:20, 8.92it/s] 185it [00:20, 9.10it/s] 186it [00:20, 9.19it/s] 187it [00:20, 9.27it/s] 188it [00:20, 8.92it/s] 189it [00:20, 9.10it/s] 190it [00:20, 9.19it/s] 191it [00:20, 9.29it/s] 192it [00:20, 9.32it/s] 193it [00:21, 9.34it/s] 194it [00:21, 9.38it/s] 195it [00:21, 8.87it/s] 196it [00:21, 9.11it/s] 196it [00:21, 9.12it/s] +2025-05-26 05:40:22,530 - INFO - Epoch: 18, Objective: tensor([8188.5557], device='cuda:0', grad_fn=), Loss: 0.07669003307819366, KL/n: 72.82756805419922 + 0it [00:00, ?it/s]2025-05-26 05:40:22,806 - INFO - [Epoch 019 | Batch 0000] IWAE-loss 6962.9434 | mean log_px -0.0530 | KL -3566.80 + 1it [00:00, 4.78it/s] 2it [00:00, 6.67it/s] 3it [00:00, 7.73it/s] 4it [00:00, 8.32it/s] 5it [00:00, 8.72it/s] 6it [00:00, 8.87it/s] 7it [00:00, 9.08it/s] 8it [00:00, 9.20it/s] 9it [00:01, 9.30it/s] 10it [00:01, 9.32it/s] 11it [00:01, 9.31it/s] 12it [00:01, 9.30it/s] 13it [00:01, 9.35it/s] 14it [00:01, 9.35it/s] 15it [00:01, 9.41it/s] 16it [00:01, 9.34it/s] 17it [00:01, 9.40it/s] 18it [00:02, 9.40it/s] 19it [00:02, 9.45it/s] 20it [00:02, 9.39it/s] 21it [00:02, 9.37it/s] 22it [00:02, 9.36it/s] 23it [00:02, 9.44it/s] 24it [00:02, 9.46it/s] 25it [00:02, 9.46it/s] 26it [00:02, 8.91it/s] 27it [00:02, 9.04it/s] 28it [00:03, 9.14it/s] 29it [00:03, 9.24it/s] 30it [00:03, 9.33it/s] 31it [00:03, 9.39it/s] 32it [00:03, 9.42it/s] 33it [00:03, 9.04it/s] 34it [00:03, 9.16it/s] 35it [00:03, 9.25it/s] 36it [00:03, 9.32it/s] 37it [00:04, 9.34it/s] 38it [00:04, 9.35it/s] 39it [00:04, 9.42it/s] 40it [00:04, 9.36it/s] 41it [00:04, 9.34it/s] 42it [00:04, 9.36it/s] 43it [00:04, 9.43it/s] 44it [00:04, 9.41it/s] 45it [00:04, 9.45it/s] 46it [00:05, 9.45it/s] 47it [00:05, 9.46it/s] 48it [00:05, 9.47it/s] 49it [00:05, 9.45it/s] 50it [00:05, 9.47it/s]2025-05-26 05:40:28,171 - INFO - [Epoch 019 | Batch 0050] IWAE-loss 11381.5762 | mean log_px -0.1166 | KL -3569.48 + 51it [00:05, 9.46it/s] 52it [00:05, 9.49it/s] 53it [00:05, 9.47it/s] 54it [00:05, 9.49it/s] 55it [00:05, 9.04it/s] 56it [00:06, 9.16it/s] 57it [00:06, 9.28it/s] 58it [00:06, 9.34it/s] 59it [00:06, 9.40it/s] 60it [00:06, 9.34it/s] 61it [00:06, 9.40it/s] 62it [00:06, 9.42it/s] 63it [00:06, 9.45it/s] 64it [00:06, 9.38it/s] 65it [00:07, 9.42it/s] 66it [00:07, 9.39it/s] 67it [00:07, 9.38it/s] 68it [00:07, 9.37it/s] 69it [00:07, 9.35it/s] 70it [00:07, 9.41it/s] 71it [00:07, 9.44it/s] 72it [00:07, 9.48it/s] 73it [00:07, 9.46it/s] 74it [00:07, 9.46it/s] 75it [00:08, 9.45it/s] 76it [00:08, 9.44it/s] 77it [00:08, 9.43it/s] 78it [00:08, 9.41it/s] 79it [00:08, 9.45it/s] 80it [00:08, 9.44it/s] 81it [00:08, 9.43it/s] 82it [00:08, 9.46it/s] 83it [00:08, 9.46it/s] 84it [00:09, 9.48it/s] 85it [00:09, 9.45it/s] 86it [00:09, 9.45it/s] 87it [00:09, 9.46it/s] 88it [00:09, 8.89it/s] 89it [00:09, 9.07it/s] 90it [00:09, 9.20it/s] 91it [00:09, 9.31it/s] 92it [00:09, 9.34it/s] 93it [00:10, 9.41it/s] 94it [00:10, 9.41it/s] 95it [00:10, 8.90it/s] 96it [00:10, 9.00it/s] 97it [00:10, 9.16it/s] 98it [00:10, 9.20it/s] 99it [00:10, 9.33it/s] 100it [00:10, 9.37it/s]2025-05-26 05:40:33,520 - INFO - [Epoch 019 | Batch 0100] IWAE-loss 8565.3213 | mean log_px -0.0776 | KL -3569.59 + 101it [00:10, 9.39it/s] 102it [00:11, 9.38it/s] 103it [00:11, 9.43it/s] 104it [00:11, 9.48it/s] 105it [00:11, 9.44it/s] 106it [00:11, 9.42it/s] 107it [00:11, 9.45it/s] 108it [00:11, 9.46it/s] 109it [00:11, 9.46it/s] 110it [00:11, 9.43it/s] 111it [00:11, 9.35it/s] 112it [00:12, 9.36it/s] 113it [00:12, 9.24it/s] 114it [00:12, 9.31it/s] 115it [00:12, 9.36it/s] 116it [00:12, 9.39it/s] 117it [00:12, 9.45it/s] 118it [00:12, 9.17it/s] 119it [00:12, 9.28it/s] 120it [00:12, 9.34it/s] 121it [00:13, 9.38it/s] 122it [00:13, 9.42it/s] 123it [00:13, 9.44it/s] 124it [00:13, 9.43it/s] 125it [00:13, 9.46it/s] 126it [00:13, 9.48it/s] 127it [00:13, 8.98it/s] 128it [00:13, 8.86it/s] 129it [00:13, 9.06it/s] 130it [00:14, 9.16it/s] 131it [00:14, 8.82it/s] 132it [00:14, 9.04it/s] 133it [00:14, 9.21it/s] 134it [00:14, 9.34it/s] 135it [00:14, 9.41it/s] 136it [00:14, 9.45it/s] 137it [00:14, 9.51it/s] 138it [00:14, 9.53it/s] 139it [00:14, 9.58it/s] 140it [00:15, 9.60it/s] 141it [00:15, 9.62it/s] 142it [00:15, 9.63it/s] 143it [00:15, 9.66it/s] 144it [00:15, 9.65it/s] 145it [00:15, 9.66it/s] 146it [00:15, 9.64it/s] 147it [00:15, 9.66it/s] 148it [00:15, 9.66it/s] 149it [00:15, 9.66it/s] 150it [00:16, 9.64it/s]2025-05-26 05:40:38,833 - INFO - [Epoch 019 | Batch 0150] IWAE-loss 7441.7295 | mean log_px -0.0628 | KL -3567.16 + 151it [00:16, 9.59it/s] 152it [00:16, 9.62it/s] 153it [00:16, 9.64it/s] 154it [00:16, 9.64it/s] 155it [00:16, 9.59it/s] 156it [00:16, 9.59it/s] 157it [00:16, 9.62it/s] 158it [00:16, 9.64it/s] 159it [00:17, 9.65it/s] 160it [00:17, 9.66it/s] 161it [00:17, 9.65it/s] 162it [00:17, 9.66it/s] 163it [00:17, 9.61it/s] 164it [00:17, 9.62it/s] 165it [00:17, 9.64it/s] 166it [00:17, 9.64it/s] 167it [00:17, 9.62it/s] 168it [00:17, 9.58it/s] 169it [00:18, 9.61it/s] 170it [00:18, 9.60it/s] 171it [00:18, 9.58it/s] 172it [00:18, 9.59it/s] 173it [00:18, 9.60it/s] 174it [00:18, 9.62it/s] 175it [00:18, 9.65it/s] 176it [00:18, 9.57it/s] 177it [00:18, 9.55it/s] 178it [00:19, 9.56it/s] 179it [00:19, 9.58it/s] 180it [00:19, 9.60it/s] 181it [00:19, 9.63it/s] 182it [00:19, 9.61it/s] 183it [00:19, 9.63it/s] 184it [00:19, 9.62it/s] 185it [00:19, 9.61it/s] 186it [00:19, 9.61it/s] 187it [00:19, 9.63it/s] 188it [00:20, 9.60it/s] 189it [00:20, 9.62it/s] 190it [00:20, 9.62it/s] 191it [00:20, 9.54it/s] 192it [00:20, 9.55it/s] 193it [00:20, 9.53it/s] 194it [00:20, 9.58it/s] 195it [00:20, 9.08it/s] 196it [00:20, 9.35it/s] +2025-05-26 05:40:43,633 - INFO - Epoch: 19, Objective: tensor([7893.3765], device='cuda:0', grad_fn=), Loss: 0.061493679881095886, KL/n: 72.83820343017578 + 0it [00:00, ?it/s]2025-05-26 05:40:43,921 - INFO - [Epoch 020 | Batch 0000] IWAE-loss 6628.0117 | mean log_px -0.0495 | KL -3568.11 + 1it [00:00, 5.23it/s] 2it [00:00, 7.15it/s] 3it [00:00, 8.20it/s] 4it [00:00, 8.78it/s] 5it [00:00, 9.13it/s] 6it [00:00, 9.32it/s] 7it [00:00, 9.49it/s] 8it [00:00, 9.57it/s] 9it [00:01, 9.65it/s] 10it [00:01, 9.66it/s] 11it [00:01, 9.72it/s] 12it [00:01, 9.73it/s] 13it [00:01, 9.77it/s] 14it [00:01, 9.76it/s] 15it [00:01, 9.78it/s] 16it [00:01, 9.74it/s] 17it [00:01, 9.75it/s] 18it [00:01, 9.75it/s] 19it [00:02, 9.76it/s] 20it [00:02, 9.72it/s] 21it [00:02, 9.73it/s] 22it [00:02, 9.72it/s] 23it [00:02, 9.73it/s] 24it [00:02, 9.54it/s] 25it [00:02, 9.59it/s] 26it [00:02, 9.65it/s] 27it [00:02, 9.70it/s] 28it [00:02, 9.72it/s] 29it [00:03, 9.72it/s] 30it [00:03, 9.71it/s] 31it [00:03, 9.20it/s] 32it [00:03, 9.36it/s] 33it [00:03, 9.48it/s] 34it [00:03, 9.56it/s] 35it [00:03, 9.64it/s] 36it [00:03, 9.51it/s] 37it [00:03, 9.36it/s] 38it [00:04, 9.25it/s] 39it [00:04, 9.42it/s] 40it [00:04, 9.53it/s] 41it [00:04, 9.61it/s] 42it [00:04, 9.67it/s] 43it [00:04, 6.37it/s] 44it [00:04, 7.11it/s] 45it [00:04, 7.76it/s] 46it [00:05, 8.23it/s] 47it [00:05, 8.61it/s] 48it [00:05, 8.93it/s] 49it [00:05, 9.18it/s] 50it [00:05, 8.80it/s]2025-05-26 05:40:49,295 - INFO - [Epoch 020 | Batch 0050] IWAE-loss 7019.3750 | mean log_px -0.0534 | KL -3567.79 + 51it [00:05, 9.04it/s] 52it [00:05, 9.23it/s] 53it [00:05, 9.39it/s] 54it [00:05, 9.49it/s] 55it [00:05, 9.61it/s] 56it [00:06, 9.67it/s] 57it [00:06, 9.73it/s] 58it [00:06, 9.74it/s] 59it [00:06, 9.78it/s] 60it [00:06, 9.79it/s] 61it [00:06, 9.81it/s] 62it [00:06, 9.81it/s] 63it [00:06, 9.80it/s] 64it [00:06, 9.79it/s] 65it [00:06, 9.81it/s] 66it [00:07, 9.81it/s] 67it [00:07, 9.79it/s] 68it [00:07, 9.80it/s] 69it [00:07, 9.80it/s] 70it [00:07, 9.32it/s] 71it [00:07, 9.46it/s] 72it [00:07, 9.55it/s] 73it [00:07, 9.63it/s] 74it [00:07, 9.68it/s] 75it [00:08, 9.72it/s] 76it [00:08, 9.74it/s] 77it [00:08, 9.76it/s] 78it [00:08, 9.77it/s] 79it [00:08, 9.78it/s] 80it [00:08, 9.78it/s] 81it [00:08, 9.80it/s] 82it [00:08, 9.81it/s] 83it [00:08, 9.83it/s] 84it [00:08, 9.82it/s] 85it [00:09, 9.80it/s] 86it [00:09, 9.79it/s] 87it [00:09, 9.81it/s] 88it [00:09, 9.80it/s] 89it [00:09, 9.80it/s] 90it [00:09, 9.80it/s] 91it [00:09, 9.20it/s] 92it [00:09, 9.37it/s] 93it [00:09, 9.50it/s] 94it [00:09, 9.58it/s] 95it [00:10, 9.66it/s] 96it [00:10, 9.72it/s] 97it [00:10, 9.73it/s] 98it [00:10, 9.75it/s] 99it [00:10, 9.26it/s] 100it [00:10, 9.39it/s]2025-05-26 05:40:54,455 - INFO - [Epoch 020 | Batch 0100] IWAE-loss 9756.4814 | mean log_px -0.0918 | KL -3565.89 + 101it [00:10, 9.45it/s] 102it [00:10, 9.54it/s] 103it [00:10, 9.15it/s] 104it [00:11, 9.32it/s] 105it [00:11, 9.45it/s] 106it [00:11, 9.53it/s] 107it [00:11, 9.61it/s] 108it [00:11, 9.65it/s] 109it [00:11, 9.68it/s] 110it [00:11, 9.14it/s] 111it [00:11, 9.32it/s] 112it [00:11, 9.46it/s] 113it [00:11, 9.58it/s] 114it [00:12, 9.66it/s] 115it [00:12, 9.68it/s] 116it [00:12, 9.63it/s] 117it [00:12, 9.27it/s] 118it [00:12, 9.42it/s] 119it [00:12, 9.51it/s] 120it [00:12, 9.59it/s] 121it [00:12, 9.67it/s] 122it [00:12, 9.70it/s] 123it [00:13, 9.73it/s] 124it [00:13, 9.72it/s] 125it [00:13, 9.71it/s] 126it [00:13, 9.72it/s] 127it [00:13, 9.15it/s] 128it [00:13, 9.34it/s] 129it [00:13, 9.33it/s] 130it [00:13, 9.27it/s] 131it [00:13, 9.19it/s] 132it [00:14, 9.10it/s] 133it [00:14, 9.21it/s] 134it [00:14, 9.32it/s] 135it [00:14, 9.40it/s] 136it [00:14, 8.85it/s] 137it [00:14, 9.05it/s] 138it [00:14, 9.16it/s] 139it [00:14, 9.29it/s] 140it [00:14, 9.37it/s] 141it [00:14, 8.85it/s] 142it [00:15, 9.04it/s] 143it [00:15, 9.14it/s] 144it [00:15, 9.28it/s] 145it [00:15, 9.42it/s] 146it [00:15, 9.52it/s] 147it [00:15, 9.23it/s] 148it [00:15, 9.32it/s] 149it [00:15, 9.37it/s] 150it [00:15, 9.49it/s]2025-05-26 05:40:59,780 - INFO - [Epoch 020 | Batch 0150] IWAE-loss 6741.2627 | mean log_px -0.0465 | KL -3565.47 + 151it [00:16, 9.56it/s] 152it [00:16, 9.61it/s] 153it [00:16, 9.66it/s] 154it [00:16, 9.68it/s] 155it [00:16, 9.70it/s] 156it [00:16, 9.72it/s] 157it [00:16, 9.73it/s] 158it [00:16, 9.73it/s] 159it [00:16, 9.69it/s] 160it [00:16, 9.72it/s] 161it [00:17, 9.71it/s] 162it [00:17, 9.73it/s] 163it [00:17, 9.76it/s] 164it [00:17, 9.73it/s] 165it [00:17, 9.76it/s] 166it [00:17, 9.72it/s] 167it [00:17, 9.73it/s] 168it [00:17, 9.73it/s] 169it [00:17, 9.76it/s] 170it [00:17, 9.76it/s] 171it [00:18, 9.77it/s] 172it [00:18, 9.73it/s] 173it [00:18, 9.73it/s] 174it [00:18, 9.75it/s] 175it [00:18, 9.75it/s] 176it [00:18, 9.14it/s] 177it [00:18, 9.33it/s] 178it [00:18, 9.46it/s] 179it [00:18, 9.57it/s] 180it [00:19, 9.64it/s] 181it [00:19, 9.71it/s] 182it [00:19, 9.75it/s] 183it [00:19, 9.76it/s] 184it [00:19, 9.13it/s] 185it [00:19, 9.34it/s] 186it [00:19, 9.46it/s] 187it [00:19, 9.56it/s] 188it [00:19, 9.62it/s] 189it [00:19, 9.67it/s] 190it [00:20, 9.68it/s] 191it [00:20, 9.69it/s] 192it [00:20, 9.71it/s] 193it [00:20, 9.35it/s] 194it [00:20, 9.48it/s] 195it [00:20, 9.17it/s] 196it [00:20, 9.43it/s] +2025-05-26 05:41:04,566 - INFO - Epoch: 20, Objective: tensor([5954.1396], device='cuda:0', grad_fn=), Loss: 0.034850478172302246, KL/n: 72.82156372070312 + 0it [00:00, ?it/s]2025-05-26 05:41:04,837 - INFO - [Epoch 021 | Batch 0000] IWAE-loss 7638.6367 | mean log_px -0.0598 | KL -3567.85 + 1it [00:00, 4.98it/s] 2it [00:00, 6.92it/s] 3it [00:00, 7.97it/s] 4it [00:00, 8.61it/s] 5it [00:00, 9.03it/s] 6it [00:00, 8.66it/s] 7it [00:00, 9.00it/s] 8it [00:00, 9.24it/s] 9it [00:01, 9.40it/s] 10it [00:01, 8.90it/s] 11it [00:01, 9.17it/s] 12it [00:01, 9.35it/s] 13it [00:01, 9.50it/s] 14it [00:01, 9.57it/s] 15it [00:01, 9.63it/s] 16it [00:01, 9.67it/s] 17it [00:01, 9.72it/s] 18it [00:01, 9.73it/s] 19it [00:02, 9.76it/s] 20it [00:02, 9.76it/s] 21it [00:02, 9.78it/s] 22it [00:02, 9.78it/s] 23it [00:02, 9.79it/s] 24it [00:02, 9.79it/s] 25it [00:02, 9.79it/s] 26it [00:02, 9.29it/s] 27it [00:02, 9.45it/s] 28it [00:03, 9.53it/s] 29it [00:03, 9.63it/s] 30it [00:03, 9.61it/s] 31it [00:03, 9.67it/s] 32it [00:03, 9.70it/s] 33it [00:03, 9.75it/s] 34it [00:03, 9.75it/s] 35it [00:03, 9.77it/s] 36it [00:03, 9.30it/s] 37it [00:03, 9.45it/s] 38it [00:04, 9.54it/s] 39it [00:04, 9.13it/s] 40it [00:04, 9.29it/s] 41it [00:04, 9.44it/s] 42it [00:04, 8.95it/s] 43it [00:04, 9.19it/s] 44it [00:04, 9.36it/s] 45it [00:04, 9.48it/s] 46it [00:04, 9.54it/s] 47it [00:05, 9.61it/s] 48it [00:05, 9.66it/s] 49it [00:05, 9.73it/s] 50it [00:05, 9.10it/s]2025-05-26 05:41:10,118 - INFO - [Epoch 021 | Batch 0050] IWAE-loss 12824.7617 | mean log_px -0.1392 | KL -3568.71 + 51it [00:05, 9.26it/s] 52it [00:05, 9.36it/s] 53it [00:05, 9.30it/s] 54it [00:05, 9.40it/s] 55it [00:05, 9.51it/s] 56it [00:05, 9.56it/s] 57it [00:06, 9.61it/s] 58it [00:06, 9.66it/s] 59it [00:06, 9.22it/s] 60it [00:06, 9.38it/s] 61it [00:06, 9.50it/s] 62it [00:06, 9.59it/s] 63it [00:06, 9.66it/s] 64it [00:06, 9.08it/s] 65it [00:06, 9.28it/s] 66it [00:07, 9.41it/s] 67it [00:07, 9.53it/s] 68it [00:07, 9.60it/s] 69it [00:07, 9.63it/s] 70it [00:07, 9.66it/s] 71it [00:07, 9.70it/s] 72it [00:07, 9.72it/s] 73it [00:07, 9.74it/s] 74it [00:07, 9.77it/s] 75it [00:07, 9.77it/s] 76it [00:08, 9.77it/s] 77it [00:08, 9.77it/s] 78it [00:08, 9.78it/s] 79it [00:08, 9.78it/s] 80it [00:08, 9.29it/s] 81it [00:08, 9.42it/s] 82it [00:08, 9.52it/s] 83it [00:08, 9.02it/s] 84it [00:08, 9.25it/s] 85it [00:09, 9.39it/s] 86it [00:09, 9.50it/s] 87it [00:09, 9.60it/s] 88it [00:09, 9.64it/s] 89it [00:09, 9.69it/s] 90it [00:09, 9.71it/s] 91it [00:09, 9.75it/s] 92it [00:09, 9.77it/s] 93it [00:09, 9.77it/s] 94it [00:09, 9.77it/s] 95it [00:10, 9.80it/s] 96it [00:10, 9.79it/s] 97it [00:10, 9.79it/s] 98it [00:10, 9.80it/s] 99it [00:10, 9.20it/s] 100it [00:10, 9.37it/s]2025-05-26 05:41:15,344 - INFO - [Epoch 021 | Batch 0100] IWAE-loss 9816.6523 | mean log_px -0.1053 | KL -3570.17 + 101it [00:10, 9.46it/s] 102it [00:10, 9.54it/s] 103it [00:10, 9.58it/s] 104it [00:11, 9.15it/s] 105it [00:11, 9.24it/s] 106it [00:11, 9.39it/s] 107it [00:11, 9.51it/s] 108it [00:11, 9.58it/s] 109it [00:11, 9.65it/s] 110it [00:11, 9.67it/s] 111it [00:11, 9.71it/s] 112it [00:11, 9.72it/s] 113it [00:11, 9.75it/s] 114it [00:12, 9.27it/s] 115it [00:12, 9.43it/s] 116it [00:12, 9.50it/s] 117it [00:12, 9.57it/s] 118it [00:12, 9.16it/s] 119it [00:12, 9.34it/s] 120it [00:12, 9.49it/s] 121it [00:12, 8.96it/s] 122it [00:12, 9.19it/s] 123it [00:13, 9.35it/s] 124it [00:13, 9.46it/s] 125it [00:13, 9.57it/s] 126it [00:13, 9.63it/s] 127it [00:13, 9.69it/s] 128it [00:13, 9.10it/s] 129it [00:13, 9.26it/s] 130it [00:13, 9.41it/s] 131it [00:13, 9.54it/s] 132it [00:13, 9.58it/s] 133it [00:14, 9.63it/s] 134it [00:14, 9.66it/s] 135it [00:14, 9.71it/s] 136it [00:14, 9.01it/s] 137it [00:14, 9.05it/s] 138it [00:14, 9.17it/s] 139it [00:14, 9.33it/s] 140it [00:14, 8.88it/s] 141it [00:14, 9.14it/s] 142it [00:15, 9.32it/s] 143it [00:15, 9.46it/s] 144it [00:15, 9.55it/s] 145it [00:15, 9.62it/s] 146it [00:15, 9.66it/s] 147it [00:15, 9.08it/s] 148it [00:15, 9.24it/s] 149it [00:15, 9.40it/s] 150it [00:15, 9.51it/s]2025-05-26 05:41:20,655 - INFO - [Epoch 021 | Batch 0150] IWAE-loss 6365.2271 | mean log_px -0.0422 | KL -3569.45 + 151it [00:16, 8.93it/s] 152it [00:16, 9.15it/s] 153it [00:16, 9.31it/s] 154it [00:16, 9.42it/s] 155it [00:16, 9.51it/s] 156it [00:16, 9.58it/s] 157it [00:16, 9.62it/s] 158it [00:16, 9.66it/s] 159it [00:16, 9.69it/s] 160it [00:16, 9.65it/s] 161it [00:17, 9.51it/s] 162it [00:17, 9.49it/s] 163it [00:17, 9.55it/s] 164it [00:17, 9.61it/s] 165it [00:17, 9.69it/s] 166it [00:17, 9.71it/s] 167it [00:17, 9.70it/s] 168it [00:17, 9.73it/s] 169it [00:17, 9.74it/s] 170it [00:17, 9.74it/s] 171it [00:18, 9.70it/s] 172it [00:18, 9.72it/s] 173it [00:18, 9.73it/s] 174it [00:18, 9.72it/s] 175it [00:18, 9.72it/s] 176it [00:18, 9.72it/s] 177it [00:18, 9.72it/s] 178it [00:18, 9.24it/s] 179it [00:18, 9.40it/s] 180it [00:19, 9.51it/s] 181it [00:19, 9.57it/s] 182it [00:19, 9.60it/s] 183it [00:19, 9.65it/s] 184it [00:19, 9.67it/s] 185it [00:19, 9.25it/s] 186it [00:19, 9.37it/s] 187it [00:19, 9.46it/s] 188it [00:19, 8.83it/s] 189it [00:20, 9.06it/s] 190it [00:20, 9.22it/s] 191it [00:20, 9.35it/s] 192it [00:20, 9.45it/s] 193it [00:20, 9.55it/s] 194it [00:20, 9.62it/s] 195it [00:20, 9.24it/s] 196it [00:20, 9.43it/s] +2025-05-26 05:41:25,490 - INFO - Epoch: 21, Objective: tensor([6160.0498], device='cuda:0', grad_fn=), Loss: 0.040021877735853195, KL/n: 72.79065704345703 + 0it [00:00, ?it/s]2025-05-26 05:41:25,762 - INFO - [Epoch 022 | Batch 0000] IWAE-loss 9817.3037 | mean log_px -0.0940 | KL -3564.62 + 1it [00:00, 4.78it/s] 2it [00:00, 6.78it/s] 3it [00:00, 7.91it/s] 4it [00:00, 8.50it/s] 5it [00:00, 8.93it/s] 6it [00:00, 9.16it/s] 7it [00:00, 8.76it/s] 8it [00:00, 9.06it/s] 9it [00:01, 9.29it/s] 10it [00:01, 9.41it/s] 11it [00:01, 9.52it/s] 12it [00:01, 9.59it/s] 13it [00:01, 9.65it/s] 14it [00:01, 9.10it/s] 15it [00:01, 9.30it/s] 16it [00:01, 9.43it/s] 17it [00:01, 9.53it/s] 18it [00:01, 9.60it/s] 19it [00:02, 9.64it/s] 20it [00:02, 9.69it/s] 21it [00:02, 9.70it/s] 22it [00:02, 9.01it/s] 23it [00:02, 9.09it/s] 24it [00:02, 9.28it/s] 25it [00:02, 9.43it/s] 26it [00:02, 9.48it/s] 27it [00:02, 9.57it/s] 28it [00:03, 9.52it/s] 29it [00:03, 9.58it/s] 30it [00:03, 9.58it/s] 31it [00:03, 9.14it/s] 32it [00:03, 9.30it/s] 33it [00:03, 9.42it/s] 34it [00:03, 9.52it/s] 35it [00:03, 9.59it/s] 36it [00:03, 9.10it/s] 37it [00:04, 9.29it/s] 38it [00:04, 9.42it/s] 39it [00:04, 9.53it/s] 40it [00:04, 9.62it/s] 41it [00:04, 9.08it/s] 42it [00:04, 9.27it/s] 43it [00:04, 9.40it/s] 44it [00:04, 9.37it/s] 45it [00:04, 8.78it/s] 46it [00:05, 8.92it/s] 47it [00:05, 9.09it/s] 48it [00:05, 9.24it/s] 49it [00:05, 9.35it/s] 50it [00:05, 9.41it/s]2025-05-26 05:41:31,110 - INFO - [Epoch 022 | Batch 0050] IWAE-loss 8459.5879 | mean log_px -0.0763 | KL -3567.08 + 51it [00:05, 8.83it/s] 52it [00:05, 9.03it/s] 53it [00:05, 9.17it/s] 54it [00:05, 9.19it/s] 55it [00:05, 9.25it/s] 56it [00:06, 9.35it/s] 57it [00:06, 9.36it/s] 58it [00:06, 9.38it/s] 59it [00:06, 9.39it/s] 60it [00:06, 9.44it/s] 61it [00:06, 9.48it/s] 62it [00:06, 9.51it/s] 63it [00:06, 9.16it/s] 64it [00:07, 6.15it/s] 65it [00:07, 6.92it/s] 66it [00:07, 7.58it/s] 67it [00:07, 8.03it/s] 68it [00:07, 8.27it/s] 69it [00:07, 8.30it/s] 70it [00:07, 8.67it/s] 71it [00:07, 8.96it/s] 72it [00:07, 9.18it/s] 73it [00:08, 9.35it/s] 74it [00:08, 9.46it/s] 75it [00:08, 9.56it/s] 76it [00:08, 9.60it/s] 77it [00:08, 9.66it/s] 78it [00:08, 9.69it/s] 79it [00:08, 9.70it/s] 80it [00:08, 9.73it/s] 81it [00:08, 9.73it/s] 82it [00:08, 9.73it/s] 83it [00:09, 9.76it/s] 84it [00:09, 9.77it/s] 85it [00:09, 9.79it/s] 86it [00:09, 9.77it/s] 87it [00:09, 9.77it/s] 88it [00:09, 9.76it/s] 89it [00:09, 9.77it/s] 90it [00:09, 9.76it/s] 91it [00:09, 9.78it/s] 92it [00:10, 9.16it/s] 93it [00:10, 9.35it/s] 94it [00:10, 9.50it/s] 95it [00:10, 9.60it/s] 96it [00:10, 9.67it/s] 97it [00:10, 9.29it/s] 98it [00:10, 9.42it/s] 99it [00:10, 9.52it/s] 100it [00:10, 9.58it/s]2025-05-26 05:41:36,558 - INFO - [Epoch 022 | Batch 0100] IWAE-loss 9265.9893 | mean log_px -0.0819 | KL -3570.15 + 101it [00:11, 9.04it/s] 102it [00:11, 9.27it/s] 103it [00:11, 9.42it/s] 104it [00:11, 9.53it/s] 105it [00:11, 9.63it/s] 106it [00:11, 9.69it/s] 107it [00:11, 9.74it/s] 108it [00:11, 9.75it/s] 109it [00:11, 9.76it/s] 110it [00:11, 9.77it/s] 111it [00:12, 9.77it/s] 112it [00:12, 9.75it/s] 113it [00:12, 9.78it/s] 114it [00:12, 9.79it/s] 115it [00:12, 9.81it/s] 116it [00:12, 9.82it/s] 117it [00:12, 9.21it/s] 118it [00:12, 9.37it/s] 119it [00:12, 9.49it/s] 120it [00:12, 9.58it/s] 121it [00:13, 9.65it/s] 122it [00:13, 9.68it/s] 123it [00:13, 9.73it/s] 124it [00:13, 9.75it/s] 125it [00:13, 9.79it/s] 126it [00:13, 9.78it/s] 127it [00:13, 9.80it/s] 128it [00:13, 9.80it/s] 129it [00:13, 9.78it/s] 130it [00:13, 9.78it/s] 131it [00:14, 9.80it/s] 132it [00:14, 9.80it/s] 133it [00:14, 9.82it/s] 134it [00:14, 9.82it/s] 135it [00:14, 9.79it/s] 136it [00:14, 9.79it/s] 137it [00:14, 9.79it/s] 138it [00:14, 9.80it/s] 139it [00:14, 9.81it/s] 140it [00:15, 9.80it/s] 141it [00:15, 9.18it/s] 142it [00:15, 9.35it/s] 143it [00:15, 9.49it/s] 144it [00:15, 9.58it/s] 145it [00:15, 9.66it/s] 146it [00:15, 9.70it/s] 147it [00:15, 9.74it/s] 148it [00:15, 9.76it/s] 149it [00:15, 9.76it/s] 150it [00:16, 9.75it/s]2025-05-26 05:41:41,728 - INFO - [Epoch 022 | Batch 0150] IWAE-loss 8519.6299 | mean log_px -0.0768 | KL -3566.00 + 151it [00:16, 9.22it/s] 152it [00:16, 9.39it/s] 153it [00:16, 9.51it/s] 154it [00:16, 9.61it/s] 155it [00:16, 9.66it/s] 156it [00:16, 9.69it/s] 157it [00:16, 9.70it/s] 158it [00:16, 9.72it/s] 159it [00:16, 9.75it/s] 160it [00:17, 9.77it/s] 161it [00:17, 9.78it/s] 162it [00:17, 9.78it/s] 163it [00:17, 9.79it/s] 164it [00:17, 9.79it/s] 165it [00:17, 9.74it/s] 166it [00:17, 9.76it/s] 167it [00:17, 9.75it/s] 168it [00:17, 9.15it/s] 169it [00:18, 9.35it/s] 170it [00:18, 9.44it/s] 171it [00:18, 9.55it/s] 172it [00:18, 9.62it/s] 173it [00:18, 9.65it/s] 174it [00:18, 9.69it/s] 175it [00:18, 9.75it/s] 176it [00:18, 9.77it/s] 177it [00:18, 9.76it/s] 178it [00:18, 9.67it/s] 179it [00:19, 9.72it/s] 180it [00:19, 9.73it/s] 181it [00:19, 9.75it/s] 182it [00:19, 9.77it/s] 183it [00:19, 9.79it/s] 184it [00:19, 9.79it/s] 185it [00:19, 9.80it/s] 186it [00:19, 9.79it/s] 187it [00:19, 9.19it/s] 188it [00:19, 9.36it/s] 189it [00:20, 9.47it/s] 190it [00:20, 9.53it/s] 191it [00:20, 9.15it/s] 192it [00:20, 9.35it/s] 193it [00:20, 9.42it/s] 194it [00:20, 9.51it/s] 195it [00:20, 9.19it/s] 196it [00:20, 8.96it/s] 196it [00:20, 9.36it/s] +2025-05-26 05:41:46,550 - INFO - Epoch: 22, Objective: tensor([8000.1289], device='cuda:0', grad_fn=), Loss: 0.06485095620155334, KL/n: 72.75353240966797 + 0it [00:00, ?it/s]2025-05-26 05:41:46,849 - INFO - [Epoch 023 | Batch 0000] IWAE-loss 10706.0791 | mean log_px -0.1055 | KL -3565.08 + 1it [00:00, 4.89it/s] 2it [00:00, 6.39it/s] 3it [00:00, 7.64it/s] 4it [00:00, 8.39it/s] 5it [00:00, 8.89it/s] 6it [00:00, 9.20it/s] 7it [00:00, 8.81it/s] 8it [00:00, 9.11it/s] 9it [00:01, 9.27it/s] 10it [00:01, 9.36it/s] 11it [00:01, 9.51it/s] 12it [00:01, 9.60it/s] 13it [00:01, 9.67it/s] 14it [00:01, 9.71it/s] 15it [00:01, 9.76it/s] 16it [00:01, 9.78it/s] 17it [00:01, 9.82it/s] 18it [00:01, 9.84it/s] 19it [00:02, 9.83it/s] 20it [00:02, 9.82it/s] 21it [00:02, 9.34it/s] 22it [00:02, 9.49it/s] 23it [00:02, 9.61it/s] 24it [00:02, 9.68it/s] 25it [00:02, 9.70it/s] 26it [00:02, 9.12it/s] 27it [00:02, 9.13it/s] 28it [00:03, 9.33it/s] 29it [00:03, 9.49it/s] 30it [00:03, 9.60it/s] 31it [00:03, 9.69it/s] 32it [00:03, 9.72it/s] 33it [00:03, 9.77it/s] 34it [00:03, 9.73it/s] 35it [00:03, 9.58it/s] 36it [00:03, 8.76it/s] 37it [00:04, 8.81it/s] 38it [00:04, 9.09it/s] 39it [00:04, 9.31it/s] 40it [00:04, 9.46it/s] 41it [00:04, 9.57it/s] 42it [00:04, 9.63it/s] 43it [00:04, 9.70it/s] 44it [00:04, 9.74it/s] 45it [00:04, 9.17it/s] 46it [00:04, 9.36it/s] 47it [00:05, 9.46it/s] 48it [00:05, 9.54it/s] 49it [00:05, 9.65it/s] 50it [00:05, 9.70it/s]2025-05-26 05:41:52,105 - INFO - [Epoch 023 | Batch 0050] IWAE-loss 6445.8760 | mean log_px -0.0427 | KL -3562.69 + 51it [00:05, 9.14it/s] 52it [00:05, 9.34it/s] 53it [00:05, 9.46it/s] 54it [00:05, 9.57it/s] 55it [00:05, 9.68it/s] 56it [00:06, 9.13it/s] 57it [00:06, 9.33it/s] 58it [00:06, 9.47it/s] 59it [00:06, 9.59it/s] 60it [00:06, 9.67it/s] 61it [00:06, 9.70it/s] 62it [00:06, 9.74it/s] 63it [00:06, 9.78it/s] 64it [00:06, 9.21it/s] 65it [00:06, 9.39it/s] 66it [00:07, 9.47it/s] 67it [00:07, 9.59it/s] 68it [00:07, 9.66it/s] 69it [00:07, 9.24it/s] 70it [00:07, 9.43it/s] 71it [00:07, 9.56it/s] 72it [00:07, 9.64it/s] 73it [00:07, 9.70it/s] 74it [00:07, 9.76it/s] 75it [00:07, 9.79it/s] 76it [00:08, 9.80it/s] 77it [00:08, 9.82it/s] 78it [00:08, 9.84it/s] 79it [00:08, 9.25it/s] 80it [00:08, 9.42it/s] 81it [00:08, 9.55it/s] 82it [00:08, 9.65it/s] 83it [00:08, 9.71it/s] 84it [00:08, 9.75it/s] 85it [00:09, 9.20it/s] 86it [00:09, 9.39it/s] 87it [00:09, 9.39it/s] 88it [00:09, 9.51it/s] 89it [00:09, 9.13it/s] 90it [00:09, 9.34it/s] 91it [00:09, 9.50it/s] 92it [00:09, 9.60it/s] 93it [00:09, 9.68it/s] 94it [00:09, 9.74it/s] 95it [00:10, 9.79it/s] 96it [00:10, 9.80it/s] 97it [00:10, 9.82it/s] 98it [00:10, 9.82it/s] 99it [00:10, 9.82it/s] 100it [00:10, 9.84it/s]2025-05-26 05:41:57,331 - INFO - [Epoch 023 | Batch 0100] IWAE-loss 9278.5117 | mean log_px -0.0849 | KL -3567.39 + 101it [00:10, 9.28it/s] 102it [00:10, 9.44it/s] 103it [00:10, 9.58it/s] 104it [00:11, 9.66it/s] 105it [00:11, 9.72it/s] 106it [00:11, 9.76it/s] 107it [00:11, 9.80it/s] 108it [00:11, 9.82it/s] 109it [00:11, 9.82it/s] 110it [00:11, 9.80it/s] 111it [00:11, 9.82it/s] 112it [00:11, 9.84it/s] 113it [00:11, 9.83it/s] 114it [00:12, 9.35it/s] 115it [00:12, 9.50it/s] 116it [00:12, 9.61it/s] 117it [00:12, 9.70it/s] 118it [00:12, 9.74it/s] 119it [00:12, 9.77it/s] 120it [00:12, 9.79it/s] 121it [00:12, 9.82it/s] 122it [00:12, 9.83it/s] 123it [00:12, 9.84it/s] 124it [00:13, 9.85it/s] 125it [00:13, 9.86it/s] 126it [00:13, 9.85it/s] 127it [00:13, 9.86it/s] 128it [00:13, 9.77it/s] 129it [00:13, 9.81it/s] 130it [00:13, 9.77it/s] 131it [00:13, 9.81it/s] 132it [00:13, 9.83it/s] 133it [00:13, 9.84it/s] 134it [00:14, 9.85it/s] 135it [00:14, 9.84it/s] 136it [00:14, 9.22it/s] 137it [00:14, 9.40it/s] 138it [00:14, 9.53it/s] 139it [00:14, 9.63it/s] 140it [00:14, 9.68it/s] 141it [00:14, 9.12it/s] 142it [00:14, 9.33it/s] 143it [00:15, 9.49it/s] 144it [00:15, 9.60it/s] 145it [00:15, 9.68it/s] 146it [00:15, 9.64it/s] 147it [00:15, 9.69it/s] 148it [00:15, 9.05it/s] 149it [00:15, 9.26it/s] 150it [00:15, 9.43it/s]2025-05-26 05:42:02,523 - INFO - [Epoch 023 | Batch 0150] IWAE-loss 9398.9590 | mean log_px -0.0833 | KL -3566.49 + 151it [00:15, 8.98it/s] 152it [00:15, 9.21it/s] 153it [00:16, 9.39it/s] 154it [00:16, 9.53it/s] 155it [00:16, 9.63it/s] 156it [00:16, 9.69it/s] 157it [00:16, 9.73it/s] 158it [00:16, 9.76it/s] 159it [00:16, 9.80it/s] 160it [00:16, 9.79it/s] 161it [00:16, 9.81it/s] 162it [00:17, 9.82it/s] 163it [00:17, 9.40it/s] 164it [00:17, 9.49it/s] 165it [00:17, 9.59it/s] 166it [00:17, 9.07it/s] 167it [00:17, 9.22it/s] 168it [00:17, 9.35it/s] 169it [00:17, 9.50it/s] 170it [00:17, 9.49it/s] 171it [00:17, 9.57it/s] 172it [00:18, 9.65it/s] 173it [00:18, 9.71it/s] 174it [00:18, 9.76it/s] 175it [00:18, 9.79it/s] 176it [00:18, 9.36it/s] 177it [00:18, 9.51it/s] 178it [00:18, 9.59it/s] 179it [00:18, 9.08it/s] 180it [00:18, 9.29it/s] 181it [00:19, 9.46it/s] 182it [00:19, 9.57it/s] 183it [00:19, 9.66it/s] 184it [00:19, 9.73it/s] 185it [00:19, 9.77it/s] 186it [00:19, 9.19it/s] 187it [00:19, 9.28it/s] 188it [00:19, 9.45it/s] 189it [00:19, 9.56it/s] 190it [00:19, 9.63it/s] 191it [00:20, 9.67it/s] 192it [00:20, 9.73it/s] 193it [00:20, 9.76it/s] 194it [00:20, 9.59it/s] 195it [00:20, 9.25it/s] 196it [00:20, 9.00it/s] 196it [00:20, 9.48it/s] +2025-05-26 05:42:07,357 - INFO - Epoch: 23, Objective: tensor([7036.1016], device='cuda:0', grad_fn=), Loss: 0.05605386570096016, KL/n: 72.70604705810547 + 0it [00:00, ?it/s]2025-05-26 05:42:07,819 - INFO - [Epoch 024 | Batch 0000] IWAE-loss 10053.7881 | mean log_px -0.0965 | KL -3562.36 + 1it [00:00, 5.33it/s] 2it [00:00, 7.16it/s] 3it [00:00, 8.17it/s] 4it [00:00, 8.41it/s] 5it [00:00, 8.39it/s] 6it [00:00, 8.79it/s] 7it [00:00, 9.10it/s] 8it [00:00, 9.29it/s] 9it [00:01, 9.44it/s] 10it [00:01, 9.53it/s] 11it [00:01, 9.55it/s] 12it [00:01, 9.13it/s] 13it [00:01, 9.33it/s] 14it [00:01, 9.46it/s] 15it [00:01, 9.55it/s] 16it [00:01, 8.97it/s] 17it [00:01, 9.21it/s] 18it [00:02, 9.36it/s] 19it [00:02, 9.48it/s] 20it [00:02, 9.56it/s] 21it [00:02, 9.64it/s] 22it [00:02, 9.69it/s] 23it [00:02, 9.74it/s] 24it [00:02, 9.24it/s] 25it [00:02, 9.42it/s] 26it [00:02, 9.50it/s] 27it [00:02, 9.59it/s] 28it [00:03, 9.64it/s] 29it [00:03, 9.70it/s] 30it [00:03, 9.73it/s] 31it [00:03, 9.75it/s] 32it [00:03, 9.74it/s] 33it [00:03, 9.76it/s] 34it [00:03, 9.76it/s] 35it [00:03, 9.77it/s] 36it [00:03, 9.16it/s] 37it [00:03, 9.36it/s] 38it [00:04, 9.47it/s] 39it [00:04, 9.56it/s] 40it [00:04, 9.14it/s] 41it [00:04, 9.33it/s] 42it [00:04, 9.48it/s] 43it [00:04, 9.00it/s] 44it [00:04, 9.20it/s] 45it [00:04, 9.36it/s] 46it [00:04, 9.47it/s] 47it [00:05, 9.59it/s] 48it [00:05, 9.63it/s] 49it [00:05, 9.69it/s] 50it [00:05, 9.69it/s]2025-05-26 05:42:13,094 - INFO - [Epoch 024 | Batch 0050] IWAE-loss 7944.3613 | mean log_px -0.0672 | KL -3565.10 + 51it [00:05, 9.06it/s] 52it [00:05, 9.26it/s] 53it [00:05, 9.43it/s] 54it [00:05, 9.50it/s] 55it [00:05, 9.59it/s] 56it [00:05, 9.61it/s] 57it [00:06, 9.65it/s] 58it [00:06, 9.67it/s] 59it [00:06, 9.09it/s] 60it [00:06, 9.29it/s] 61it [00:06, 9.44it/s] 62it [00:06, 9.51it/s] 63it [00:06, 9.58it/s] 64it [00:06, 9.58it/s] 65it [00:06, 9.53it/s] 66it [00:07, 9.53it/s] 67it [00:07, 9.61it/s] 68it [00:07, 9.65it/s] 69it [00:07, 9.69it/s] 70it [00:07, 9.72it/s] 71it [00:07, 9.76it/s] 72it [00:07, 9.74it/s] 73it [00:07, 9.76it/s] 74it [00:07, 9.76it/s] 75it [00:07, 9.77it/s] 76it [00:08, 9.16it/s] 77it [00:08, 9.34it/s] 78it [00:08, 9.44it/s] 79it [00:08, 9.54it/s] 80it [00:08, 9.56it/s] 81it [00:08, 9.63it/s] 82it [00:08, 9.66it/s] 83it [00:08, 9.64it/s] 84it [00:08, 9.10it/s] 85it [00:09, 9.30it/s] 86it [00:09, 9.38it/s] 87it [00:09, 9.42it/s] 88it [00:09, 9.52it/s] 89it [00:09, 9.62it/s] 90it [00:09, 9.67it/s] 91it [00:09, 9.72it/s] 92it [00:09, 9.73it/s] 93it [00:09, 9.13it/s] 94it [00:09, 9.32it/s] 95it [00:10, 9.44it/s] 96it [00:10, 9.54it/s] 97it [00:10, 9.65it/s] 98it [00:10, 9.70it/s] 99it [00:10, 9.72it/s] 100it [00:10, 9.71it/s]2025-05-26 05:42:18,343 - INFO - [Epoch 024 | Batch 0100] IWAE-loss 6554.0537 | mean log_px -0.0452 | KL -3559.28 + 101it [00:10, 9.12it/s] 102it [00:10, 9.30it/s] 103it [00:10, 9.43it/s] 104it [00:11, 9.52it/s] 105it [00:11, 9.43it/s] 106it [00:11, 9.44it/s] 107it [00:11, 9.53it/s] 108it [00:11, 9.60it/s] 109it [00:11, 9.65it/s] 110it [00:11, 9.69it/s] 111it [00:11, 9.72it/s] 112it [00:11, 9.13it/s] 113it [00:11, 9.29it/s] 114it [00:12, 9.42it/s] 115it [00:12, 9.53it/s] 116it [00:12, 9.61it/s] 117it [00:12, 9.67it/s] 118it [00:12, 9.71it/s] 119it [00:12, 9.72it/s] 120it [00:12, 9.73it/s] 121it [00:12, 9.75it/s] 122it [00:12, 9.75it/s] 123it [00:13, 9.76it/s] 124it [00:13, 9.75it/s] 125it [00:13, 9.77it/s] 126it [00:13, 9.76it/s] 127it [00:13, 9.79it/s] 128it [00:13, 9.78it/s] 129it [00:13, 9.75it/s] 130it [00:13, 9.77it/s] 131it [00:13, 9.17it/s] 132it [00:13, 9.29it/s] 133it [00:14, 9.42it/s] 134it [00:14, 9.50it/s] 135it [00:14, 8.87it/s] 136it [00:14, 8.84it/s] 137it [00:14, 9.06it/s] 138it [00:14, 9.26it/s] 139it [00:14, 9.40it/s] 140it [00:14, 9.50it/s] 141it [00:14, 9.61it/s] 142it [00:15, 9.16it/s] 143it [00:15, 9.33it/s] 144it [00:15, 9.46it/s] 145it [00:15, 9.55it/s] 146it [00:15, 9.54it/s] 147it [00:15, 9.54it/s] 148it [00:15, 9.62it/s] 149it [00:15, 9.67it/s] 150it [00:15, 9.71it/s]2025-05-26 05:42:23,605 - INFO - [Epoch 024 | Batch 0150] IWAE-loss 11166.3877 | mean log_px -0.1161 | KL -3563.05 + 151it [00:15, 9.72it/s] 152it [00:16, 9.75it/s] 153it [00:16, 9.77it/s] 154it [00:16, 9.77it/s] 155it [00:16, 9.80it/s] 156it [00:16, 9.78it/s] 157it [00:16, 9.73it/s] 158it [00:16, 9.12it/s] 159it [00:16, 9.31it/s] 160it [00:16, 9.46it/s] 161it [00:17, 9.56it/s] 162it [00:17, 9.06it/s] 163it [00:17, 9.25it/s] 164it [00:17, 9.39it/s] 165it [00:17, 9.49it/s] 166it [00:17, 8.99it/s] 167it [00:17, 9.23it/s] 168it [00:17, 9.38it/s] 169it [00:17, 9.51it/s] 170it [00:17, 9.58it/s] 171it [00:18, 9.65it/s] 172it [00:18, 9.69it/s] 173it [00:18, 9.71it/s] 174it [00:18, 9.73it/s] 175it [00:18, 9.75it/s] 176it [00:18, 9.74it/s] 177it [00:18, 9.74it/s] 178it [00:18, 9.73it/s] 179it [00:18, 9.12it/s] 180it [00:19, 9.30it/s] 181it [00:19, 9.42it/s] 182it [00:19, 9.52it/s] 183it [00:19, 9.60it/s] 184it [00:19, 9.65it/s] 185it [00:19, 9.68it/s] 186it [00:19, 9.72it/s] 187it [00:19, 9.73it/s] 188it [00:19, 9.75it/s] 189it [00:19, 9.75it/s] 190it [00:20, 9.75it/s] 191it [00:20, 9.79it/s] 192it [00:20, 9.77it/s] 193it [00:20, 9.77it/s] 194it [00:20, 9.76it/s] 195it [00:20, 9.34it/s] 196it [00:20, 9.07it/s] 196it [00:20, 9.44it/s] +2025-05-26 05:42:28,440 - INFO - Epoch: 24, Objective: tensor([7781.2070], device='cuda:0', grad_fn=), Loss: 0.06895510107278824, KL/n: 72.64373779296875 +2025-05-26 05:42:28,446 - INFO - Select objective: bbb + 0it [00:00, ?it/s] 2it [00:00, 16.62it/s] 5it [00:00, 22.98it/s] 8it [00:00, 25.85it/s] 11it [00:00, 27.42it/s] 15it [00:00, 28.62it/s] 19it [00:00, 29.31it/s] 23it [00:00, 29.67it/s] 27it [00:00, 30.08it/s] 31it [00:01, 30.14it/s] 35it [00:01, 30.16it/s] 39it [00:01, 30.55it/s] 43it [00:01, 30.61it/s] 47it [00:01, 30.29it/s] 51it [00:01, 30.03it/s] 55it [00:01, 30.24it/s] 59it [00:02, 30.39it/s] 63it [00:02, 30.51it/s] 67it [00:02, 30.40it/s] 71it [00:02, 30.72it/s] 75it [00:02, 30.74it/s] 79it [00:02, 30.75it/s] 83it [00:02, 30.77it/s] 87it [00:02, 30.78it/s] 91it [00:03, 30.76it/s] 95it [00:03, 30.55it/s] 99it [00:03, 30.65it/s] 103it [00:03, 30.72it/s] 107it [00:03, 30.52it/s] 111it [00:03, 30.56it/s] 115it [00:03, 30.83it/s] 119it [00:03, 30.83it/s] 123it [00:04, 30.82it/s] 127it [00:04, 30.59it/s] 131it [00:04, 30.63it/s] 135it [00:04, 30.84it/s] 139it [00:04, 30.84it/s] 143it [00:04, 30.83it/s] 147it [00:04, 30.84it/s] 151it [00:04, 30.83it/s] 155it [00:05, 30.81it/s] 159it [00:05, 30.61it/s] 163it [00:05, 30.73it/s] 167it [00:05, 30.83it/s] 171it [00:05, 30.74it/s] 175it [00:05, 30.72it/s] 179it [00:05, 30.73it/s] 183it [00:06, 30.71it/s] 187it [00:06, 30.70it/s] 191it [00:06, 30.71it/s] 195it [00:06, 30.68it/s] 199it [00:06, 30.75it/s] 203it [00:06, 30.69it/s] 207it [00:06, 30.72it/s] 211it [00:06, 30.70it/s] 215it [00:07, 30.61it/s] 219it [00:07, 30.67it/s] 223it [00:07, 30.69it/s] 227it [00:07, 30.74it/s] 231it [00:07, 30.73it/s] 235it [00:07, 30.73it/s] 239it [00:07, 30.69it/s] 243it [00:07, 30.71it/s] 247it [00:08, 30.71it/s] 251it [00:08, 30.69it/s] 255it [00:08, 30.71it/s] 259it [00:08, 30.71it/s] 263it [00:08, 30.72it/s] 267it [00:08, 30.69it/s] 271it [00:08, 30.69it/s] 275it [00:09, 30.70it/s] 279it [00:09, 28.17it/s] 280it [00:09, 30.19it/s] +2025-05-26 05:42:37,884 - INFO - Epoch: 0, Objective: 0.06987767666578293, Loss: 0.06753052026033401, KL/n: 0.0023471589665859938 + 0%| | 0/84 [00:00), Loss: 0.43466299772262573, KL/n: 68.75403594970703 + 0it [00:00, ?it/s]2025-05-26 05:45:12,610 - INFO - [Epoch 001 | Batch 0000] IWAE-loss 28074.5488 | mean log_px -0.3577 | KL -3369.96 + 1it [00:00, 5.54it/s] 2it [00:00, 6.87it/s] 3it [00:00, 7.95it/s] 4it [00:00, 8.56it/s] 5it [00:00, 8.92it/s] 6it [00:00, 9.16it/s] 7it [00:00, 9.35it/s] 8it [00:00, 9.01it/s] 9it [00:01, 9.28it/s] 10it [00:01, 9.41it/s] 11it [00:01, 9.56it/s] 12it [00:01, 9.58it/s] 13it [00:01, 9.67it/s] 14it [00:01, 9.67it/s] 15it [00:01, 9.73it/s] 16it [00:01, 9.74it/s] 17it [00:01, 9.75it/s] 18it [00:01, 9.74it/s] 19it [00:02, 9.79it/s] 20it [00:02, 9.79it/s] 21it [00:02, 9.82it/s] 22it [00:02, 9.75it/s] 23it [00:02, 9.77it/s] 24it [00:02, 9.78it/s] 25it [00:02, 9.77it/s] 26it [00:02, 9.75it/s] 27it [00:02, 9.78it/s] 28it [00:02, 9.78it/s] 29it [00:03, 9.77it/s] 30it [00:03, 9.16it/s] 31it [00:03, 9.36it/s] 32it [00:03, 9.48it/s] 33it [00:03, 9.56it/s] 34it [00:03, 9.59it/s] 35it [00:03, 9.62it/s] 36it [00:03, 9.02it/s] 37it [00:03, 9.25it/s] 38it [00:04, 9.40it/s] 39it [00:04, 9.51it/s] 40it [00:04, 9.57it/s] 41it [00:04, 9.60it/s] 42it [00:04, 9.65it/s] 43it [00:04, 9.72it/s] 44it [00:04, 9.71it/s] 45it [00:04, 9.72it/s] 46it [00:04, 9.75it/s] 47it [00:04, 9.75it/s] 48it [00:05, 9.78it/s] 49it [00:05, 9.17it/s] 50it [00:05, 9.35it/s]2025-05-26 05:45:17,836 - INFO - [Epoch 001 | Batch 0050] IWAE-loss 26761.6230 | mean log_px -0.3389 | KL -3393.95 + 51it [00:05, 9.46it/s] 52it [00:05, 9.52it/s] 53it [00:05, 9.60it/s] 54it [00:05, 9.64it/s] 55it [00:05, 9.65it/s] 56it [00:05, 9.06it/s] 57it [00:06, 9.28it/s] 58it [00:06, 9.40it/s] 59it [00:06, 9.52it/s] 60it [00:06, 9.60it/s] 61it [00:06, 9.67it/s] 62it [00:06, 9.66it/s] 63it [00:06, 9.69it/s] 64it [00:06, 9.74it/s] 65it [00:06, 9.73it/s] 66it [00:06, 9.74it/s] 67it [00:07, 9.77it/s] 68it [00:07, 9.13it/s] 69it [00:07, 9.34it/s] 70it [00:07, 9.48it/s] 71it [00:07, 9.54it/s] 72it [00:07, 9.55it/s] 73it [00:07, 9.56it/s] 74it [00:07, 9.64it/s] 75it [00:07, 9.71it/s] 76it [00:08, 9.25it/s] 77it [00:08, 9.13it/s] 78it [00:08, 9.18it/s] 79it [00:08, 9.29it/s] 80it [00:08, 9.42it/s] 81it [00:08, 9.55it/s] 82it [00:08, 9.57it/s] 83it [00:08, 9.65it/s] 84it [00:08, 9.66it/s] 85it [00:08, 9.66it/s] 86it [00:09, 9.66it/s] 87it [00:09, 9.66it/s] 88it [00:09, 9.38it/s] 89it [00:09, 9.52it/s] 90it [00:09, 9.58it/s] 91it [00:09, 9.66it/s] 92it [00:09, 9.66it/s] 93it [00:09, 9.70it/s] 94it [00:09, 9.71it/s] 95it [00:10, 9.68it/s] 96it [00:10, 9.71it/s] 97it [00:10, 9.74it/s] 98it [00:10, 9.75it/s] 99it [00:10, 9.76it/s] 100it [00:10, 9.71it/s]2025-05-26 05:45:23,061 - INFO - [Epoch 001 | Batch 0100] IWAE-loss 28285.6133 | mean log_px -0.3769 | KL -3410.21 + 101it [00:10, 9.68it/s] 102it [00:10, 9.70it/s] 103it [00:10, 9.69it/s] 104it [00:10, 9.68it/s] 105it [00:11, 9.70it/s] 106it [00:11, 9.17it/s] 107it [00:11, 9.36it/s] 108it [00:11, 9.44it/s] 109it [00:11, 9.54it/s] 110it [00:11, 9.60it/s] 111it [00:11, 9.65it/s] 112it [00:11, 9.69it/s] 113it [00:11, 9.72it/s] 114it [00:11, 9.74it/s] 115it [00:12, 9.72it/s] 116it [00:12, 9.71it/s] 117it [00:12, 9.70it/s] 118it [00:12, 9.71it/s] 119it [00:12, 9.75it/s] 120it [00:12, 9.72it/s] 121it [00:12, 9.15it/s] 122it [00:12, 9.29it/s] 123it [00:12, 9.42it/s] 124it [00:13, 9.54it/s] 125it [00:13, 9.62it/s] 126it [00:13, 9.13it/s] 127it [00:13, 9.29it/s] 128it [00:13, 9.41it/s] 129it [00:13, 9.54it/s] 130it [00:13, 9.60it/s] 131it [00:13, 9.67it/s] 132it [00:13, 9.70it/s] 133it [00:13, 9.70it/s] 134it [00:14, 9.28it/s] 135it [00:14, 9.45it/s] 136it [00:14, 9.53it/s] 137it [00:14, 9.58it/s] 138it [00:14, 9.60it/s] 139it [00:14, 9.66it/s] 140it [00:14, 9.70it/s] 141it [00:14, 9.73it/s] 142it [00:14, 9.75it/s] 143it [00:15, 9.73it/s] 144it [00:15, 9.72it/s] 145it [00:15, 9.72it/s] 146it [00:15, 9.17it/s] 147it [00:15, 9.36it/s] 148it [00:15, 9.47it/s] 149it [00:15, 9.56it/s] 150it [00:15, 9.58it/s]2025-05-26 05:45:28,291 - INFO - [Epoch 001 | Batch 0150] IWAE-loss 24188.4082 | mean log_px -0.3034 | KL -3424.15 + 151it [00:15, 9.61it/s] 152it [00:15, 9.62it/s] 153it [00:16, 9.69it/s] 154it [00:16, 9.68it/s] 155it [00:16, 9.70it/s] 156it [00:16, 9.69it/s] 157it [00:16, 9.72it/s] 158it [00:16, 9.76it/s] 159it [00:16, 9.78it/s] 160it [00:16, 9.75it/s] 161it [00:16, 9.33it/s] 162it [00:17, 9.46it/s] 163it [00:17, 9.54it/s] 164it [00:17, 9.61it/s] 165it [00:17, 9.68it/s] 166it [00:17, 9.71it/s] 167it [00:17, 9.73it/s] 168it [00:17, 9.70it/s] 169it [00:17, 9.54it/s] 170it [00:17, 9.37it/s] 171it [00:17, 9.24it/s] 172it [00:18, 9.32it/s] 173it [00:18, 9.41it/s] 174it [00:18, 9.46it/s] 175it [00:18, 9.51it/s] 176it [00:18, 9.54it/s] 177it [00:18, 9.56it/s] 178it [00:18, 9.57it/s] 179it [00:18, 9.59it/s] 180it [00:18, 9.61it/s] 181it [00:18, 9.60it/s] 182it [00:19, 9.63it/s] 183it [00:19, 9.30it/s] 184it [00:19, 9.44it/s] 185it [00:19, 9.56it/s] 186it [00:19, 9.58it/s] 187it [00:19, 9.54it/s] 188it [00:19, 9.63it/s] 189it [00:19, 9.64it/s] 190it [00:19, 9.65it/s] 191it [00:20, 9.70it/s] 192it [00:20, 9.69it/s] 193it [00:20, 9.74it/s] 194it [00:20, 9.75it/s] 195it [00:20, 9.29it/s] 196it [00:20, 9.50it/s] +2025-05-26 05:45:33,097 - INFO - Epoch: 1, Objective: tensor([25134.6309], device='cuda:0', grad_fn=), Loss: 0.3120049238204956, KL/n: 70.07382202148438 + 0it [00:00, ?it/s]2025-05-26 05:45:33,375 - INFO - [Epoch 002 | Batch 0000] IWAE-loss 26034.8926 | mean log_px -0.3319 | KL -3429.36 + 1it [00:00, 5.11it/s] 2it [00:00, 7.06it/s] 3it [00:00, 7.51it/s] 4it [00:00, 8.28it/s] 5it [00:00, 8.81it/s] 6it [00:00, 9.14it/s] 7it [00:00, 9.35it/s] 8it [00:00, 9.51it/s] 9it [00:01, 9.21it/s] 10it [00:01, 9.23it/s] 11it [00:01, 9.42it/s] 12it [00:01, 9.50it/s] 13it [00:01, 8.93it/s] 14it [00:01, 9.17it/s] 15it [00:01, 9.37it/s] 16it [00:01, 9.43it/s] 17it [00:01, 9.50it/s] 18it [00:02, 9.54it/s] 19it [00:02, 9.65it/s] 20it [00:02, 9.71it/s] 21it [00:02, 9.77it/s] 22it [00:02, 9.10it/s] 23it [00:02, 9.20it/s] 24it [00:02, 9.37it/s] 25it [00:02, 9.14it/s] 26it [00:02, 9.32it/s] 27it [00:02, 9.46it/s] 28it [00:03, 9.53it/s] 29it [00:03, 9.60it/s] 30it [00:03, 9.65it/s] 31it [00:03, 9.69it/s] 32it [00:03, 9.71it/s] 33it [00:03, 9.74it/s] 34it [00:03, 9.77it/s] 35it [00:03, 9.80it/s] 36it [00:03, 9.81it/s] 37it [00:03, 9.83it/s] 38it [00:04, 9.83it/s] 39it [00:04, 9.87it/s] 40it [00:04, 9.86it/s] 41it [00:04, 9.12it/s] 42it [00:04, 9.30it/s] 43it [00:04, 9.47it/s] 44it [00:04, 9.57it/s] 45it [00:04, 9.66it/s] 46it [00:04, 9.70it/s] 47it [00:05, 9.76it/s] 48it [00:05, 9.71it/s] 49it [00:05, 9.53it/s] 50it [00:05, 9.21it/s]2025-05-26 05:45:38,636 - INFO - [Epoch 002 | Batch 0050] IWAE-loss 24607.2324 | mean log_px -0.3063 | KL -3444.27 + 51it [00:05, 9.37it/s] 52it [00:05, 9.50it/s] 53it [00:05, 9.59it/s] 54it [00:05, 9.66it/s] 55it [00:05, 9.70it/s] 56it [00:05, 9.70it/s] 57it [00:06, 9.59it/s] 58it [00:06, 9.65it/s] 59it [00:06, 9.68it/s] 60it [00:06, 9.15it/s] 61it [00:06, 9.35it/s] 62it [00:06, 9.48it/s] 63it [00:06, 9.60it/s] 64it [00:06, 9.67it/s] 65it [00:06, 9.74it/s] 66it [00:07, 9.75it/s] 67it [00:07, 9.78it/s] 68it [00:07, 9.77it/s] 69it [00:07, 9.77it/s] 70it [00:07, 9.71it/s] 71it [00:07, 9.76it/s] 72it [00:07, 9.75it/s] 73it [00:07, 9.79it/s] 74it [00:07, 9.80it/s] 75it [00:07, 9.23it/s] 76it [00:08, 9.40it/s] 77it [00:08, 9.54it/s] 78it [00:08, 9.62it/s] 79it [00:08, 9.68it/s] 80it [00:08, 9.31it/s] 81it [00:08, 9.47it/s] 82it [00:08, 9.17it/s] 83it [00:08, 9.37it/s] 84it [00:08, 9.50it/s] 85it [00:08, 9.59it/s] 86it [00:09, 9.65it/s] 87it [00:09, 9.71it/s] 88it [00:09, 9.75it/s] 89it [00:09, 9.79it/s] 90it [00:09, 9.79it/s] 91it [00:09, 9.81it/s] 92it [00:09, 9.82it/s] 93it [00:09, 9.69it/s] 94it [00:09, 9.63it/s] 95it [00:10, 9.55it/s] 96it [00:10, 6.26it/s] 97it [00:10, 6.67it/s] 98it [00:10, 7.33it/s] 99it [00:10, 7.95it/s] 100it [00:10, 8.43it/s]2025-05-26 05:45:44,040 - INFO - [Epoch 002 | Batch 0100] IWAE-loss 20464.7461 | mean log_px -0.2492 | KL -3452.10 + 101it [00:10, 8.66it/s] 102it [00:10, 8.83it/s] 103it [00:11, 9.08it/s] 104it [00:11, 9.26it/s] 105it [00:11, 8.96it/s] 106it [00:11, 9.10it/s] 107it [00:11, 9.30it/s] 108it [00:11, 9.45it/s] 109it [00:11, 9.56it/s] 110it [00:11, 9.63it/s] 111it [00:11, 9.69it/s] 112it [00:12, 9.73it/s] 113it [00:12, 9.15it/s] 114it [00:12, 9.33it/s] 115it [00:12, 9.49it/s] 116it [00:12, 9.51it/s] 117it [00:12, 9.53it/s] 118it [00:12, 9.60it/s] 119it [00:12, 9.67it/s] 120it [00:12, 9.73it/s] 121it [00:12, 9.78it/s] 122it [00:13, 9.78it/s] 123it [00:13, 9.26it/s] 124it [00:13, 9.42it/s] 125it [00:13, 9.56it/s] 126it [00:13, 9.26it/s] 127it [00:13, 9.45it/s] 128it [00:13, 9.56it/s] 129it [00:13, 9.66it/s] 130it [00:13, 9.71it/s] 131it [00:14, 9.76it/s] 132it [00:14, 9.79it/s] 133it [00:14, 9.81it/s] 134it [00:14, 9.82it/s] 135it [00:14, 9.83it/s] 136it [00:14, 9.84it/s] 137it [00:14, 9.85it/s] 138it [00:14, 9.83it/s] 139it [00:14, 9.85it/s] 140it [00:14, 9.84it/s] 141it [00:15, 9.85it/s] 142it [00:15, 9.84it/s] 143it [00:15, 9.84it/s] 144it [00:15, 9.83it/s] 145it [00:15, 9.82it/s] 147it [00:15, 9.93it/s] 149it [00:15, 10.00it/s] 150it [00:15, 10.00it/s]2025-05-26 05:45:49,204 - INFO - [Epoch 002 | Batch 0150] IWAE-loss 18063.8633 | mean log_px -0.2179 | KL -3453.99 + 151it [00:16, 9.99it/s] 153it [00:16, 10.01it/s] 155it [00:16, 9.65it/s] 157it [00:16, 9.80it/s] 159it [00:16, 9.87it/s] 160it [00:16, 9.64it/s] 162it [00:17, 9.80it/s] 164it [00:17, 9.89it/s] 166it [00:17, 9.95it/s] 168it [00:17, 10.00it/s] 170it [00:17, 10.03it/s] 172it [00:18, 10.05it/s] 174it [00:18, 10.06it/s] 176it [00:18, 9.79it/s] 178it [00:18, 9.88it/s] 180it [00:18, 9.95it/s] 182it [00:19, 9.99it/s] 184it [00:19, 10.03it/s] 186it [00:19, 10.05it/s] 188it [00:19, 10.06it/s] 190it [00:19, 10.06it/s] 192it [00:20, 10.06it/s] 194it [00:20, 9.81it/s] 195it [00:20, 9.53it/s] 196it [00:20, 9.50it/s] +2025-05-26 05:45:53,862 - INFO - Epoch: 2, Objective: tensor([23773.6406], device='cuda:0', grad_fn=), Loss: 0.30370157957077026, KL/n: 70.60922241210938 + 0it [00:00, ?it/s]2025-05-26 05:45:54,149 - INFO - [Epoch 003 | Batch 0000] IWAE-loss 22127.6270 | mean log_px -0.2715 | KL -3458.96 + 1it [00:00, 4.43it/s] 2it [00:00, 6.54it/s] 4it [00:00, 8.39it/s] 6it [00:00, 8.69it/s] 7it [00:00, 8.91it/s] 8it [00:00, 9.14it/s] 9it [00:01, 9.35it/s] 10it [00:01, 9.47it/s] 11it [00:01, 9.59it/s] 12it [00:01, 9.19it/s] 13it [00:01, 9.40it/s] 14it [00:01, 9.54it/s] 15it [00:01, 9.08it/s] 16it [00:01, 9.30it/s] 18it [00:02, 9.60it/s] 19it [00:02, 9.27it/s] 20it [00:02, 9.42it/s] 21it [00:02, 9.57it/s] 22it [00:02, 9.64it/s] 23it [00:02, 9.72it/s] 24it [00:02, 9.76it/s] 25it [00:02, 9.80it/s] 26it [00:02, 9.19it/s] 27it [00:02, 9.35it/s] 28it [00:03, 9.49it/s] 29it [00:03, 9.61it/s] 30it [00:03, 9.67it/s] 31it [00:03, 9.75it/s] 32it [00:03, 9.75it/s] 33it [00:03, 9.29it/s] 34it [00:03, 9.44it/s] 35it [00:03, 9.56it/s] 36it [00:03, 9.61it/s] 37it [00:03, 9.70it/s] 38it [00:04, 9.75it/s] 39it [00:04, 9.78it/s] 40it [00:04, 9.77it/s] 41it [00:04, 9.82it/s] 42it [00:04, 9.82it/s] 43it [00:04, 9.84it/s] 44it [00:04, 9.82it/s] 45it [00:04, 9.85it/s] 46it [00:04, 9.84it/s] 47it [00:05, 9.86it/s] 48it [00:05, 9.84it/s] 49it [00:05, 9.86it/s] 50it [00:05, 9.85it/s]2025-05-26 05:45:59,364 - INFO - [Epoch 003 | Batch 0050] IWAE-loss 18690.7363 | mean log_px -0.2205 | KL -3462.40 + 51it [00:05, 9.17it/s] 52it [00:05, 9.23it/s] 53it [00:05, 9.39it/s] 54it [00:05, 9.52it/s] 55it [00:05, 9.63it/s] 56it [00:05, 9.70it/s] 57it [00:06, 9.76it/s] 58it [00:06, 9.78it/s] 59it [00:06, 9.79it/s] 60it [00:06, 9.32it/s] 61it [00:06, 9.48it/s] 62it [00:06, 9.47it/s] 63it [00:06, 9.61it/s] 64it [00:06, 9.66it/s] 65it [00:06, 9.74it/s] 66it [00:06, 9.78it/s] 67it [00:07, 9.82it/s] 68it [00:07, 9.82it/s] 69it [00:07, 9.84it/s] 70it [00:07, 9.85it/s] 71it [00:07, 9.82it/s] 72it [00:07, 9.05it/s] 73it [00:07, 9.14it/s] 74it [00:07, 9.18it/s] 75it [00:07, 9.38it/s] 76it [00:08, 9.51it/s] 77it [00:08, 8.92it/s] 78it [00:08, 9.17it/s] 79it [00:08, 9.34it/s] 80it [00:08, 9.48it/s] 81it [00:08, 9.60it/s] 82it [00:08, 9.65it/s] 83it [00:08, 9.72it/s] 84it [00:08, 9.69it/s] 85it [00:09, 9.19it/s] 86it [00:09, 9.36it/s] 87it [00:09, 9.50it/s] 88it [00:09, 9.58it/s] 89it [00:09, 9.66it/s] 90it [00:09, 9.71it/s] 91it [00:09, 9.72it/s] 92it [00:09, 9.71it/s] 93it [00:09, 9.71it/s] 94it [00:09, 9.69it/s] 95it [00:10, 9.72it/s] 96it [00:10, 9.73it/s] 97it [00:10, 9.68it/s] 98it [00:10, 9.66it/s] 99it [00:10, 9.11it/s] 100it [00:10, 9.28it/s]2025-05-26 05:46:04,621 - INFO - [Epoch 003 | Batch 0100] IWAE-loss 22098.5781 | mean log_px -0.2703 | KL -3471.58 + 101it [00:10, 9.40it/s] 102it [00:10, 9.46it/s] 103it [00:10, 9.53it/s] 104it [00:10, 9.11it/s] 105it [00:11, 9.23it/s] 106it [00:11, 9.26it/s] 107it [00:11, 9.42it/s] 108it [00:11, 9.50it/s] 109it [00:11, 9.01it/s] 110it [00:11, 9.17it/s] 111it [00:11, 9.31it/s] 112it [00:11, 9.40it/s] 113it [00:11, 8.90it/s] 114it [00:12, 9.02it/s] 115it [00:12, 9.16it/s] 116it [00:12, 9.12it/s] 117it [00:12, 9.24it/s] 118it [00:12, 9.28it/s] 119it [00:12, 9.37it/s] 120it [00:12, 9.37it/s] 121it [00:12, 9.39it/s] 122it [00:12, 9.43it/s] 123it [00:13, 9.48it/s] 124it [00:13, 9.42it/s] 125it [00:13, 9.43it/s] 126it [00:13, 9.48it/s] 127it [00:13, 9.45it/s] 128it [00:13, 9.49it/s] 129it [00:13, 9.09it/s] 130it [00:13, 9.18it/s] 131it [00:13, 9.29it/s] 132it [00:14, 9.35it/s] 133it [00:14, 9.36it/s] 134it [00:14, 9.37it/s] 135it [00:14, 9.39it/s] 136it [00:14, 8.86it/s] 137it [00:14, 9.05it/s] 138it [00:14, 9.16it/s] 139it [00:14, 9.29it/s] 140it [00:14, 9.37it/s] 141it [00:14, 9.47it/s] 142it [00:15, 9.42it/s] 143it [00:15, 9.43it/s] 144it [00:15, 9.42it/s] 145it [00:15, 9.43it/s] 146it [00:15, 9.44it/s] 147it [00:15, 8.89it/s] 148it [00:15, 9.05it/s] 149it [00:15, 9.21it/s] 150it [00:15, 9.34it/s]2025-05-26 05:46:10,001 - INFO - [Epoch 003 | Batch 0150] IWAE-loss 23228.7480 | mean log_px -0.2856 | KL -3470.63 + 151it [00:16, 9.43it/s] 152it [00:16, 9.40it/s] 153it [00:16, 9.45it/s] 154it [00:16, 9.48it/s] 155it [00:16, 9.49it/s] 156it [00:16, 9.49it/s] 157it [00:16, 9.48it/s] 158it [00:16, 9.52it/s] 159it [00:16, 9.58it/s] 160it [00:16, 9.49it/s] 161it [00:17, 9.50it/s] 162it [00:17, 9.43it/s] 163it [00:17, 9.45it/s] 164it [00:17, 9.44it/s] 165it [00:17, 9.50it/s] 166it [00:17, 9.45it/s] 167it [00:17, 9.48it/s] 168it [00:17, 9.48it/s] 169it [00:17, 9.07it/s] 170it [00:18, 9.19it/s] 171it [00:18, 9.25it/s] 172it [00:18, 9.30it/s] 173it [00:18, 9.39it/s] 174it [00:18, 9.40it/s] 175it [00:18, 9.49it/s] 176it [00:18, 9.53it/s] 177it [00:18, 9.59it/s] 178it [00:18, 9.53it/s] 179it [00:19, 9.54it/s] 180it [00:19, 9.56it/s] 181it [00:19, 9.55it/s] 182it [00:19, 9.52it/s] 183it [00:19, 9.51it/s] 184it [00:19, 9.44it/s] 185it [00:19, 8.92it/s] 186it [00:19, 9.04it/s] 187it [00:19, 9.15it/s] 188it [00:19, 9.23it/s] 189it [00:20, 9.28it/s] 190it [00:20, 9.31it/s] 191it [00:20, 9.41it/s] 192it [00:20, 9.42it/s] 193it [00:20, 9.45it/s] 194it [00:20, 9.48it/s] 195it [00:20, 8.53it/s] 196it [00:20, 8.82it/s] 196it [00:20, 9.36it/s] +2025-05-26 05:46:14,920 - INFO - Epoch: 3, Objective: tensor([23300.8750], device='cuda:0', grad_fn=), Loss: 0.2900332510471344, KL/n: 70.9906005859375 + 0it [00:00, ?it/s]2025-05-26 05:46:15,373 - INFO - [Epoch 004 | Batch 0000] IWAE-loss 12282.2793 | mean log_px -0.1411 | KL -3474.90 + 1it [00:00, 5.45it/s] 2it [00:00, 7.24it/s] 3it [00:00, 7.54it/s] 4it [00:00, 8.22it/s] 5it [00:00, 8.64it/s] 6it [00:00, 8.91it/s] 7it [00:00, 9.14it/s] 8it [00:00, 9.23it/s] 9it [00:01, 9.32it/s] 10it [00:01, 9.36it/s] 11it [00:01, 9.41it/s] 12it [00:01, 9.42it/s] 13it [00:01, 9.46it/s] 14it [00:01, 9.47it/s] 15it [00:01, 9.53it/s] 16it [00:01, 9.49it/s] 17it [00:01, 9.46it/s] 18it [00:01, 9.47it/s] 19it [00:02, 9.53it/s] 20it [00:02, 9.54it/s] 21it [00:02, 9.60it/s] 22it [00:02, 9.54it/s] 23it [00:02, 9.43it/s] 24it [00:02, 9.45it/s] 25it [00:02, 9.45it/s] 26it [00:02, 9.43it/s] 27it [00:02, 8.91it/s] 28it [00:03, 9.06it/s] 29it [00:03, 9.18it/s] 30it [00:03, 9.30it/s] 31it [00:03, 9.36it/s] 32it [00:03, 9.35it/s] 33it [00:03, 9.37it/s] 34it [00:03, 9.39it/s] 35it [00:03, 9.36it/s] 36it [00:03, 9.35it/s] 37it [00:04, 9.36it/s] 38it [00:04, 9.40it/s] 39it [00:04, 9.42it/s] 40it [00:04, 9.42it/s] 41it [00:04, 8.89it/s] 42it [00:04, 9.05it/s] 43it [00:04, 9.16it/s] 44it [00:04, 9.24it/s] 45it [00:04, 9.34it/s] 46it [00:04, 9.38it/s] 47it [00:05, 8.99it/s] 48it [00:05, 9.10it/s] 49it [00:05, 9.21it/s] 50it [00:05, 9.24it/s]2025-05-26 05:46:20,737 - INFO - [Epoch 004 | Batch 0050] IWAE-loss 23196.6523 | mean log_px -0.2816 | KL -3483.42 + 51it [00:05, 8.76it/s] 52it [00:05, 8.89it/s] 53it [00:05, 9.08it/s] 54it [00:05, 9.17it/s] 55it [00:05, 9.27it/s] 56it [00:06, 9.31it/s] 57it [00:06, 9.32it/s] 58it [00:06, 9.33it/s] 59it [00:06, 8.82it/s] 60it [00:06, 8.98it/s] 61it [00:06, 9.13it/s] 62it [00:06, 9.21it/s] 63it [00:06, 9.30it/s] 64it [00:06, 9.33it/s] 65it [00:07, 9.36it/s] 66it [00:07, 9.30it/s] 67it [00:07, 9.38it/s] 68it [00:07, 9.39it/s] 69it [00:07, 9.43it/s] 70it [00:07, 9.44it/s] 71it [00:07, 9.52it/s] 72it [00:07, 9.53it/s] 73it [00:07, 9.51it/s] 74it [00:08, 9.48it/s] 75it [00:08, 9.50it/s] 76it [00:08, 9.47it/s] 77it [00:08, 9.31it/s] 78it [00:08, 8.85it/s] 79it [00:08, 8.71it/s] 80it [00:08, 8.83it/s] 81it [00:08, 9.01it/s] 82it [00:08, 9.16it/s] 83it [00:09, 9.32it/s] 84it [00:09, 9.34it/s] 85it [00:09, 9.36it/s] 86it [00:09, 9.35it/s] 87it [00:09, 9.35it/s] 88it [00:09, 9.37it/s] 89it [00:09, 9.42it/s] 90it [00:09, 9.39it/s] 91it [00:09, 9.47it/s] 92it [00:09, 9.44it/s] 93it [00:10, 9.44it/s] 94it [00:10, 9.47it/s] 95it [00:10, 9.45it/s] 96it [00:10, 8.99it/s] 97it [00:10, 9.12it/s] 98it [00:10, 9.21it/s] 99it [00:10, 9.35it/s] 100it [00:10, 9.43it/s]2025-05-26 05:46:26,130 - INFO - [Epoch 004 | Batch 0100] IWAE-loss 22043.1543 | mean log_px -0.2736 | KL -3483.78 + 101it [00:10, 9.46it/s] 102it [00:11, 9.46it/s] 103it [00:11, 9.50it/s] 104it [00:11, 9.02it/s] 105it [00:11, 9.15it/s] 106it [00:11, 9.25it/s] 107it [00:11, 9.32it/s] 108it [00:11, 9.34it/s] 109it [00:11, 9.40it/s] 110it [00:11, 9.39it/s] 111it [00:12, 9.37it/s] 112it [00:12, 9.38it/s] 113it [00:12, 9.44it/s] 114it [00:12, 9.19it/s] 115it [00:12, 8.74it/s] 116it [00:12, 8.96it/s] 117it [00:12, 9.03it/s] 118it [00:12, 9.01it/s] 119it [00:12, 9.10it/s] 120it [00:13, 9.11it/s] 121it [00:13, 9.12it/s] 122it [00:13, 9.18it/s] 123it [00:13, 9.22it/s] 124it [00:13, 9.34it/s] 125it [00:13, 9.43it/s] 126it [00:13, 9.44it/s] 127it [00:13, 8.96it/s] 128it [00:13, 9.08it/s] 129it [00:13, 9.10it/s] 130it [00:14, 9.20it/s] 131it [00:14, 9.28it/s] 132it [00:14, 9.38it/s] 133it [00:14, 8.88it/s] 134it [00:14, 9.01it/s] 135it [00:14, 9.14it/s] 136it [00:14, 9.27it/s] 137it [00:14, 9.37it/s] 138it [00:14, 9.35it/s] 139it [00:15, 9.42it/s] 140it [00:15, 9.44it/s] 141it [00:15, 9.50it/s] 142it [00:15, 9.53it/s] 143it [00:15, 9.50it/s] 144it [00:15, 9.48it/s] 145it [00:15, 9.48it/s] 146it [00:15, 9.52it/s] 147it [00:15, 9.52it/s] 148it [00:16, 9.49it/s] 149it [00:16, 9.51it/s] 150it [00:16, 9.47it/s]2025-05-26 05:46:31,516 - INFO - [Epoch 004 | Batch 0150] IWAE-loss 22188.4727 | mean log_px -0.2672 | KL -3485.55 + 151it [00:16, 9.50it/s] 152it [00:16, 9.02it/s] 153it [00:16, 9.12it/s] 154it [00:16, 9.24it/s] 155it [00:16, 9.34it/s] 156it [00:16, 9.35it/s] 157it [00:16, 9.43it/s] 158it [00:17, 9.39it/s] 159it [00:17, 8.95it/s] 160it [00:17, 9.11it/s] 161it [00:17, 9.18it/s] 162it [00:17, 9.25it/s] 163it [00:17, 9.30it/s] 164it [00:17, 9.31it/s] 165it [00:17, 8.73it/s] 166it [00:17, 8.76it/s] 167it [00:18, 8.84it/s] 168it [00:18, 8.93it/s] 169it [00:18, 9.05it/s] 170it [00:18, 9.17it/s] 171it [00:18, 9.11it/s] 172it [00:18, 9.03it/s] 173it [00:18, 8.79it/s] 174it [00:18, 8.60it/s] 175it [00:18, 8.69it/s] 176it [00:19, 8.71it/s] 177it [00:19, 8.87it/s] 178it [00:19, 9.04it/s] 179it [00:19, 8.62it/s] 180it [00:19, 8.85it/s] 181it [00:19, 9.01it/s] 182it [00:19, 9.10it/s] 183it [00:19, 9.16it/s] 184it [00:19, 9.28it/s] 185it [00:20, 9.38it/s] 186it [00:20, 9.38it/s] 187it [00:20, 9.42it/s] 188it [00:20, 8.85it/s] 189it [00:20, 8.95it/s] 190it [00:20, 9.09it/s] 191it [00:20, 9.16it/s] 192it [00:20, 9.24it/s] 193it [00:20, 9.27it/s] 194it [00:21, 9.30it/s] 195it [00:21, 8.80it/s] 196it [00:21, 9.03it/s] 196it [00:21, 9.17it/s] +2025-05-26 05:46:36,602 - INFO - Epoch: 4, Objective: tensor([19702.6348], device='cuda:0', grad_fn=), Loss: 0.23782320320606232, KL/n: 71.2601089477539 + 0it [00:00, ?it/s]2025-05-26 05:46:36,890 - INFO - [Epoch 005 | Batch 0000] IWAE-loss 16530.5488 | mean log_px -0.1878 | KL -3492.38 + 1it [00:00, 5.15it/s] 2it [00:00, 7.04it/s] 3it [00:00, 7.98it/s] 4it [00:00, 8.52it/s] 5it [00:00, 8.88it/s] 6it [00:00, 9.07it/s] 7it [00:00, 9.22it/s] 8it [00:00, 8.74it/s] 9it [00:01, 8.98it/s] 10it [00:01, 9.12it/s] 11it [00:01, 9.23it/s] 12it [00:01, 9.31it/s] 13it [00:01, 8.83it/s] 14it [00:01, 9.04it/s] 15it [00:01, 9.14it/s] 16it [00:01, 9.25it/s] 17it [00:01, 9.36it/s] 18it [00:02, 9.43it/s] 19it [00:02, 9.46it/s] 20it [00:02, 9.43it/s] 21it [00:02, 8.91it/s] 22it [00:02, 9.08it/s] 23it [00:02, 9.22it/s] 24it [00:02, 9.29it/s] 25it [00:02, 9.37it/s] 26it [00:02, 8.86it/s] 27it [00:03, 9.06it/s] 28it [00:03, 9.15it/s] 29it [00:03, 9.27it/s] 30it [00:03, 9.34it/s] 31it [00:03, 8.98it/s] 32it [00:03, 9.13it/s] 33it [00:03, 9.28it/s] 34it [00:03, 9.21it/s] 35it [00:03, 9.26it/s] 36it [00:03, 9.31it/s] 37it [00:04, 9.39it/s] 38it [00:04, 9.43it/s] 39it [00:04, 9.48it/s] 40it [00:04, 9.53it/s] 41it [00:04, 9.54it/s] 42it [00:04, 9.48it/s] 43it [00:04, 9.48it/s] 44it [00:04, 9.45it/s] 45it [00:04, 8.93it/s] 46it [00:05, 9.05it/s] 47it [00:05, 9.18it/s] 48it [00:05, 9.26it/s] 49it [00:05, 9.37it/s] 50it [00:05, 9.39it/s]2025-05-26 05:46:42,281 - INFO - [Epoch 005 | Batch 0050] IWAE-loss 17774.5938 | mean log_px -0.2058 | KL -3492.53 + 51it [00:05, 9.45it/s] 52it [00:05, 9.42it/s] 53it [00:05, 9.41it/s] 54it [00:05, 9.38it/s] 55it [00:06, 9.47it/s] 56it [00:06, 9.53it/s] 57it [00:06, 9.53it/s] 58it [00:06, 8.95it/s] 59it [00:06, 9.12it/s] 60it [00:06, 9.25it/s] 61it [00:06, 9.33it/s] 62it [00:06, 8.88it/s] 63it [00:06, 9.02it/s] 64it [00:06, 9.16it/s] 65it [00:07, 9.27it/s] 66it [00:07, 9.30it/s] 67it [00:07, 9.41it/s] 68it [00:07, 9.40it/s] 69it [00:07, 9.46it/s] 70it [00:07, 8.81it/s] 71it [00:07, 8.90it/s] 72it [00:07, 8.89it/s] 73it [00:07, 9.05it/s] 74it [00:08, 8.64it/s] 75it [00:08, 8.91it/s] 76it [00:08, 8.95it/s] 77it [00:08, 9.15it/s] 78it [00:08, 8.75it/s] 79it [00:08, 8.96it/s] 80it [00:08, 9.12it/s] 81it [00:08, 9.17it/s] 82it [00:08, 9.23it/s] 83it [00:09, 9.37it/s] 84it [00:09, 9.34it/s] 85it [00:09, 8.86it/s] 86it [00:09, 9.05it/s] 87it [00:09, 9.08it/s] 88it [00:09, 9.24it/s] 89it [00:09, 9.31it/s] 90it [00:09, 9.41it/s] 91it [00:09, 9.43it/s] 92it [00:10, 9.04it/s] 93it [00:10, 9.19it/s] 94it [00:10, 9.30it/s] 95it [00:10, 9.37it/s] 96it [00:10, 8.87it/s] 97it [00:10, 9.05it/s] 98it [00:10, 9.18it/s] 99it [00:10, 9.29it/s] 100it [00:10, 9.37it/s]2025-05-26 05:46:47,731 - INFO - [Epoch 005 | Batch 0100] IWAE-loss 13819.5430 | mean log_px -0.1567 | KL -3497.92 + 101it [00:11, 8.99it/s] 102it [00:11, 9.14it/s] 103it [00:11, 9.27it/s] 104it [00:11, 9.36it/s] 105it [00:11, 8.90it/s] 106it [00:11, 9.08it/s] 107it [00:11, 9.18it/s] 108it [00:11, 9.30it/s] 109it [00:11, 9.37it/s] 110it [00:12, 9.42it/s] 111it [00:12, 9.46it/s] 112it [00:12, 9.48it/s] 113it [00:12, 9.51it/s] 114it [00:12, 9.39it/s] 115it [00:12, 9.40it/s] 116it [00:12, 9.47it/s] 117it [00:12, 9.40it/s] 118it [00:12, 9.37it/s] 119it [00:12, 9.23it/s] 120it [00:13, 9.20it/s] 121it [00:13, 9.35it/s] 122it [00:13, 9.39it/s] 123it [00:13, 9.42it/s] 124it [00:13, 9.45it/s] 125it [00:13, 9.45it/s] 126it [00:13, 9.51it/s] 127it [00:13, 9.58it/s] 128it [00:13, 9.57it/s] 129it [00:14, 9.57it/s] 130it [00:14, 9.53it/s] 131it [00:14, 9.49it/s] 132it [00:14, 9.50it/s] 133it [00:14, 9.45it/s] 134it [00:14, 9.39it/s] 135it [00:14, 9.47it/s] 136it [00:14, 9.53it/s] 137it [00:14, 9.50it/s] 138it [00:14, 9.48it/s] 139it [00:15, 9.52it/s] 140it [00:15, 9.34it/s] 141it [00:15, 9.44it/s] 142it [00:15, 9.51it/s] 143it [00:15, 9.52it/s] 144it [00:15, 8.98it/s] 145it [00:15, 9.12it/s] 146it [00:15, 9.27it/s] 147it [00:15, 9.35it/s] 148it [00:16, 9.39it/s] 149it [00:16, 9.40it/s] 150it [00:16, 9.46it/s]2025-05-26 05:46:53,063 - INFO - [Epoch 005 | Batch 0150] IWAE-loss 18954.9707 | mean log_px -0.2272 | KL -3503.50 + 151it [00:16, 9.43it/s] 152it [00:16, 9.44it/s] 153it [00:16, 9.50it/s] 154it [00:16, 9.54it/s] 155it [00:16, 9.51it/s] 156it [00:16, 9.10it/s] 157it [00:17, 9.22it/s] 158it [00:17, 9.34it/s] 159it [00:17, 9.00it/s] 160it [00:17, 9.15it/s] 161it [00:17, 9.28it/s] 162it [00:17, 9.33it/s] 163it [00:17, 9.40it/s] 164it [00:17, 9.42it/s] 165it [00:17, 9.49it/s] 166it [00:17, 9.49it/s] 167it [00:18, 9.52it/s] 168it [00:18, 9.46it/s] 169it [00:18, 9.52it/s] 170it [00:18, 9.48it/s] 171it [00:18, 9.50it/s] 172it [00:18, 8.96it/s] 173it [00:18, 9.10it/s] 174it [00:18, 9.27it/s] 175it [00:18, 9.33it/s] 176it [00:19, 9.37it/s] 177it [00:19, 9.43it/s] 178it [00:19, 9.48it/s] 179it [00:19, 9.45it/s] 180it [00:19, 9.46it/s] 181it [00:19, 9.53it/s] 182it [00:19, 8.97it/s] 183it [00:19, 9.10it/s] 184it [00:19, 9.22it/s] 185it [00:20, 9.34it/s] 186it [00:20, 9.42it/s] 187it [00:20, 9.05it/s] 188it [00:20, 9.18it/s] 189it [00:20, 9.32it/s] 190it [00:20, 9.38it/s] 191it [00:20, 9.43it/s] 192it [00:20, 9.42it/s] 193it [00:20, 9.52it/s] 194it [00:20, 9.47it/s] 195it [00:21, 8.88it/s] 196it [00:21, 9.04it/s] 196it [00:21, 9.22it/s] +2025-05-26 05:46:58,001 - INFO - Epoch: 5, Objective: tensor([12165.8643], device='cuda:0', grad_fn=), Loss: 0.1356792002916336, KL/n: 71.50433349609375 + 0it [00:00, ?it/s]2025-05-26 05:46:58,464 - INFO - [Epoch 006 | Batch 0000] IWAE-loss 17046.0859 | mean log_px -0.1989 | KL -3502.32 + 1it [00:00, 4.62it/s] 2it [00:00, 6.59it/s] 3it [00:00, 7.71it/s] 4it [00:00, 8.27it/s] 5it [00:00, 8.55it/s] 6it [00:00, 8.78it/s] 7it [00:00, 9.06it/s] 8it [00:00, 9.21it/s] 9it [00:01, 8.72it/s] 10it [00:01, 8.90it/s] 11it [00:01, 9.10it/s] 12it [00:01, 9.24it/s] 13it [00:01, 9.37it/s] 14it [00:01, 9.35it/s] 15it [00:01, 9.39it/s] 16it [00:01, 9.40it/s] 17it [00:01, 9.41it/s] 18it [00:02, 8.89it/s] 19it [00:02, 9.10it/s] 20it [00:02, 9.22it/s] 21it [00:02, 9.24it/s] 22it [00:02, 8.88it/s] 23it [00:02, 9.06it/s] 24it [00:02, 9.13it/s] 25it [00:02, 9.18it/s] 26it [00:02, 9.19it/s] 27it [00:03, 9.25it/s] 28it [00:03, 9.22it/s] 29it [00:03, 9.33it/s] 30it [00:03, 9.30it/s] 31it [00:03, 9.33it/s] 32it [00:03, 9.34it/s] 33it [00:03, 9.44it/s] 34it [00:03, 9.47it/s] 35it [00:03, 9.52it/s] 36it [00:03, 9.46it/s] 37it [00:04, 9.45it/s] 38it [00:04, 9.48it/s] 39it [00:04, 9.45it/s] 40it [00:04, 9.44it/s] 41it [00:04, 9.45it/s] 42it [00:04, 9.49it/s] 43it [00:04, 9.52it/s] 44it [00:04, 9.47it/s] 45it [00:04, 9.48it/s] 46it [00:05, 9.44it/s] 47it [00:05, 9.45it/s] 48it [00:05, 9.46it/s] 49it [00:05, 9.54it/s] 50it [00:05, 9.57it/s]2025-05-26 05:47:03,842 - INFO - [Epoch 006 | Batch 0050] IWAE-loss 15465.3457 | mean log_px -0.1867 | KL -3503.66 + 51it [00:05, 9.48it/s] 52it [00:05, 9.49it/s] 53it [00:05, 9.54it/s] 54it [00:05, 9.61it/s] 55it [00:05, 9.66it/s] 56it [00:06, 9.66it/s] 57it [00:06, 9.51it/s] 58it [00:06, 9.20it/s] 59it [00:06, 9.24it/s] 60it [00:06, 9.37it/s] 61it [00:06, 9.50it/s] 62it [00:06, 9.59it/s] 63it [00:06, 9.67it/s] 64it [00:06, 9.65it/s] 65it [00:07, 9.49it/s] 66it [00:07, 9.54it/s] 67it [00:07, 9.60it/s] 68it [00:07, 9.62it/s] 69it [00:07, 9.65it/s] 70it [00:07, 9.65it/s] 71it [00:07, 9.70it/s] 72it [00:07, 9.72it/s] 73it [00:07, 9.75it/s] 74it [00:07, 9.72it/s] 75it [00:08, 9.68it/s] 76it [00:08, 9.69it/s] 77it [00:08, 9.73it/s] 78it [00:08, 9.76it/s] 79it [00:08, 9.75it/s] 80it [00:08, 9.75it/s] 81it [00:08, 9.76it/s] 82it [00:08, 9.73it/s] 83it [00:08, 9.73it/s] 84it [00:08, 9.72it/s] 85it [00:09, 9.72it/s] 86it [00:09, 9.70it/s] 87it [00:09, 9.74it/s] 88it [00:09, 9.71it/s] 89it [00:09, 9.74it/s] 90it [00:09, 9.76it/s] 91it [00:09, 9.79it/s] 92it [00:09, 9.79it/s] 93it [00:09, 9.81it/s] 94it [00:10, 9.80it/s] 95it [00:10, 9.81it/s] 96it [00:10, 9.81it/s] 97it [00:10, 9.82it/s] 98it [00:10, 9.78it/s] 99it [00:10, 9.75it/s] 100it [00:10, 9.76it/s]2025-05-26 05:47:09,010 - INFO - [Epoch 006 | Batch 0100] IWAE-loss 16232.7539 | mean log_px -0.1872 | KL -3505.36 + 101it [00:10, 9.76it/s] 102it [00:10, 9.76it/s] 103it [00:10, 9.75it/s] 104it [00:11, 9.77it/s] 105it [00:11, 9.77it/s] 106it [00:11, 9.76it/s] 107it [00:11, 9.77it/s] 108it [00:11, 9.76it/s] 109it [00:11, 9.76it/s] 110it [00:11, 9.76it/s] 111it [00:11, 9.79it/s] 112it [00:11, 9.62it/s] 113it [00:11, 9.60it/s] 114it [00:12, 9.50it/s] 115it [00:12, 9.48it/s] 116it [00:12, 9.45it/s] 117it [00:12, 9.41it/s] 118it [00:12, 9.39it/s] 119it [00:12, 9.43it/s] 120it [00:12, 9.40it/s] 121it [00:12, 9.41it/s] 122it [00:12, 9.41it/s] 123it [00:13, 9.47it/s] 124it [00:13, 9.42it/s] 125it [00:13, 9.46it/s] 126it [00:13, 9.47it/s] 127it [00:13, 9.46it/s] 128it [00:13, 9.41it/s] 129it [00:13, 9.47it/s] 130it [00:13, 9.44it/s] 131it [00:13, 9.45it/s] 132it [00:13, 9.44it/s] 133it [00:14, 9.43it/s] 134it [00:14, 9.48it/s] 135it [00:14, 9.51it/s] 136it [00:14, 9.50it/s] 137it [00:14, 9.49it/s] 138it [00:14, 9.49it/s] 139it [00:14, 9.54it/s] 140it [00:14, 9.52it/s] 141it [00:14, 9.51it/s] 142it [00:15, 9.51it/s] 143it [00:15, 9.53it/s] 144it [00:15, 9.46it/s] 145it [00:15, 9.50it/s] 146it [00:15, 9.44it/s] 147it [00:15, 9.45it/s] 148it [00:15, 9.44it/s] 149it [00:15, 9.45it/s] 150it [00:15, 9.40it/s]2025-05-26 05:47:14,267 - INFO - [Epoch 006 | Batch 0150] IWAE-loss 16457.2578 | mean log_px -0.1880 | KL -3506.98 + 151it [00:15, 9.40it/s] 152it [00:16, 9.36it/s] 153it [00:16, 9.38it/s] 154it [00:16, 8.78it/s] 155it [00:16, 8.95it/s] 156it [00:16, 8.96it/s] 157it [00:16, 9.10it/s] 158it [00:16, 9.20it/s] 159it [00:16, 9.30it/s] 160it [00:16, 9.32it/s] 161it [00:17, 9.36it/s] 162it [00:17, 9.39it/s] 163it [00:17, 9.35it/s] 164it [00:17, 9.35it/s] 165it [00:17, 9.37it/s] 166it [00:17, 9.40it/s] 167it [00:17, 9.42it/s] 168it [00:17, 9.41it/s] 169it [00:17, 9.43it/s] 170it [00:18, 9.44it/s] 171it [00:18, 9.46it/s] 172it [00:18, 9.38it/s] 173it [00:18, 9.42it/s] 174it [00:18, 9.42it/s] 175it [00:18, 9.48it/s] 176it [00:18, 9.43it/s] 177it [00:18, 9.45it/s] 178it [00:18, 9.45it/s] 179it [00:18, 9.48it/s] 180it [00:19, 9.48it/s] 181it [00:19, 9.51it/s] 182it [00:19, 9.48it/s] 183it [00:19, 9.59it/s] 184it [00:19, 9.64it/s] 185it [00:19, 9.66it/s] 186it [00:19, 9.66it/s] 187it [00:19, 9.71it/s] 188it [00:19, 9.75it/s] 189it [00:20, 9.77it/s] 190it [00:20, 9.74it/s] 191it [00:20, 9.76it/s] 192it [00:20, 9.76it/s] 193it [00:20, 9.79it/s] 194it [00:20, 9.76it/s] 195it [00:20, 9.18it/s] 196it [00:20, 9.41it/s] +2025-05-26 05:47:19,144 - INFO - Epoch: 6, Objective: tensor([15376.6016], device='cuda:0', grad_fn=), Loss: 0.17358337342739105, KL/n: 71.75361633300781 + 0it [00:00, ?it/s]2025-05-26 05:47:19,427 - INFO - [Epoch 007 | Batch 0000] IWAE-loss 17575.0977 | mean log_px -0.2084 | KL -3514.32 + 1it [00:00, 5.20it/s] 2it [00:00, 7.18it/s] 3it [00:00, 8.18it/s] 4it [00:00, 8.74it/s] 5it [00:00, 9.06it/s] 6it [00:00, 8.64it/s] 7it [00:00, 8.97it/s] 8it [00:00, 9.14it/s] 9it [00:01, 9.27it/s] 10it [00:01, 9.37it/s] 11it [00:01, 9.53it/s] 12it [00:01, 9.55it/s] 13it [00:01, 9.65it/s] 14it [00:01, 9.66it/s] 15it [00:01, 9.72it/s] 16it [00:01, 9.72it/s] 17it [00:01, 9.78it/s] 18it [00:01, 9.77it/s] 19it [00:02, 9.78it/s] 20it [00:02, 9.15it/s] 21it [00:02, 9.34it/s] 22it [00:02, 9.41it/s] 23it [00:02, 9.52it/s] 24it [00:02, 9.58it/s] 25it [00:02, 9.65it/s] 26it [00:02, 9.66it/s] 27it [00:02, 9.70it/s] 28it [00:03, 9.70it/s] 29it [00:03, 9.75it/s] 30it [00:03, 9.76it/s] 31it [00:03, 9.75it/s] 32it [00:03, 9.75it/s] 33it [00:03, 9.78it/s] 34it [00:03, 9.76it/s] 35it [00:03, 9.14it/s] 36it [00:03, 9.29it/s] 37it [00:03, 9.45it/s] 38it [00:04, 9.51it/s] 39it [00:04, 9.59it/s] 40it [00:04, 9.63it/s] 41it [00:04, 9.06it/s] 42it [00:04, 9.26it/s] 43it [00:04, 9.45it/s] 44it [00:04, 9.51it/s] 45it [00:04, 9.58it/s] 46it [00:04, 9.63it/s] 47it [00:05, 9.67it/s] 48it [00:05, 9.69it/s] 49it [00:05, 9.73it/s] 50it [00:05, 9.74it/s]2025-05-26 05:47:24,650 - INFO - [Epoch 007 | Batch 0050] IWAE-loss 11222.3057 | mean log_px -0.1177 | KL -3518.79 + 51it [00:05, 9.73it/s] 52it [00:05, 9.72it/s] 53it [00:05, 9.76it/s] 54it [00:05, 9.73it/s] 55it [00:05, 9.72it/s] 56it [00:05, 9.72it/s] 57it [00:06, 9.74it/s] 58it [00:06, 9.74it/s] 59it [00:06, 9.77it/s] 60it [00:06, 9.77it/s] 61it [00:06, 9.78it/s] 62it [00:06, 9.77it/s] 63it [00:06, 9.14it/s] 64it [00:06, 9.29it/s] 65it [00:06, 9.44it/s] 66it [00:06, 9.42it/s] 67it [00:07, 9.56it/s] 68it [00:07, 9.64it/s] 69it [00:07, 9.74it/s] 70it [00:07, 9.78it/s] 71it [00:07, 9.83it/s] 72it [00:07, 9.21it/s] 73it [00:07, 9.40it/s] 74it [00:07, 9.52it/s] 75it [00:07, 9.64it/s] 76it [00:08, 9.09it/s] 77it [00:08, 9.30it/s] 78it [00:08, 9.44it/s] 79it [00:08, 9.57it/s] 80it [00:08, 9.07it/s] 81it [00:08, 9.31it/s] 82it [00:08, 9.44it/s] 83it [00:08, 9.56it/s] 84it [00:08, 9.07it/s] 85it [00:08, 9.29it/s] 86it [00:09, 9.42it/s] 87it [00:09, 8.97it/s] 88it [00:09, 9.20it/s] 89it [00:09, 9.39it/s] 90it [00:09, 9.51it/s] 91it [00:09, 9.02it/s] 92it [00:09, 9.24it/s] 93it [00:09, 9.42it/s] 94it [00:09, 9.53it/s] 95it [00:10, 9.11it/s] 96it [00:10, 9.11it/s] 97it [00:10, 9.23it/s] 98it [00:10, 8.76it/s] 99it [00:10, 8.92it/s] 100it [00:10, 9.11it/s]2025-05-26 05:47:29,972 - INFO - [Epoch 007 | Batch 0100] IWAE-loss 15323.3848 | mean log_px -0.1767 | KL -3517.25 + 101it [00:10, 9.26it/s] 102it [00:10, 8.84it/s] 103it [00:10, 9.10it/s] 104it [00:11, 8.75it/s] 105it [00:11, 9.01it/s] 106it [00:11, 9.20it/s] 107it [00:11, 9.36it/s] 108it [00:11, 8.89it/s] 109it [00:11, 9.14it/s] 110it [00:11, 9.35it/s] 111it [00:11, 9.49it/s] 112it [00:11, 9.58it/s] 113it [00:12, 9.66it/s] 114it [00:12, 9.71it/s] 115it [00:12, 9.75it/s] 116it [00:12, 9.79it/s] 117it [00:12, 9.83it/s] 118it [00:12, 9.81it/s] 119it [00:12, 9.19it/s] 120it [00:12, 9.37it/s] 121it [00:12, 9.50it/s] 122it [00:12, 9.60it/s] 123it [00:13, 9.69it/s] 124it [00:13, 9.73it/s] 125it [00:13, 9.77it/s] 126it [00:13, 9.79it/s] 127it [00:13, 9.80it/s] 128it [00:13, 9.79it/s] 129it [00:13, 9.81it/s] 130it [00:13, 9.81it/s] 131it [00:13, 9.80it/s] 132it [00:13, 9.82it/s] 133it [00:14, 9.76it/s] 134it [00:14, 9.60it/s] 135it [00:14, 9.60it/s] 136it [00:14, 9.02it/s] 137it [00:14, 9.22it/s] 138it [00:14, 9.26it/s] 139it [00:14, 9.36it/s] 140it [00:14, 9.41it/s] 141it [00:14, 9.47it/s] 142it [00:15, 9.49it/s] 143it [00:15, 9.57it/s] 144it [00:15, 9.55it/s] 145it [00:15, 9.52it/s] 146it [00:15, 9.52it/s] 147it [00:15, 9.51it/s] 148it [00:15, 8.94it/s] 149it [00:15, 9.09it/s] 150it [00:15, 9.19it/s]2025-05-26 05:47:35,258 - INFO - [Epoch 007 | Batch 0150] IWAE-loss 19223.7129 | mean log_px -0.2297 | KL -3526.62 + 151it [00:16, 9.27it/s] 152it [00:16, 8.78it/s] 153it [00:16, 9.00it/s] 154it [00:16, 9.17it/s] 155it [00:16, 9.27it/s] 156it [00:16, 9.25it/s] 157it [00:16, 8.66it/s] 158it [00:16, 8.59it/s] 159it [00:16, 8.83it/s] 160it [00:17, 8.99it/s] 161it [00:17, 9.14it/s] 162it [00:17, 9.23it/s] 163it [00:17, 9.31it/s] 164it [00:17, 9.40it/s] 165it [00:17, 9.40it/s] 166it [00:17, 9.40it/s] 167it [00:17, 9.41it/s] 168it [00:17, 8.94it/s] 169it [00:18, 9.10it/s] 170it [00:18, 9.22it/s] 171it [00:18, 9.29it/s] 172it [00:18, 9.39it/s] 173it [00:18, 8.88it/s] 174it [00:18, 9.07it/s] 175it [00:18, 9.28it/s] 176it [00:18, 9.39it/s] 177it [00:18, 9.47it/s] 178it [00:18, 9.54it/s] 179it [00:19, 9.55it/s] 180it [00:19, 9.56it/s] 181it [00:19, 9.59it/s] 182it [00:19, 9.03it/s] 183it [00:19, 9.17it/s] 184it [00:19, 9.25it/s] 185it [00:19, 9.31it/s] 186it [00:19, 9.38it/s] 187it [00:19, 9.43it/s] 188it [00:20, 9.47it/s] 189it [00:20, 9.48it/s] 190it [00:20, 9.46it/s] 191it [00:20, 9.41it/s] 192it [00:20, 9.49it/s] 193it [00:20, 9.51it/s] 194it [00:20, 9.52it/s] 195it [00:20, 8.91it/s] 196it [00:20, 9.11it/s] 196it [00:20, 9.35it/s] +2025-05-26 05:47:40,237 - INFO - Epoch: 7, Objective: tensor([11751.9316], device='cuda:0', grad_fn=), Loss: 0.11317390948534012, KL/n: 71.94717407226562 + 0it [00:00, ?it/s]2025-05-26 05:47:40,687 - INFO - [Epoch 008 | Batch 0000] IWAE-loss 14055.2070 | mean log_px -0.1545 | KL -3523.18 + 1it [00:00, 4.83it/s] 2it [00:00, 6.67it/s] 3it [00:00, 7.40it/s] 4it [00:00, 7.89it/s] 5it [00:00, 8.35it/s] 6it [00:00, 8.66it/s] 7it [00:00, 9.01it/s] 8it [00:00, 9.22it/s] 9it [00:01, 9.39it/s] 10it [00:01, 8.94it/s] 11it [00:01, 9.20it/s] 12it [00:01, 9.35it/s] 13it [00:01, 9.47it/s] 14it [00:01, 9.44it/s] 15it [00:01, 9.39it/s] 16it [00:01, 9.35it/s] 17it [00:01, 9.53it/s] 18it [00:02, 9.65it/s] 20it [00:02, 9.82it/s] 22it [00:02, 9.90it/s] 24it [00:02, 9.95it/s] 26it [00:02, 9.98it/s] 28it [00:03, 9.99it/s] 29it [00:03, 9.58it/s] 30it [00:03, 9.66it/s] 32it [00:03, 9.80it/s] 34it [00:03, 9.88it/s] 36it [00:03, 9.93it/s] 38it [00:04, 9.99it/s] 40it [00:04, 10.02it/s] 42it [00:04, 10.05it/s] 44it [00:04, 9.99it/s] 45it [00:04, 9.98it/s] 46it [00:04, 9.93it/s] 47it [00:04, 9.91it/s] 48it [00:05, 9.89it/s] 49it [00:05, 9.33it/s]2025-05-26 05:47:45,877 - INFO - [Epoch 008 | Batch 0050] IWAE-loss 12810.5664 | mean log_px -0.1418 | KL -3528.74 + 51it [00:05, 9.64it/s] 53it [00:05, 9.82it/s] 55it [00:05, 9.93it/s] 57it [00:05, 10.00it/s] 59it [00:06, 10.04it/s] 61it [00:06, 10.07it/s] 63it [00:06, 10.09it/s] 65it [00:06, 10.10it/s] 67it [00:06, 10.11it/s] 69it [00:07, 9.86it/s] 71it [00:07, 9.95it/s] 73it [00:07, 10.00it/s] 75it [00:07, 10.05it/s] 77it [00:07, 10.08it/s] 79it [00:08, 10.08it/s] 81it [00:08, 10.09it/s] 83it [00:08, 9.66it/s] 85it [00:08, 9.79it/s] 87it [00:08, 9.90it/s] 89it [00:09, 9.63it/s] 91it [00:09, 9.77it/s] 92it [00:09, 9.51it/s] 94it [00:09, 9.69it/s] 96it [00:09, 9.81it/s] 98it [00:10, 9.91it/s] 100it [00:10, 9.97it/s]2025-05-26 05:47:50,906 - INFO - [Epoch 008 | Batch 0100] IWAE-loss 9847.4746 | mean log_px -0.0930 | KL -3528.36 + 101it [00:10, 9.67it/s] 103it [00:10, 9.81it/s] 105it [00:10, 9.91it/s] 107it [00:11, 9.97it/s] 109it [00:11, 10.01it/s] 111it [00:11, 10.04it/s] 113it [00:11, 10.06it/s] 115it [00:11, 10.09it/s] 117it [00:11, 10.10it/s] 119it [00:12, 10.10it/s] 121it [00:12, 10.10it/s] 123it [00:12, 10.11it/s] 125it [00:12, 9.84it/s] 127it [00:13, 9.89it/s] 128it [00:13, 9.54it/s] 130it [00:13, 9.73it/s] 132it [00:13, 9.85it/s] 134it [00:13, 9.91it/s] 136it [00:13, 9.97it/s] 138it [00:14, 9.67it/s] 140it [00:14, 9.81it/s] 142it [00:14, 9.90it/s] 144it [00:14, 9.97it/s] 146it [00:14, 10.01it/s] 148it [00:15, 9.89it/s] 150it [00:15, 9.96it/s]2025-05-26 05:47:55,945 - INFO - [Epoch 008 | Batch 0150] IWAE-loss 11725.8896 | mean log_px -0.1225 | KL -3532.75 + 152it [00:15, 9.99it/s] 154it [00:15, 10.02it/s] 156it [00:15, 10.05it/s] 158it [00:16, 10.07it/s] 160it [00:16, 10.08it/s] 162it [00:16, 10.09it/s] 164it [00:16, 10.10it/s] 166it [00:16, 10.10it/s] 168it [00:17, 10.10it/s] 170it [00:17, 10.11it/s] 172it [00:17, 10.12it/s] 174it [00:17, 10.12it/s] 176it [00:17, 10.11it/s] 178it [00:18, 10.11it/s] 180it [00:18, 10.11it/s] 182it [00:18, 10.11it/s] 184it [00:18, 10.11it/s] 186it [00:18, 10.10it/s] 188it [00:19, 10.10it/s] 190it [00:19, 10.11it/s] 192it [00:19, 10.12it/s] 194it [00:19, 10.11it/s] 196it [00:19, 9.75it/s] 196it [00:19, 9.81it/s] +2025-05-26 05:48:00,529 - INFO - Epoch: 8, Objective: tensor([19531.0215], device='cuda:0', grad_fn=), Loss: 0.22876138985157013, KL/n: 72.13713073730469 + 0it [00:00, ?it/s]2025-05-26 05:48:00,806 - INFO - [Epoch 009 | Batch 0000] IWAE-loss 15139.6064 | mean log_px -0.1711 | KL -3532.32 + 1it [00:00, 5.29it/s] 3it [00:00, 8.16it/s] 4it [00:00, 8.71it/s] 6it [00:00, 9.27it/s] 7it [00:00, 9.43it/s] 8it [00:00, 9.10it/s] 10it [00:01, 9.47it/s] 12it [00:01, 9.67it/s] 14it [00:01, 9.78it/s] 16it [00:01, 9.58it/s] 18it [00:01, 9.72it/s] 20it [00:02, 9.82it/s] 22it [00:02, 9.89it/s] 24it [00:02, 9.93it/s] 26it [00:02, 9.95it/s] 28it [00:02, 9.63it/s] 29it [00:03, 9.68it/s] 30it [00:03, 9.70it/s] 31it [00:03, 9.77it/s] 32it [00:03, 9.81it/s] 34it [00:03, 9.91it/s] 36it [00:03, 9.94it/s] 38it [00:03, 9.92it/s] 39it [00:04, 9.90it/s] 40it [00:04, 9.91it/s] 42it [00:04, 9.95it/s] 44it [00:04, 9.94it/s] 46it [00:04, 9.81it/s] 47it [00:04, 9.44it/s] 48it [00:04, 9.51it/s] 49it [00:05, 9.62it/s] 50it [00:05, 9.71it/s]2025-05-26 05:48:05,911 - INFO - [Epoch 009 | Batch 0050] IWAE-loss 10535.8184 | mean log_px -0.1103 | KL -3535.26 + 51it [00:05, 9.77it/s] 52it [00:05, 9.83it/s] 54it [00:05, 9.93it/s] 56it [00:05, 9.62it/s] 58it [00:06, 9.76it/s] 60it [00:06, 9.85it/s] 61it [00:06, 9.85it/s] 62it [00:06, 9.87it/s] 64it [00:06, 9.89it/s] 65it [00:06, 9.46it/s] 66it [00:06, 9.29it/s] 68it [00:07, 9.18it/s] 69it [00:07, 9.34it/s] 70it [00:07, 9.49it/s] 72it [00:07, 9.72it/s] 73it [00:07, 9.78it/s] 74it [00:07, 9.83it/s] 76it [00:07, 9.51it/s] 77it [00:07, 9.60it/s] 78it [00:08, 9.69it/s] 80it [00:08, 9.82it/s] 82it [00:08, 9.89it/s] 84it [00:08, 9.94it/s] 86it [00:08, 9.95it/s] 88it [00:09, 9.96it/s] 90it [00:09, 9.98it/s] 92it [00:09, 9.98it/s] 93it [00:09, 9.85it/s] 94it [00:09, 9.56it/s] 96it [00:09, 9.73it/s] 97it [00:10, 9.35it/s] 98it [00:10, 9.49it/s] 100it [00:10, 9.69it/s]2025-05-26 05:48:11,055 - INFO - [Epoch 009 | Batch 0100] IWAE-loss 12649.1650 | mean log_px -0.1434 | KL -3534.93 + 101it [00:10, 9.75it/s] 102it [00:10, 9.81it/s] 103it [00:10, 9.86it/s] 104it [00:10, 9.87it/s] 106it [00:10, 9.95it/s] 107it [00:11, 9.55it/s] 108it [00:11, 9.53it/s] 109it [00:11, 9.63it/s] 110it [00:11, 9.72it/s] 112it [00:11, 9.85it/s] 114it [00:11, 9.48it/s] 115it [00:11, 9.59it/s] 116it [00:11, 9.67it/s] 118it [00:12, 9.82it/s] 120it [00:12, 9.90it/s] 122it [00:12, 9.95it/s] 123it [00:12, 9.96it/s] 124it [00:12, 9.49it/s] 126it [00:13, 9.69it/s] 128it [00:13, 9.81it/s] 130it [00:13, 9.89it/s] 132it [00:13, 9.94it/s] 133it [00:13, 9.94it/s] 134it [00:13, 9.93it/s] 136it [00:14, 9.97it/s] 138it [00:14, 10.00it/s] 140it [00:14, 9.72it/s] 142it [00:14, 9.82it/s] 144it [00:14, 9.87it/s] 146it [00:15, 9.92it/s] 148it [00:15, 9.95it/s] 150it [00:15, 9.98it/s]2025-05-26 05:48:16,137 - INFO - [Epoch 009 | Batch 0150] IWAE-loss 14599.3418 | mean log_px -0.1665 | KL -3540.62 + 151it [00:15, 9.72it/s] 152it [00:15, 9.77it/s] 154it [00:15, 9.87it/s] 156it [00:16, 9.92it/s] 158it [00:16, 9.96it/s] 160it [00:16, 9.98it/s] 162it [00:16, 10.00it/s] 164it [00:16, 10.02it/s] 166it [00:17, 10.04it/s] 168it [00:17, 10.03it/s] 170it [00:17, 10.03it/s] 172it [00:17, 10.04it/s] 174it [00:17, 10.03it/s] 176it [00:18, 10.02it/s] 178it [00:18, 10.02it/s] 180it [00:18, 10.02it/s] 182it [00:18, 10.01it/s] 184it [00:18, 10.01it/s] 186it [00:19, 10.01it/s] 188it [00:19, 10.02it/s] 190it [00:19, 9.68it/s] 191it [00:19, 9.69it/s] 192it [00:19, 9.67it/s] 194it [00:19, 9.47it/s] 195it [00:19, 9.28it/s] 196it [00:20, 9.73it/s] +2025-05-26 05:48:20,801 - INFO - Epoch: 9, Objective: tensor([12982.9697], device='cuda:0', grad_fn=), Loss: 0.14898112416267395, KL/n: 72.30970001220703 + 0it [00:00, ?it/s]2025-05-26 05:48:21,255 - INFO - [Epoch 010 | Batch 0000] IWAE-loss 13698.6484 | mean log_px -0.1451 | KL -3541.10 + 1it [00:00, 5.50it/s] 3it [00:00, 8.31it/s] 5it [00:00, 9.08it/s] 6it [00:00, 9.31it/s] 7it [00:00, 9.08it/s] 9it [00:00, 9.51it/s] 11it [00:01, 9.74it/s] 13it [00:01, 9.86it/s] 15it [00:01, 9.95it/s] 17it [00:01, 10.00it/s] 19it [00:01, 10.03it/s] 21it [00:02, 9.95it/s] 22it [00:02, 9.95it/s] 23it [00:02, 9.96it/s] 24it [00:02, 9.88it/s] 25it [00:02, 9.89it/s] 27it [00:02, 9.98it/s] 29it [00:02, 10.04it/s] 31it [00:03, 10.06it/s] 33it [00:03, 10.08it/s] 35it [00:03, 9.72it/s] 37it [00:03, 9.84it/s] 39it [00:04, 9.92it/s] 40it [00:04, 9.93it/s] 42it [00:04, 9.95it/s] 44it [00:04, 10.00it/s] 45it [00:04, 9.60it/s] 47it [00:04, 9.78it/s] 49it [00:05, 9.88it/s]2025-05-26 05:48:26,292 - INFO - [Epoch 010 | Batch 0050] IWAE-loss 15355.1699 | mean log_px -0.1796 | KL -3543.84 + 51it [00:05, 9.95it/s] 53it [00:05, 9.99it/s] 55it [00:05, 10.02it/s] 57it [00:05, 10.04it/s] 59it [00:06, 10.06it/s] 61it [00:06, 10.08it/s] 63it [00:06, 10.09it/s] 65it [00:06, 10.10it/s] 67it [00:06, 10.10it/s] 69it [00:06, 10.10it/s] 71it [00:07, 9.76it/s] 73it [00:07, 9.86it/s] 75it [00:07, 9.93it/s] 77it [00:07, 9.98it/s] 79it [00:08, 10.02it/s] 81it [00:08, 10.05it/s] 83it [00:08, 10.07it/s] 85it [00:08, 10.00it/s] 87it [00:08, 10.02it/s] 89it [00:09, 10.04it/s] 91it [00:09, 10.04it/s] 93it [00:09, 10.05it/s] 95it [00:09, 10.06it/s] 97it [00:09, 10.08it/s] 99it [00:09, 10.09it/s]2025-05-26 05:48:31,271 - INFO - [Epoch 010 | Batch 0100] IWAE-loss 10181.3457 | mean log_px -0.1026 | KL -3547.27 + 101it [00:10, 9.75it/s] 103it [00:10, 9.86it/s] 105it [00:10, 9.93it/s] 107it [00:10, 9.70it/s] 108it [00:10, 9.75it/s] 110it [00:11, 9.86it/s] 112it [00:11, 9.94it/s] 114it [00:11, 10.00it/s] 116it [00:11, 10.02it/s] 118it [00:11, 10.05it/s] 120it [00:12, 10.07it/s] 122it [00:12, 10.08it/s] 124it [00:12, 10.10it/s] 126it [00:12, 10.09it/s] 128it [00:12, 10.11it/s] 130it [00:13, 10.11it/s] 132it [00:13, 10.10it/s] 134it [00:13, 10.01it/s] 136it [00:13, 10.04it/s] 138it [00:13, 10.06it/s] 140it [00:14, 9.73it/s] 141it [00:14, 9.43it/s] 142it [00:14, 9.53it/s] 143it [00:14, 9.62it/s] 144it [00:14, 9.70it/s] 145it [00:14, 9.28it/s] 147it [00:14, 9.59it/s] 149it [00:15, 9.38it/s]2025-05-26 05:48:36,365 - INFO - [Epoch 010 | Batch 0150] IWAE-loss 12556.6738 | mean log_px -0.1344 | KL -3543.33 + 151it [00:15, 9.59it/s] 153it [00:15, 9.39it/s] 155it [00:15, 9.60it/s] 157it [00:15, 9.76it/s] 158it [00:16, 9.44it/s] 160it [00:16, 9.66it/s] 162it [00:16, 9.80it/s] 164it [00:16, 9.90it/s] 166it [00:16, 9.99it/s] 168it [00:17, 10.02it/s] 170it [00:17, 10.06it/s] 172it [00:17, 10.05it/s] 174it [00:17, 10.02it/s] 176it [00:17, 9.52it/s] 178it [00:18, 9.69it/s] 180it [00:18, 9.81it/s] 181it [00:18, 9.48it/s] 183it [00:18, 9.69it/s] 185it [00:18, 9.83it/s] 186it [00:18, 9.85it/s] 188it [00:19, 9.59it/s] 190it [00:19, 9.68it/s] 191it [00:19, 9.30it/s] 192it [00:19, 9.42it/s] 194it [00:19, 9.67it/s] 195it [00:19, 9.42it/s] 196it [00:19, 9.80it/s] +2025-05-26 05:48:41,104 - INFO - Epoch: 10, Objective: tensor([15107.3916], device='cuda:0', grad_fn=), Loss: 0.16303861141204834, KL/n: 72.43524169921875 + 0it [00:00, ?it/s]2025-05-26 05:48:41,393 - INFO - [Epoch 011 | Batch 0000] IWAE-loss 10246.0049 | mean log_px -0.1013 | KL -3548.55 + 1it [00:00, 4.67it/s] 2it [00:00, 6.74it/s] 3it [00:00, 7.90it/s] 4it [00:00, 8.58it/s] 6it [00:00, 9.28it/s] 7it [00:00, 9.02it/s] 8it [00:00, 9.27it/s] 10it [00:01, 9.14it/s] 12it [00:01, 9.42it/s] 13it [00:01, 9.54it/s] 14it [00:01, 9.59it/s] 16it [00:01, 9.75it/s] 18it [00:01, 9.83it/s] 19it [00:02, 9.85it/s] 20it [00:02, 9.86it/s] 21it [00:02, 9.87it/s] 22it [00:02, 9.88it/s] 24it [00:02, 9.92it/s] 26it [00:02, 9.95it/s] 27it [00:02, 9.95it/s] 28it [00:02, 9.93it/s] 29it [00:03, 9.94it/s] 30it [00:03, 9.94it/s] 32it [00:03, 9.96it/s] 33it [00:03, 9.56it/s] 34it [00:03, 9.64it/s] 35it [00:03, 9.73it/s] 36it [00:03, 9.79it/s] 37it [00:03, 9.85it/s] 38it [00:03, 9.86it/s] 40it [00:04, 9.93it/s] 41it [00:04, 9.94it/s] 42it [00:04, 9.38it/s] 43it [00:04, 9.53it/s] 44it [00:04, 9.52it/s] 45it [00:04, 9.55it/s] 46it [00:04, 9.19it/s] 47it [00:04, 9.40it/s] 48it [00:05, 9.53it/s] 49it [00:05, 9.66it/s] 50it [00:05, 9.23it/s]2025-05-26 05:48:46,577 - INFO - [Epoch 011 | Batch 0050] IWAE-loss 13919.8701 | mean log_px -0.1529 | KL -3551.17 + 51it [00:05, 9.40it/s] 52it [00:05, 9.54it/s] 53it [00:05, 9.65it/s] 54it [00:05, 9.74it/s] 55it [00:05, 9.81it/s] 56it [00:05, 9.85it/s] 57it [00:05, 9.88it/s] 58it [00:06, 9.89it/s] 59it [00:06, 9.92it/s] 60it [00:06, 9.92it/s] 61it [00:06, 9.94it/s] 62it [00:06, 9.93it/s] 63it [00:06, 9.93it/s] 64it [00:06, 9.89it/s] 66it [00:06, 9.95it/s] 67it [00:06, 9.96it/s] 68it [00:07, 9.95it/s] 69it [00:07, 9.50it/s] 70it [00:07, 9.61it/s] 71it [00:07, 9.71it/s] 72it [00:07, 9.77it/s] 73it [00:07, 9.84it/s] 74it [00:07, 9.86it/s] 75it [00:07, 9.88it/s] 76it [00:07, 9.90it/s] 77it [00:08, 9.93it/s] 78it [00:08, 9.39it/s] 80it [00:08, 9.66it/s] 81it [00:08, 9.74it/s] 82it [00:08, 9.79it/s] 83it [00:08, 9.83it/s] 84it [00:08, 9.86it/s] 85it [00:08, 9.86it/s] 86it [00:08, 9.33it/s] 87it [00:09, 9.51it/s] 88it [00:09, 9.23it/s] 89it [00:09, 9.43it/s] 90it [00:09, 9.55it/s] 91it [00:09, 9.66it/s] 92it [00:09, 9.72it/s] 93it [00:09, 9.78it/s] 94it [00:09, 9.81it/s] 96it [00:09, 9.89it/s] 97it [00:10, 9.38it/s] 98it [00:10, 9.52it/s] 100it [00:10, 9.73it/s]2025-05-26 05:48:51,702 - INFO - [Epoch 011 | Batch 0100] IWAE-loss 11395.6230 | mean log_px -0.1321 | KL -3551.43 + 101it [00:10, 9.28it/s] 102it [00:10, 9.43it/s] 104it [00:10, 9.67it/s] 105it [00:10, 9.74it/s] 106it [00:11, 9.79it/s] 107it [00:11, 9.84it/s] 108it [00:11, 9.86it/s] 109it [00:11, 9.89it/s] 110it [00:11, 9.91it/s] 111it [00:11, 9.93it/s] 112it [00:11, 9.31it/s] 113it [00:11, 9.50it/s] 114it [00:11, 9.61it/s] 115it [00:11, 9.72it/s] 116it [00:12, 9.79it/s] 117it [00:12, 9.85it/s] 118it [00:12, 9.87it/s] 120it [00:12, 9.93it/s] 121it [00:12, 9.94it/s] 122it [00:12, 9.92it/s] 123it [00:12, 9.93it/s] 124it [00:12, 9.93it/s] 125it [00:12, 9.95it/s] 126it [00:13, 9.95it/s] 127it [00:13, 9.55it/s] 128it [00:13, 9.66it/s] 129it [00:13, 9.63it/s] 130it [00:13, 9.68it/s] 131it [00:13, 9.76it/s] 132it [00:13, 9.80it/s] 133it [00:13, 9.85it/s] 134it [00:13, 9.37it/s] 135it [00:13, 9.53it/s] 136it [00:14, 9.64it/s] 137it [00:14, 9.74it/s] 138it [00:14, 9.80it/s] 140it [00:14, 9.88it/s] 141it [00:14, 9.91it/s] 142it [00:14, 9.35it/s] 144it [00:14, 9.62it/s] 145it [00:15, 9.70it/s] 146it [00:15, 9.76it/s] 147it [00:15, 9.81it/s] 148it [00:15, 9.84it/s] 150it [00:15, 9.91it/s]2025-05-26 05:48:56,830 - INFO - [Epoch 011 | Batch 0150] IWAE-loss 14350.5879 | mean log_px -0.1595 | KL -3548.78 + 151it [00:15, 9.42it/s] 152it [00:15, 9.54it/s] 153it [00:15, 9.65it/s] 154it [00:15, 9.72it/s] 155it [00:16, 9.17it/s] 156it [00:16, 9.34it/s] 157it [00:16, 9.43it/s] 158it [00:16, 9.02it/s] 159it [00:16, 9.23it/s] 160it [00:16, 9.36it/s] 161it [00:16, 9.46it/s] 162it [00:16, 9.59it/s] 163it [00:16, 9.71it/s] 164it [00:17, 9.76it/s] 165it [00:17, 9.82it/s] 166it [00:17, 9.85it/s] 167it [00:17, 9.87it/s] 168it [00:17, 9.25it/s] 169it [00:17, 9.46it/s] 170it [00:17, 9.59it/s] 171it [00:17, 9.68it/s] 172it [00:17, 9.69it/s] 173it [00:17, 9.77it/s] 174it [00:18, 9.18it/s] 175it [00:18, 9.37it/s] 176it [00:18, 9.48it/s] 177it [00:18, 9.57it/s] 178it [00:18, 9.60it/s] 179it [00:18, 9.69it/s] 180it [00:18, 9.78it/s] 181it [00:18, 9.83it/s] 182it [00:18, 9.88it/s] 183it [00:18, 9.88it/s] 184it [00:19, 9.88it/s] 185it [00:19, 9.89it/s] 186it [00:19, 9.89it/s] 187it [00:19, 9.91it/s] 188it [00:19, 9.92it/s] 189it [00:19, 9.92it/s] 190it [00:19, 9.91it/s] 191it [00:19, 9.92it/s] 192it [00:19, 9.90it/s] 193it [00:19, 9.92it/s] 194it [00:20, 9.91it/s] 195it [00:20, 9.46it/s] 196it [00:20, 9.63it/s] +2025-05-26 05:49:01,608 - INFO - Epoch: 11, Objective: tensor([10451.8135], device='cuda:0', grad_fn=), Loss: 0.1001165509223938, KL/n: 72.5517807006836 + 0it [00:00, ?it/s]2025-05-26 05:49:02,037 - INFO - [Epoch 012 | Batch 0000] IWAE-loss 8402.5049 | mean log_px -0.0712 | KL -3554.51 + 1it [00:00, 5.36it/s] 2it [00:00, 7.34it/s] 4it [00:00, 8.83it/s] 5it [00:00, 9.16it/s] 6it [00:00, 9.36it/s] 8it [00:00, 9.66it/s] 10it [00:01, 9.80it/s] 11it [00:01, 9.82it/s] 12it [00:01, 9.84it/s] 14it [00:01, 9.92it/s] 15it [00:01, 9.93it/s] 16it [00:01, 9.94it/s] 18it [00:01, 9.98it/s] 20it [00:02, 9.99it/s] 22it [00:02, 9.99it/s] 24it [00:02, 10.00it/s] 26it [00:02, 10.00it/s] 28it [00:02, 10.00it/s] 30it [00:03, 9.99it/s] 31it [00:03, 9.91it/s] 32it [00:03, 9.81it/s] 34it [00:03, 9.88it/s] 35it [00:03, 9.87it/s] 36it [00:03, 9.85it/s] 37it [00:03, 9.35it/s] 38it [00:03, 9.49it/s] 39it [00:04, 9.53it/s] 40it [00:04, 9.64it/s] 41it [00:04, 9.65it/s] 42it [00:04, 9.73it/s] 43it [00:04, 9.76it/s] 44it [00:04, 9.18it/s] 46it [00:04, 9.55it/s] 48it [00:04, 9.74it/s] 50it [00:05, 9.83it/s]2025-05-26 05:49:07,140 - INFO - [Epoch 012 | Batch 0050] IWAE-loss 10922.4316 | mean log_px -0.1087 | KL -3553.06 + 51it [00:05, 9.41it/s] 52it [00:05, 9.53it/s] 54it [00:05, 9.72it/s] 56it [00:05, 9.82it/s] 57it [00:05, 9.85it/s] 58it [00:05, 9.88it/s] 60it [00:06, 9.94it/s] 61it [00:06, 9.94it/s] 62it [00:06, 9.95it/s] 63it [00:06, 9.72it/s] 64it [00:06, 9.21it/s] 65it [00:06, 9.41it/s] 66it [00:06, 9.44it/s] 67it [00:06, 9.58it/s] 68it [00:07, 9.69it/s] 69it [00:07, 9.76it/s] 70it [00:07, 9.19it/s] 71it [00:07, 9.40it/s] 72it [00:07, 9.55it/s] 74it [00:07, 9.76it/s] 76it [00:07, 9.85it/s] 78it [00:08, 9.91it/s] 79it [00:08, 9.92it/s] 80it [00:08, 9.45it/s] 81it [00:08, 9.43it/s] 82it [00:08, 9.38it/s] 83it [00:08, 9.46it/s] 84it [00:08, 9.51it/s] 85it [00:08, 9.60it/s] 86it [00:08, 9.63it/s] 87it [00:09, 9.68it/s] 88it [00:09, 9.70it/s] 89it [00:09, 9.73it/s] 90it [00:09, 9.73it/s] 91it [00:09, 9.77it/s] 92it [00:09, 9.73it/s] 93it [00:09, 9.75it/s] 94it [00:09, 9.75it/s] 96it [00:09, 9.88it/s] 98it [00:10, 9.94it/s] 100it [00:10, 9.98it/s]2025-05-26 05:49:12,296 - INFO - [Epoch 012 | Batch 0100] IWAE-loss 11670.1055 | mean log_px -0.1183 | KL -3560.71 + 101it [00:10, 9.98it/s] 102it [00:10, 9.48it/s] 104it [00:10, 9.70it/s] 105it [00:10, 9.76it/s] 107it [00:11, 9.87it/s] 108it [00:11, 9.88it/s] 110it [00:11, 9.94it/s] 112it [00:11, 9.96it/s] 114it [00:11, 9.98it/s] 116it [00:11, 9.99it/s] 118it [00:12, 9.71it/s] 120it [00:12, 9.81it/s] 122it [00:12, 9.60it/s] 124it [00:12, 9.72it/s] 126it [00:12, 9.81it/s] 128it [00:13, 9.88it/s] 130it [00:13, 9.92it/s] 132it [00:13, 9.95it/s] 134it [00:13, 9.98it/s] 136it [00:13, 9.99it/s] 138it [00:14, 9.99it/s] 140it [00:14, 10.00it/s] 142it [00:14, 10.01it/s] 144it [00:14, 10.01it/s] 146it [00:14, 10.01it/s] 148it [00:15, 10.01it/s] 150it [00:15, 10.02it/s]2025-05-26 05:49:17,347 - INFO - [Epoch 012 | Batch 0150] IWAE-loss 9823.7705 | mean log_px -0.0984 | KL -3558.63 + 152it [00:15, 10.01it/s] 154it [00:15, 10.02it/s] 156it [00:15, 10.03it/s] 158it [00:16, 10.02it/s] 160it [00:16, 9.79it/s] 162it [00:16, 9.85it/s] 164it [00:16, 9.91it/s] 166it [00:16, 9.96it/s] 168it [00:17, 9.98it/s] 170it [00:17, 10.00it/s] 172it [00:17, 10.00it/s] 174it [00:17, 9.92it/s] 175it [00:17, 9.90it/s] 176it [00:17, 9.89it/s] 178it [00:18, 9.87it/s] 179it [00:18, 9.85it/s] 181it [00:18, 9.92it/s] 182it [00:18, 9.93it/s] 183it [00:18, 9.94it/s] 184it [00:18, 9.94it/s] 186it [00:19, 9.60it/s] 188it [00:19, 9.75it/s] 190it [00:19, 9.85it/s] 192it [00:19, 9.92it/s] 194it [00:19, 9.94it/s] 195it [00:19, 9.65it/s] 196it [00:20, 9.76it/s] +2025-05-26 05:49:22,007 - INFO - Epoch: 12, Objective: tensor([11959.2480], device='cuda:0', grad_fn=), Loss: 0.12528853118419647, KL/n: 72.63204193115234 + 0it [00:00, ?it/s]2025-05-26 05:49:22,294 - INFO - [Epoch 013 | Batch 0000] IWAE-loss 10673.3086 | mean log_px -0.1125 | KL -3559.28 + 1it [00:00, 4.45it/s] 2it [00:00, 6.54it/s] 3it [00:00, 7.76it/s] 4it [00:00, 8.49it/s] 6it [00:00, 9.25it/s] 8it [00:00, 9.57it/s] 9it [00:01, 9.67it/s] 10it [00:01, 9.74it/s] 11it [00:01, 9.80it/s] 12it [00:01, 9.83it/s] 13it [00:01, 9.87it/s] 14it [00:01, 9.89it/s] 15it [00:01, 9.92it/s] 16it [00:01, 9.93it/s] 18it [00:01, 9.57it/s] 19it [00:02, 9.55it/s] 20it [00:02, 9.64it/s] 21it [00:02, 9.72it/s] 22it [00:02, 9.78it/s] 23it [00:02, 9.84it/s] 24it [00:02, 9.87it/s] 25it [00:02, 9.89it/s] 26it [00:02, 9.36it/s] 27it [00:02, 9.52it/s] 28it [00:02, 9.63it/s] 30it [00:03, 9.79it/s] 32it [00:03, 9.85it/s] 34it [00:03, 9.90it/s] 36it [00:03, 9.94it/s] 38it [00:03, 9.96it/s] 40it [00:04, 9.97it/s] 42it [00:04, 9.97it/s] 44it [00:04, 9.98it/s] 46it [00:04, 9.98it/s] 48it [00:04, 9.99it/s] 49it [00:05, 9.99it/s] 50it [00:05, 9.97it/s]2025-05-26 05:49:27,382 - INFO - [Epoch 013 | Batch 0050] IWAE-loss 14811.1055 | mean log_px -0.1740 | KL -3564.73 + 51it [00:05, 9.95it/s] 52it [00:05, 9.95it/s] 53it [00:05, 9.96it/s] 54it [00:05, 9.94it/s] 56it [00:05, 9.96it/s] 58it [00:05, 9.98it/s] 59it [00:06, 9.96it/s] 60it [00:06, 9.93it/s] 61it [00:06, 9.95it/s] 62it [00:06, 9.94it/s] 63it [00:06, 9.93it/s] 64it [00:06, 9.91it/s] 65it [00:06, 9.92it/s] 66it [00:06, 9.90it/s] 67it [00:06, 9.91it/s] 68it [00:06, 9.92it/s] 69it [00:07, 9.93it/s] 70it [00:07, 9.94it/s] 71it [00:07, 9.79it/s] 72it [00:07, 9.84it/s] 74it [00:07, 9.43it/s] 75it [00:07, 9.56it/s] 76it [00:07, 9.65it/s] 78it [00:08, 9.77it/s] 79it [00:08, 9.43it/s] 80it [00:08, 9.55it/s] 81it [00:08, 9.64it/s] 82it [00:08, 9.72it/s] 83it [00:08, 9.20it/s] 84it [00:08, 9.39it/s] 85it [00:08, 9.53it/s] 86it [00:08, 9.56it/s] 87it [00:08, 9.66it/s] 88it [00:09, 9.73it/s] 90it [00:09, 9.80it/s] 91it [00:09, 9.76it/s] 92it [00:09, 9.79it/s] 93it [00:09, 9.84it/s] 94it [00:09, 9.85it/s] 96it [00:09, 9.91it/s] 97it [00:09, 9.93it/s] 98it [00:10, 9.92it/s] 99it [00:10, 9.94it/s] 100it [00:10, 9.93it/s]2025-05-26 05:49:32,488 - INFO - [Epoch 013 | Batch 0100] IWAE-loss 11084.1914 | mean log_px -0.1101 | KL -3557.34 + 101it [00:10, 9.93it/s] 102it [00:10, 9.92it/s] 104it [00:10, 9.95it/s] 105it [00:10, 9.95it/s] 106it [00:10, 9.88it/s] 107it [00:10, 9.91it/s] 108it [00:11, 9.91it/s] 109it [00:11, 9.93it/s] 110it [00:11, 9.93it/s] 111it [00:11, 9.87it/s] 112it [00:11, 9.87it/s] 113it [00:11, 9.90it/s] 114it [00:11, 9.81it/s] 116it [00:11, 9.90it/s] 117it [00:12, 9.92it/s] 118it [00:12, 9.92it/s] 119it [00:12, 9.92it/s] 120it [00:12, 9.91it/s] 121it [00:12, 9.93it/s] 122it [00:12, 9.34it/s] 124it [00:12, 9.62it/s] 125it [00:12, 9.70it/s] 126it [00:12, 9.76it/s] 127it [00:13, 9.43it/s] 128it [00:13, 9.55it/s] 129it [00:13, 9.64it/s] 130it [00:13, 9.72it/s] 131it [00:13, 9.78it/s] 132it [00:13, 9.20it/s] 133it [00:13, 9.40it/s] 134it [00:13, 9.54it/s] 135it [00:13, 9.65it/s] 136it [00:13, 9.73it/s] 138it [00:14, 9.84it/s] 139it [00:14, 9.87it/s] 140it [00:14, 9.86it/s] 141it [00:14, 9.90it/s] 142it [00:14, 9.90it/s] 143it [00:14, 9.90it/s] 144it [00:14, 9.91it/s] 145it [00:14, 9.91it/s] 146it [00:14, 9.92it/s] 147it [00:15, 9.94it/s] 148it [00:15, 9.94it/s] 149it [00:15, 9.95it/s] 150it [00:15, 9.92it/s]2025-05-26 05:49:37,589 - INFO - [Epoch 013 | Batch 0150] IWAE-loss 8056.9863 | mean log_px -0.0642 | KL -3562.25 + 151it [00:15, 9.27it/s] 152it [00:15, 9.32it/s] 153it [00:15, 9.27it/s] 154it [00:15, 9.27it/s] 155it [00:15, 8.98it/s] 156it [00:16, 9.18it/s] 157it [00:16, 9.35it/s] 158it [00:16, 9.45it/s] 159it [00:16, 9.57it/s] 160it [00:16, 9.64it/s] 161it [00:16, 9.70it/s] 162it [00:16, 9.72it/s] 163it [00:16, 9.77it/s] 164it [00:16, 9.74it/s] 165it [00:16, 9.75it/s] 166it [00:17, 9.81it/s] 167it [00:17, 9.85it/s] 168it [00:17, 9.88it/s] 169it [00:17, 9.91it/s] 170it [00:17, 9.92it/s] 172it [00:17, 9.95it/s] 173it [00:17, 9.96it/s] 174it [00:17, 9.93it/s] 175it [00:17, 9.93it/s] 176it [00:18, 9.91it/s] 177it [00:18, 9.92it/s] 178it [00:18, 9.93it/s] 179it [00:18, 9.94it/s] 180it [00:18, 9.94it/s] 181it [00:18, 9.94it/s] 182it [00:18, 9.94it/s] 184it [00:18, 9.97it/s] 185it [00:18, 9.98it/s] 186it [00:19, 9.95it/s] 188it [00:19, 9.97it/s] 189it [00:19, 9.92it/s] 190it [00:19, 9.27it/s] 191it [00:19, 9.15it/s] 192it [00:19, 9.27it/s] 193it [00:19, 9.43it/s] 194it [00:19, 9.53it/s] 195it [00:20, 9.20it/s] 196it [00:20, 9.00it/s] 196it [00:20, 9.68it/s] +2025-05-26 05:49:42,380 - INFO - Epoch: 13, Objective: tensor([13255.1807], device='cuda:0', grad_fn=), Loss: 0.15383651852607727, KL/n: 72.70011138916016 + 0it [00:00, ?it/s]2025-05-26 05:49:42,845 - INFO - [Epoch 014 | Batch 0000] IWAE-loss 11022.1055 | mean log_px -0.1185 | KL -3559.76 + 1it [00:00, 5.29it/s] 2it [00:00, 6.71it/s] 4it [00:00, 8.48it/s] 5it [00:00, 8.23it/s] 7it [00:00, 9.00it/s] 9it [00:01, 9.41it/s] 10it [00:01, 9.54it/s] 12it [00:01, 9.73it/s] 14it [00:01, 9.85it/s] 16it [00:01, 9.91it/s] 18it [00:01, 9.97it/s] 19it [00:02, 9.82it/s] 20it [00:02, 9.83it/s] 22it [00:02, 9.91it/s] 24it [00:02, 9.97it/s] 25it [00:02, 9.94it/s] 27it [00:02, 10.00it/s] 28it [00:02, 9.99it/s] 30it [00:03, 10.02it/s] 32it [00:03, 10.05it/s] 34it [00:03, 10.07it/s] 36it [00:03, 9.68it/s] 38it [00:03, 9.79it/s] 40it [00:04, 9.89it/s] 42it [00:04, 9.96it/s] 44it [00:04, 10.00it/s] 46it [00:04, 10.02it/s] 48it [00:04, 10.03it/s] 50it [00:05, 10.04it/s]2025-05-26 05:49:47,902 - INFO - [Epoch 014 | Batch 0050] IWAE-loss 8267.6357 | mean log_px -0.0700 | KL -3559.77 + 52it [00:05, 9.70it/s] 54it [00:05, 9.82it/s] 56it [00:05, 9.89it/s] 58it [00:05, 9.95it/s] 60it [00:06, 10.00it/s] 62it [00:06, 10.03it/s] 64it [00:06, 10.02it/s] 66it [00:06, 10.04it/s] 68it [00:06, 10.05it/s] 70it [00:07, 10.06it/s] 72it [00:07, 10.06it/s] 74it [00:07, 9.77it/s] 76it [00:07, 9.53it/s] 78it [00:07, 9.68it/s] 80it [00:08, 9.78it/s] 82it [00:08, 9.86it/s] 84it [00:08, 9.91it/s] 86it [00:08, 9.96it/s] 88it [00:08, 9.99it/s] 90it [00:09, 10.01it/s] 92it [00:09, 10.03it/s] 94it [00:09, 10.05it/s] 96it [00:09, 9.99it/s] 98it [00:09, 10.01it/s] 100it [00:10, 10.02it/s]2025-05-26 05:49:52,940 - INFO - [Epoch 014 | Batch 0100] IWAE-loss 13712.4199 | mean log_px -0.1565 | KL -3561.90 + 102it [00:10, 9.69it/s] 104it [00:10, 9.80it/s] 105it [00:10, 9.83it/s] 107it [00:10, 9.91it/s] 108it [00:11, 9.92it/s] 110it [00:11, 9.98it/s] 112it [00:11, 10.02it/s] 114it [00:11, 9.68it/s] 116it [00:11, 9.79it/s] 117it [00:11, 9.30it/s] 118it [00:12, 9.44it/s] 120it [00:12, 9.67it/s] 122it [00:12, 9.80it/s] 124it [00:12, 9.88it/s] 126it [00:12, 9.94it/s] 128it [00:13, 9.96it/s] 130it [00:13, 10.01it/s] 132it [00:13, 10.03it/s] 134it [00:13, 10.04it/s] 136it [00:13, 10.03it/s] 138it [00:14, 10.04it/s] 140it [00:14, 10.05it/s] 142it [00:14, 10.05it/s] 144it [00:14, 10.06it/s] 146it [00:14, 10.07it/s] 148it [00:15, 10.06it/s] 150it [00:15, 10.08it/s]2025-05-26 05:49:57,987 - INFO - [Epoch 014 | Batch 0150] IWAE-loss 13030.7373 | mean log_px -0.1424 | KL -3557.82 + 152it [00:15, 9.73it/s] 154it [00:15, 9.82it/s] 155it [00:15, 9.85it/s] 156it [00:15, 9.87it/s] 158it [00:16, 9.95it/s] 160it [00:16, 10.00it/s] 162it [00:16, 10.02it/s] 164it [00:16, 10.05it/s] 166it [00:16, 10.05it/s] 168it [00:17, 10.06it/s] 170it [00:17, 10.07it/s] 172it [00:17, 10.07it/s] 174it [00:17, 10.05it/s] 176it [00:17, 10.05it/s] 178it [00:18, 9.34it/s] 179it [00:18, 9.19it/s] 180it [00:18, 9.26it/s] 181it [00:18, 9.41it/s] 182it [00:18, 9.55it/s] 183it [00:18, 9.64it/s] 184it [00:18, 9.70it/s] 186it [00:18, 9.84it/s] 188it [00:19, 9.93it/s] 190it [00:19, 9.80it/s] 191it [00:19, 9.79it/s] 192it [00:19, 9.58it/s] 193it [00:19, 9.16it/s] 195it [00:19, 9.20it/s] 196it [00:19, 8.98it/s] 196it [00:20, 9.77it/s] +2025-05-26 05:50:02,758 - INFO - Epoch: 14, Objective: tensor([11565.9922], device='cuda:0', grad_fn=), Loss: 0.11370649188756943, KL/n: 72.74580383300781 + 0it [00:00, ?it/s]2025-05-26 05:50:03,025 - INFO - [Epoch 015 | Batch 0000] IWAE-loss 10721.7217 | mean log_px -0.1022 | KL -3567.32 + 1it [00:00, 5.63it/s] 2it [00:00, 7.26it/s] 3it [00:00, 8.10it/s] 4it [00:00, 8.60it/s] 5it [00:00, 8.29it/s] 6it [00:00, 8.67it/s] 7it [00:00, 8.91it/s] 8it [00:00, 9.05it/s] 9it [00:01, 9.18it/s] 10it [00:01, 9.27it/s] 11it [00:01, 9.37it/s] 12it [00:01, 9.41it/s] 13it [00:01, 9.49it/s] 14it [00:01, 9.47it/s] 15it [00:01, 9.29it/s] 16it [00:01, 9.31it/s] 17it [00:01, 9.40it/s] 18it [00:02, 9.43it/s] 19it [00:02, 9.46it/s] 20it [00:02, 9.42it/s] 21it [00:02, 9.45it/s] 22it [00:02, 9.44it/s] 23it [00:02, 8.96it/s] 24it [00:02, 9.08it/s] 25it [00:02, 9.14it/s] 26it [00:02, 9.25it/s] 27it [00:02, 9.34it/s] 28it [00:03, 8.82it/s] 29it [00:03, 8.98it/s] 30it [00:03, 9.15it/s] 31it [00:03, 9.37it/s] 32it [00:03, 9.54it/s] 33it [00:03, 9.03it/s] 34it [00:03, 9.29it/s] 35it [00:03, 9.47it/s] 36it [00:03, 9.60it/s] 37it [00:04, 9.71it/s] 38it [00:04, 9.26it/s] 39it [00:04, 9.46it/s] 40it [00:04, 9.57it/s] 42it [00:04, 9.40it/s] 43it [00:04, 9.54it/s] 44it [00:04, 9.63it/s] 45it [00:04, 9.26it/s] 46it [00:05, 9.44it/s] 47it [00:05, 9.50it/s] 48it [00:05, 8.93it/s] 49it [00:05, 9.19it/s] 50it [00:05, 9.41it/s]2025-05-26 05:50:08,388 - INFO - [Epoch 015 | Batch 0050] IWAE-loss 11714.7119 | mean log_px -0.1263 | KL -3566.29 + 51it [00:05, 9.52it/s] 52it [00:05, 9.64it/s] 53it [00:05, 9.14it/s] 54it [00:05, 9.35it/s] 55it [00:05, 9.54it/s] 56it [00:06, 9.06it/s] 57it [00:06, 9.31it/s] 58it [00:06, 9.49it/s] 60it [00:06, 9.71it/s] 61it [00:06, 9.33it/s] 62it [00:06, 9.49it/s] 63it [00:06, 9.45it/s] 64it [00:06, 9.58it/s] 65it [00:07, 9.69it/s] 66it [00:07, 9.76it/s] 68it [00:07, 9.37it/s] 69it [00:07, 9.51it/s] 70it [00:07, 9.57it/s] 71it [00:07, 9.67it/s] 72it [00:07, 9.74it/s] 73it [00:07, 9.32it/s] 74it [00:07, 9.48it/s] 75it [00:08, 9.61it/s] 76it [00:08, 9.71it/s] 77it [00:08, 9.16it/s] 78it [00:08, 9.38it/s] 79it [00:08, 9.55it/s] 80it [00:08, 9.66it/s] 81it [00:08, 9.25it/s] 82it [00:08, 9.43it/s] 83it [00:08, 9.59it/s] 84it [00:09, 9.07it/s] 86it [00:09, 9.47it/s] 87it [00:09, 9.60it/s] 88it [00:09, 9.68it/s] 89it [00:09, 9.30it/s] 90it [00:09, 9.47it/s] 91it [00:09, 9.60it/s] 92it [00:09, 9.69it/s] 93it [00:09, 9.24it/s] 94it [00:10, 9.22it/s] 95it [00:10, 9.01it/s] 96it [00:10, 9.10it/s] 97it [00:10, 9.34it/s] 98it [00:10, 8.92it/s] 99it [00:10, 9.22it/s] 100it [00:10, 9.40it/s]2025-05-26 05:50:13,688 - INFO - [Epoch 015 | Batch 0100] IWAE-loss 10056.2070 | mean log_px -0.1000 | KL -3566.32 + 101it [00:10, 9.53it/s] 102it [00:10, 9.64it/s] 104it [00:11, 9.81it/s] 105it [00:11, 9.30it/s] 106it [00:11, 9.45it/s] 107it [00:11, 9.57it/s] 108it [00:11, 9.68it/s] 109it [00:11, 9.74it/s] 110it [00:11, 9.79it/s] 112it [00:11, 9.89it/s] 113it [00:12, 9.90it/s] 114it [00:12, 9.91it/s] 116it [00:12, 9.69it/s] 117it [00:12, 9.75it/s] 118it [00:12, 9.79it/s] 119it [00:12, 9.83it/s] 120it [00:12, 9.27it/s] 121it [00:12, 9.46it/s] 122it [00:13, 9.59it/s] 124it [00:13, 9.77it/s] 125it [00:13, 9.81it/s] 126it [00:13, 9.83it/s] 128it [00:13, 9.90it/s] 129it [00:13, 9.90it/s] 130it [00:13, 9.90it/s] 131it [00:13, 9.91it/s] 132it [00:14, 9.90it/s] 133it [00:14, 9.92it/s] 134it [00:14, 9.92it/s] 135it [00:14, 9.93it/s] 136it [00:14, 9.91it/s] 137it [00:14, 9.77it/s] 138it [00:14, 9.21it/s] 139it [00:14, 9.37it/s] 140it [00:14, 9.52it/s] 141it [00:14, 9.65it/s] 142it [00:15, 9.74it/s] 143it [00:15, 9.80it/s] 144it [00:15, 9.82it/s] 145it [00:15, 9.87it/s] 146it [00:15, 9.88it/s] 147it [00:15, 9.90it/s] 148it [00:15, 9.91it/s] 149it [00:15, 9.29it/s] 150it [00:15, 9.48it/s]2025-05-26 05:50:18,830 - INFO - [Epoch 015 | Batch 0150] IWAE-loss 9198.8525 | mean log_px -0.0873 | KL -3561.38 + 151it [00:15, 9.56it/s] 152it [00:16, 9.65it/s] 153it [00:16, 9.75it/s] 154it [00:16, 9.80it/s] 155it [00:16, 9.86it/s] 156it [00:16, 9.87it/s] 157it [00:16, 9.88it/s] 158it [00:16, 9.89it/s] 159it [00:16, 9.92it/s] 160it [00:16, 9.91it/s] 161it [00:16, 9.88it/s] 162it [00:17, 9.89it/s] 163it [00:17, 9.89it/s] 164it [00:17, 9.87it/s] 165it [00:17, 9.89it/s] 166it [00:17, 9.86it/s] 167it [00:17, 9.37it/s] 168it [00:17, 9.51it/s] 169it [00:17, 9.63it/s] 170it [00:17, 9.08it/s] 171it [00:18, 9.29it/s] 172it [00:18, 9.48it/s] 173it [00:18, 9.62it/s] 174it [00:18, 9.72it/s] 176it [00:18, 9.84it/s] 177it [00:18, 9.86it/s] 178it [00:18, 9.87it/s] 179it [00:18, 9.89it/s] 180it [00:18, 9.91it/s] 181it [00:19, 9.41it/s] 182it [00:19, 9.53it/s] 184it [00:19, 9.74it/s] 185it [00:19, 9.80it/s] 186it [00:19, 9.83it/s] 187it [00:19, 9.87it/s] 188it [00:19, 9.88it/s] 189it [00:19, 9.90it/s] 190it [00:19, 9.90it/s] 192it [00:20, 9.94it/s] 193it [00:20, 9.95it/s] 194it [00:20, 9.94it/s] 195it [00:20, 9.47it/s] 196it [00:20, 9.21it/s] 196it [00:20, 9.48it/s] +2025-05-26 05:50:23,561 - INFO - Epoch: 15, Objective: tensor([12319.4551], device='cuda:0', grad_fn=), Loss: 0.13309964537620544, KL/n: 72.79181671142578 + 0it [00:00, ?it/s]2025-05-26 05:50:24,029 - INFO - [Epoch 016 | Batch 0000] IWAE-loss 7340.2905 | mean log_px -0.0581 | KL -3566.00 + 1it [00:00, 5.26it/s] 2it [00:00, 6.73it/s] 4it [00:00, 8.48it/s] 6it [00:00, 9.15it/s] 8it [00:00, 9.49it/s] 10it [00:01, 9.68it/s] 12it [00:01, 9.81it/s] 14it [00:01, 9.89it/s] 15it [00:01, 9.91it/s] 16it [00:01, 9.92it/s] 17it [00:01, 9.93it/s] 18it [00:01, 9.95it/s] 20it [00:02, 9.64it/s] 21it [00:02, 9.72it/s] 22it [00:02, 9.78it/s] 24it [00:02, 9.90it/s] 26it [00:02, 9.95it/s] 28it [00:02, 9.99it/s] 30it [00:03, 10.02it/s] 32it [00:03, 10.03it/s] 34it [00:03, 10.02it/s] 36it [00:03, 10.03it/s] 38it [00:03, 10.03it/s] 40it [00:04, 10.03it/s] 42it [00:04, 10.02it/s] 44it [00:04, 10.02it/s] 46it [00:04, 10.02it/s] 48it [00:04, 10.00it/s] 50it [00:05, 9.96it/s]2025-05-26 05:50:29,059 - INFO - [Epoch 016 | Batch 0050] IWAE-loss 9277.7939 | mean log_px -0.0837 | KL -3565.87 + 51it [00:05, 9.57it/s] 52it [00:05, 9.65it/s] 54it [00:05, 9.80it/s] 56it [00:05, 9.88it/s] 58it [00:05, 9.93it/s] 59it [00:06, 9.87it/s] 60it [00:06, 9.87it/s] 62it [00:06, 9.91it/s] 63it [00:06, 9.92it/s] 64it [00:06, 9.93it/s] 66it [00:06, 9.97it/s] 68it [00:06, 10.00it/s] 70it [00:07, 10.02it/s] 72it [00:07, 10.02it/s] 74it [00:07, 10.03it/s] 76it [00:07, 10.03it/s] 78it [00:07, 10.03it/s] 80it [00:08, 9.68it/s] 81it [00:08, 9.73it/s] 82it [00:08, 9.78it/s] 84it [00:08, 9.88it/s] 86it [00:08, 9.93it/s] 88it [00:08, 9.96it/s] 90it [00:09, 9.99it/s] 92it [00:09, 10.00it/s] 94it [00:09, 10.02it/s] 96it [00:09, 9.98it/s] 98it [00:09, 10.00it/s] 100it [00:10, 10.00it/s]2025-05-26 05:50:34,100 - INFO - [Epoch 016 | Batch 0100] IWAE-loss 11751.0801 | mean log_px -0.1212 | KL -3566.18 + 102it [00:10, 9.65it/s] 104it [00:10, 9.76it/s] 105it [00:10, 9.80it/s] 106it [00:10, 9.40it/s] 107it [00:10, 9.46it/s] 108it [00:11, 9.58it/s] 110it [00:11, 9.73it/s] 111it [00:11, 9.78it/s] 112it [00:11, 9.82it/s] 113it [00:11, 9.86it/s] 114it [00:11, 9.88it/s] 115it [00:11, 9.90it/s] 116it [00:11, 9.92it/s] 118it [00:12, 9.97it/s] 120it [00:12, 10.00it/s] 122it [00:12, 10.02it/s] 124it [00:12, 10.00it/s] 126it [00:12, 10.00it/s] 127it [00:12, 9.58it/s] 129it [00:13, 9.74it/s] 130it [00:13, 9.79it/s] 132it [00:13, 9.48it/s] 134it [00:13, 9.67it/s] 136it [00:13, 9.80it/s] 138it [00:14, 9.88it/s] 139it [00:14, 9.89it/s] 140it [00:14, 9.91it/s] 142it [00:14, 9.96it/s] 144it [00:14, 9.99it/s] 146it [00:14, 10.01it/s] 148it [00:15, 10.02it/s] 150it [00:15, 10.04it/s]2025-05-26 05:50:39,189 - INFO - [Epoch 016 | Batch 0150] IWAE-loss 10209.6055 | mean log_px -0.0996 | KL -3564.47 + 152it [00:15, 9.69it/s] 154it [00:15, 9.80it/s] 156it [00:15, 9.88it/s] 157it [00:15, 9.60it/s] 158it [00:16, 9.67it/s] 160it [00:16, 9.81it/s] 161it [00:16, 9.47it/s] 162it [00:16, 9.57it/s] 164it [00:16, 9.74it/s] 166it [00:16, 9.84it/s] 167it [00:17, 9.87it/s] 168it [00:17, 9.89it/s] 170it [00:17, 9.94it/s] 172it [00:17, 9.97it/s] 174it [00:17, 9.71it/s] 176it [00:17, 9.81it/s] 177it [00:18, 9.44it/s] 178it [00:18, 9.55it/s] 179it [00:18, 9.65it/s] 181it [00:18, 9.80it/s] 182it [00:18, 9.36it/s] 184it [00:18, 9.62it/s] 186it [00:18, 9.76it/s] 188it [00:19, 9.85it/s] 190it [00:19, 9.93it/s] 191it [00:19, 9.93it/s] 192it [00:19, 9.95it/s] 194it [00:19, 9.99it/s] 195it [00:19, 9.66it/s] 196it [00:19, 9.39it/s] 196it [00:20, 9.77it/s] +2025-05-26 05:50:43,942 - INFO - Epoch: 16, Objective: tensor([10027.8145], device='cuda:0', grad_fn=), Loss: 0.09540171176195145, KL/n: 72.8223648071289 + 0it [00:00, ?it/s]2025-05-26 05:50:44,223 - INFO - [Epoch 017 | Batch 0000] IWAE-loss 10231.7510 | mean log_px -0.0985 | KL -3565.85 + 1it [00:00, 5.31it/s] 2it [00:00, 7.13it/s] 3it [00:00, 8.02it/s] 4it [00:00, 8.12it/s] 6it [00:00, 9.05it/s] 7it [00:00, 8.80it/s] 8it [00:00, 9.09it/s] 10it [00:01, 9.47it/s] 11it [00:01, 9.23it/s] 12it [00:01, 9.41it/s] 13it [00:01, 9.54it/s] 15it [00:01, 9.74it/s] 16it [00:01, 9.79it/s] 18it [00:01, 9.90it/s] 20it [00:02, 9.94it/s] 22it [00:02, 9.97it/s] 24it [00:02, 9.98it/s] 26it [00:02, 10.00it/s] 28it [00:02, 10.02it/s] 30it [00:03, 10.04it/s] 32it [00:03, 10.03it/s] 34it [00:03, 10.04it/s] 36it [00:03, 10.05it/s] 38it [00:03, 10.05it/s] 40it [00:04, 10.05it/s] 42it [00:04, 10.05it/s] 44it [00:04, 10.03it/s] 46it [00:04, 10.03it/s] 48it [00:04, 10.04it/s] 50it [00:05, 10.05it/s]2025-05-26 05:50:49,288 - INFO - [Epoch 017 | Batch 0050] IWAE-loss 8144.4380 | mean log_px -0.0670 | KL -3562.43 + 52it [00:05, 9.70it/s] 53it [00:05, 9.74it/s] 54it [00:05, 9.78it/s] 56it [00:05, 9.88it/s] 58it [00:05, 9.56it/s] 59it [00:06, 9.29it/s] 60it [00:06, 9.44it/s] 61it [00:06, 9.56it/s] 62it [00:06, 9.67it/s] 63it [00:06, 9.75it/s] 64it [00:06, 9.23it/s] 66it [00:06, 9.55it/s] 68it [00:07, 9.74it/s] 70it [00:07, 9.85it/s] 72it [00:07, 9.91it/s] 73it [00:07, 9.51it/s] 74it [00:07, 9.54it/s] 75it [00:07, 9.49it/s] 76it [00:07, 9.56it/s] 77it [00:07, 9.58it/s] 78it [00:08, 9.69it/s] 80it [00:08, 9.83it/s] 82it [00:08, 9.91it/s] 84it [00:08, 9.95it/s] 85it [00:08, 9.95it/s] 87it [00:08, 10.01it/s] 89it [00:09, 10.03it/s] 91it [00:09, 10.02it/s] 93it [00:09, 10.03it/s] 95it [00:09, 10.03it/s] 97it [00:09, 10.04it/s] 99it [00:10, 10.04it/s]2025-05-26 05:50:54,404 - INFO - [Epoch 017 | Batch 0100] IWAE-loss 8396.8623 | mean log_px -0.0690 | KL -3563.99 + 101it [00:10, 9.70it/s] 103it [00:10, 9.81it/s] 105it [00:10, 9.88it/s] 106it [00:10, 9.90it/s] 107it [00:10, 9.91it/s] 109it [00:11, 9.56it/s] 110it [00:11, 9.64it/s] 112it [00:11, 9.77it/s] 114it [00:11, 9.86it/s] 116it [00:11, 9.92it/s] 118it [00:12, 9.96it/s] 120it [00:12, 9.98it/s] 121it [00:12, 9.98it/s] 122it [00:12, 9.98it/s] 124it [00:12, 10.00it/s] 126it [00:12, 10.02it/s] 128it [00:13, 10.03it/s] 130it [00:13, 10.04it/s] 132it [00:13, 10.04it/s] 134it [00:13, 10.04it/s] 136it [00:13, 10.05it/s] 138it [00:14, 10.05it/s] 140it [00:14, 10.06it/s] 142it [00:14, 10.06it/s] 144it [00:14, 10.06it/s] 146it [00:14, 10.07it/s] 148it [00:15, 10.08it/s] 150it [00:15, 10.07it/s]2025-05-26 05:50:59,428 - INFO - [Epoch 017 | Batch 0150] IWAE-loss 9258.7881 | mean log_px -0.0835 | KL -3569.38 + 152it [00:15, 9.73it/s] 153it [00:15, 9.71it/s] 154it [00:15, 9.73it/s] 156it [00:15, 9.84it/s] 158it [00:16, 9.91it/s] 160it [00:16, 9.95it/s] 162it [00:16, 9.97it/s] 164it [00:16, 9.81it/s] 165it [00:16, 9.54it/s] 166it [00:16, 9.63it/s] 168it [00:17, 9.78it/s] 169it [00:17, 9.80it/s] 170it [00:17, 9.84it/s] 172it [00:17, 9.91it/s] 174it [00:17, 9.97it/s] 175it [00:17, 9.52it/s] 176it [00:17, 9.62it/s] 178it [00:18, 9.78it/s] 180it [00:18, 9.87it/s] 182it [00:18, 9.93it/s] 184it [00:18, 9.97it/s] 185it [00:18, 9.52it/s] 186it [00:18, 9.61it/s] 187it [00:19, 9.69it/s] 188it [00:19, 9.77it/s] 190it [00:19, 9.88it/s] 192it [00:19, 9.54it/s] 194it [00:19, 9.71it/s] 195it [00:19, 9.47it/s] 196it [00:20, 9.25it/s] 196it [00:20, 9.75it/s] +2025-05-26 05:51:04,179 - INFO - Epoch: 17, Objective: tensor([9598.7822], device='cuda:0', grad_fn=), Loss: 0.08933060616254807, KL/n: 72.83203125 + 0it [00:00, ?it/s]2025-05-26 05:51:04,643 - INFO - [Epoch 018 | Batch 0000] IWAE-loss 12348.8164 | mean log_px -0.1254 | KL -3569.31 + 1it [00:00, 2.66it/s] 2it [00:00, 4.45it/s] 4it [00:00, 6.79it/s] 6it [00:00, 7.99it/s] 8it [00:01, 8.72it/s] 10it [00:01, 9.12it/s] 11it [00:01, 9.29it/s] 13it [00:01, 9.56it/s] 14it [00:01, 9.64it/s] 16it [00:01, 9.79it/s] 18it [00:02, 9.87it/s] 20it [00:02, 9.93it/s] 21it [00:02, 9.61it/s] 22it [00:02, 9.69it/s] 24it [00:02, 9.81it/s] 26it [00:02, 9.89it/s] 28it [00:03, 9.94it/s] 29it [00:03, 9.54it/s] 30it [00:03, 9.62it/s] 32it [00:03, 9.78it/s] 34it [00:03, 9.86it/s] 36it [00:03, 9.93it/s] 38it [00:04, 9.96it/s] 39it [00:04, 9.63it/s] 40it [00:04, 9.69it/s] 42it [00:04, 9.81it/s] 44it [00:04, 9.88it/s] 46it [00:04, 9.94it/s] 47it [00:05, 9.94it/s] 48it [00:05, 9.95it/s] 50it [00:05, 9.98it/s]2025-05-26 05:51:09,719 - INFO - [Epoch 018 | Batch 0050] IWAE-loss 8044.7241 | mean log_px -0.0678 | KL -3567.06 + 51it [00:05, 9.51it/s] 52it [00:05, 9.62it/s] 54it [00:05, 9.80it/s] 55it [00:05, 9.38it/s] 56it [00:05, 9.51it/s] 58it [00:06, 9.70it/s] 60it [00:06, 9.84it/s] 61it [00:06, 9.57it/s] 63it [00:06, 9.75it/s] 65it [00:06, 9.86it/s] 66it [00:07, 9.89it/s] 68it [00:07, 9.93it/s] 70it [00:07, 9.98it/s] 71it [00:07, 9.57it/s] 73it [00:07, 9.74it/s] 74it [00:07, 9.36it/s] 76it [00:08, 9.61it/s] 78it [00:08, 9.75it/s] 80it [00:08, 9.85it/s] 82it [00:08, 9.91it/s] 84it [00:08, 9.95it/s] 86it [00:09, 9.99it/s] 88it [00:09, 10.01it/s] 90it [00:09, 10.02it/s] 92it [00:09, 10.02it/s] 94it [00:09, 9.98it/s] 96it [00:10, 9.98it/s] 97it [00:10, 9.65it/s] 98it [00:10, 9.67it/s] 100it [00:10, 9.80it/s]2025-05-26 05:51:14,832 - INFO - [Epoch 018 | Batch 0100] IWAE-loss 8123.0947 | mean log_px -0.0684 | KL -3570.99 + 101it [00:10, 9.40it/s] 102it [00:10, 9.53it/s] 104it [00:10, 9.73it/s] 105it [00:11, 9.42it/s] 106it [00:11, 9.55it/s] 108it [00:11, 9.68it/s] 109it [00:11, 9.19it/s] 110it [00:11, 9.09it/s] 111it [00:11, 9.25it/s] 112it [00:11, 9.44it/s] 114it [00:11, 9.69it/s] 116it [00:12, 9.81it/s] 117it [00:12, 9.48it/s] 118it [00:12, 9.59it/s] 120it [00:12, 9.74it/s] 121it [00:12, 9.79it/s] 122it [00:12, 9.83it/s] 123it [00:12, 9.56it/s] 124it [00:12, 9.67it/s] 126it [00:13, 9.83it/s] 128it [00:13, 9.91it/s] 130it [00:13, 9.95it/s] 132it [00:13, 9.97it/s] 133it [00:13, 9.97it/s] 134it [00:13, 9.97it/s] 136it [00:14, 9.99it/s] 137it [00:14, 9.99it/s] 138it [00:14, 9.57it/s] 140it [00:14, 9.75it/s] 142it [00:14, 9.85it/s] 144it [00:14, 9.91it/s] 145it [00:15, 9.58it/s] 146it [00:15, 9.66it/s] 148it [00:15, 9.80it/s] 150it [00:15, 9.88it/s]2025-05-26 05:51:19,985 - INFO - [Epoch 018 | Batch 0150] IWAE-loss 6793.8252 | mean log_px -0.0610 | KL -3563.42 + 151it [00:15, 9.46it/s] 152it [00:15, 9.56it/s] 153it [00:15, 9.64it/s] 154it [00:16, 9.72it/s] 155it [00:16, 9.78it/s] 156it [00:16, 9.25it/s] 157it [00:16, 9.44it/s] 158it [00:16, 9.59it/s] 159it [00:16, 9.70it/s] 161it [00:16, 9.86it/s] 163it [00:16, 9.94it/s] 164it [00:17, 9.95it/s] 165it [00:17, 9.93it/s] 166it [00:17, 9.88it/s] 168it [00:17, 9.96it/s] 170it [00:17, 9.99it/s] 172it [00:17, 10.02it/s] 174it [00:18, 10.02it/s] 175it [00:18, 10.01it/s] 176it [00:18, 9.99it/s] 177it [00:18, 9.48it/s] 179it [00:18, 9.71it/s] 181it [00:18, 9.37it/s] 182it [00:18, 9.49it/s] 183it [00:19, 9.59it/s] 185it [00:19, 9.78it/s] 186it [00:19, 9.45it/s] 188it [00:19, 9.68it/s] 190it [00:19, 9.80it/s] 192it [00:19, 9.88it/s] 194it [00:20, 9.92it/s] 195it [00:20, 9.19it/s] 196it [00:20, 9.59it/s] +2025-05-26 05:51:24,744 - INFO - Epoch: 18, Objective: tensor([8188.5557], device='cuda:0', grad_fn=), Loss: 0.07669003307819366, KL/n: 72.82756805419922 + 0it [00:00, ?it/s]2025-05-26 05:51:25,021 - INFO - [Epoch 019 | Batch 0000] IWAE-loss 6962.9434 | mean log_px -0.0530 | KL -3566.80 + 1it [00:00, 5.32it/s] 2it [00:00, 6.69it/s] 3it [00:00, 7.88it/s] 4it [00:00, 8.56it/s] 5it [00:00, 9.01it/s] 6it [00:00, 9.31it/s] 7it [00:00, 8.89it/s] 8it [00:00, 9.07it/s] 9it [00:01, 9.33it/s] 10it [00:01, 9.49it/s] 12it [00:01, 9.72it/s] 14it [00:01, 9.60it/s] 15it [00:01, 9.33it/s] 16it [00:01, 9.46it/s] 18it [00:01, 9.67it/s] 19it [00:02, 9.74it/s] 20it [00:02, 9.78it/s] 22it [00:02, 9.87it/s] 24it [00:02, 9.92it/s] 26it [00:02, 9.95it/s] 28it [00:02, 9.98it/s] 29it [00:03, 9.98it/s] 30it [00:03, 9.97it/s] 31it [00:03, 9.97it/s] 32it [00:03, 9.97it/s] 33it [00:03, 9.96it/s] 34it [00:03, 9.37it/s] 36it [00:03, 9.65it/s] 38it [00:03, 9.78it/s] 40it [00:04, 9.87it/s] 42it [00:04, 9.92it/s] 43it [00:04, 9.93it/s] 44it [00:04, 9.93it/s] 45it [00:04, 9.44it/s] 46it [00:04, 9.57it/s] 47it [00:04, 9.68it/s] 48it [00:05, 9.75it/s] 50it [00:05, 9.86it/s]2025-05-26 05:51:30,161 - INFO - [Epoch 019 | Batch 0050] IWAE-loss 11381.5762 | mean log_px -0.1166 | KL -3569.48 + 51it [00:05, 9.33it/s] 52it [00:05, 9.47it/s] 54it [00:05, 9.25it/s] 56it [00:05, 9.52it/s] 58it [00:06, 9.67it/s] 60it [00:06, 9.78it/s] 62it [00:06, 9.84it/s] 64it [00:06, 9.90it/s] 65it [00:06, 9.92it/s] 66it [00:06, 9.93it/s] 67it [00:06, 9.95it/s] 68it [00:07, 9.93it/s] 69it [00:07, 9.94it/s] 70it [00:07, 9.94it/s] 72it [00:07, 9.97it/s] 73it [00:07, 9.56it/s] 74it [00:07, 9.67it/s] 76it [00:07, 9.82it/s] 77it [00:07, 9.86it/s] 78it [00:08, 9.87it/s] 80it [00:08, 9.94it/s] 82it [00:08, 9.97it/s] 83it [00:08, 9.98it/s] 84it [00:08, 9.96it/s] 86it [00:08, 9.98it/s] 88it [00:09, 9.98it/s] 89it [00:09, 9.98it/s] 90it [00:09, 9.48it/s] 92it [00:09, 9.68it/s] 93it [00:09, 9.74it/s] 94it [00:09, 9.79it/s] 96it [00:09, 9.88it/s] 98it [00:10, 9.92it/s] 99it [00:10, 9.93it/s] 100it [00:10, 9.93it/s]2025-05-26 05:51:35,256 - INFO - [Epoch 019 | Batch 0100] IWAE-loss 8565.3213 | mean log_px -0.0776 | KL -3569.59 + 101it [00:10, 9.39it/s] 102it [00:10, 9.53it/s] 104it [00:10, 9.63it/s] 105it [00:10, 9.32it/s] 106it [00:10, 9.46it/s] 108it [00:11, 9.69it/s] 110it [00:11, 9.80it/s] 112it [00:11, 9.51it/s] 114it [00:11, 9.68it/s] 115it [00:11, 9.74it/s] 116it [00:11, 9.79it/s] 118it [00:12, 9.87it/s] 120it [00:12, 9.48it/s] 121it [00:12, 9.53it/s] 122it [00:12, 9.54it/s] 124it [00:12, 9.74it/s] 125it [00:12, 9.32it/s] 126it [00:13, 9.46it/s] 128it [00:13, 9.68it/s] 130it [00:13, 9.82it/s] 132it [00:13, 9.52it/s] 133it [00:13, 9.60it/s] 134it [00:13, 9.67it/s] 136it [00:14, 9.82it/s] 138it [00:14, 9.90it/s] 140it [00:14, 9.94it/s] 141it [00:14, 9.95it/s] 142it [00:14, 9.47it/s] 143it [00:14, 9.59it/s] 144it [00:14, 9.68it/s] 146it [00:15, 9.82it/s] 148it [00:15, 9.76it/s] 149it [00:15, 9.37it/s] 150it [00:15, 9.45it/s]2025-05-26 05:51:40,460 - INFO - [Epoch 019 | Batch 0150] IWAE-loss 7441.7295 | mean log_px -0.0628 | KL -3567.16 + 151it [00:15, 9.50it/s] 152it [00:15, 9.62it/s] 153it [00:15, 9.68it/s] 154it [00:15, 9.29it/s] 155it [00:16, 9.47it/s] 156it [00:16, 9.61it/s] 157it [00:16, 9.71it/s] 158it [00:16, 9.78it/s] 160it [00:16, 9.92it/s] 162it [00:16, 9.97it/s] 164it [00:16, 10.01it/s] 165it [00:17, 9.96it/s] 166it [00:17, 9.96it/s] 168it [00:17, 10.00it/s] 170it [00:17, 10.01it/s] 172it [00:17, 10.03it/s] 174it [00:17, 10.04it/s] 176it [00:18, 10.04it/s] 178it [00:18, 10.04it/s] 180it [00:18, 10.04it/s] 182it [00:18, 10.05it/s] 184it [00:18, 10.05it/s] 186it [00:19, 10.02it/s] 188it [00:19, 10.02it/s] 190it [00:19, 10.03it/s] 192it [00:19, 10.04it/s] 194it [00:19, 9.71it/s] 195it [00:20, 9.49it/s] 196it [00:20, 9.30it/s] 196it [00:20, 9.68it/s] +2025-05-26 05:51:45,123 - INFO - Epoch: 19, Objective: tensor([7893.3765], device='cuda:0', grad_fn=), Loss: 0.061493679881095886, KL/n: 72.83820343017578 + 0it [00:00, ?it/s]2025-05-26 05:51:45,576 - INFO - [Epoch 020 | Batch 0000] IWAE-loss 6628.0117 | mean log_px -0.0495 | KL -3568.11 + 1it [00:00, 5.37it/s] 2it [00:00, 6.58it/s] 4it [00:00, 8.40it/s] 6it [00:00, 9.11it/s] 8it [00:00, 9.46it/s] 10it [00:01, 9.35it/s] 11it [00:01, 9.45it/s] 12it [00:01, 9.56it/s] 14it [00:01, 9.66it/s] 15it [00:01, 9.60it/s] 16it [00:01, 9.12it/s] 17it [00:01, 9.25it/s] 18it [00:01, 9.34it/s] 19it [00:02, 9.44it/s] 20it [00:02, 9.48it/s] 21it [00:02, 9.58it/s] 22it [00:02, 9.63it/s] 23it [00:02, 9.69it/s] 24it [00:02, 9.72it/s] 25it [00:02, 9.75it/s] 26it [00:02, 9.14it/s] 27it [00:02, 9.34it/s] 28it [00:03, 9.48it/s] 30it [00:03, 9.14it/s] 31it [00:03, 9.29it/s] 33it [00:03, 9.59it/s] 34it [00:03, 9.68it/s] 36it [00:03, 9.82it/s] 38it [00:04, 9.90it/s] 40it [00:04, 9.51it/s] 41it [00:04, 9.60it/s] 42it [00:04, 9.66it/s] 43it [00:04, 9.72it/s] 44it [00:04, 9.78it/s] 45it [00:04, 9.82it/s] 46it [00:04, 9.85it/s] 48it [00:05, 9.52it/s] 49it [00:05, 9.59it/s] 50it [00:05, 9.67it/s]2025-05-26 05:51:50,796 - INFO - [Epoch 020 | Batch 0050] IWAE-loss 7019.3750 | mean log_px -0.0534 | KL -3567.79 + 51it [00:05, 9.72it/s] 52it [00:05, 9.79it/s] 53it [00:05, 9.23it/s] 54it [00:05, 9.44it/s] 56it [00:05, 9.70it/s] 58it [00:06, 9.83it/s] 60it [00:06, 9.90it/s] 62it [00:06, 9.94it/s] 63it [00:06, 9.95it/s] 64it [00:06, 9.41it/s] 65it [00:06, 9.37it/s] 66it [00:06, 9.35it/s] 67it [00:07, 9.44it/s] 68it [00:07, 9.52it/s] 69it [00:07, 9.59it/s] 70it [00:07, 9.61it/s] 71it [00:07, 9.66it/s] 72it [00:07, 9.68it/s] 73it [00:07, 9.71it/s] 74it [00:07, 9.72it/s] 75it [00:07, 9.73it/s] 76it [00:07, 9.71it/s] 77it [00:08, 9.75it/s] 78it [00:08, 9.80it/s] 79it [00:08, 9.21it/s] 80it [00:08, 9.42it/s] 81it [00:08, 9.57it/s] 82it [00:08, 9.67it/s] 83it [00:08, 9.27it/s] 84it [00:08, 9.45it/s] 85it [00:08, 9.59it/s] 86it [00:09, 9.70it/s] 88it [00:09, 9.36it/s] 89it [00:09, 9.51it/s] 90it [00:09, 9.63it/s] 92it [00:09, 9.34it/s] 93it [00:09, 9.47it/s] 94it [00:09, 9.49it/s] 95it [00:09, 9.59it/s] 96it [00:10, 9.69it/s] 97it [00:10, 9.77it/s] 98it [00:10, 9.80it/s] 100it [00:10, 9.89it/s]2025-05-26 05:51:55,990 - INFO - [Epoch 020 | Batch 0100] IWAE-loss 9756.4814 | mean log_px -0.0918 | KL -3565.89 + 101it [00:10, 9.91it/s] 102it [00:10, 9.93it/s] 103it [00:10, 9.94it/s] 104it [00:10, 9.95it/s] 106it [00:11, 9.58it/s] 108it [00:11, 9.75it/s] 109it [00:11, 9.79it/s] 110it [00:11, 9.81it/s] 111it [00:11, 9.32it/s] 112it [00:11, 9.45it/s] 114it [00:11, 9.68it/s] 116it [00:12, 9.81it/s] 117it [00:12, 9.85it/s] 118it [00:12, 9.88it/s] 120it [00:12, 9.93it/s] 122it [00:12, 9.96it/s] 124it [00:12, 9.97it/s] 125it [00:13, 9.98it/s] 126it [00:13, 9.98it/s] 127it [00:13, 9.96it/s] 128it [00:13, 9.95it/s] 129it [00:13, 9.93it/s] 130it [00:13, 9.94it/s] 131it [00:13, 9.32it/s] 132it [00:13, 9.50it/s] 133it [00:13, 9.62it/s] 134it [00:13, 9.71it/s] 136it [00:14, 9.85it/s] 138it [00:14, 9.92it/s] 140it [00:14, 9.89it/s] 142it [00:14, 9.94it/s] 144it [00:14, 9.60it/s] 146it [00:15, 9.74it/s] 147it [00:15, 9.78it/s] 148it [00:15, 9.46it/s] 149it [00:15, 9.56it/s] 150it [00:15, 9.58it/s]2025-05-26 05:52:01,113 - INFO - [Epoch 020 | Batch 0150] IWAE-loss 6741.2627 | mean log_px -0.0465 | KL -3565.47 + 151it [00:15, 9.65it/s] 152it [00:15, 9.73it/s] 153it [00:15, 9.77it/s] 154it [00:16, 9.83it/s] 155it [00:16, 9.87it/s] 156it [00:16, 9.89it/s] 157it [00:16, 9.89it/s] 158it [00:16, 9.89it/s] 160it [00:16, 9.95it/s] 162it [00:16, 9.94it/s] 163it [00:16, 9.95it/s] 164it [00:17, 9.95it/s] 165it [00:17, 9.51it/s] 166it [00:17, 9.60it/s] 167it [00:17, 9.70it/s] 168it [00:17, 9.77it/s] 170it [00:17, 9.39it/s] 171it [00:17, 9.52it/s] 172it [00:17, 9.64it/s] 174it [00:18, 9.80it/s] 175it [00:18, 9.83it/s] 176it [00:18, 9.33it/s] 177it [00:18, 9.49it/s] 178it [00:18, 9.62it/s] 179it [00:18, 9.71it/s] 180it [00:18, 9.78it/s] 182it [00:18, 9.88it/s] 184it [00:19, 9.92it/s] 186it [00:19, 9.95it/s] 188it [00:19, 9.95it/s] 189it [00:19, 9.96it/s] 190it [00:19, 9.96it/s] 191it [00:19, 9.97it/s] 192it [00:19, 9.94it/s] 193it [00:20, 9.89it/s] 194it [00:20, 9.91it/s] 195it [00:20, 9.49it/s] 196it [00:20, 9.10it/s] 196it [00:20, 9.60it/s] +2025-05-26 05:52:05,840 - INFO - Epoch: 20, Objective: tensor([5954.1396], device='cuda:0', grad_fn=), Loss: 0.034850478172302246, KL/n: 72.82156372070312 + 0it [00:00, ?it/s]2025-05-26 05:52:06,129 - INFO - [Epoch 021 | Batch 0000] IWAE-loss 7638.6367 | mean log_px -0.0598 | KL -3567.85 + 1it [00:00, 5.34it/s] 2it [00:00, 7.31it/s] 4it [00:00, 8.85it/s] 5it [00:00, 9.16it/s] 7it [00:00, 9.58it/s] 9it [00:01, 9.43it/s] 10it [00:01, 9.54it/s] 12it [00:01, 9.75it/s] 14it [00:01, 9.86it/s] 16it [00:01, 9.92it/s] 17it [00:01, 9.51it/s] 18it [00:01, 9.61it/s] 20it [00:02, 9.79it/s] 22it [00:02, 9.90it/s] 24it [00:02, 9.95it/s] 26it [00:02, 10.00it/s] 28it [00:02, 10.01it/s] 30it [00:03, 10.01it/s] 31it [00:03, 9.62it/s] 33it [00:03, 9.77it/s] 35it [00:03, 9.86it/s] 36it [00:03, 9.32it/s] 37it [00:03, 9.44it/s] 38it [00:03, 9.52it/s] 39it [00:04, 9.60it/s] 40it [00:04, 9.58it/s] 41it [00:04, 9.22it/s] 42it [00:04, 9.40it/s] 43it [00:04, 9.48it/s] 44it [00:04, 9.59it/s] 45it [00:04, 9.70it/s] 47it [00:04, 9.88it/s] 49it [00:05, 9.97it/s] 50it [00:05, 9.95it/s]2025-05-26 05:52:11,244 - INFO - [Epoch 021 | Batch 0050] IWAE-loss 12824.7617 | mean log_px -0.1392 | KL -3568.71 + 51it [00:05, 9.39it/s] 52it [00:05, 9.30it/s] 53it [00:05, 9.45it/s] 55it [00:05, 9.71it/s] 57it [00:05, 9.84it/s] 59it [00:06, 9.92it/s] 61it [00:06, 9.98it/s] 63it [00:06, 10.02it/s] 65it [00:06, 10.05it/s] 67it [00:06, 10.05it/s] 69it [00:07, 10.07it/s] 71it [00:07, 10.08it/s] 73it [00:07, 10.09it/s] 75it [00:07, 9.75it/s] 77it [00:07, 9.85it/s] 79it [00:08, 9.93it/s] 81it [00:08, 9.99it/s] 83it [00:08, 10.01it/s] 85it [00:08, 9.63it/s] 86it [00:08, 9.66it/s] 88it [00:09, 9.81it/s] 89it [00:09, 9.45it/s] 91it [00:09, 9.68it/s] 93it [00:09, 9.81it/s] 95it [00:09, 9.56it/s] 96it [00:09, 9.63it/s] 98it [00:10, 9.79it/s] 100it [00:10, 9.88it/s]2025-05-26 05:52:16,335 - INFO - [Epoch 021 | Batch 0100] IWAE-loss 9816.6523 | mean log_px -0.1053 | KL -3570.17 + 101it [00:10, 9.51it/s] 102it [00:10, 9.59it/s] 104it [00:10, 9.78it/s] 106it [00:10, 9.88it/s] 107it [00:11, 9.88it/s] 109it [00:11, 9.63it/s] 111it [00:11, 9.78it/s] 113it [00:11, 9.88it/s] 115it [00:11, 9.95it/s] 117it [00:12, 10.00it/s] 119it [00:12, 10.03it/s] 121it [00:12, 9.63it/s] 122it [00:12, 9.58it/s] 124it [00:12, 9.73it/s] 126it [00:12, 9.84it/s] 128it [00:13, 9.91it/s] 130it [00:13, 9.96it/s] 131it [00:13, 9.66it/s] 132it [00:13, 9.70it/s] 134it [00:13, 9.83it/s] 136it [00:13, 9.82it/s] 138it [00:14, 9.88it/s] 139it [00:14, 9.53it/s] 141it [00:14, 9.73it/s] 142it [00:14, 9.39it/s] 144it [00:14, 9.62it/s] 146it [00:15, 9.77it/s] 148it [00:15, 9.88it/s] 150it [00:15, 9.96it/s]2025-05-26 05:52:21,446 - INFO - [Epoch 021 | Batch 0150] IWAE-loss 6365.2271 | mean log_px -0.0422 | KL -3569.45 + 151it [00:15, 9.58it/s] 153it [00:15, 9.74it/s] 155it [00:15, 9.86it/s] 157it [00:16, 9.93it/s] 158it [00:16, 9.94it/s] 160it [00:16, 9.99it/s] 162it [00:16, 10.03it/s] 164it [00:16, 9.97it/s] 166it [00:17, 9.98it/s] 168it [00:17, 10.02it/s] 170it [00:17, 10.04it/s] 172it [00:17, 10.06it/s] 174it [00:17, 9.73it/s] 176it [00:18, 9.84it/s] 178it [00:18, 9.92it/s] 180it [00:18, 9.97it/s] 182it [00:18, 9.67it/s] 184it [00:18, 9.79it/s] 186it [00:19, 9.88it/s] 188it [00:19, 9.94it/s] 190it [00:19, 9.99it/s] 192it [00:19, 9.98it/s] 194it [00:19, 9.99it/s] 195it [00:19, 9.71it/s] 196it [00:20, 9.46it/s] 196it [00:20, 9.74it/s] +2025-05-26 05:52:26,116 - INFO - Epoch: 21, Objective: tensor([6160.0498], device='cuda:0', grad_fn=), Loss: 0.040021877735853195, KL/n: 72.79065704345703 + 0it [00:00, ?it/s]2025-05-26 05:52:26,572 - INFO - [Epoch 022 | Batch 0000] IWAE-loss 9817.3037 | mean log_px -0.0940 | KL -3564.62 + 1it [00:00, 5.37it/s] 2it [00:00, 6.82it/s] 4it [00:00, 8.52it/s] 5it [00:00, 8.88it/s] 6it [00:00, 9.17it/s] 8it [00:00, 9.56it/s] 9it [00:01, 9.66it/s] 10it [00:01, 9.74it/s] 11it [00:01, 9.81it/s] 13it [00:01, 9.91it/s] 14it [00:01, 9.93it/s] 16it [00:01, 9.96it/s] 17it [00:01, 9.97it/s] 18it [00:01, 9.96it/s] 20it [00:02, 9.95it/s] 21it [00:02, 9.96it/s] 22it [00:02, 9.91it/s] 23it [00:02, 9.89it/s] 24it [00:02, 9.41it/s] 25it [00:02, 9.52it/s] 26it [00:02, 9.61it/s] 27it [00:02, 9.69it/s] 28it [00:02, 9.71it/s] 29it [00:03, 9.74it/s] 30it [00:03, 9.76it/s] 31it [00:03, 9.79it/s] 32it [00:03, 9.76it/s] 33it [00:03, 9.79it/s] 34it [00:03, 9.78it/s] 35it [00:03, 9.26it/s] 36it [00:03, 9.37it/s] 37it [00:03, 9.48it/s] 38it [00:03, 9.52it/s] 39it [00:04, 8.98it/s] 40it [00:04, 9.19it/s] 41it [00:04, 9.34it/s] 42it [00:04, 9.43it/s] 43it [00:04, 9.55it/s] 44it [00:04, 9.54it/s] 45it [00:04, 9.36it/s] 46it [00:04, 9.32it/s] 47it [00:04, 9.35it/s] 48it [00:05, 9.52it/s] 50it [00:05, 9.74it/s]2025-05-26 05:52:31,742 - INFO - [Epoch 022 | Batch 0050] IWAE-loss 8459.5879 | mean log_px -0.0763 | KL -3567.08 + 51it [00:05, 9.26it/s] 52it [00:05, 9.44it/s] 54it [00:05, 9.67it/s] 55it [00:05, 9.70it/s] 56it [00:05, 9.70it/s] 57it [00:05, 9.76it/s] 58it [00:06, 9.78it/s] 59it [00:06, 9.24it/s] 60it [00:06, 9.42it/s] 62it [00:06, 9.68it/s] 64it [00:06, 9.39it/s] 65it [00:06, 9.52it/s] 66it [00:06, 9.62it/s] 68it [00:07, 9.79it/s] 70it [00:07, 9.87it/s] 72it [00:07, 9.92it/s] 73it [00:07, 9.50it/s] 74it [00:07, 9.44it/s] 75it [00:07, 9.54it/s] 77it [00:08, 9.74it/s] 78it [00:08, 9.28it/s] 79it [00:08, 9.44it/s] 81it [00:08, 9.67it/s] 82it [00:08, 9.68it/s] 83it [00:08, 9.71it/s] 84it [00:08, 9.75it/s] 86it [00:08, 9.86it/s] 88it [00:09, 9.91it/s] 89it [00:09, 9.47it/s] 90it [00:09, 9.57it/s] 92it [00:09, 9.70it/s] 94it [00:09, 9.81it/s] 96it [00:10, 9.87it/s] 98it [00:10, 9.93it/s] 99it [00:10, 9.94it/s] 100it [00:10, 9.94it/s]2025-05-26 05:52:36,908 - INFO - [Epoch 022 | Batch 0100] IWAE-loss 9265.9893 | mean log_px -0.0819 | KL -3570.15 + 101it [00:10, 9.95it/s] 102it [00:10, 9.44it/s] 103it [00:10, 9.57it/s] 104it [00:10, 9.67it/s] 106it [00:11, 9.82it/s] 108it [00:11, 9.90it/s] 110it [00:11, 9.94it/s] 112it [00:11, 9.97it/s] 114it [00:11, 9.98it/s] 115it [00:11, 9.97it/s] 116it [00:12, 9.96it/s] 118it [00:12, 9.98it/s] 119it [00:12, 9.98it/s] 120it [00:12, 9.98it/s] 122it [00:12, 9.56it/s] 124it [00:12, 9.72it/s] 126it [00:13, 9.82it/s] 127it [00:13, 9.81it/s] 128it [00:13, 9.76it/s] 129it [00:13, 9.79it/s] 130it [00:13, 9.82it/s] 131it [00:13, 9.83it/s] 132it [00:13, 9.85it/s] 133it [00:13, 9.87it/s] 134it [00:13, 9.89it/s] 135it [00:13, 9.92it/s] 136it [00:14, 9.92it/s] 138it [00:14, 9.96it/s] 139it [00:14, 9.58it/s] 140it [00:14, 9.68it/s] 142it [00:14, 9.34it/s] 143it [00:14, 9.48it/s] 144it [00:14, 9.59it/s] 146it [00:15, 9.78it/s] 147it [00:15, 9.77it/s] 148it [00:15, 9.81it/s] 149it [00:15, 9.85it/s] 150it [00:15, 9.88it/s]2025-05-26 05:52:42,011 - INFO - [Epoch 022 | Batch 0150] IWAE-loss 8519.6299 | mean log_px -0.0768 | KL -3566.00 + 151it [00:15, 9.90it/s] 152it [00:15, 9.92it/s] 154it [00:15, 9.97it/s] 155it [00:16, 9.98it/s] 156it [00:16, 9.97it/s] 158it [00:16, 9.99it/s] 160it [00:16, 9.99it/s] 161it [00:16, 9.99it/s] 162it [00:16, 9.99it/s] 163it [00:16, 9.55it/s] 164it [00:16, 9.66it/s] 166it [00:17, 9.81it/s] 168it [00:17, 9.47it/s] 169it [00:17, 9.58it/s] 170it [00:17, 9.67it/s] 172it [00:17, 9.80it/s] 173it [00:17, 9.35it/s] 174it [00:17, 9.50it/s] 176it [00:18, 9.70it/s] 178it [00:18, 9.81it/s] 180it [00:18, 9.88it/s] 182it [00:18, 9.93it/s] 183it [00:18, 9.93it/s] 184it [00:18, 9.93it/s] 185it [00:19, 9.36it/s] 186it [00:19, 9.50it/s] 188it [00:19, 9.71it/s] 190it [00:19, 9.82it/s] 192it [00:19, 9.88it/s] 194it [00:20, 9.92it/s] 195it [00:20, 9.63it/s] 196it [00:20, 9.39it/s] 196it [00:20, 9.65it/s] +2025-05-26 05:52:46,742 - INFO - Epoch: 22, Objective: tensor([8000.1289], device='cuda:0', grad_fn=), Loss: 0.06485095620155334, KL/n: 72.75353240966797 + 0it [00:00, ?it/s]2025-05-26 05:52:46,998 - INFO - [Epoch 023 | Batch 0000] IWAE-loss 10706.0791 | mean log_px -0.1055 | KL -3565.08 + 1it [00:00, 6.14it/s] 3it [00:00, 8.66it/s] 5it [00:00, 8.85it/s] 7it [00:00, 9.34it/s] 8it [00:00, 9.48it/s] 10it [00:01, 9.72it/s] 12it [00:01, 9.85it/s] 14it [00:01, 9.92it/s] 16it [00:01, 9.97it/s] 18it [00:01, 10.00it/s] 20it [00:02, 10.03it/s] 22it [00:02, 10.04it/s] 24it [00:02, 10.05it/s] 26it [00:02, 10.05it/s] 28it [00:02, 9.69it/s] 29it [00:03, 9.48it/s] 30it [00:03, 9.34it/s] 31it [00:03, 9.44it/s] 32it [00:03, 9.49it/s] 33it [00:03, 9.17it/s] 34it [00:03, 9.23it/s] 35it [00:03, 9.36it/s] 36it [00:03, 9.45it/s] 37it [00:03, 9.56it/s] 38it [00:03, 9.63it/s] 39it [00:04, 9.63it/s] 40it [00:04, 9.67it/s] 41it [00:04, 9.71it/s] 42it [00:04, 9.31it/s] 44it [00:04, 9.65it/s] 46it [00:04, 9.80it/s] 48it [00:04, 9.89it/s] 49it [00:05, 9.47it/s]2025-05-26 05:52:52,144 - INFO - [Epoch 023 | Batch 0050] IWAE-loss 6445.8760 | mean log_px -0.0427 | KL -3562.69 + 51it [00:05, 9.66it/s] 53it [00:05, 9.80it/s] 54it [00:05, 9.83it/s] 56it [00:05, 9.91it/s] 58it [00:06, 9.95it/s] 60it [00:06, 9.99it/s] 62it [00:06, 10.01it/s] 64it [00:06, 10.02it/s] 66it [00:06, 10.03it/s] 68it [00:06, 10.05it/s] 70it [00:07, 10.05it/s] 72it [00:07, 10.06it/s] 74it [00:07, 10.05it/s] 76it [00:07, 10.03it/s] 78it [00:07, 10.04it/s] 80it [00:08, 10.03it/s] 82it [00:08, 10.05it/s] 84it [00:08, 10.05it/s] 86it [00:08, 10.04it/s] 88it [00:08, 10.04it/s] 90it [00:09, 10.04it/s] 92it [00:09, 10.04it/s] 94it [00:09, 10.04it/s] 96it [00:09, 10.04it/s] 98it [00:09, 10.04it/s] 100it [00:10, 9.68it/s]2025-05-26 05:52:57,147 - INFO - [Epoch 023 | Batch 0100] IWAE-loss 9278.5117 | mean log_px -0.0849 | KL -3567.39 + 102it [00:10, 9.78it/s] 104it [00:10, 9.86it/s] 105it [00:10, 9.87it/s] 106it [00:10, 9.49it/s] 108it [00:11, 9.69it/s] 110it [00:11, 9.82it/s] 112it [00:11, 9.90it/s] 114it [00:11, 9.94it/s] 116it [00:11, 9.61it/s] 118it [00:12, 9.75it/s] 120it [00:12, 9.79it/s] 121it [00:12, 9.39it/s] 123it [00:12, 9.60it/s] 125it [00:12, 9.40it/s] 126it [00:12, 9.51it/s] 128it [00:13, 9.71it/s] 130it [00:13, 9.83it/s] 132it [00:13, 9.90it/s] 133it [00:13, 9.52it/s] 135it [00:13, 9.70it/s] 136it [00:13, 9.75it/s] 138it [00:14, 9.86it/s] 139it [00:14, 9.86it/s] 140it [00:14, 9.89it/s] 142it [00:14, 9.96it/s] 144it [00:14, 10.01it/s] 145it [00:14, 9.57it/s] 146it [00:14, 9.66it/s] 148it [00:15, 9.82it/s] 149it [00:15, 9.41it/s] 150it [00:15, 9.53it/s]2025-05-26 05:53:02,292 - INFO - [Epoch 023 | Batch 0150] IWAE-loss 9398.9590 | mean log_px -0.0833 | KL -3566.49 + 151it [00:15, 9.65it/s] 152it [00:15, 9.74it/s] 153it [00:15, 9.24it/s] 154it [00:15, 9.43it/s] 156it [00:15, 9.72it/s] 158it [00:16, 9.86it/s] 160it [00:16, 9.93it/s] 162it [00:16, 9.98it/s] 164it [00:16, 9.62it/s] 165it [00:16, 9.66it/s] 166it [00:16, 9.69it/s] 168it [00:17, 9.84it/s] 170it [00:17, 9.92it/s] 172it [00:17, 9.98it/s] 174it [00:17, 9.97it/s] 175it [00:17, 9.52it/s] 176it [00:18, 9.59it/s] 178it [00:18, 9.76it/s] 180it [00:18, 9.86it/s] 182it [00:18, 9.55it/s] 184it [00:18, 9.70it/s] 186it [00:19, 9.81it/s] 188it [00:19, 9.63it/s] 190it [00:19, 9.77it/s] 192it [00:19, 9.86it/s] 194it [00:19, 9.93it/s] 195it [00:19, 9.67it/s] 196it [00:20, 9.74it/s] +2025-05-26 05:53:06,999 - INFO - Epoch: 23, Objective: tensor([7036.1016], device='cuda:0', grad_fn=), Loss: 0.05605386570096016, KL/n: 72.70604705810547 + 0it [00:00, ?it/s]2025-05-26 05:53:07,448 - INFO - [Epoch 024 | Batch 0000] IWAE-loss 10053.7881 | mean log_px -0.0965 | KL -3562.36 + 1it [00:00, 4.90it/s] 2it [00:00, 6.97it/s] 4it [00:00, 8.64it/s] 6it [00:00, 9.26it/s] 8it [00:00, 9.56it/s] 9it [00:01, 9.58it/s] 10it [00:01, 9.64it/s] 12it [00:01, 9.80it/s] 14it [00:01, 9.89it/s] 16it [00:01, 9.94it/s] 18it [00:01, 9.99it/s] 20it [00:02, 10.01it/s] 22it [00:02, 10.02it/s] 24it [00:02, 10.03it/s] 26it [00:02, 10.05it/s] 28it [00:02, 10.03it/s] 30it [00:03, 10.02it/s] 32it [00:03, 10.03it/s] 34it [00:03, 9.79it/s] 36it [00:03, 9.87it/s] 38it [00:03, 9.93it/s] 40it [00:04, 9.96it/s] 42it [00:04, 9.99it/s] 44it [00:04, 10.01it/s] 46it [00:04, 10.02it/s] 48it [00:04, 10.02it/s] 50it [00:05, 10.03it/s]2025-05-26 05:53:12,475 - INFO - [Epoch 024 | Batch 0050] IWAE-loss 7944.3613 | mean log_px -0.0672 | KL -3565.10 + 52it [00:05, 10.03it/s] 54it [00:05, 10.04it/s] 56it [00:05, 10.04it/s] 58it [00:05, 10.04it/s] 60it [00:06, 10.05it/s] 62it [00:06, 10.02it/s] 64it [00:06, 10.02it/s] 66it [00:06, 10.02it/s] 68it [00:06, 10.02it/s] 70it [00:07, 10.02it/s] 72it [00:07, 10.03it/s] 74it [00:07, 9.69it/s] 76it [00:07, 9.77it/s] 78it [00:07, 9.85it/s] 80it [00:08, 9.91it/s] 82it [00:08, 9.95it/s] 83it [00:08, 9.59it/s] 84it [00:08, 9.67it/s] 86it [00:08, 9.80it/s] 88it [00:08, 9.88it/s] 90it [00:09, 9.93it/s] 91it [00:09, 9.53it/s] 92it [00:09, 9.62it/s] 94it [00:09, 9.78it/s] 96it [00:09, 9.87it/s] 98it [00:09, 9.93it/s] 100it [00:10, 9.97it/s]2025-05-26 05:53:17,530 - INFO - [Epoch 024 | Batch 0100] IWAE-loss 6554.0537 | mean log_px -0.0452 | KL -3559.28 + 101it [00:10, 9.96it/s] 102it [00:10, 9.97it/s] 104it [00:10, 10.00it/s] 106it [00:10, 10.02it/s] 108it [00:10, 10.02it/s] 110it [00:11, 10.03it/s] 112it [00:11, 10.03it/s] 114it [00:11, 10.04it/s] 116it [00:11, 10.04it/s] 118it [00:11, 10.02it/s] 120it [00:12, 10.03it/s] 122it [00:12, 10.04it/s] 124it [00:12, 9.94it/s] 126it [00:12, 9.96it/s] 127it [00:12, 9.71it/s] 128it [00:12, 9.76it/s] 130it [00:13, 9.53it/s] 131it [00:13, 9.62it/s] 132it [00:13, 9.70it/s] 134it [00:13, 9.83it/s] 135it [00:13, 9.82it/s] 136it [00:13, 9.21it/s] 137it [00:13, 9.09it/s] 138it [00:14, 9.25it/s] 139it [00:14, 9.43it/s] 140it [00:14, 9.54it/s] 141it [00:14, 9.64it/s] 142it [00:14, 9.71it/s] 143it [00:14, 9.76it/s] 144it [00:14, 9.79it/s] 145it [00:14, 9.83it/s] 146it [00:14, 9.83it/s] 147it [00:14, 9.79it/s] 148it [00:15, 9.82it/s] 150it [00:15, 9.93it/s]2025-05-26 05:53:22,623 - INFO - [Epoch 024 | Batch 0150] IWAE-loss 11166.3877 | mean log_px -0.1161 | KL -3563.05 + 151it [00:15, 9.93it/s] 152it [00:15, 9.95it/s] 154it [00:15, 9.99it/s] 156it [00:15, 10.01it/s] 158it [00:16, 10.02it/s] 160it [00:16, 10.02it/s] 162it [00:16, 9.74it/s] 164it [00:16, 9.84it/s] 166it [00:16, 9.90it/s] 168it [00:17, 9.96it/s] 169it [00:17, 9.65it/s] 170it [00:17, 9.71it/s] 172it [00:17, 9.45it/s] 174it [00:17, 9.64it/s] 176it [00:17, 9.78it/s] 178it [00:18, 9.87it/s] 180it [00:18, 9.93it/s] 182it [00:18, 9.69it/s] 184it [00:18, 9.80it/s] 186it [00:18, 9.88it/s] 188it [00:19, 9.93it/s] 189it [00:19, 9.64it/s] 191it [00:19, 9.79it/s] 193it [00:19, 9.88it/s] 195it [00:19, 9.68it/s] 196it [00:20, 9.80it/s] +2025-05-26 05:53:27,317 - INFO - Epoch: 24, Objective: tensor([7781.2070], device='cuda:0', grad_fn=), Loss: 0.06895510107278824, KL/n: 72.64373779296875 + 0it [00:00, ?it/s]2025-05-26 05:53:27,592 - INFO - [Epoch 025 | Batch 0000] IWAE-loss 5908.9863 | mean log_px -0.0345 | KL -3553.46 + 1it [00:00, 4.75it/s] 2it [00:00, 6.79it/s] 4it [00:00, 8.55it/s] 6it [00:00, 9.23it/s] 8it [00:00, 9.56it/s] 10it [00:01, 9.77it/s] 12it [00:01, 9.87it/s] 14it [00:01, 9.94it/s] 16it [00:01, 10.00it/s] 18it [00:01, 10.04it/s] 20it [00:02, 10.01it/s] 22it [00:02, 9.93it/s] 24it [00:02, 9.96it/s] 26it [00:02, 10.00it/s] 28it [00:02, 10.01it/s] 30it [00:03, 9.62it/s] 32it [00:03, 9.75it/s] 34it [00:03, 9.83it/s] 35it [00:03, 9.79it/s] 36it [00:03, 9.37it/s] 38it [00:03, 9.61it/s] 40it [00:04, 9.76it/s] 42it [00:04, 9.87it/s] 43it [00:04, 9.49it/s] 44it [00:04, 9.59it/s] 46it [00:04, 9.77it/s] 47it [00:04, 9.39it/s] 48it [00:04, 9.52it/s] 50it [00:05, 9.71it/s]2025-05-26 05:53:32,700 - INFO - [Epoch 025 | Batch 0050] IWAE-loss 5141.8364 | mean log_px -0.0226 | KL -3558.55 + 52it [00:05, 9.82it/s] 54it [00:05, 9.89it/s] 56it [00:05, 9.94it/s] 58it [00:05, 9.98it/s] 60it [00:06, 9.66it/s] 62it [00:06, 9.78it/s] 64it [00:06, 9.88it/s] 66it [00:06, 9.95it/s] 68it [00:07, 9.99it/s] 70it [00:07, 10.01it/s] 72it [00:07, 10.03it/s] 74it [00:07, 10.04it/s] 76it [00:07, 10.04it/s] 78it [00:07, 10.03it/s] 80it [00:08, 9.76it/s] 82it [00:08, 9.86it/s] 84it [00:08, 9.91it/s] 86it [00:08, 9.97it/s] 88it [00:09, 10.00it/s] 90it [00:09, 10.02it/s] 92it [00:09, 10.03it/s] 94it [00:09, 10.05it/s] 96it [00:09, 10.06it/s] 98it [00:10, 10.07it/s] 100it [00:10, 10.07it/s]2025-05-26 05:53:37,708 - INFO - [Epoch 025 | Batch 0100] IWAE-loss 6209.9375 | mean log_px -0.0399 | KL -3555.98 + 102it [00:10, 9.86it/s] 103it [00:10, 9.55it/s] 104it [00:10, 9.06it/s] 105it [00:10, 9.24it/s] 107it [00:10, 9.56it/s] 109it [00:11, 9.74it/s] 111it [00:11, 9.84it/s] 113it [00:11, 9.92it/s] 115it [00:11, 9.97it/s] 117it [00:11, 9.66it/s] 119it [00:12, 9.78it/s] 121it [00:12, 9.88it/s] 123it [00:12, 9.95it/s] 125it [00:12, 9.98it/s] 127it [00:12, 10.01it/s] 129it [00:13, 10.04it/s] 131it [00:13, 10.05it/s] 133it [00:13, 10.04it/s] 135it [00:13, 10.04it/s] 137it [00:13, 10.05it/s] 139it [00:14, 9.64it/s] 141it [00:14, 9.77it/s] 143it [00:14, 9.86it/s] 145it [00:14, 9.92it/s] 146it [00:14, 9.93it/s] 148it [00:15, 9.57it/s] 150it [00:15, 9.71it/s]2025-05-26 05:53:42,820 - INFO - [Epoch 025 | Batch 0150] IWAE-loss 8218.2256 | mean log_px -0.0712 | KL -3553.84 + 151it [00:15, 9.76it/s] 152it [00:15, 9.81it/s] 154it [00:15, 9.49it/s] 156it [00:15, 9.68it/s] 158it [00:16, 9.82it/s] 160it [00:16, 9.62it/s] 162it [00:16, 9.75it/s] 164it [00:16, 9.85it/s] 166it [00:16, 9.93it/s] 168it [00:17, 9.98it/s] 169it [00:17, 9.67it/s] 170it [00:17, 9.74it/s] 172it [00:17, 9.87it/s] 173it [00:17, 9.89it/s] 175it [00:17, 9.96it/s] 176it [00:17, 9.90it/s] 178it [00:18, 9.97it/s] 180it [00:18, 10.01it/s] 182it [00:18, 10.03it/s] 184it [00:18, 10.06it/s] 186it [00:18, 10.07it/s] 188it [00:19, 9.73it/s] 190it [00:19, 9.84it/s] 192it [00:19, 9.92it/s] 194it [00:19, 9.97it/s] 195it [00:19, 9.69it/s] 196it [00:19, 9.70it/s] 196it [00:20, 9.78it/s] +2025-05-26 05:53:47,492 - INFO - Epoch: 25, Objective: tensor([8688.2051], device='cuda:0', grad_fn=), Loss: 0.08251015841960907, KL/n: 72.58772277832031 + 0it [00:00, ?it/s]2025-05-26 05:53:47,945 - INFO - [Epoch 026 | Batch 0000] IWAE-loss 7151.1875 | mean log_px -0.0637 | KL -3554.05 + 1it [00:00, 2.57it/s] 3it [00:00, 5.74it/s] 4it [00:00, 6.39it/s] 5it [00:00, 7.24it/s] 6it [00:00, 7.93it/s] 8it [00:01, 8.82it/s] 9it [00:01, 9.09it/s] 11it [00:01, 9.49it/s] 12it [00:01, 9.60it/s] 14it [00:01, 9.35it/s] 16it [00:01, 9.61it/s] 18it [00:02, 9.76it/s] 20it [00:02, 9.85it/s] 22it [00:02, 9.93it/s] 23it [00:02, 9.92it/s] 25it [00:02, 9.80it/s] 26it [00:02, 9.47it/s] 28it [00:03, 9.67it/s] 29it [00:03, 9.74it/s] 30it [00:03, 9.79it/s] 31it [00:03, 9.83it/s] 32it [00:03, 9.87it/s] 34it [00:03, 9.94it/s] 36it [00:03, 9.98it/s] 38it [00:04, 10.02it/s] 40it [00:04, 10.03it/s] 42it [00:04, 10.04it/s] 44it [00:04, 9.61it/s] 45it [00:04, 9.55it/s] 46it [00:04, 9.47it/s] 47it [00:05, 9.51it/s] 48it [00:05, 9.54it/s] 49it [00:05, 9.59it/s] 50it [00:05, 9.62it/s]2025-05-26 05:53:53,092 - INFO - [Epoch 026 | Batch 0050] IWAE-loss 8084.2090 | mean log_px -0.0655 | KL -3553.26 + 51it [00:05, 9.65it/s] 52it [00:05, 9.69it/s] 53it [00:05, 9.74it/s] 54it [00:05, 9.74it/s] 55it [00:05, 9.77it/s] 56it [00:06, 9.73it/s] 57it [00:06, 9.73it/s] 58it [00:06, 9.76it/s] 60it [00:06, 9.75it/s] 62it [00:06, 9.87it/s] 64it [00:06, 9.62it/s] 66it [00:07, 9.67it/s] 67it [00:07, 9.72it/s] 68it [00:07, 9.78it/s] 70it [00:07, 9.88it/s] 72it [00:07, 9.94it/s] 74it [00:07, 9.97it/s] 76it [00:08, 10.00it/s] 78it [00:08, 9.65it/s] 79it [00:08, 9.71it/s] 81it [00:08, 9.83it/s] 83it [00:08, 9.54it/s] 84it [00:08, 9.62it/s] 85it [00:08, 9.69it/s] 86it [00:09, 9.75it/s] 87it [00:09, 9.80it/s] 88it [00:09, 9.85it/s] 90it [00:09, 9.94it/s] 92it [00:09, 9.99it/s] 94it [00:09, 10.01it/s] 96it [00:10, 10.03it/s] 98it [00:10, 10.03it/s] 100it [00:10, 10.04it/s]2025-05-26 05:53:58,171 - INFO - [Epoch 026 | Batch 0100] IWAE-loss 6382.7183 | mean log_px -0.0501 | KL -3556.70 + 102it [00:10, 10.03it/s] 104it [00:10, 9.82it/s] 105it [00:11, 9.48it/s] 107it [00:11, 9.67it/s] 108it [00:11, 9.73it/s] 110it [00:11, 9.84it/s] 112it [00:11, 9.55it/s] 114it [00:11, 9.70it/s] 116it [00:12, 9.81it/s] 118it [00:12, 9.89it/s] 119it [00:12, 9.90it/s] 120it [00:12, 9.80it/s] 121it [00:12, 9.49it/s] 122it [00:12, 9.60it/s] 124it [00:12, 9.35it/s] 126it [00:13, 9.58it/s] 128it [00:13, 9.74it/s] 129it [00:13, 9.75it/s] 130it [00:13, 9.78it/s] 131it [00:13, 9.76it/s] 132it [00:13, 9.81it/s] 134it [00:13, 9.91it/s] 135it [00:14, 9.92it/s] 136it [00:14, 9.89it/s] 137it [00:14, 9.43it/s] 138it [00:14, 9.56it/s] 140it [00:14, 9.77it/s] 142it [00:14, 9.87it/s] 144it [00:15, 9.92it/s] 146it [00:15, 9.92it/s] 147it [00:15, 9.84it/s] 148it [00:15, 9.77it/s] 149it [00:15, 9.75it/s] 150it [00:15, 9.78it/s]2025-05-26 05:54:03,313 - INFO - [Epoch 026 | Batch 0150] IWAE-loss 8474.0977 | mean log_px -0.0783 | KL -3551.70 + 151it [00:15, 9.77it/s] 152it [00:15, 9.72it/s] 153it [00:15, 9.75it/s] 154it [00:16, 9.75it/s] 155it [00:16, 9.78it/s] 156it [00:16, 9.78it/s] 157it [00:16, 9.76it/s] 158it [00:16, 9.74it/s] 159it [00:16, 9.72it/s] 160it [00:16, 9.71it/s] 161it [00:16, 9.71it/s] 162it [00:16, 9.73it/s] 163it [00:16, 9.77it/s] 164it [00:17, 9.73it/s] 165it [00:17, 9.75it/s] 166it [00:17, 9.72it/s] 167it [00:17, 9.72it/s] 168it [00:17, 9.69it/s] 169it [00:17, 9.72it/s] 170it [00:17, 9.74it/s] 171it [00:17, 9.63it/s] 172it [00:17, 9.69it/s] 173it [00:17, 9.67it/s] 174it [00:18, 9.67it/s] 175it [00:18, 9.70it/s] 176it [00:18, 9.73it/s] 177it [00:18, 9.74it/s] 178it [00:18, 9.77it/s] 179it [00:18, 9.77it/s] 180it [00:18, 9.76it/s] 181it [00:18, 9.78it/s] 182it [00:18, 9.80it/s] 183it [00:19, 9.80it/s] 184it [00:19, 9.78it/s] 185it [00:19, 9.77it/s] 186it [00:19, 9.77it/s] 187it [00:19, 9.80it/s] 188it [00:19, 9.78it/s] 189it [00:19, 9.77it/s] 190it [00:19, 9.77it/s] 191it [00:19, 9.76it/s] 192it [00:19, 9.76it/s] 193it [00:20, 9.76it/s] 194it [00:20, 9.76it/s] 195it [00:20, 9.24it/s] 196it [00:20, 9.59it/s] +2025-05-26 05:54:08,053 - INFO - Epoch: 26, Objective: tensor([10124.8457], device='cuda:0', grad_fn=), Loss: 0.10262526571750641, KL/n: 72.52192687988281 + 0it [00:00, ?it/s]2025-05-26 05:54:08,341 - INFO - [Epoch 027 | Batch 0000] IWAE-loss 5660.2915 | mean log_px -0.0403 | KL -3550.19 + 1it [00:00, 5.05it/s] 2it [00:00, 6.96it/s] 3it [00:00, 7.43it/s] 4it [00:00, 8.19it/s] 5it [00:00, 8.71it/s] 6it [00:00, 9.05it/s] 7it [00:00, 9.29it/s] 8it [00:00, 9.41it/s] 9it [00:01, 9.52it/s] 10it [00:01, 9.56it/s] 11it [00:01, 9.63it/s] 12it [00:01, 9.65it/s] 13it [00:01, 9.71it/s] 14it [00:01, 9.70it/s] 15it [00:01, 9.72it/s] 16it [00:01, 9.71it/s] 17it [00:01, 9.74it/s] 18it [00:01, 9.77it/s] 19it [00:02, 9.75it/s] 20it [00:02, 9.71it/s] 21it [00:02, 9.31it/s] 22it [00:02, 9.42it/s] 23it [00:02, 9.55it/s] 24it [00:02, 9.63it/s] 25it [00:02, 9.71it/s] 26it [00:02, 9.73it/s] 27it [00:02, 9.78it/s] 28it [00:03, 9.77it/s] 29it [00:03, 9.78it/s] 30it [00:03, 9.77it/s] 31it [00:03, 9.81it/s] 32it [00:03, 9.79it/s] 33it [00:03, 9.82it/s] 34it [00:03, 9.78it/s] 35it [00:03, 9.77it/s] 36it [00:03, 9.79it/s] 37it [00:03, 9.82it/s] 38it [00:04, 9.76it/s] 39it [00:04, 9.78it/s] 40it [00:04, 9.70it/s] 41it [00:04, 9.70it/s] 42it [00:04, 9.08it/s] 43it [00:04, 9.28it/s] 44it [00:04, 9.37it/s] 45it [00:04, 9.49it/s] 46it [00:04, 9.53it/s] 47it [00:04, 9.58it/s] 48it [00:05, 9.62it/s] 49it [00:05, 9.67it/s] 50it [00:05, 9.69it/s]2025-05-26 05:54:13,530 - INFO - [Epoch 027 | Batch 0050] IWAE-loss 7041.8789 | mean log_px -0.0514 | KL -3547.65 + 51it [00:05, 9.74it/s] 52it [00:05, 9.72it/s] 53it [00:05, 9.73it/s] 54it [00:05, 9.73it/s] 55it [00:05, 9.72it/s] 56it [00:05, 9.69it/s] 57it [00:06, 9.71it/s] 58it [00:06, 9.73it/s] 59it [00:06, 9.77it/s] 60it [00:06, 9.76it/s] 61it [00:06, 9.18it/s] 62it [00:06, 9.34it/s] 63it [00:06, 9.48it/s] 64it [00:06, 9.57it/s] 65it [00:06, 9.63it/s] 66it [00:06, 9.69it/s] 67it [00:07, 9.73it/s] 68it [00:07, 9.74it/s] 69it [00:07, 9.74it/s] 70it [00:07, 9.75it/s] 71it [00:07, 9.18it/s] 72it [00:07, 9.34it/s] 73it [00:07, 9.46it/s] 74it [00:07, 9.54it/s] 75it [00:07, 9.60it/s] 76it [00:07, 9.62it/s] 77it [00:08, 9.67it/s] 78it [00:08, 9.71it/s] 79it [00:08, 9.73it/s] 80it [00:08, 9.12it/s] 81it [00:08, 9.30it/s] 82it [00:08, 9.27it/s] 83it [00:08, 9.38it/s] 84it [00:08, 9.45it/s] 85it [00:08, 9.54it/s] 86it [00:09, 9.49it/s] 87it [00:09, 9.60it/s] 88it [00:09, 9.65it/s] 89it [00:09, 9.69it/s] 90it [00:09, 9.69it/s] 91it [00:09, 9.71it/s] 92it [00:09, 9.73it/s] 93it [00:09, 9.74it/s] 94it [00:09, 9.73it/s] 95it [00:09, 9.72it/s] 96it [00:10, 9.72it/s] 97it [00:10, 9.77it/s] 98it [00:10, 9.77it/s] 99it [00:10, 9.14it/s] 100it [00:10, 9.32it/s]2025-05-26 05:54:18,756 - INFO - [Epoch 027 | Batch 0100] IWAE-loss 7957.1924 | mean log_px -0.0696 | KL -3551.78 + 101it [00:10, 9.46it/s] 102it [00:10, 9.54it/s] 103it [00:10, 9.63it/s] 104it [00:10, 9.59it/s] 105it [00:11, 9.65it/s] 106it [00:11, 9.66it/s] 107it [00:11, 9.70it/s] 108it [00:11, 9.57it/s] 109it [00:11, 9.54it/s] 110it [00:11, 9.55it/s] 111it [00:11, 9.14it/s] 112it [00:11, 9.30it/s] 113it [00:11, 9.45it/s] 114it [00:11, 9.52it/s] 115it [00:12, 9.62it/s] 116it [00:12, 9.66it/s] 117it [00:12, 9.17it/s] 118it [00:12, 9.32it/s] 119it [00:12, 9.48it/s] 120it [00:12, 9.56it/s] 121it [00:12, 9.63it/s] 122it [00:12, 9.66it/s] 123it [00:12, 9.71it/s] 124it [00:13, 9.72it/s] 125it [00:13, 9.71it/s] 126it [00:13, 9.68it/s] 127it [00:13, 9.75it/s] 128it [00:13, 9.72it/s] 129it [00:13, 9.77it/s] 130it [00:13, 9.77it/s] 131it [00:13, 9.76it/s] 132it [00:13, 9.75it/s] 133it [00:13, 9.76it/s] 134it [00:14, 9.72it/s] 135it [00:14, 9.15it/s] 136it [00:14, 9.31it/s] 137it [00:14, 9.44it/s] 138it [00:14, 9.53it/s] 139it [00:14, 9.62it/s] 140it [00:14, 9.65it/s] 141it [00:14, 9.66it/s] 142it [00:14, 9.68it/s] 143it [00:14, 9.74it/s] 144it [00:15, 9.74it/s] 145it [00:15, 9.77it/s] 146it [00:15, 9.73it/s] 147it [00:15, 9.76it/s] 148it [00:15, 9.76it/s] 149it [00:15, 9.64it/s] 150it [00:15, 9.59it/s]2025-05-26 05:54:23,965 - INFO - [Epoch 027 | Batch 0150] IWAE-loss 7002.5981 | mean log_px -0.0568 | KL -3547.20 + 151it [00:15, 8.90it/s] 152it [00:15, 9.05it/s] 153it [00:16, 9.22it/s] 154it [00:16, 9.32it/s] 155it [00:16, 9.39it/s] 156it [00:16, 9.44it/s] 157it [00:16, 9.49it/s] 158it [00:16, 9.52it/s] 159it [00:16, 9.55it/s] 160it [00:16, 9.55it/s] 161it [00:16, 9.44it/s] 162it [00:16, 9.49it/s] 163it [00:17, 9.59it/s] 164it [00:17, 9.64it/s] 165it [00:17, 9.19it/s] 166it [00:17, 9.35it/s] 167it [00:17, 9.49it/s] 168it [00:17, 9.53it/s] 169it [00:17, 9.62it/s] 170it [00:17, 9.65it/s] 171it [00:17, 9.65it/s] 172it [00:18, 9.67it/s] 173it [00:18, 9.69it/s] 174it [00:18, 9.70it/s] 175it [00:18, 9.72it/s] 176it [00:18, 9.12it/s] 177it [00:18, 9.32it/s] 178it [00:18, 9.45it/s] 179it [00:18, 9.56it/s] 180it [00:18, 9.62it/s] 181it [00:18, 9.68it/s] 182it [00:19, 9.71it/s] 183it [00:19, 9.75it/s] 184it [00:19, 9.29it/s] 185it [00:19, 9.44it/s] 186it [00:19, 9.50it/s] 187it [00:19, 9.58it/s] 188it [00:19, 9.64it/s] 189it [00:19, 9.69it/s] 190it [00:19, 9.70it/s] 191it [00:20, 9.73it/s] 192it [00:20, 9.42it/s] 193it [00:20, 9.53it/s] 194it [00:20, 8.97it/s] 195it [00:20, 8.70it/s] 196it [00:20, 9.49it/s] +2025-05-26 05:54:28,835 - INFO - Epoch: 27, Objective: tensor([5026.2368], device='cuda:0', grad_fn=), Loss: 0.021482713520526886, KL/n: 72.46076965332031 + 0it [00:00, ?it/s]2025-05-26 05:54:29,111 - INFO - [Epoch 028 | Batch 0000] IWAE-loss 6144.6147 | mean log_px -0.0405 | KL -3548.91 + 1it [00:00, 4.65it/s] 2it [00:00, 6.72it/s] 3it [00:00, 7.84it/s] 4it [00:00, 8.49it/s] 5it [00:00, 8.94it/s] 6it [00:00, 9.20it/s] 7it [00:00, 9.39it/s] 8it [00:00, 9.50it/s] 9it [00:01, 9.62it/s] 10it [00:01, 9.66it/s] 11it [00:01, 9.71it/s] 12it [00:01, 9.68it/s] 13it [00:01, 9.70it/s] 14it [00:01, 6.00it/s] 15it [00:01, 6.80it/s] 16it [00:01, 7.48it/s] 17it [00:02, 8.07it/s] 18it [00:02, 8.53it/s] 19it [00:02, 8.89it/s] 20it [00:02, 8.98it/s] 21it [00:02, 9.19it/s] 22it [00:02, 9.32it/s] 23it [00:02, 9.47it/s] 24it [00:02, 9.56it/s] 25it [00:02, 9.60it/s] 26it [00:02, 9.66it/s] 27it [00:03, 9.71it/s] 28it [00:03, 9.72it/s] 29it [00:03, 9.74it/s] 30it [00:03, 9.74it/s] 31it [00:03, 9.80it/s] 32it [00:03, 9.22it/s] 33it [00:03, 9.40it/s] 34it [00:03, 9.51it/s] 35it [00:03, 9.61it/s] 36it [00:04, 9.65it/s] 37it [00:04, 9.68it/s] 38it [00:04, 9.45it/s] 39it [00:04, 9.45it/s] 40it [00:04, 9.51it/s] 41it [00:04, 9.58it/s] 42it [00:04, 9.63it/s] 43it [00:04, 9.70it/s] 44it [00:04, 9.72it/s] 45it [00:04, 9.76it/s] 46it [00:05, 9.76it/s] 47it [00:05, 9.78it/s] 48it [00:05, 9.75it/s] 49it [00:05, 9.75it/s] 50it [00:05, 9.73it/s]2025-05-26 05:54:34,505 - INFO - [Epoch 028 | Batch 0050] IWAE-loss 7022.5996 | mean log_px -0.0538 | KL -3548.01 + 51it [00:05, 9.17it/s] 52it [00:05, 9.29it/s] 53it [00:05, 9.38it/s] 54it [00:05, 9.48it/s] 55it [00:06, 9.55it/s] 56it [00:06, 9.60it/s] 57it [00:06, 9.44it/s] 58it [00:06, 9.38it/s] 59it [00:06, 9.37it/s] 60it [00:06, 8.81it/s] 61it [00:06, 9.07it/s] 62it [00:06, 8.69it/s] 63it [00:06, 8.97it/s] 64it [00:07, 9.18it/s] 65it [00:07, 9.34it/s] 66it [00:07, 9.40it/s] 67it [00:07, 9.51it/s] 68it [00:07, 9.55it/s] 69it [00:07, 9.61it/s] 70it [00:07, 9.15it/s] 71it [00:07, 9.31it/s] 72it [00:07, 9.43it/s] 73it [00:07, 8.99it/s] 74it [00:08, 9.17it/s] 75it [00:08, 9.36it/s] 76it [00:08, 9.43it/s] 77it [00:08, 9.51it/s] 78it [00:08, 9.08it/s] 79it [00:08, 9.28it/s] 80it [00:08, 9.40it/s] 81it [00:08, 9.53it/s] 82it [00:08, 9.20it/s] 83it [00:09, 9.37it/s] 84it [00:09, 9.48it/s] 85it [00:09, 9.59it/s] 86it [00:09, 9.62it/s] 87it [00:09, 9.67it/s] 88it [00:09, 9.61it/s] 89it [00:09, 9.65it/s] 90it [00:09, 9.07it/s] 91it [00:09, 9.27it/s] 92it [00:09, 9.39it/s] 93it [00:10, 9.51it/s] 94it [00:10, 9.57it/s] 95it [00:10, 9.63it/s] 96it [00:10, 9.66it/s] 97it [00:10, 9.72it/s] 98it [00:10, 8.81it/s] 99it [00:10, 8.88it/s] 100it [00:10, 9.02it/s]2025-05-26 05:54:39,879 - INFO - [Epoch 028 | Batch 0100] IWAE-loss 7795.5220 | mean log_px -0.0668 | KL -3546.89 + 101it [00:10, 9.25it/s] 102it [00:11, 8.93it/s] 103it [00:11, 9.16it/s] 104it [00:11, 9.30it/s] 105it [00:11, 9.46it/s] 106it [00:11, 9.55it/s] 107it [00:11, 9.10it/s] 108it [00:11, 9.29it/s] 109it [00:11, 9.45it/s] 110it [00:11, 9.52it/s] 111it [00:12, 9.60it/s] 112it [00:12, 9.63it/s] 113it [00:12, 9.69it/s] 114it [00:12, 9.72it/s] 115it [00:12, 9.75it/s] 116it [00:12, 9.27it/s] 117it [00:12, 9.42it/s] 118it [00:12, 9.54it/s] 119it [00:12, 9.58it/s] 120it [00:12, 9.65it/s] 121it [00:13, 9.72it/s] 122it [00:13, 9.73it/s] 123it [00:13, 9.74it/s] 124it [00:13, 9.74it/s] 125it [00:13, 9.75it/s] 126it [00:13, 9.75it/s] 127it [00:13, 9.17it/s] 128it [00:13, 9.35it/s] 129it [00:13, 9.51it/s] 130it [00:13, 9.59it/s] 131it [00:14, 9.66it/s] 132it [00:14, 9.66it/s] 133it [00:14, 9.23it/s] 134it [00:14, 9.36it/s] 135it [00:14, 9.46it/s] 136it [00:14, 9.55it/s] 137it [00:14, 9.60it/s] 138it [00:14, 9.63it/s] 139it [00:14, 9.68it/s] 140it [00:15, 9.69it/s] 141it [00:15, 9.68it/s] 142it [00:15, 9.68it/s] 143it [00:15, 9.67it/s] 144it [00:15, 9.66it/s] 145it [00:15, 9.70it/s] 146it [00:15, 9.44it/s] 147it [00:15, 9.49it/s] 148it [00:15, 9.52it/s] 149it [00:15, 9.59it/s] 150it [00:16, 9.61it/s]2025-05-26 05:54:45,114 - INFO - [Epoch 028 | Batch 0150] IWAE-loss 6129.2549 | mean log_px -0.0445 | KL -3552.00 + 151it [00:16, 9.62it/s] 152it [00:16, 9.17it/s] 153it [00:16, 9.34it/s] 154it [00:16, 9.44it/s] 155it [00:16, 9.55it/s] 156it [00:16, 9.60it/s] 157it [00:16, 9.65it/s] 158it [00:16, 9.68it/s] 159it [00:17, 9.72it/s] 160it [00:17, 9.73it/s] 161it [00:17, 9.76it/s] 162it [00:17, 9.76it/s] 163it [00:17, 9.75it/s] 164it [00:17, 9.73it/s] 165it [00:17, 9.12it/s] 166it [00:17, 9.31it/s] 167it [00:17, 9.43it/s] 168it [00:17, 9.46it/s] 169it [00:18, 8.71it/s] 170it [00:18, 8.78it/s] 171it [00:18, 9.04it/s] 172it [00:18, 9.21it/s] 173it [00:18, 8.91it/s] 174it [00:18, 9.15it/s] 175it [00:18, 9.31it/s] 176it [00:18, 9.44it/s] 177it [00:18, 9.57it/s] 178it [00:19, 9.64it/s] 179it [00:19, 9.72it/s] 180it [00:19, 9.72it/s] 181it [00:19, 9.74it/s] 182it [00:19, 9.74it/s] 183it [00:19, 9.75it/s] 184it [00:19, 9.76it/s] 185it [00:19, 9.75it/s] 186it [00:19, 9.73it/s] 187it [00:19, 9.73it/s] 188it [00:20, 9.72it/s] 189it [00:20, 9.70it/s] 190it [00:20, 9.68it/s] 191it [00:20, 9.73it/s] 192it [00:20, 9.72it/s] 193it [00:20, 9.75it/s] 194it [00:20, 9.74it/s] 195it [00:20, 9.18it/s] 196it [00:20, 9.34it/s] +2025-05-26 05:54:49,943 - INFO - Epoch: 28, Objective: tensor([7316.0479], device='cuda:0', grad_fn=), Loss: 0.06041298806667328, KL/n: 72.37413787841797 + 0it [00:00, ?it/s]2025-05-26 05:54:50,235 - INFO - [Epoch 029 | Batch 0000] IWAE-loss 5790.9482 | mean log_px -0.0366 | KL -3544.11 + 1it [00:00, 4.90it/s] 2it [00:00, 6.95it/s] 3it [00:00, 8.01it/s] 4it [00:00, 8.62it/s] 5it [00:00, 9.02it/s] 6it [00:00, 9.26it/s] 7it [00:00, 9.33it/s] 8it [00:00, 9.48it/s] 9it [00:01, 9.58it/s] 10it [00:01, 9.65it/s] 11it [00:01, 9.70it/s] 12it [00:01, 9.71it/s] 13it [00:01, 9.73it/s] 14it [00:01, 9.75it/s] 15it [00:01, 9.77it/s] 16it [00:01, 9.76it/s] 17it [00:01, 9.79it/s] 18it [00:01, 9.76it/s] 19it [00:02, 9.80it/s] 20it [00:02, 9.79it/s] 21it [00:02, 9.77it/s] 22it [00:02, 9.77it/s] 23it [00:02, 9.79it/s] 24it [00:02, 9.77it/s] 25it [00:02, 9.78it/s] 26it [00:02, 9.76it/s] 27it [00:02, 9.77it/s] 28it [00:02, 9.74it/s] 29it [00:03, 9.74it/s] 30it [00:03, 9.75it/s] 31it [00:03, 9.80it/s] 32it [00:03, 9.80it/s] 33it [00:03, 9.82it/s] 34it [00:03, 9.80it/s] 35it [00:03, 9.79it/s] 36it [00:03, 9.78it/s] 37it [00:03, 9.76it/s] 38it [00:03, 9.76it/s] 39it [00:04, 9.78it/s] 40it [00:04, 9.78it/s] 41it [00:04, 9.77it/s] 42it [00:04, 9.76it/s] 43it [00:04, 9.76it/s] 44it [00:04, 9.73it/s] 45it [00:04, 9.77it/s] 46it [00:04, 9.78it/s] 47it [00:04, 9.80it/s] 48it [00:05, 9.76it/s] 49it [00:05, 9.67it/s] 50it [00:05, 9.35it/s]2025-05-26 05:54:55,373 - INFO - [Epoch 029 | Batch 0050] IWAE-loss 8045.6401 | mean log_px -0.0730 | KL -3546.79 + 51it [00:05, 9.34it/s] 52it [00:05, 9.45it/s] 53it [00:05, 9.58it/s] 54it [00:05, 9.64it/s] 55it [00:05, 9.69it/s] 56it [00:05, 9.68it/s] 57it [00:05, 9.70it/s] 58it [00:06, 9.70it/s] 59it [00:06, 9.72it/s] 60it [00:06, 9.71it/s] 61it [00:06, 9.66it/s] 62it [00:06, 9.69it/s] 63it [00:06, 9.75it/s] 64it [00:06, 9.75it/s] 65it [00:06, 9.73it/s] 66it [00:06, 9.73it/s] 67it [00:06, 9.72it/s] 68it [00:07, 9.75it/s] 69it [00:07, 9.76it/s] 70it [00:07, 9.77it/s] 71it [00:07, 9.77it/s] 72it [00:07, 9.76it/s] 73it [00:07, 9.80it/s] 74it [00:07, 9.81it/s] 75it [00:07, 9.83it/s] 76it [00:07, 9.83it/s] 77it [00:08, 9.85it/s] 78it [00:08, 9.82it/s] 79it [00:08, 9.81it/s] 80it [00:08, 9.82it/s] 81it [00:08, 9.81it/s] 82it [00:08, 9.82it/s] 83it [00:08, 9.82it/s] 84it [00:08, 9.80it/s] 85it [00:08, 9.78it/s] 86it [00:08, 9.77it/s] 87it [00:09, 9.77it/s] 88it [00:09, 9.74it/s] 89it [00:09, 9.78it/s] 90it [00:09, 9.75it/s] 91it [00:09, 9.79it/s] 92it [00:09, 9.76it/s] 93it [00:09, 9.77it/s] 94it [00:09, 9.77it/s] 95it [00:09, 9.80it/s] 96it [00:09, 9.81it/s] 97it [00:10, 9.83it/s] 98it [00:10, 9.79it/s] 99it [00:10, 9.81it/s] 100it [00:10, 9.82it/s]2025-05-26 05:55:00,488 - INFO - [Epoch 029 | Batch 0100] IWAE-loss 7717.3555 | mean log_px -0.0658 | KL -3546.15 + 101it [00:10, 9.75it/s] 102it [00:10, 9.74it/s] 103it [00:10, 9.76it/s] 104it [00:10, 9.77it/s] 105it [00:10, 9.79it/s] 106it [00:10, 9.80it/s] 107it [00:11, 9.79it/s] 108it [00:11, 9.78it/s] 109it [00:11, 9.77it/s] 110it [00:11, 9.67it/s] 111it [00:11, 9.71it/s] 112it [00:11, 9.55it/s] 113it [00:11, 9.58it/s] 114it [00:11, 9.59it/s] 115it [00:11, 9.65it/s] 116it [00:12, 9.68it/s] 117it [00:12, 9.61it/s] 118it [00:12, 9.54it/s] 119it [00:12, 9.44it/s] 120it [00:12, 9.34it/s] 121it [00:12, 9.44it/s] 122it [00:12, 9.47it/s] 123it [00:12, 9.52it/s] 124it [00:12, 9.53it/s] 125it [00:12, 9.60it/s] 126it [00:13, 9.59it/s] 127it [00:13, 9.66it/s] 128it [00:13, 9.66it/s] 129it [00:13, 9.65it/s] 130it [00:13, 9.68it/s] 131it [00:13, 9.69it/s] 132it [00:13, 9.71it/s] 133it [00:13, 9.75it/s] 134it [00:13, 9.72it/s] 135it [00:13, 9.76it/s] 136it [00:14, 9.70it/s] 137it [00:14, 9.72it/s] 138it [00:14, 9.70it/s] 139it [00:14, 9.70it/s] 140it [00:14, 9.47it/s] 141it [00:14, 9.55it/s] 142it [00:14, 9.58it/s] 143it [00:14, 9.66it/s] 144it [00:14, 9.66it/s] 145it [00:15, 9.63it/s] 146it [00:15, 9.64it/s] 147it [00:15, 9.69it/s] 148it [00:15, 9.70it/s] 149it [00:15, 9.73it/s] 150it [00:15, 9.69it/s]2025-05-26 05:55:05,672 - INFO - [Epoch 029 | Batch 0150] IWAE-loss 9115.5293 | mean log_px -0.0874 | KL -3541.34 + 151it [00:15, 9.33it/s] 152it [00:15, 9.46it/s] 153it [00:15, 9.55it/s] 154it [00:15, 9.60it/s] 155it [00:16, 9.61it/s] 156it [00:16, 9.60it/s] 157it [00:16, 9.66it/s] 158it [00:16, 9.66it/s] 159it [00:16, 9.47it/s] 160it [00:16, 9.52it/s] 161it [00:16, 9.62it/s] 162it [00:16, 9.66it/s] 163it [00:16, 9.67it/s] 164it [00:16, 9.68it/s] 165it [00:17, 9.71it/s] 166it [00:17, 9.68it/s] 167it [00:17, 9.70it/s] 168it [00:17, 9.71it/s] 169it [00:17, 9.73it/s] 170it [00:17, 9.68it/s] 171it [00:17, 9.69it/s] 172it [00:17, 9.62it/s] 173it [00:17, 9.65it/s] 174it [00:18, 9.63it/s] 175it [00:18, 9.65it/s] 176it [00:18, 9.64it/s] 177it [00:18, 9.67it/s] 178it [00:18, 9.65it/s] 179it [00:18, 9.07it/s] 180it [00:18, 9.25it/s] 181it [00:18, 9.36it/s] 182it [00:18, 9.45it/s] 183it [00:18, 9.53it/s] 184it [00:19, 9.57it/s] 185it [00:19, 9.60it/s] 186it [00:19, 9.64it/s] 187it [00:19, 9.65it/s] 188it [00:19, 9.69it/s] 189it [00:19, 9.66it/s] 190it [00:19, 9.64it/s] 191it [00:19, 9.70it/s] 192it [00:19, 9.73it/s] 193it [00:20, 9.75it/s] 194it [00:20, 9.73it/s] 195it [00:20, 9.17it/s] 196it [00:20, 9.40it/s] 196it [00:20, 9.61it/s] +2025-05-26 05:55:10,458 - INFO - Epoch: 29, Objective: tensor([7595.7744], device='cuda:0', grad_fn=), Loss: 0.06281988322734833, KL/n: 72.2783432006836 + 0it [00:00, ?it/s]2025-05-26 05:55:10,737 - INFO - [Epoch 030 | Batch 0000] IWAE-loss 7184.0381 | mean log_px -0.0520 | KL -3540.00 + 1it [00:00, 4.71it/s] 2it [00:00, 6.72it/s] 3it [00:00, 7.83it/s] 4it [00:00, 8.47it/s] 5it [00:00, 8.92it/s] 6it [00:00, 9.18it/s] 7it [00:00, 9.35it/s] 8it [00:00, 9.46it/s] 9it [00:01, 9.58it/s] 10it [00:01, 9.60it/s] 11it [00:01, 9.67it/s] 12it [00:01, 9.70it/s] 13it [00:01, 9.70it/s] 14it [00:01, 9.71it/s] 15it [00:01, 9.76it/s] 16it [00:01, 9.75it/s] 17it [00:01, 9.75it/s] 18it [00:01, 9.71it/s] 19it [00:02, 9.14it/s] 20it [00:02, 9.30it/s] 21it [00:02, 9.45it/s] 22it [00:02, 9.54it/s] 23it [00:02, 9.61it/s] 24it [00:02, 9.65it/s] 25it [00:02, 9.69it/s] 26it [00:02, 9.69it/s] 27it [00:02, 9.61it/s] 28it [00:03, 9.58it/s] 29it [00:03, 9.67it/s] 30it [00:03, 9.71it/s] 31it [00:03, 9.72it/s] 32it [00:03, 9.71it/s] 33it [00:03, 9.69it/s] 34it [00:03, 9.66it/s] 35it [00:03, 9.71it/s] 36it [00:03, 9.73it/s] 37it [00:03, 9.70it/s] 38it [00:04, 9.10it/s] 39it [00:04, 9.28it/s] 40it [00:04, 9.38it/s] 41it [00:04, 9.49it/s] 42it [00:04, 9.55it/s] 43it [00:04, 9.41it/s] 44it [00:04, 9.47it/s] 45it [00:04, 9.54it/s] 46it [00:04, 9.56it/s] 47it [00:04, 9.62it/s] 48it [00:05, 6.27it/s] 49it [00:05, 7.01it/s] 50it [00:05, 7.63it/s]2025-05-26 05:55:16,152 - INFO - [Epoch 030 | Batch 0050] IWAE-loss 5986.0142 | mean log_px -0.0354 | KL -3537.95 + 51it [00:05, 8.12it/s] 52it [00:05, 8.50it/s] 53it [00:05, 8.84it/s] 54it [00:05, 9.06it/s] 55it [00:06, 8.71it/s] 56it [00:06, 9.00it/s] 57it [00:06, 9.21it/s] 58it [00:06, 9.33it/s] 59it [00:06, 8.90it/s] 60it [00:06, 9.13it/s] 61it [00:06, 9.33it/s] 62it [00:06, 9.46it/s] 63it [00:06, 9.55it/s] 64it [00:06, 9.60it/s] 65it [00:07, 9.66it/s] 66it [00:07, 9.68it/s] 67it [00:07, 9.14it/s] 68it [00:07, 9.32it/s] 69it [00:07, 9.47it/s] 70it [00:07, 9.54it/s] 71it [00:07, 9.62it/s] 72it [00:07, 9.61it/s] 73it [00:07, 9.67it/s] 74it [00:08, 9.08it/s] 75it [00:08, 9.25it/s] 76it [00:08, 9.39it/s] 77it [00:08, 9.47it/s] 78it [00:08, 9.55it/s] 79it [00:08, 9.62it/s] 80it [00:08, 9.67it/s] 81it [00:08, 9.70it/s] 82it [00:08, 9.70it/s] 83it [00:08, 9.70it/s] 84it [00:09, 9.70it/s] 85it [00:09, 9.70it/s] 86it [00:09, 9.67it/s] 87it [00:09, 9.68it/s] 88it [00:09, 9.63it/s] 89it [00:09, 9.65it/s] 90it [00:09, 9.68it/s] 91it [00:09, 9.69it/s] 92it [00:09, 9.06it/s] 93it [00:10, 9.21it/s] 94it [00:10, 9.33it/s] 95it [00:10, 9.43it/s] 96it [00:10, 9.51it/s] 97it [00:10, 9.53it/s] 98it [00:10, 9.58it/s] 99it [00:10, 9.63it/s] 100it [00:10, 9.66it/s]2025-05-26 05:55:21,415 - INFO - [Epoch 030 | Batch 0100] IWAE-loss 5398.5059 | mean log_px -0.0280 | KL -3539.20 + 101it [00:10, 9.06it/s] 102it [00:10, 9.20it/s] 103it [00:11, 9.32it/s] 104it [00:11, 9.45it/s] 105it [00:11, 9.56it/s] 106it [00:11, 9.59it/s] 107it [00:11, 9.63it/s] 108it [00:11, 9.67it/s] 109it [00:11, 9.65it/s] 110it [00:11, 9.69it/s] 111it [00:11, 9.72it/s] 112it [00:12, 9.15it/s] 113it [00:12, 9.33it/s] 114it [00:12, 9.44it/s] 115it [00:12, 9.49it/s] 116it [00:12, 9.55it/s] 117it [00:12, 9.60it/s] 118it [00:12, 9.04it/s] 119it [00:12, 9.25it/s] 120it [00:12, 9.40it/s] 121it [00:12, 9.51it/s] 122it [00:13, 9.54it/s] 123it [00:13, 9.59it/s] 124it [00:13, 9.59it/s] 125it [00:13, 9.63it/s] 126it [00:13, 9.65it/s] 127it [00:13, 9.65it/s] 128it [00:13, 9.64it/s] 129it [00:13, 9.58it/s] 130it [00:13, 9.17it/s] 131it [00:14, 8.57it/s] 132it [00:14, 8.85it/s] 133it [00:14, 9.12it/s] 134it [00:14, 9.29it/s] 135it [00:14, 9.40it/s] 136it [00:14, 9.51it/s] 137it [00:14, 9.62it/s] 138it [00:14, 9.67it/s] 139it [00:14, 9.07it/s] 140it [00:15, 9.27it/s] 141it [00:15, 9.38it/s] 142it [00:15, 9.48it/s] 143it [00:15, 8.88it/s] 144it [00:15, 9.09it/s] 145it [00:15, 9.29it/s] 146it [00:15, 9.43it/s] 147it [00:15, 9.54it/s] 148it [00:15, 9.61it/s] 149it [00:15, 9.47it/s] 150it [00:16, 8.75it/s]2025-05-26 05:55:26,777 - INFO - [Epoch 030 | Batch 0150] IWAE-loss 8095.3145 | mean log_px -0.0698 | KL -3535.73 + 151it [00:16, 8.75it/s] 152it [00:16, 8.97it/s] 153it [00:16, 9.15it/s] 154it [00:16, 9.20it/s] 155it [00:16, 9.30it/s] 156it [00:16, 9.37it/s] 157it [00:16, 9.44it/s] 158it [00:16, 9.48it/s] 159it [00:17, 9.52it/s] 160it [00:17, 9.53it/s] 161it [00:17, 9.04it/s] 162it [00:17, 9.19it/s] 163it [00:17, 9.37it/s] 164it [00:17, 9.44it/s] 165it [00:17, 9.49it/s] 166it [00:17, 9.53it/s] 167it [00:17, 9.63it/s] 168it [00:18, 9.04it/s] 169it [00:18, 9.22it/s] 170it [00:18, 9.36it/s] 171it [00:18, 9.50it/s] 172it [00:18, 9.52it/s] 173it [00:18, 9.56it/s] 174it [00:18, 9.59it/s] 175it [00:18, 9.65it/s] 176it [00:18, 9.69it/s] 177it [00:18, 9.68it/s] 178it [00:19, 9.68it/s] 179it [00:19, 9.72it/s] 180it [00:19, 9.68it/s] 181it [00:19, 9.70it/s] 182it [00:19, 9.70it/s] 183it [00:19, 9.37it/s] 184it [00:19, 9.49it/s] 185it [00:19, 9.53it/s] 186it [00:19, 9.09it/s] 187it [00:20, 9.26it/s] 188it [00:20, 9.42it/s] 189it [00:20, 9.50it/s] 190it [00:20, 9.55it/s] 191it [00:20, 9.59it/s] 192it [00:20, 9.61it/s] 193it [00:20, 9.65it/s] 194it [00:20, 9.65it/s] 195it [00:20, 9.13it/s] 196it [00:21, 9.32it/s] +2025-05-26 05:55:31,632 - INFO - Epoch: 30, Objective: tensor([8346.3223], device='cuda:0', grad_fn=), Loss: 0.08652433753013611, KL/n: 72.18109130859375 + 0it [00:00, ?it/s]2025-05-26 05:55:31,881 - INFO - [Epoch 031 | Batch 0000] IWAE-loss 7981.7705 | mean log_px -0.0697 | KL -3537.61 + 1it [00:00, 5.40it/s] 2it [00:00, 7.31it/s] 3it [00:00, 8.22it/s] 4it [00:00, 8.74it/s] 5it [00:00, 9.05it/s] 6it [00:00, 8.77it/s] 7it [00:00, 9.12it/s] 8it [00:00, 9.33it/s] 9it [00:01, 9.41it/s] 10it [00:01, 9.45it/s] 11it [00:01, 9.05it/s] 12it [00:01, 9.25it/s] 13it [00:01, 9.41it/s] 14it [00:01, 9.46it/s] 15it [00:01, 9.56it/s] 16it [00:01, 9.14it/s] 17it [00:01, 9.27it/s] 18it [00:01, 9.37it/s] 19it [00:02, 9.50it/s] 20it [00:02, 9.56it/s] 21it [00:02, 9.66it/s] 22it [00:02, 9.70it/s] 23it [00:02, 9.70it/s] 24it [00:02, 9.72it/s] 25it [00:02, 9.75it/s] 26it [00:02, 9.60it/s] 27it [00:02, 9.61it/s] 28it [00:03, 9.63it/s] 29it [00:03, 9.71it/s] 30it [00:03, 9.71it/s] 31it [00:03, 9.69it/s] 32it [00:03, 9.64it/s] 33it [00:03, 9.69it/s] 34it [00:03, 9.39it/s] 35it [00:03, 9.05it/s] 36it [00:03, 9.21it/s] 37it [00:03, 9.38it/s] 38it [00:04, 9.48it/s] 39it [00:04, 9.57it/s] 40it [00:04, 9.59it/s] 41it [00:04, 9.66it/s] 42it [00:04, 9.69it/s] 43it [00:04, 9.75it/s] 44it [00:04, 9.72it/s] 45it [00:04, 9.72it/s] 46it [00:04, 9.68it/s] 47it [00:05, 9.73it/s] 48it [00:05, 9.71it/s] 49it [00:05, 9.62it/s] 50it [00:05, 9.16it/s]2025-05-26 05:55:37,161 - INFO - [Epoch 031 | Batch 0050] IWAE-loss 7131.4248 | mean log_px -0.0549 | KL -3539.47 + 51it [00:05, 9.21it/s] 52it [00:05, 9.37it/s] 53it [00:05, 9.48it/s] 54it [00:05, 9.51it/s] 55it [00:05, 9.59it/s] 56it [00:05, 9.59it/s] 57it [00:06, 9.63it/s] 58it [00:06, 9.63it/s] 59it [00:06, 9.65it/s] 60it [00:06, 9.64it/s] 61it [00:06, 9.66it/s] 62it [00:06, 9.66it/s] 63it [00:06, 9.68it/s] 64it [00:06, 9.71it/s] 65it [00:06, 9.05it/s] 66it [00:07, 9.23it/s] 67it [00:07, 9.36it/s] 68it [00:07, 9.43it/s] 69it [00:07, 9.52it/s] 70it [00:07, 9.55it/s] 71it [00:07, 9.60it/s] 72it [00:07, 9.63it/s] 73it [00:07, 9.69it/s] 74it [00:07, 9.70it/s] 75it [00:07, 9.21it/s] 76it [00:08, 9.34it/s] 77it [00:08, 9.45it/s] 78it [00:08, 9.52it/s] 79it [00:08, 9.59it/s] 80it [00:08, 9.58it/s] 81it [00:08, 9.62it/s] 82it [00:08, 9.61it/s] 83it [00:08, 9.65it/s] 84it [00:08, 9.64it/s] 85it [00:08, 9.64it/s] 86it [00:09, 9.67it/s] 87it [00:09, 9.71it/s] 88it [00:09, 9.71it/s] 89it [00:09, 9.71it/s] 90it [00:09, 9.69it/s] 91it [00:09, 9.71it/s] 92it [00:09, 9.70it/s] 93it [00:09, 9.72it/s] 94it [00:09, 9.70it/s] 95it [00:10, 9.72it/s] 96it [00:10, 9.07it/s] 97it [00:10, 9.27it/s] 98it [00:10, 9.34it/s] 99it [00:10, 9.47it/s] 100it [00:10, 9.56it/s]2025-05-26 05:55:42,388 - INFO - [Epoch 031 | Batch 0100] IWAE-loss 6414.5449 | mean log_px -0.0424 | KL -3538.34 + 101it [00:10, 9.62it/s] 102it [00:10, 9.63it/s] 103it [00:10, 9.65it/s] 104it [00:10, 9.67it/s] 105it [00:11, 9.71it/s] 106it [00:11, 9.71it/s] 107it [00:11, 9.74it/s] 108it [00:11, 9.72it/s] 109it [00:11, 9.74it/s] 110it [00:11, 9.74it/s] 111it [00:11, 9.73it/s] 112it [00:11, 9.70it/s] 113it [00:11, 9.71it/s] 114it [00:12, 9.67it/s] 115it [00:12, 9.69it/s] 116it [00:12, 9.66it/s] 117it [00:12, 9.68it/s] 118it [00:12, 9.70it/s] 119it [00:12, 9.73it/s] 120it [00:12, 9.75it/s] 121it [00:12, 9.71it/s] 122it [00:12, 9.69it/s] 123it [00:12, 9.10it/s] 124it [00:13, 9.27it/s] 125it [00:13, 9.41it/s] 126it [00:13, 9.50it/s] 127it [00:13, 9.59it/s] 128it [00:13, 9.64it/s] 129it [00:13, 9.68it/s] 130it [00:13, 9.70it/s] 131it [00:13, 9.73it/s] 132it [00:13, 9.72it/s] 133it [00:13, 9.70it/s] 134it [00:14, 9.06it/s] 135it [00:14, 9.27it/s] 136it [00:14, 9.39it/s] 137it [00:14, 9.50it/s] 138it [00:14, 9.58it/s] 139it [00:14, 9.62it/s] 140it [00:14, 9.64it/s] 141it [00:14, 9.63it/s] 142it [00:14, 9.65it/s] 143it [00:15, 9.70it/s] 144it [00:15, 9.72it/s] 145it [00:15, 9.72it/s] 146it [00:15, 9.70it/s] 147it [00:15, 9.70it/s] 148it [00:15, 9.70it/s] 149it [00:15, 9.68it/s] 150it [00:15, 9.68it/s]2025-05-26 05:55:47,580 - INFO - [Epoch 031 | Batch 0150] IWAE-loss 7563.3599 | mean log_px -0.0640 | KL -3531.75 + 151it [00:15, 9.70it/s] 152it [00:15, 9.73it/s] 153it [00:16, 9.71it/s] 154it [00:16, 9.68it/s] 155it [00:16, 9.69it/s] 156it [00:16, 9.68it/s] 157it [00:16, 9.69it/s] 158it [00:16, 9.19it/s] 159it [00:16, 9.33it/s] 160it [00:16, 9.41it/s] 161it [00:16, 9.31it/s] 162it [00:17, 8.94it/s] 163it [00:17, 9.17it/s] 164it [00:17, 9.34it/s] 165it [00:17, 9.48it/s] 166it [00:17, 9.55it/s] 167it [00:17, 9.61it/s] 168it [00:17, 9.63it/s] 169it [00:17, 9.63it/s] 170it [00:17, 9.18it/s] 171it [00:17, 9.35it/s] 172it [00:18, 9.47it/s] 173it [00:18, 9.54it/s] 174it [00:18, 9.09it/s] 175it [00:18, 8.84it/s] 176it [00:18, 9.10it/s] 177it [00:18, 9.26it/s] 178it [00:18, 9.28it/s] 179it [00:18, 9.37it/s] 180it [00:18, 9.44it/s] 181it [00:19, 9.52it/s] 182it [00:19, 9.56it/s] 183it [00:19, 9.15it/s] 184it [00:19, 9.29it/s] 185it [00:19, 9.43it/s] 186it [00:19, 9.49it/s] 187it [00:19, 9.11it/s] 188it [00:19, 9.28it/s] 189it [00:19, 9.44it/s] 190it [00:20, 9.49it/s] 191it [00:20, 9.56it/s] 192it [00:20, 9.12it/s] 193it [00:20, 9.29it/s] 194it [00:20, 9.44it/s] 195it [00:20, 8.97it/s] 196it [00:20, 9.26it/s] 196it [00:20, 9.46it/s] +2025-05-26 05:55:52,477 - INFO - Epoch: 31, Objective: tensor([6049.7988], device='cuda:0', grad_fn=), Loss: 0.03925026208162308, KL/n: 72.08685302734375 + 0it [00:00, ?it/s]2025-05-26 05:55:52,758 - INFO - [Epoch 032 | Batch 0000] IWAE-loss 5750.3301 | mean log_px -0.0349 | KL -3535.57 + 1it [00:00, 5.32it/s] 2it [00:00, 7.10it/s] 3it [00:00, 8.10it/s] 4it [00:00, 8.64it/s] 5it [00:00, 9.05it/s] 6it [00:00, 9.28it/s] 7it [00:00, 9.42it/s] 8it [00:00, 9.51it/s] 9it [00:01, 9.58it/s] 10it [00:01, 9.62it/s] 11it [00:01, 9.64it/s] 12it [00:01, 9.64it/s] 13it [00:01, 9.71it/s] 14it [00:01, 9.72it/s] 15it [00:01, 9.74it/s] 16it [00:01, 9.70it/s] 17it [00:01, 9.72it/s] 18it [00:01, 9.70it/s] 19it [00:02, 9.71it/s] 20it [00:02, 9.71it/s] 21it [00:02, 9.71it/s] 22it [00:02, 9.70it/s] 23it [00:02, 9.72it/s] 24it [00:02, 9.68it/s] 25it [00:02, 9.71it/s] 26it [00:02, 9.69it/s] 27it [00:02, 9.73it/s] 28it [00:02, 9.75it/s] 29it [00:03, 9.73it/s] 30it [00:03, 9.74it/s] 31it [00:03, 9.78it/s] 32it [00:03, 9.78it/s] 33it [00:03, 9.81it/s] 34it [00:03, 9.80it/s] 35it [00:03, 9.80it/s] 36it [00:03, 9.77it/s] 37it [00:03, 9.77it/s] 38it [00:03, 9.73it/s] 39it [00:04, 9.72it/s] 40it [00:04, 9.67it/s] 41it [00:04, 9.69it/s] 42it [00:04, 9.69it/s] 43it [00:04, 9.68it/s] 44it [00:04, 9.70it/s] 45it [00:04, 9.70it/s] 46it [00:04, 9.68it/s] 47it [00:04, 9.70it/s] 48it [00:05, 9.69it/s] 49it [00:05, 9.69it/s] 50it [00:05, 9.69it/s]2025-05-26 05:55:58,117 - INFO - [Epoch 032 | Batch 0050] IWAE-loss 5072.8218 | mean log_px -0.0260 | KL -3529.07 + 51it [00:05, 5.80it/s] 52it [00:05, 6.60it/s] 53it [00:05, 7.30it/s] 54it [00:05, 7.88it/s] 55it [00:05, 7.95it/s] 56it [00:06, 8.38it/s] 57it [00:06, 8.69it/s] 58it [00:06, 8.97it/s] 59it [00:06, 9.19it/s] 60it [00:06, 8.79it/s] 61it [00:06, 9.07it/s] 62it [00:06, 9.24it/s] 63it [00:06, 9.36it/s] 64it [00:06, 9.27it/s] 65it [00:07, 9.38it/s] 66it [00:07, 9.32it/s] 67it [00:07, 9.47it/s] 68it [00:07, 9.56it/s] 69it [00:07, 9.62it/s] 70it [00:07, 9.46it/s] 71it [00:07, 9.50it/s] 72it [00:07, 9.52it/s] 73it [00:07, 9.55it/s] 74it [00:08, 9.55it/s] 75it [00:08, 9.58it/s] 76it [00:08, 9.63it/s] 77it [00:08, 9.68it/s] 78it [00:08, 9.68it/s] 79it [00:08, 9.71it/s] 80it [00:08, 9.70it/s] 81it [00:08, 9.68it/s] 82it [00:08, 9.68it/s] 83it [00:08, 9.66it/s] 84it [00:09, 9.68it/s] 85it [00:09, 9.63it/s] 86it [00:09, 9.65it/s] 87it [00:09, 9.66it/s] 88it [00:09, 9.65it/s] 89it [00:09, 9.66it/s] 90it [00:09, 9.65it/s] 91it [00:09, 9.69it/s] 92it [00:09, 9.67it/s] 93it [00:09, 9.70it/s] 94it [00:10, 9.73it/s] 95it [00:10, 9.75it/s] 96it [00:10, 9.73it/s] 97it [00:10, 9.75it/s] 98it [00:10, 9.74it/s] 99it [00:10, 9.75it/s] 100it [00:10, 9.72it/s]2025-05-26 05:56:03,359 - INFO - [Epoch 032 | Batch 0100] IWAE-loss 6324.5918 | mean log_px -0.0521 | KL -3526.06 + 101it [00:10, 9.69it/s] 102it [00:10, 9.45it/s] 103it [00:11, 8.67it/s] 104it [00:11, 8.91it/s] 105it [00:11, 9.13it/s] 106it [00:11, 9.31it/s] 107it [00:11, 9.46it/s] 108it [00:11, 9.53it/s] 109it [00:11, 9.62it/s] 110it [00:11, 9.64it/s] 111it [00:11, 9.70it/s] 112it [00:11, 9.72it/s] 113it [00:12, 9.73it/s] 114it [00:12, 9.71it/s] 115it [00:12, 9.75it/s] 116it [00:12, 9.75it/s] 117it [00:12, 9.74it/s] 118it [00:12, 9.74it/s] 119it [00:12, 9.76it/s] 120it [00:12, 9.78it/s] 121it [00:12, 9.78it/s] 122it [00:12, 9.76it/s] 123it [00:13, 9.16it/s] 124it [00:13, 9.30it/s] 125it [00:13, 9.41it/s] 126it [00:13, 9.47it/s] 127it [00:13, 9.54it/s] 128it [00:13, 9.60it/s] 129it [00:13, 9.65it/s] 130it [00:13, 9.64it/s] 131it [00:13, 9.68it/s] 132it [00:14, 9.11it/s] 133it [00:14, 9.08it/s] 134it [00:14, 9.28it/s] 135it [00:14, 9.40it/s] 136it [00:14, 9.51it/s] 137it [00:14, 9.59it/s] 138it [00:14, 9.60it/s] 139it [00:14, 9.65it/s] 140it [00:14, 9.66it/s] 141it [00:14, 9.67it/s] 142it [00:15, 9.68it/s] 143it [00:15, 9.67it/s] 144it [00:15, 9.43it/s] 145it [00:15, 9.51it/s] 146it [00:15, 9.56it/s] 147it [00:15, 9.59it/s] 148it [00:15, 9.60it/s] 149it [00:15, 9.65it/s] 150it [00:15, 9.67it/s]2025-05-26 05:56:08,608 - INFO - [Epoch 032 | Batch 0150] IWAE-loss 7815.7627 | mean log_px -0.0678 | KL -3526.52 + 151it [00:16, 9.68it/s] 152it [00:16, 9.71it/s] 153it [00:16, 9.74it/s] 154it [00:16, 9.73it/s] 155it [00:16, 9.40it/s] 156it [00:16, 9.49it/s] 157it [00:16, 9.57it/s] 158it [00:16, 9.62it/s] 159it [00:16, 9.63it/s] 160it [00:16, 9.65it/s] 161it [00:17, 9.66it/s] 162it [00:17, 9.68it/s] 163it [00:17, 9.72it/s] 164it [00:17, 9.74it/s] 165it [00:17, 9.72it/s] 166it [00:17, 9.15it/s] 167it [00:17, 9.31it/s] 168it [00:17, 9.42it/s] 169it [00:17, 9.55it/s] 170it [00:18, 9.02it/s] 171it [00:18, 9.26it/s] 172it [00:18, 9.38it/s] 173it [00:18, 9.50it/s] 174it [00:18, 9.57it/s] 175it [00:18, 9.23it/s] 176it [00:18, 9.35it/s] 177it [00:18, 9.48it/s] 178it [00:18, 9.52it/s] 179it [00:18, 9.48it/s] 180it [00:19, 9.50it/s] 181it [00:19, 9.54it/s] 182it [00:19, 9.57it/s] 183it [00:19, 9.65it/s] 184it [00:19, 9.67it/s] 185it [00:19, 9.72it/s] 186it [00:19, 9.73it/s] 187it [00:19, 9.73it/s] 188it [00:19, 9.72it/s] 189it [00:20, 9.70it/s] 190it [00:20, 9.16it/s] 191it [00:20, 9.32it/s] 192it [00:20, 9.46it/s] 193it [00:20, 9.54it/s] 194it [00:20, 9.58it/s] 195it [00:20, 9.09it/s] 196it [00:20, 9.33it/s] 196it [00:20, 9.40it/s] +2025-05-26 05:56:13,453 - INFO - Epoch: 32, Objective: tensor([5291.6196], device='cuda:0', grad_fn=), Loss: 0.03124961443245411, KL/n: 71.98877716064453 + 0it [00:00, ?it/s]2025-05-26 05:56:13,732 - INFO - [Epoch 033 | Batch 0000] IWAE-loss 5486.5654 | mean log_px -0.0308 | KL -3528.38 + 1it [00:00, 5.42it/s] 2it [00:00, 7.37it/s] 3it [00:00, 8.34it/s] 4it [00:00, 8.81it/s] 5it [00:00, 9.07it/s] 6it [00:00, 9.29it/s] 7it [00:00, 9.44it/s] 8it [00:00, 9.53it/s] 9it [00:01, 9.61it/s] 10it [00:01, 9.62it/s] 11it [00:01, 9.66it/s] 12it [00:01, 9.66it/s] 13it [00:01, 9.65it/s] 14it [00:01, 9.66it/s] 15it [00:01, 9.65it/s] 16it [00:01, 9.10it/s] 17it [00:01, 9.29it/s] 18it [00:01, 9.38it/s] 19it [00:02, 9.49it/s] 20it [00:02, 9.59it/s] 21it [00:02, 9.67it/s] 22it [00:02, 9.67it/s] 23it [00:02, 9.71it/s] 24it [00:02, 9.71it/s] 25it [00:02, 9.70it/s] 26it [00:02, 9.68it/s] 27it [00:02, 9.71it/s] 28it [00:02, 9.72it/s] 29it [00:03, 9.71it/s] 30it [00:03, 9.69it/s] 31it [00:03, 9.72it/s] 32it [00:03, 9.72it/s] 33it [00:03, 9.70it/s] 34it [00:03, 9.69it/s] 35it [00:03, 9.69it/s] 36it [00:03, 9.68it/s] 37it [00:03, 9.70it/s] 38it [00:04, 9.65it/s] 39it [00:04, 9.68it/s] 40it [00:04, 9.69it/s] 41it [00:04, 9.68it/s] 42it [00:04, 9.71it/s] 43it [00:04, 9.71it/s] 44it [00:04, 9.68it/s] 45it [00:04, 9.72it/s] 46it [00:04, 9.67it/s] 47it [00:04, 9.69it/s] 48it [00:05, 9.20it/s] 49it [00:05, 9.37it/s] 50it [00:05, 9.49it/s]2025-05-26 05:56:18,921 - INFO - [Epoch 033 | Batch 0050] IWAE-loss 5826.6826 | mean log_px -0.0356 | KL -3525.49 + 51it [00:05, 9.57it/s] 52it [00:05, 9.62it/s] 53it [00:05, 9.63it/s] 54it [00:05, 9.65it/s] 55it [00:05, 9.68it/s] 56it [00:05, 9.72it/s] 57it [00:05, 9.74it/s] 58it [00:06, 9.76it/s] 59it [00:06, 9.78it/s] 60it [00:06, 9.79it/s] 61it [00:06, 9.78it/s] 62it [00:06, 9.69it/s] 63it [00:06, 9.65it/s] 64it [00:06, 9.65it/s] 65it [00:06, 9.66it/s] 66it [00:06, 9.66it/s] 67it [00:07, 9.62it/s] 68it [00:07, 9.62it/s] 69it [00:07, 9.63it/s] 70it [00:07, 9.57it/s] 71it [00:07, 9.62it/s] 72it [00:07, 9.64it/s] 73it [00:07, 9.66it/s] 74it [00:07, 9.68it/s] 75it [00:07, 9.68it/s] 76it [00:07, 9.66it/s] 77it [00:08, 9.66it/s] 78it [00:08, 9.65it/s] 79it [00:08, 9.68it/s] 80it [00:08, 9.69it/s] 81it [00:08, 9.70it/s] 82it [00:08, 9.64it/s] 83it [00:08, 9.67it/s] 84it [00:08, 9.67it/s] 85it [00:08, 9.70it/s] 86it [00:08, 9.71it/s] 87it [00:09, 9.68it/s] 88it [00:09, 9.71it/s] 89it [00:09, 9.76it/s] 90it [00:09, 9.77it/s] 91it [00:09, 9.65it/s] 92it [00:09, 9.61it/s] 93it [00:09, 9.63it/s] 94it [00:09, 9.62it/s] 95it [00:09, 9.67it/s] 96it [00:10, 9.69it/s] 97it [00:10, 9.73it/s] 98it [00:10, 9.72it/s] 99it [00:10, 9.72it/s] 100it [00:10, 9.71it/s]2025-05-26 05:56:24,083 - INFO - [Epoch 033 | Batch 0100] IWAE-loss 7603.5825 | mean log_px -0.0618 | KL -3521.97 + 101it [00:10, 9.72it/s] 102it [00:10, 9.72it/s] 103it [00:10, 9.73it/s] 104it [00:10, 9.72it/s] 105it [00:10, 9.58it/s] 106it [00:11, 9.58it/s] 107it [00:11, 9.61it/s] 108it [00:11, 9.62it/s] 109it [00:11, 9.67it/s] 110it [00:11, 9.67it/s] 111it [00:11, 9.66it/s] 112it [00:11, 9.66it/s] 113it [00:11, 9.69it/s] 114it [00:11, 9.47it/s] 115it [00:11, 9.56it/s] 116it [00:12, 9.61it/s] 117it [00:12, 9.65it/s] 118it [00:12, 9.66it/s] 119it [00:12, 9.69it/s] 120it [00:12, 9.68it/s] 121it [00:12, 9.68it/s] 122it [00:12, 9.71it/s] 123it [00:12, 9.74it/s] 124it [00:12, 9.75it/s] 125it [00:13, 9.76it/s] 126it [00:13, 9.77it/s] 127it [00:13, 9.77it/s] 128it [00:13, 9.74it/s] 129it [00:13, 9.74it/s] 130it [00:13, 9.74it/s] 131it [00:13, 9.77it/s] 132it [00:13, 9.74it/s] 133it [00:13, 9.73it/s] 134it [00:13, 9.71it/s] 135it [00:14, 9.73it/s] 136it [00:14, 9.69it/s] 137it [00:14, 9.68it/s] 138it [00:14, 9.67it/s] 139it [00:14, 9.68it/s] 140it [00:14, 9.69it/s] 141it [00:14, 9.72it/s] 142it [00:14, 9.70it/s] 143it [00:14, 9.25it/s] 144it [00:14, 9.40it/s] 145it [00:15, 9.50it/s] 146it [00:15, 9.55it/s] 147it [00:15, 9.58it/s] 148it [00:15, 9.61it/s] 149it [00:15, 9.64it/s] 150it [00:15, 9.65it/s]2025-05-26 05:56:29,262 - INFO - [Epoch 033 | Batch 0150] IWAE-loss 5245.3364 | mean log_px -0.0273 | KL -3525.40 + 151it [00:15, 9.65it/s] 152it [00:15, 9.03it/s] 153it [00:15, 9.08it/s] 154it [00:16, 9.08it/s] 155it [00:16, 9.19it/s] 156it [00:16, 8.73it/s] 157it [00:16, 8.96it/s] 158it [00:16, 9.11it/s] 159it [00:16, 9.23it/s] 160it [00:16, 9.33it/s] 161it [00:16, 9.40it/s] 162it [00:16, 9.45it/s] 163it [00:17, 9.47it/s] 164it [00:17, 9.48it/s] 165it [00:17, 9.54it/s] 166it [00:17, 9.59it/s] 167it [00:17, 9.65it/s] 168it [00:17, 9.67it/s] 169it [00:17, 9.69it/s] 170it [00:17, 9.67it/s] 171it [00:17, 9.68it/s] 172it [00:17, 9.69it/s] 173it [00:18, 9.41it/s] 174it [00:18, 9.49it/s] 175it [00:18, 9.56it/s] 176it [00:18, 9.61it/s] 177it [00:18, 9.65it/s] 178it [00:18, 9.64it/s] 179it [00:18, 9.69it/s] 180it [00:18, 9.71it/s] 181it [00:18, 9.71it/s] 182it [00:18, 9.71it/s] 183it [00:19, 9.73it/s] 184it [00:19, 9.74it/s] 185it [00:19, 9.75it/s] 186it [00:19, 9.73it/s] 187it [00:19, 9.73it/s] 188it [00:19, 9.73it/s] 189it [00:19, 9.73it/s] 190it [00:19, 9.73it/s] 191it [00:19, 9.27it/s] 192it [00:20, 9.39it/s] 193it [00:20, 9.47it/s] 194it [00:20, 9.54it/s] 195it [00:20, 9.05it/s] 196it [00:20, 9.55it/s] +2025-05-26 05:56:34,117 - INFO - Epoch: 33, Objective: tensor([9180.2832], device='cuda:0', grad_fn=), Loss: 0.08810441941022873, KL/n: 71.89595794677734 + 0it [00:00, ?it/s]2025-05-26 05:56:34,390 - INFO - [Epoch 034 | Batch 0000] IWAE-loss 7107.1201 | mean log_px -0.0598 | KL -3525.40 + 1it [00:00, 5.38it/s] 2it [00:00, 7.21it/s] 3it [00:00, 8.17it/s] 4it [00:00, 8.72it/s] 5it [00:00, 9.10it/s] 6it [00:00, 9.31it/s] 7it [00:00, 9.42it/s] 8it [00:00, 9.46it/s] 9it [00:01, 9.58it/s] 10it [00:01, 9.63it/s] 11it [00:01, 9.66it/s] 12it [00:01, 9.66it/s] 13it [00:01, 9.67it/s] 14it [00:01, 9.66it/s] 15it [00:01, 9.68it/s] 16it [00:01, 9.71it/s] 17it [00:01, 9.73it/s] 18it [00:01, 9.70it/s] 19it [00:02, 9.71it/s] 20it [00:02, 9.71it/s] 21it [00:02, 9.74it/s] 22it [00:02, 9.74it/s] 23it [00:02, 9.75it/s] 24it [00:02, 9.71it/s] 25it [00:02, 9.76it/s] 26it [00:02, 9.77it/s] 27it [00:02, 9.76it/s] 28it [00:02, 9.75it/s] 29it [00:03, 9.75it/s] 30it [00:03, 9.74it/s] 31it [00:03, 9.76it/s] 32it [00:03, 9.53it/s] 33it [00:03, 9.53it/s] 34it [00:03, 9.51it/s] 35it [00:03, 9.48it/s] 36it [00:03, 9.49it/s] 37it [00:03, 9.49it/s] 38it [00:04, 9.48it/s] 39it [00:04, 9.47it/s] 40it [00:04, 9.45it/s] 41it [00:04, 9.47it/s] 42it [00:04, 9.41it/s] 43it [00:04, 9.45it/s] 44it [00:04, 9.38it/s] 45it [00:04, 9.42it/s] 46it [00:04, 9.34it/s] 47it [00:04, 9.40it/s] 48it [00:05, 9.40it/s] 49it [00:05, 9.40it/s] 50it [00:05, 9.47it/s]2025-05-26 05:56:39,602 - INFO - [Epoch 034 | Batch 0050] IWAE-loss 5209.7563 | mean log_px -0.0287 | KL -3518.90 + 51it [00:05, 9.46it/s] 52it [00:05, 9.47it/s] 53it [00:05, 9.46it/s] 54it [00:05, 9.44it/s] 55it [00:05, 9.46it/s] 56it [00:05, 9.49it/s] 57it [00:06, 9.54it/s] 58it [00:06, 9.51it/s] 59it [00:06, 9.52it/s] 60it [00:06, 9.51it/s] 61it [00:06, 9.57it/s] 62it [00:06, 9.31it/s] 63it [00:06, 9.37it/s] 64it [00:06, 9.37it/s] 65it [00:06, 9.44it/s] 66it [00:06, 9.43it/s] 67it [00:07, 9.49it/s] 68it [00:07, 6.24it/s] 69it [00:07, 6.97it/s] 70it [00:07, 7.53it/s] 71it [00:07, 8.05it/s] 72it [00:07, 8.47it/s] 73it [00:07, 8.76it/s] 74it [00:08, 8.93it/s] 75it [00:08, 9.04it/s] 76it [00:08, 9.11it/s] 77it [00:08, 9.21it/s] 78it [00:08, 9.25it/s] 79it [00:08, 9.33it/s] 80it [00:08, 9.33it/s] 81it [00:08, 9.44it/s] 82it [00:08, 9.49it/s] 83it [00:08, 9.54it/s] 84it [00:09, 9.55it/s] 85it [00:09, 9.46it/s] 86it [00:09, 9.43it/s] 87it [00:09, 9.35it/s] 88it [00:09, 9.42it/s] 89it [00:09, 9.46it/s] 90it [00:09, 9.47it/s] 91it [00:09, 9.50it/s] 92it [00:09, 9.46it/s] 93it [00:10, 9.48it/s] 94it [00:10, 9.44it/s] 95it [00:10, 9.45it/s] 96it [00:10, 9.46it/s] 97it [00:10, 9.42it/s] 98it [00:10, 9.46it/s] 99it [00:10, 9.45it/s] 100it [00:10, 9.51it/s]2025-05-26 05:56:45,068 - INFO - [Epoch 034 | Batch 0100] IWAE-loss 6808.0835 | mean log_px -0.0500 | KL -3514.93 + 101it [00:10, 9.43it/s] 102it [00:10, 9.45it/s] 103it [00:11, 9.47it/s] 104it [00:11, 9.50it/s] 105it [00:11, 9.45it/s] 106it [00:11, 9.43it/s] 107it [00:11, 9.40it/s] 108it [00:11, 9.23it/s] 109it [00:11, 9.33it/s] 110it [00:11, 9.39it/s] 111it [00:11, 9.36it/s] 112it [00:12, 9.39it/s] 113it [00:12, 9.42it/s] 114it [00:12, 9.44it/s] 115it [00:12, 9.50it/s] 116it [00:12, 9.08it/s] 117it [00:12, 9.19it/s] 118it [00:12, 9.24it/s] 119it [00:12, 9.33it/s] 120it [00:12, 9.36it/s] 121it [00:12, 9.41it/s] 122it [00:13, 9.40it/s] 123it [00:13, 9.37it/s] 124it [00:13, 8.90it/s] 125it [00:13, 9.00it/s] 126it [00:13, 9.07it/s] 127it [00:13, 9.20it/s] 128it [00:13, 9.29it/s] 129it [00:13, 9.39it/s] 130it [00:13, 9.42it/s] 131it [00:14, 9.45it/s] 132it [00:14, 9.45it/s] 133it [00:14, 9.50it/s] 134it [00:14, 8.94it/s] 135it [00:14, 9.06it/s] 136it [00:14, 9.15it/s] 137it [00:14, 9.30it/s] 138it [00:14, 8.94it/s] 139it [00:14, 9.08it/s] 140it [00:15, 9.18it/s] 141it [00:15, 9.26it/s] 142it [00:15, 8.79it/s] 143it [00:15, 8.95it/s] 144it [00:15, 9.11it/s] 145it [00:15, 9.26it/s] 146it [00:15, 9.31it/s] 147it [00:15, 8.70it/s] 148it [00:15, 8.89it/s] 149it [00:16, 9.06it/s] 150it [00:16, 9.14it/s]2025-05-26 05:56:50,487 - INFO - [Epoch 034 | Batch 0150] IWAE-loss 7905.4756 | mean log_px -0.0700 | KL -3521.38 + 151it [00:16, 9.27it/s] 152it [00:16, 9.40it/s] 153it [00:16, 9.02it/s] 154it [00:16, 9.23it/s] 155it [00:16, 9.41it/s] 156it [00:16, 9.53it/s] 157it [00:16, 9.63it/s] 158it [00:17, 9.67it/s] 159it [00:17, 9.71it/s] 160it [00:17, 9.73it/s] 161it [00:17, 9.75it/s] 162it [00:17, 9.28it/s] 163it [00:17, 9.43it/s] 164it [00:17, 9.54it/s] 165it [00:17, 9.62it/s] 166it [00:17, 9.64it/s] 167it [00:17, 9.66it/s] 168it [00:18, 9.68it/s] 169it [00:18, 9.71it/s] 170it [00:18, 9.74it/s] 171it [00:18, 9.74it/s] 172it [00:18, 9.14it/s] 173it [00:18, 9.29it/s] 174it [00:18, 9.44it/s] 175it [00:18, 9.57it/s] 176it [00:18, 9.65it/s] 177it [00:18, 9.72it/s] 178it [00:19, 9.68it/s] 179it [00:19, 9.72it/s] 180it [00:19, 9.74it/s] 181it [00:19, 9.76it/s] 182it [00:19, 9.78it/s] 183it [00:19, 9.79it/s] 184it [00:19, 9.75it/s] 185it [00:19, 9.78it/s] 186it [00:19, 9.79it/s] 187it [00:20, 9.82it/s] 188it [00:20, 9.75it/s] 189it [00:20, 9.74it/s] 190it [00:20, 9.78it/s] 191it [00:20, 9.14it/s] 192it [00:20, 9.32it/s] 193it [00:20, 9.44it/s] 194it [00:20, 9.53it/s] 195it [00:20, 9.02it/s] 196it [00:21, 8.86it/s] 196it [00:21, 9.30it/s] +2025-05-26 05:56:55,316 - INFO - Epoch: 34, Objective: tensor([7032.6973], device='cuda:0', grad_fn=), Loss: 0.05743390694260597, KL/n: 71.76044464111328 + 0it [00:00, ?it/s]2025-05-26 05:56:55,592 - INFO - [Epoch 035 | Batch 0000] IWAE-loss 5518.7554 | mean log_px -0.0321 | KL -3518.21 + 1it [00:00, 5.39it/s] 2it [00:00, 7.23it/s] 3it [00:00, 8.20it/s] 4it [00:00, 8.75it/s] 5it [00:00, 9.08it/s] 6it [00:00, 9.28it/s] 7it [00:00, 9.43it/s] 8it [00:00, 9.52it/s] 9it [00:01, 9.61it/s] 10it [00:01, 9.65it/s] 11it [00:01, 9.65it/s] 12it [00:01, 9.68it/s] 13it [00:01, 9.69it/s] 14it [00:01, 9.71it/s] 15it [00:01, 9.75it/s] 16it [00:01, 9.60it/s] 17it [00:01, 9.62it/s] 18it [00:01, 9.66it/s] 19it [00:02, 9.70it/s] 20it [00:02, 9.71it/s] 21it [00:02, 9.73it/s] 22it [00:02, 9.72it/s] 23it [00:02, 9.77it/s] 24it [00:02, 9.76it/s] 25it [00:02, 9.75it/s] 26it [00:02, 9.76it/s] 27it [00:02, 9.77it/s] 28it [00:02, 9.73it/s] 29it [00:03, 9.74it/s] 30it [00:03, 9.73it/s] 31it [00:03, 9.72it/s] 32it [00:03, 9.72it/s] 33it [00:03, 9.74it/s] 34it [00:03, 9.74it/s] 35it [00:03, 9.77it/s] 36it [00:03, 9.75it/s] 37it [00:03, 9.76it/s] 38it [00:03, 9.71it/s] 39it [00:04, 9.73it/s] 40it [00:04, 9.72it/s] 41it [00:04, 9.72it/s] 42it [00:04, 9.71it/s] 43it [00:04, 9.71it/s] 44it [00:04, 9.71it/s] 45it [00:04, 9.71it/s] 46it [00:04, 9.43it/s] 47it [00:04, 9.55it/s] 48it [00:05, 9.56it/s] 49it [00:05, 9.61it/s] 50it [00:05, 9.61it/s]2025-05-26 05:57:00,751 - INFO - [Epoch 035 | Batch 0050] IWAE-loss 10205.3838 | mean log_px -0.0955 | KL -3515.78 + 51it [00:05, 9.35it/s] 52it [00:05, 9.26it/s] 53it [00:05, 9.27it/s] 54it [00:05, 9.46it/s] 56it [00:05, 9.72it/s] 58it [00:06, 9.86it/s] 60it [00:06, 9.89it/s] 61it [00:06, 9.91it/s] 62it [00:06, 9.92it/s] 63it [00:06, 9.87it/s] 64it [00:06, 9.87it/s] 65it [00:06, 9.86it/s] 66it [00:06, 9.87it/s] 67it [00:06, 9.89it/s] 68it [00:07, 9.87it/s] 69it [00:07, 9.88it/s] 70it [00:07, 9.89it/s] 71it [00:07, 9.90it/s] 72it [00:07, 9.87it/s] 73it [00:07, 9.89it/s] 74it [00:07, 9.91it/s] 75it [00:07, 9.93it/s] 76it [00:07, 9.94it/s] 77it [00:07, 9.93it/s] 78it [00:08, 9.91it/s] 79it [00:08, 9.92it/s] 80it [00:08, 9.93it/s] 81it [00:08, 9.92it/s] 82it [00:08, 9.92it/s] 83it [00:08, 9.93it/s] 84it [00:08, 9.31it/s] 86it [00:08, 9.62it/s] 87it [00:09, 9.70it/s] 88it [00:09, 9.74it/s] 89it [00:09, 9.68it/s] 90it [00:09, 9.68it/s] 91it [00:09, 9.69it/s] 92it [00:09, 9.69it/s] 93it [00:09, 9.62it/s] 94it [00:09, 9.62it/s] 95it [00:09, 9.68it/s] 96it [00:09, 9.69it/s] 97it [00:10, 9.69it/s] 98it [00:10, 9.66it/s] 99it [00:10, 9.05it/s] 100it [00:10, 9.23it/s]2025-05-26 05:57:05,894 - INFO - [Epoch 035 | Batch 0100] IWAE-loss 7475.6548 | mean log_px -0.0570 | KL -3514.94 + 101it [00:10, 9.39it/s] 102it [00:10, 9.54it/s] 103it [00:10, 9.63it/s] 104it [00:10, 9.70it/s] 105it [00:10, 9.77it/s] 106it [00:10, 9.83it/s] 107it [00:11, 9.88it/s] 108it [00:11, 9.87it/s] 110it [00:11, 9.95it/s] 111it [00:11, 9.42it/s] 112it [00:11, 9.55it/s] 113it [00:11, 9.66it/s] 114it [00:11, 9.73it/s] 115it [00:11, 9.76it/s] 116it [00:12, 9.80it/s] 117it [00:12, 9.84it/s] 118it [00:12, 9.87it/s] 119it [00:12, 9.89it/s] 120it [00:12, 9.90it/s] 121it [00:12, 9.93it/s] 122it [00:12, 9.93it/s] 123it [00:12, 9.31it/s] 124it [00:12, 9.45it/s] 125it [00:12, 9.57it/s] 126it [00:13, 8.89it/s] 127it [00:13, 9.15it/s] 128it [00:13, 9.36it/s] 129it [00:13, 8.91it/s] 130it [00:13, 9.21it/s] 131it [00:13, 9.42it/s] 132it [00:13, 9.57it/s] 134it [00:13, 9.74it/s] 136it [00:14, 9.84it/s] 138it [00:14, 9.90it/s] 139it [00:14, 9.44it/s] 140it [00:14, 9.54it/s] 141it [00:14, 9.64it/s] 142it [00:14, 9.27it/s] 144it [00:14, 9.57it/s] 145it [00:15, 9.63it/s] 146it [00:15, 9.69it/s] 147it [00:15, 9.74it/s] 148it [00:15, 9.43it/s] 150it [00:15, 9.67it/s]2025-05-26 05:57:11,084 - INFO - [Epoch 035 | Batch 0150] IWAE-loss 5995.6523 | mean log_px -0.0361 | KL -3514.44 + 151it [00:15, 9.74it/s] 152it [00:15, 9.76it/s] 153it [00:15, 9.81it/s] 154it [00:15, 9.85it/s] 155it [00:16, 9.86it/s] 156it [00:16, 9.88it/s] 157it [00:16, 9.89it/s] 158it [00:16, 9.88it/s] 160it [00:16, 9.95it/s] 161it [00:16, 9.41it/s] 162it [00:16, 9.51it/s] 163it [00:16, 9.53it/s] 164it [00:17, 9.62it/s] 165it [00:17, 9.67it/s] 166it [00:17, 9.66it/s] 167it [00:17, 9.74it/s] 168it [00:17, 9.78it/s] 170it [00:17, 9.90it/s] 172it [00:17, 9.96it/s] 173it [00:17, 9.95it/s] 174it [00:18, 9.93it/s] 176it [00:18, 9.97it/s] 178it [00:18, 9.96it/s] 179it [00:18, 9.95it/s] 180it [00:18, 9.96it/s] 181it [00:18, 9.43it/s] 183it [00:18, 9.68it/s] 184it [00:19, 9.74it/s] 185it [00:19, 9.79it/s] 186it [00:19, 9.72it/s] 188it [00:19, 9.61it/s] 189it [00:19, 8.93it/s] 190it [00:19, 8.78it/s] 191it [00:19, 8.98it/s] 192it [00:19, 9.23it/s] 193it [00:20, 9.04it/s] 195it [00:20, 9.10it/s] 196it [00:20, 8.89it/s] 196it [00:20, 9.59it/s] +2025-05-26 05:57:15,887 - INFO - Epoch: 35, Objective: tensor([5837.2930], device='cuda:0', grad_fn=), Loss: 0.03758452087640762, KL/n: 71.64217376708984 + 0it [00:00, ?it/s]2025-05-26 05:57:16,170 - INFO - [Epoch 036 | Batch 0000] IWAE-loss 5874.6455 | mean log_px -0.0372 | KL -3509.21 + 1it [00:00, 5.40it/s] 2it [00:00, 7.30it/s] 3it [00:00, 8.32it/s] 4it [00:00, 8.88it/s] 6it [00:00, 9.45it/s] 8it [00:00, 9.66it/s] 10it [00:01, 9.81it/s] 12it [00:01, 9.91it/s] 13it [00:01, 9.91it/s] 14it [00:01, 9.93it/s] 16it [00:01, 9.99it/s] 18it [00:01, 10.02it/s] 20it [00:02, 9.95it/s] 21it [00:02, 9.91it/s] 22it [00:02, 9.92it/s] 24it [00:02, 9.48it/s] 26it [00:02, 9.66it/s] 27it [00:02, 9.71it/s] 28it [00:02, 9.73it/s] 30it [00:03, 9.84it/s] 31it [00:03, 9.86it/s] 32it [00:03, 9.86it/s] 34it [00:03, 9.93it/s] 36it [00:03, 9.96it/s] 37it [00:03, 9.83it/s] 38it [00:03, 9.82it/s] 39it [00:04, 9.84it/s] 40it [00:04, 9.26it/s] 41it [00:04, 9.43it/s] 43it [00:04, 9.67it/s] 44it [00:04, 9.72it/s] 45it [00:04, 9.77it/s] 46it [00:04, 9.78it/s] 48it [00:04, 9.88it/s] 49it [00:05, 9.90it/s] 50it [00:05, 9.91it/s]2025-05-26 05:57:21,250 - INFO - [Epoch 036 | Batch 0050] IWAE-loss 5224.4829 | mean log_px -0.0283 | KL -3501.39 + 51it [00:05, 9.92it/s] 52it [00:05, 9.93it/s] 54it [00:05, 9.96it/s] 55it [00:05, 9.96it/s] 56it [00:05, 9.96it/s] 58it [00:05, 9.98it/s] 59it [00:06, 9.97it/s] 60it [00:06, 9.39it/s] 61it [00:06, 9.54it/s] 62it [00:06, 6.49it/s] 63it [00:06, 7.18it/s] 64it [00:06, 7.79it/s] 65it [00:06, 8.31it/s] 66it [00:06, 8.70it/s] 67it [00:07, 9.02it/s] 68it [00:07, 9.29it/s] 70it [00:07, 9.61it/s] 71it [00:07, 9.70it/s] 72it [00:07, 9.75it/s] 73it [00:07, 9.80it/s] 74it [00:07, 9.83it/s] 75it [00:07, 9.88it/s] 76it [00:07, 9.89it/s] 77it [00:08, 9.91it/s] 78it [00:08, 9.91it/s] 80it [00:08, 9.95it/s] 82it [00:08, 9.95it/s] 84it [00:08, 9.98it/s] 86it [00:08, 9.99it/s] 87it [00:09, 9.98it/s] 88it [00:09, 9.98it/s] 89it [00:09, 9.98it/s] 90it [00:09, 9.96it/s] 92it [00:09, 9.98it/s] 93it [00:09, 9.98it/s] 94it [00:09, 9.98it/s] 95it [00:09, 9.96it/s] 96it [00:09, 9.95it/s] 98it [00:10, 9.99it/s] 99it [00:10, 9.98it/s] 100it [00:10, 9.98it/s]2025-05-26 05:57:26,478 - INFO - [Epoch 036 | Batch 0100] IWAE-loss 8589.2041 | mean log_px -0.0804 | KL -3509.35 + 101it [00:10, 9.98it/s] 102it [00:10, 9.97it/s] 103it [00:10, 9.95it/s] 104it [00:10, 9.96it/s] 105it [00:10, 9.97it/s] 106it [00:10, 9.95it/s] 107it [00:11, 9.95it/s] 108it [00:11, 9.92it/s] 109it [00:11, 9.82it/s] 110it [00:11, 9.79it/s] 111it [00:11, 9.66it/s] 112it [00:11, 9.66it/s] 113it [00:11, 9.70it/s] 114it [00:11, 9.74it/s] 115it [00:11, 9.79it/s] 116it [00:12, 9.80it/s] 117it [00:12, 9.18it/s] 118it [00:12, 9.37it/s] 119it [00:12, 9.51it/s] 120it [00:12, 9.58it/s] 121it [00:12, 8.98it/s] 122it [00:12, 9.22it/s] 123it [00:12, 9.41it/s] 124it [00:12, 9.54it/s] 125it [00:12, 9.65it/s] 126it [00:13, 9.70it/s] 127it [00:13, 9.75it/s] 128it [00:13, 9.78it/s] 129it [00:13, 9.82it/s] 130it [00:13, 9.84it/s] 131it [00:13, 9.33it/s] 132it [00:13, 9.47it/s] 133it [00:13, 9.60it/s] 134it [00:13, 9.68it/s] 135it [00:14, 9.74it/s] 136it [00:14, 9.65it/s] 137it [00:14, 9.61it/s] 138it [00:14, 9.61it/s] 139it [00:14, 9.67it/s] 140it [00:14, 9.73it/s] 141it [00:14, 9.77it/s] 142it [00:14, 9.12it/s] 143it [00:14, 9.35it/s] 144it [00:14, 9.50it/s] 145it [00:15, 9.62it/s] 146it [00:15, 9.54it/s] 147it [00:15, 9.65it/s] 148it [00:15, 9.63it/s] 149it [00:15, 9.69it/s] 150it [00:15, 9.72it/s]2025-05-26 05:57:31,668 - INFO - [Epoch 036 | Batch 0150] IWAE-loss 5136.7231 | mean log_px -0.0261 | KL -3499.86 + 151it [00:15, 9.13it/s] 152it [00:15, 9.32it/s] 153it [00:15, 9.47it/s] 154it [00:16, 9.56it/s] 155it [00:16, 9.04it/s] 156it [00:16, 8.81it/s] 157it [00:16, 8.67it/s] 158it [00:16, 8.83it/s] 159it [00:16, 9.01it/s] 160it [00:16, 8.73it/s] 161it [00:16, 8.93it/s] 162it [00:16, 9.03it/s] 163it [00:17, 9.14it/s] 164it [00:17, 9.25it/s] 165it [00:17, 9.26it/s] 166it [00:17, 9.29it/s] 167it [00:17, 9.30it/s] 168it [00:17, 9.32it/s] 169it [00:17, 9.35it/s] 170it [00:17, 9.34it/s] 171it [00:17, 9.27it/s] 172it [00:17, 9.26it/s] 173it [00:18, 9.33it/s] 174it [00:18, 9.40it/s] 175it [00:18, 9.39it/s] 176it [00:18, 9.35it/s] 177it [00:18, 9.38it/s] 178it [00:18, 8.88it/s] 179it [00:18, 9.01it/s] 180it [00:18, 9.15it/s] 181it [00:18, 9.16it/s] 182it [00:19, 9.21it/s] 183it [00:19, 9.27it/s] 184it [00:19, 9.27it/s] 185it [00:19, 9.33it/s] 186it [00:19, 9.37it/s] 187it [00:19, 9.37it/s] 188it [00:19, 9.38it/s] 189it [00:19, 9.48it/s] 190it [00:19, 8.96it/s] 191it [00:20, 9.08it/s] 192it [00:20, 9.18it/s] 193it [00:20, 9.25it/s] 194it [00:20, 9.30it/s] 195it [00:20, 8.78it/s] 196it [00:20, 8.59it/s] 196it [00:20, 9.47it/s] +2025-05-26 05:57:36,718 - INFO - Epoch: 36, Objective: tensor([6148.1465], device='cuda:0', grad_fn=), Loss: 0.04331137239933014, KL/n: 71.53656005859375 + 0it [00:00, ?it/s]2025-05-26 05:57:36,998 - INFO - [Epoch 037 | Batch 0000] IWAE-loss 5157.5024 | mean log_px -0.0263 | KL -3506.90 + 1it [00:00, 5.41it/s] 2it [00:00, 7.28it/s] 3it [00:00, 8.21it/s] 4it [00:00, 8.71it/s] 5it [00:00, 9.05it/s] 6it [00:00, 9.25it/s] 7it [00:00, 9.37it/s] 8it [00:00, 9.40it/s] 9it [00:01, 9.50it/s] 10it [00:01, 9.46it/s] 11it [00:01, 9.50it/s] 12it [00:01, 9.49it/s] 13it [00:01, 9.52it/s] 14it [00:01, 9.51it/s] 15it [00:01, 9.51it/s] 16it [00:01, 9.49it/s] 17it [00:01, 9.45it/s] 18it [00:01, 9.48it/s] 19it [00:02, 9.50it/s] 20it [00:02, 9.49it/s] 21it [00:02, 9.49it/s] 22it [00:02, 9.48it/s] 23it [00:02, 9.53it/s] 24it [00:02, 9.51it/s] 25it [00:02, 9.51it/s] 26it [00:02, 9.30it/s] 27it [00:02, 9.42it/s] 28it [00:03, 9.46it/s] 29it [00:03, 9.47it/s] 30it [00:03, 8.99it/s] 31it [00:03, 9.11it/s] 32it [00:03, 9.19it/s] 33it [00:03, 9.27it/s] 34it [00:03, 9.35it/s] 35it [00:03, 9.45it/s] 36it [00:03, 9.47it/s] 37it [00:03, 9.50it/s] 38it [00:04, 9.52it/s] 39it [00:04, 9.43it/s] 40it [00:04, 9.46it/s] 41it [00:04, 9.00it/s] 42it [00:04, 9.15it/s] 43it [00:04, 9.26it/s] 44it [00:04, 9.30it/s] 45it [00:04, 9.36it/s] 46it [00:04, 9.41it/s] 47it [00:05, 9.48it/s] 48it [00:05, 9.46it/s] 49it [00:05, 9.47it/s] 50it [00:05, 9.48it/s]2025-05-26 05:57:42,294 - INFO - [Epoch 037 | Batch 0050] IWAE-loss 6418.6987 | mean log_px -0.0469 | KL -3502.43 + 51it [00:05, 9.46it/s] 52it [00:05, 9.48it/s] 53it [00:05, 9.51it/s] 54it [00:05, 8.95it/s] 55it [00:05, 9.13it/s] 56it [00:06, 9.27it/s] 57it [00:06, 9.39it/s] 58it [00:06, 9.42it/s] 59it [00:06, 9.45it/s] 60it [00:06, 9.46it/s] 61it [00:06, 9.49it/s] 62it [00:06, 9.49it/s] 63it [00:06, 9.52it/s] 64it [00:06, 9.53it/s] 65it [00:06, 9.51it/s] 66it [00:07, 9.51it/s] 67it [00:07, 9.52it/s] 68it [00:07, 9.56it/s] 69it [00:07, 9.58it/s] 70it [00:07, 9.56it/s] 71it [00:07, 9.54it/s] 72it [00:07, 9.41it/s] 73it [00:07, 9.45it/s] 74it [00:07, 9.48it/s] 75it [00:08, 9.47it/s] 76it [00:08, 9.47it/s] 77it [00:08, 9.47it/s] 78it [00:08, 9.51it/s] 79it [00:08, 9.56it/s] 80it [00:08, 9.52it/s] 81it [00:08, 9.49it/s] 82it [00:08, 9.13it/s] 83it [00:08, 9.24it/s] 84it [00:08, 9.27it/s] 85it [00:09, 9.36it/s] 86it [00:09, 9.35it/s] 87it [00:09, 9.38it/s] 88it [00:09, 9.39it/s] 89it [00:09, 9.44it/s] 90it [00:09, 9.47it/s] 91it [00:09, 9.51it/s] 92it [00:09, 9.01it/s] 93it [00:09, 9.19it/s] 94it [00:10, 9.26it/s] 95it [00:10, 9.33it/s] 96it [00:10, 9.38it/s] 97it [00:10, 9.45it/s] 98it [00:10, 9.46it/s] 99it [00:10, 9.49it/s] 100it [00:10, 9.51it/s]2025-05-26 05:57:47,604 - INFO - [Epoch 037 | Batch 0100] IWAE-loss 5038.2764 | mean log_px -0.0247 | KL -3498.83 + 101it [00:10, 9.53it/s] 102it [00:10, 9.53it/s] 103it [00:11, 9.52it/s] 104it [00:11, 9.47it/s] 105it [00:11, 9.48it/s] 106it [00:11, 8.98it/s] 107it [00:11, 9.19it/s] 108it [00:11, 9.29it/s] 109it [00:11, 9.36it/s] 110it [00:11, 9.40it/s] 111it [00:11, 9.08it/s] 112it [00:11, 9.18it/s] 113it [00:12, 9.33it/s] 114it [00:12, 9.37it/s] 115it [00:12, 9.46it/s] 116it [00:12, 9.46it/s] 117it [00:12, 9.48it/s] 118it [00:12, 9.49it/s] 119it [00:12, 9.47it/s] 120it [00:12, 9.44it/s] 121it [00:12, 9.47it/s] 122it [00:13, 9.49it/s] 123it [00:13, 9.50it/s] 124it [00:13, 9.31it/s] 125it [00:13, 9.35it/s] 126it [00:13, 9.36it/s] 127it [00:13, 9.41it/s] 128it [00:13, 9.38it/s] 129it [00:13, 9.44it/s] 130it [00:13, 9.44it/s] 131it [00:13, 9.49it/s] 132it [00:14, 9.46it/s] 133it [00:14, 9.49it/s] 134it [00:14, 9.51it/s] 135it [00:14, 9.52it/s] 136it [00:14, 9.54it/s] 137it [00:14, 9.02it/s] 138it [00:14, 9.15it/s] 139it [00:14, 9.27it/s] 140it [00:14, 9.33it/s] 141it [00:15, 9.39it/s] 142it [00:15, 9.44it/s] 143it [00:15, 9.46it/s] 144it [00:15, 9.10it/s] 145it [00:15, 9.23it/s] 146it [00:15, 9.29it/s] 147it [00:15, 9.37it/s] 148it [00:15, 9.08it/s] 149it [00:15, 9.24it/s] 150it [00:16, 9.36it/s]2025-05-26 05:57:52,946 - INFO - [Epoch 037 | Batch 0150] IWAE-loss 6093.8408 | mean log_px -0.0371 | KL -3496.12 + 151it [00:16, 9.44it/s] 152it [00:16, 9.52it/s] 153it [00:16, 9.52it/s] 154it [00:16, 9.50it/s] 155it [00:16, 9.55it/s] 156it [00:16, 9.54it/s] 157it [00:16, 9.58it/s] 158it [00:16, 9.54it/s] 159it [00:16, 9.59it/s] 160it [00:17, 9.57it/s] 161it [00:17, 9.50it/s] 162it [00:17, 9.41it/s] 163it [00:17, 9.41it/s] 164it [00:17, 9.37it/s] 165it [00:17, 9.41it/s] 166it [00:17, 9.46it/s] 167it [00:17, 9.54it/s] 168it [00:17, 9.59it/s] 169it [00:18, 9.64it/s] 170it [00:18, 9.59it/s] 171it [00:18, 9.57it/s] 172it [00:18, 9.56it/s] 173it [00:18, 9.57it/s] 174it [00:18, 9.55it/s] 175it [00:18, 9.59it/s] 176it [00:18, 9.56it/s] 177it [00:18, 9.52it/s] 178it [00:18, 9.53it/s] 179it [00:19, 9.52it/s] 180it [00:19, 9.53it/s] 181it [00:19, 9.54it/s] 182it [00:19, 9.54it/s] 183it [00:19, 9.57it/s] 184it [00:19, 9.53it/s] 185it [00:19, 9.54it/s] 186it [00:19, 9.56it/s] 187it [00:19, 9.59it/s] 188it [00:20, 9.58it/s] 189it [00:20, 9.56it/s] 190it [00:20, 9.59it/s] 191it [00:20, 9.55it/s] 192it [00:20, 9.51it/s] 193it [00:20, 9.48it/s] 194it [00:20, 9.49it/s] 195it [00:20, 8.84it/s] 196it [00:20, 9.11it/s] 196it [00:20, 9.36it/s] +2025-05-26 05:57:57,790 - INFO - Epoch: 37, Objective: tensor([7495.4062], device='cuda:0', grad_fn=), Loss: 0.06337570399045944, KL/n: 71.414794921875 + 0it [00:00, ?it/s]2025-05-26 05:57:58,045 - INFO - [Epoch 038 | Batch 0000] IWAE-loss 8049.1758 | mean log_px -0.0730 | KL -3499.70 + 1it [00:00, 6.12it/s] 2it [00:00, 7.80it/s] 3it [00:00, 8.62it/s] 4it [00:00, 8.96it/s] 5it [00:00, 9.24it/s] 6it [00:00, 9.31it/s] 7it [00:00, 9.39it/s] 8it [00:00, 9.46it/s] 9it [00:00, 9.54it/s] 10it [00:01, 9.56it/s] 11it [00:01, 9.60it/s] 12it [00:01, 9.60it/s] 13it [00:01, 9.65it/s] 14it [00:01, 9.61it/s] 15it [00:01, 9.62it/s] 16it [00:01, 9.58it/s] 17it [00:01, 9.53it/s] 18it [00:01, 9.56it/s] 19it [00:02, 9.61it/s] 20it [00:02, 9.39it/s] 21it [00:02, 9.39it/s] 22it [00:02, 9.47it/s] 23it [00:02, 9.48it/s] 24it [00:02, 9.50it/s] 25it [00:02, 9.42it/s] 26it [00:02, 9.38it/s] 27it [00:02, 9.43it/s] 28it [00:02, 9.48it/s] 29it [00:03, 9.51it/s] 30it [00:03, 9.51it/s] 31it [00:03, 9.53it/s] 32it [00:03, 9.51it/s] 33it [00:03, 9.54it/s] 34it [00:03, 9.55it/s] 35it [00:03, 9.46it/s] 36it [00:03, 9.43it/s] 37it [00:03, 9.46it/s] 38it [00:04, 9.48it/s] 39it [00:04, 9.48it/s] 40it [00:04, 9.40it/s] 41it [00:04, 9.46it/s] 42it [00:04, 9.52it/s] 43it [00:04, 9.54it/s] 44it [00:04, 9.55it/s] 45it [00:04, 9.54it/s] 46it [00:04, 9.54it/s] 47it [00:04, 9.54it/s] 48it [00:05, 9.56it/s] 49it [00:05, 9.52it/s] 50it [00:05, 9.50it/s]2025-05-26 05:58:03,290 - INFO - [Epoch 038 | Batch 0050] IWAE-loss 5952.2158 | mean log_px -0.0410 | KL -3503.08 + 51it [00:05, 5.96it/s] 52it [00:05, 6.62it/s] 53it [00:05, 7.16it/s] 54it [00:05, 7.46it/s] 55it [00:06, 7.98it/s] 56it [00:06, 8.37it/s] 57it [00:06, 8.68it/s] 58it [00:06, 8.89it/s] 59it [00:06, 9.02it/s] 60it [00:06, 9.15it/s] 61it [00:06, 9.22it/s] 62it [00:06, 9.29it/s] 63it [00:06, 9.26it/s] 64it [00:07, 9.08it/s] 65it [00:07, 9.10it/s] 66it [00:07, 9.17it/s] 67it [00:07, 8.68it/s] 68it [00:07, 8.84it/s] 69it [00:07, 8.94it/s] 70it [00:07, 8.97it/s] 71it [00:07, 9.13it/s] 72it [00:07, 9.17it/s] 73it [00:08, 9.28it/s] 74it [00:08, 9.38it/s] 75it [00:08, 9.45it/s] 76it [00:08, 9.46it/s] 77it [00:08, 9.47it/s] 78it [00:08, 9.48it/s] 79it [00:08, 9.51it/s] 80it [00:08, 9.52it/s] 81it [00:08, 9.50it/s] 82it [00:08, 9.06it/s] 83it [00:09, 9.23it/s] 84it [00:09, 9.34it/s] 85it [00:09, 9.37it/s] 86it [00:09, 9.41it/s] 87it [00:09, 9.45it/s] 88it [00:09, 9.48it/s] 89it [00:09, 9.49it/s] 90it [00:09, 9.46it/s] 91it [00:09, 9.49it/s] 92it [00:10, 9.47it/s] 93it [00:10, 9.48it/s] 94it [00:10, 9.43it/s] 95it [00:10, 9.45it/s] 96it [00:10, 9.48it/s] 97it [00:10, 9.47it/s] 98it [00:10, 9.49it/s] 99it [00:10, 9.46it/s] 100it [00:10, 9.44it/s]2025-05-26 05:58:08,872 - INFO - [Epoch 038 | Batch 0100] IWAE-loss 7382.7646 | mean log_px -0.0584 | KL -3494.08 + 101it [00:10, 9.48it/s] 102it [00:11, 9.46it/s] 103it [00:11, 9.50it/s] 104it [00:11, 9.48it/s] 105it [00:11, 9.51it/s] 106it [00:11, 9.55it/s] 107it [00:11, 9.53it/s] 108it [00:11, 9.48it/s] 109it [00:11, 9.46it/s] 110it [00:11, 9.47it/s] 111it [00:12, 9.45it/s] 112it [00:12, 9.47it/s] 113it [00:12, 9.12it/s] 114it [00:12, 9.20it/s] 115it [00:12, 9.26it/s] 116it [00:12, 9.32it/s] 117it [00:12, 9.35it/s] 118it [00:12, 9.37it/s] 119it [00:12, 9.47it/s] 120it [00:13, 9.45it/s] 121it [00:13, 9.47it/s] 122it [00:13, 9.50it/s] 123it [00:13, 9.49it/s] 124it [00:13, 9.40it/s] 125it [00:13, 8.98it/s] 126it [00:13, 9.11it/s] 127it [00:13, 9.24it/s] 128it [00:13, 9.28it/s] 129it [00:13, 9.36it/s] 130it [00:14, 8.83it/s] 131it [00:14, 9.03it/s] 132it [00:14, 9.16it/s] 133it [00:14, 9.30it/s] 134it [00:14, 9.34it/s] 135it [00:14, 9.43it/s] 136it [00:14, 8.95it/s] 137it [00:14, 9.13it/s] 138it [00:14, 9.26it/s] 139it [00:15, 9.38it/s] 140it [00:15, 9.46it/s] 141it [00:15, 9.47it/s] 142it [00:15, 9.45it/s] 143it [00:15, 9.48it/s] 144it [00:15, 9.50it/s] 145it [00:15, 9.51it/s] 146it [00:15, 9.48it/s] 147it [00:15, 9.47it/s] 148it [00:16, 9.46it/s] 149it [00:16, 9.50it/s] 150it [00:16, 9.49it/s]2025-05-26 05:58:14,210 - INFO - [Epoch 038 | Batch 0150] IWAE-loss 5241.9893 | mean log_px -0.0268 | KL -3495.52 + 151it [00:16, 9.54it/s] 152it [00:16, 9.51it/s] 153it [00:16, 9.54it/s] 154it [00:16, 9.55it/s] 155it [00:16, 9.51it/s] 156it [00:16, 9.56it/s] 157it [00:16, 9.58it/s] 158it [00:17, 9.53it/s] 159it [00:17, 9.54it/s] 160it [00:17, 9.52it/s] 161it [00:17, 9.48it/s] 162it [00:17, 9.51it/s] 163it [00:17, 9.51it/s] 164it [00:17, 9.47it/s] 165it [00:17, 9.16it/s] 166it [00:17, 9.27it/s] 167it [00:18, 9.35it/s] 168it [00:18, 9.37it/s] 169it [00:18, 9.41it/s] 170it [00:18, 9.44it/s] 171it [00:18, 9.46it/s] 172it [00:18, 9.52it/s] 173it [00:18, 9.39it/s] 174it [00:18, 9.39it/s] 175it [00:18, 9.41it/s] 176it [00:18, 9.33it/s] 177it [00:19, 9.43it/s] 178it [00:19, 9.42it/s] 179it [00:19, 9.47it/s] 180it [00:19, 9.46it/s] 181it [00:19, 9.55it/s] 182it [00:19, 9.53it/s] 183it [00:19, 9.53it/s] 184it [00:19, 9.55it/s] 185it [00:19, 9.51it/s] 186it [00:20, 9.22it/s] 187it [00:20, 8.62it/s] 188it [00:20, 8.72it/s] 189it [00:20, 8.95it/s] 190it [00:20, 9.13it/s] 191it [00:20, 9.24it/s] 192it [00:20, 9.29it/s] 193it [00:20, 9.36it/s] 194it [00:20, 9.40it/s] 195it [00:21, 8.85it/s] 196it [00:21, 8.76it/s] 196it [00:21, 9.23it/s] +2025-05-26 05:58:19,151 - INFO - Epoch: 38, Objective: tensor([6876.5137], device='cuda:0', grad_fn=), Loss: 0.05297667905688286, KL/n: 71.28185272216797 + 0it [00:00, ?it/s]2025-05-26 05:58:19,444 - INFO - [Epoch 039 | Batch 0000] IWAE-loss 6343.7041 | mean log_px -0.0524 | KL -3491.50 + 1it [00:00, 5.02it/s] 2it [00:00, 6.35it/s] 3it [00:00, 7.51it/s] 4it [00:00, 8.21it/s] 5it [00:00, 8.65it/s] 6it [00:00, 8.33it/s] 7it [00:00, 8.70it/s] 8it [00:00, 8.94it/s] 9it [00:01, 9.16it/s] 10it [00:01, 8.86it/s] 11it [00:01, 9.11it/s] 12it [00:01, 9.13it/s] 13it [00:01, 8.75it/s] 14it [00:01, 8.98it/s] 15it [00:01, 9.15it/s] 16it [00:01, 9.23it/s] 17it [00:01, 9.33it/s] 18it [00:02, 9.40it/s] 19it [00:02, 9.45it/s] 20it [00:02, 9.43it/s] 21it [00:02, 9.45it/s] 22it [00:02, 9.44it/s] 23it [00:02, 9.49it/s] 24it [00:02, 9.50it/s] 25it [00:02, 9.54it/s] 26it [00:02, 9.50it/s] 27it [00:03, 9.51it/s] 28it [00:03, 9.48it/s] 29it [00:03, 9.48it/s] 30it [00:03, 9.44it/s] 31it [00:03, 8.96it/s] 32it [00:03, 9.07it/s] 33it [00:03, 9.17it/s] 34it [00:03, 9.25it/s] 35it [00:03, 9.31it/s] 36it [00:03, 9.36it/s] 37it [00:04, 9.38it/s] 38it [00:04, 9.42it/s] 39it [00:04, 9.44it/s] 40it [00:04, 9.44it/s] 41it [00:04, 9.40it/s] 42it [00:04, 9.38it/s] 43it [00:04, 9.44it/s] 44it [00:04, 9.46it/s] 45it [00:04, 8.92it/s] 46it [00:05, 9.05it/s] 47it [00:05, 9.14it/s] 48it [00:05, 9.24it/s] 49it [00:05, 9.29it/s] 50it [00:05, 9.31it/s]2025-05-26 05:58:24,842 - INFO - [Epoch 039 | Batch 0050] IWAE-loss 5679.2578 | mean log_px -0.0351 | KL -3490.73 + 51it [00:05, 9.34it/s] 52it [00:05, 9.36it/s] 53it [00:05, 9.39it/s] 54it [00:05, 9.39it/s] 55it [00:06, 9.40it/s] 56it [00:06, 9.42it/s] 57it [00:06, 9.45it/s] 58it [00:06, 9.44it/s] 59it [00:06, 9.45it/s] 60it [00:06, 9.44it/s] 61it [00:06, 9.48it/s] 62it [00:06, 9.58it/s] 63it [00:06, 9.66it/s] 64it [00:06, 9.71it/s] 65it [00:07, 9.27it/s] 66it [00:07, 9.43it/s] 67it [00:07, 9.55it/s] 68it [00:07, 9.04it/s] 69it [00:07, 9.27it/s] 70it [00:07, 9.44it/s] 71it [00:07, 9.58it/s] 72it [00:07, 9.66it/s] 73it [00:07, 9.73it/s] 74it [00:08, 9.76it/s] 75it [00:08, 9.79it/s] 76it [00:08, 9.81it/s] 77it [00:08, 9.82it/s] 78it [00:08, 9.83it/s] 79it [00:08, 9.22it/s] 80it [00:08, 9.40it/s] 81it [00:08, 9.56it/s] 82it [00:08, 9.54it/s] 83it [00:08, 9.56it/s] 84it [00:09, 9.57it/s] 85it [00:09, 9.67it/s] 86it [00:09, 9.72it/s] 87it [00:09, 9.15it/s] 88it [00:09, 9.35it/s] 89it [00:09, 9.51it/s] 90it [00:09, 9.60it/s] 91it [00:09, 9.69it/s] 92it [00:09, 9.74it/s] 93it [00:09, 9.78it/s] 94it [00:10, 9.80it/s] 95it [00:10, 9.83it/s] 96it [00:10, 9.70it/s] 97it [00:10, 9.72it/s] 98it [00:10, 9.74it/s] 99it [00:10, 9.76it/s] 100it [00:10, 9.79it/s]2025-05-26 05:58:30,062 - INFO - [Epoch 039 | Batch 0100] IWAE-loss 5635.9746 | mean log_px -0.0364 | KL -3484.96 + 101it [00:10, 9.81it/s] 102it [00:10, 9.79it/s] 103it [00:11, 9.83it/s] 104it [00:11, 9.83it/s] 105it [00:11, 9.85it/s] 106it [00:11, 9.85it/s] 107it [00:11, 9.23it/s] 108it [00:11, 9.39it/s] 109it [00:11, 9.53it/s] 110it [00:11, 9.61it/s] 111it [00:11, 9.70it/s] 112it [00:11, 9.73it/s] 113it [00:12, 9.77it/s] 114it [00:12, 9.79it/s] 115it [00:12, 9.82it/s] 116it [00:12, 9.82it/s] 117it [00:12, 9.84it/s] 118it [00:12, 9.83it/s] 119it [00:12, 9.83it/s] 120it [00:12, 9.83it/s] 121it [00:12, 9.85it/s] 122it [00:12, 9.85it/s] 123it [00:13, 9.85it/s] 124it [00:13, 9.85it/s] 125it [00:13, 9.87it/s] 126it [00:13, 9.79it/s] 127it [00:13, 9.18it/s] 128it [00:13, 9.37it/s] 129it [00:13, 9.53it/s] 130it [00:13, 9.62it/s] 131it [00:13, 9.70it/s] 132it [00:14, 9.75it/s] 133it [00:14, 9.80it/s] 134it [00:14, 9.81it/s] 135it [00:14, 9.84it/s] 136it [00:14, 9.84it/s] 137it [00:14, 9.21it/s] 138it [00:14, 9.38it/s] 139it [00:14, 9.54it/s] 140it [00:14, 9.63it/s] 141it [00:14, 9.07it/s] 142it [00:15, 9.29it/s] 143it [00:15, 9.46it/s] 144it [00:15, 9.57it/s] 145it [00:15, 9.65it/s] 146it [00:15, 9.71it/s] 147it [00:15, 9.78it/s] 148it [00:15, 9.80it/s] 149it [00:15, 9.73it/s] 150it [00:15, 9.02it/s]2025-05-26 05:58:35,269 - INFO - [Epoch 039 | Batch 0150] IWAE-loss 6551.1885 | mean log_px -0.0438 | KL -3480.69 + 151it [00:16, 9.03it/s] 152it [00:16, 9.17it/s] 153it [00:16, 9.22it/s] 154it [00:16, 9.32it/s] 155it [00:16, 9.02it/s] 156it [00:16, 9.16it/s] 157it [00:16, 9.32it/s] 158it [00:16, 9.41it/s] 159it [00:16, 9.45it/s] 160it [00:16, 9.49it/s] 161it [00:17, 8.87it/s] 162it [00:17, 9.05it/s] 163it [00:17, 9.21it/s] 164it [00:17, 9.31it/s] 165it [00:17, 9.32it/s] 166it [00:17, 9.38it/s] 167it [00:17, 9.48it/s] 168it [00:17, 9.44it/s] 169it [00:17, 9.50it/s] 170it [00:18, 9.51it/s] 171it [00:18, 9.52it/s] 172it [00:18, 9.48it/s] 173it [00:18, 9.49it/s] 174it [00:18, 9.53it/s] 175it [00:18, 9.47it/s] 176it [00:18, 9.45it/s] 177it [00:18, 9.47it/s] 178it [00:18, 9.40it/s] 179it [00:19, 9.41it/s] 180it [00:19, 9.41it/s] 181it [00:19, 9.49it/s] 182it [00:19, 9.46it/s] 183it [00:19, 8.95it/s] 184it [00:19, 9.11it/s] 185it [00:19, 9.24it/s] 186it [00:19, 9.32it/s] 187it [00:19, 9.38it/s] 188it [00:19, 9.43it/s] 189it [00:20, 9.43it/s] 190it [00:20, 9.33it/s] 191it [00:20, 9.33it/s] 192it [00:20, 9.43it/s] 193it [00:20, 9.52it/s] 194it [00:20, 9.55it/s] 195it [00:20, 8.95it/s] 196it [00:20, 9.15it/s] 196it [00:20, 9.38it/s] +2025-05-26 05:58:40,187 - INFO - Epoch: 39, Objective: tensor([6474.6235], device='cuda:0', grad_fn=), Loss: 0.045537568628787994, KL/n: 71.1382827758789 + 0it [00:00, ?it/s]2025-05-26 05:58:40,463 - INFO - [Epoch 040 | Batch 0000] IWAE-loss 7672.9946 | mean log_px -0.0628 | KL -3483.29 + 1it [00:00, 4.79it/s] 2it [00:00, 6.72it/s] 3it [00:00, 7.80it/s] 4it [00:00, 8.38it/s] 5it [00:00, 8.82it/s] 6it [00:00, 8.98it/s] 7it [00:00, 9.13it/s] 8it [00:00, 9.23it/s] 9it [00:01, 8.75it/s] 10it [00:01, 8.98it/s] 11it [00:01, 9.14it/s] 12it [00:01, 9.21it/s] 13it [00:01, 8.90it/s] 14it [00:01, 9.02it/s] 15it [00:01, 9.15it/s] 16it [00:01, 9.19it/s] 17it [00:01, 9.30it/s] 18it [00:02, 9.33it/s] 19it [00:02, 9.40it/s] 20it [00:02, 9.39it/s] 21it [00:02, 8.93it/s] 22it [00:02, 9.13it/s] 23it [00:02, 9.26it/s] 24it [00:02, 9.35it/s] 25it [00:02, 9.47it/s] 26it [00:02, 9.51it/s] 27it [00:03, 9.57it/s] 28it [00:03, 9.57it/s] 29it [00:03, 6.24it/s] 30it [00:03, 6.96it/s] 31it [00:03, 7.57it/s] 32it [00:03, 8.06it/s] 33it [00:03, 8.42it/s] 34it [00:03, 8.75it/s] 35it [00:04, 9.00it/s] 36it [00:04, 9.14it/s] 37it [00:04, 9.27it/s] 38it [00:04, 8.78it/s] 39it [00:04, 9.03it/s] 40it [00:04, 9.16it/s] 41it [00:04, 9.29it/s] 42it [00:04, 9.35it/s] 43it [00:04, 9.41it/s] 44it [00:04, 9.42it/s] 45it [00:05, 9.47it/s] 46it [00:05, 9.48it/s] 47it [00:05, 9.51it/s] 48it [00:05, 9.47it/s] 49it [00:05, 9.51it/s] 50it [00:05, 9.48it/s]2025-05-26 05:58:46,009 - INFO - [Epoch 040 | Batch 0050] IWAE-loss 5287.8018 | mean log_px -0.0307 | KL -3482.75 + 51it [00:05, 9.53it/s] 52it [00:05, 9.57it/s] 53it [00:05, 9.60it/s] 54it [00:06, 9.61it/s] 55it [00:06, 9.57it/s] 56it [00:06, 9.54it/s] 57it [00:06, 9.54it/s] 58it [00:06, 9.55it/s] 59it [00:06, 9.62it/s] 60it [00:06, 9.59it/s] 61it [00:06, 9.59it/s] 62it [00:06, 9.58it/s] 63it [00:06, 9.54it/s] 64it [00:07, 9.54it/s] 65it [00:07, 9.61it/s] 66it [00:07, 9.64it/s] 67it [00:07, 9.59it/s] 68it [00:07, 9.59it/s] 69it [00:07, 9.59it/s] 70it [00:07, 9.58it/s] 71it [00:07, 9.60it/s] 72it [00:07, 9.59it/s] 73it [00:08, 9.58it/s] 74it [00:08, 9.58it/s] 75it [00:08, 9.54it/s] 76it [00:08, 9.44it/s] 77it [00:08, 9.47it/s] 78it [00:08, 9.48it/s] 79it [00:08, 9.49it/s] 80it [00:08, 9.45it/s] 81it [00:08, 9.46it/s] 82it [00:08, 9.47it/s] 83it [00:09, 9.53it/s] 84it [00:09, 9.48it/s] 85it [00:09, 9.54it/s] 86it [00:09, 9.51it/s] 87it [00:09, 9.55it/s] 88it [00:09, 9.50it/s] 89it [00:09, 9.56it/s] 90it [00:09, 9.50it/s] 91it [00:09, 9.40it/s] 92it [00:10, 9.41it/s] 93it [00:10, 9.46it/s] 94it [00:10, 9.49it/s] 95it [00:10, 9.49it/s] 96it [00:10, 9.40it/s] 97it [00:10, 9.36it/s] 98it [00:10, 9.43it/s] 99it [00:10, 9.47it/s] 100it [00:10, 9.40it/s]2025-05-26 05:58:51,262 - INFO - [Epoch 040 | Batch 0100] IWAE-loss 6247.6255 | mean log_px -0.0492 | KL -3478.28 + 101it [00:10, 9.40it/s] 102it [00:11, 9.44it/s] 103it [00:11, 9.45it/s] 104it [00:11, 9.43it/s] 105it [00:11, 9.43it/s] 106it [00:11, 9.44it/s] 107it [00:11, 9.46it/s] 108it [00:11, 9.45it/s] 109it [00:11, 9.47it/s] 110it [00:11, 9.46it/s] 111it [00:12, 9.45it/s] 112it [00:12, 9.45it/s] 113it [00:12, 9.47it/s] 114it [00:12, 9.41it/s] 115it [00:12, 9.43it/s] 116it [00:12, 9.39it/s] 117it [00:12, 9.40it/s] 118it [00:12, 9.42it/s] 119it [00:12, 9.51it/s] 120it [00:12, 9.48it/s] 121it [00:13, 9.48it/s] 122it [00:13, 9.48it/s] 123it [00:13, 9.43it/s] 124it [00:13, 9.43it/s] 125it [00:13, 9.46it/s] 126it [00:13, 9.48it/s] 127it [00:13, 9.46it/s] 128it [00:13, 9.50it/s] 129it [00:13, 9.51it/s] 130it [00:14, 9.51it/s] 131it [00:14, 9.48it/s] 132it [00:14, 9.32it/s] 133it [00:14, 9.38it/s] 134it [00:14, 9.35it/s] 135it [00:14, 9.35it/s] 136it [00:14, 9.39it/s] 137it [00:14, 9.45it/s] 138it [00:14, 9.28it/s] 139it [00:15, 9.38it/s] 140it [00:15, 9.36it/s] 141it [00:15, 9.38it/s] 142it [00:15, 9.38it/s] 143it [00:15, 9.43it/s] 144it [00:15, 9.41it/s] 145it [00:15, 9.43it/s] 146it [00:15, 9.43it/s] 147it [00:15, 9.47it/s] 148it [00:15, 9.45it/s] 149it [00:16, 9.41it/s] 150it [00:16, 9.37it/s]2025-05-26 05:58:56,566 - INFO - [Epoch 040 | Batch 0150] IWAE-loss 6392.1655 | mean log_px -0.0420 | KL -3472.99 + 151it [00:16, 9.41it/s] 152it [00:16, 8.92it/s] 153it [00:16, 9.07it/s] 154it [00:16, 9.15it/s] 155it [00:16, 9.20it/s] 156it [00:16, 9.25it/s] 157it [00:16, 9.31it/s] 158it [00:17, 9.34it/s] 159it [00:17, 9.37it/s] 160it [00:17, 9.43it/s] 161it [00:17, 9.41it/s] 162it [00:17, 8.90it/s] 163it [00:17, 8.99it/s] 164it [00:17, 9.10it/s] 165it [00:17, 9.20it/s] 166it [00:17, 9.25it/s] 167it [00:18, 9.29it/s] 168it [00:18, 9.00it/s] 169it [00:18, 9.17it/s] 170it [00:18, 9.24it/s] 171it [00:18, 9.31it/s] 172it [00:18, 9.32it/s] 173it [00:18, 9.36it/s] 174it [00:18, 9.34it/s] 175it [00:18, 9.41it/s] 176it [00:18, 9.43it/s] 177it [00:19, 9.42it/s] 178it [00:19, 9.44it/s] 179it [00:19, 9.44it/s] 180it [00:19, 9.44it/s] 181it [00:19, 9.51it/s] 182it [00:19, 9.47it/s] 183it [00:19, 9.44it/s] 184it [00:19, 9.34it/s] 185it [00:19, 9.01it/s] 186it [00:20, 9.12it/s] 187it [00:20, 9.22it/s] 188it [00:20, 9.27it/s] 189it [00:20, 9.33it/s] 190it [00:20, 9.02it/s] 191it [00:20, 9.13it/s] 192it [00:20, 9.20it/s] 193it [00:20, 8.80it/s] 194it [00:20, 8.96it/s] 195it [00:21, 8.53it/s] 196it [00:21, 8.81it/s] 196it [00:21, 9.22it/s] +2025-05-26 05:59:01,577 - INFO - Epoch: 40, Objective: tensor([5746.3809], device='cuda:0', grad_fn=), Loss: 0.034290388226509094, KL/n: 70.98202514648438 + 0it [00:00, ?it/s]2025-05-26 05:59:01,871 - INFO - [Epoch 041 | Batch 0000] IWAE-loss 5749.5537 | mean log_px -0.0346 | KL -3479.12 + 1it [00:00, 4.42it/s] 2it [00:00, 6.39it/s] 3it [00:00, 7.53it/s] 4it [00:00, 8.09it/s] 5it [00:00, 8.47it/s] 6it [00:00, 8.80it/s] 7it [00:00, 8.99it/s] 8it [00:00, 9.15it/s] 9it [00:01, 9.24it/s] 10it [00:01, 9.29it/s] 11it [00:01, 9.31it/s] 12it [00:01, 9.29it/s] 13it [00:01, 8.88it/s] 14it [00:01, 9.01it/s] 15it [00:01, 9.13it/s] 16it [00:01, 9.26it/s] 17it [00:01, 9.30it/s] 18it [00:02, 8.90it/s] 19it [00:02, 9.06it/s] 20it [00:02, 9.18it/s] 21it [00:02, 9.27it/s] 22it [00:02, 9.31it/s] 23it [00:02, 9.34it/s] 24it [00:02, 9.29it/s] 25it [00:02, 9.30it/s] 26it [00:02, 9.32it/s] 27it [00:03, 9.38it/s] 28it [00:03, 9.38it/s] 29it [00:03, 9.41it/s] 30it [00:03, 8.82it/s] 31it [00:03, 9.01it/s] 32it [00:03, 9.15it/s] 33it [00:03, 9.20it/s] 34it [00:03, 8.71it/s] 35it [00:03, 8.94it/s] 36it [00:04, 9.09it/s] 37it [00:04, 9.21it/s] 38it [00:04, 9.29it/s] 39it [00:04, 9.36it/s] 40it [00:04, 9.41it/s] 41it [00:04, 9.42it/s] 42it [00:04, 9.42it/s] 43it [00:04, 9.42it/s] 44it [00:04, 9.21it/s] 45it [00:04, 9.13it/s] 46it [00:05, 8.64it/s] 47it [00:05, 8.92it/s] 48it [00:05, 9.12it/s] 49it [00:05, 9.29it/s] 50it [00:05, 9.39it/s]2025-05-26 05:59:07,316 - INFO - [Epoch 041 | Batch 0050] IWAE-loss 5837.0518 | mean log_px -0.0380 | KL -3473.68 + 51it [00:05, 9.45it/s] 52it [00:05, 9.47it/s] 53it [00:05, 8.94it/s] 54it [00:05, 9.11it/s] 55it [00:06, 9.24it/s] 56it [00:06, 9.36it/s] 57it [00:06, 8.98it/s] 58it [00:06, 9.11it/s] 59it [00:06, 9.23it/s] 60it [00:06, 9.29it/s] 61it [00:06, 9.35it/s] 62it [00:06, 9.42it/s] 63it [00:06, 9.46it/s] 64it [00:07, 9.41it/s] 65it [00:07, 9.42it/s] 66it [00:07, 9.40it/s] 67it [00:07, 9.40it/s] 68it [00:07, 9.42it/s] 69it [00:07, 9.45it/s] 70it [00:07, 9.49it/s] 71it [00:07, 9.46it/s] 72it [00:07, 9.47it/s] 73it [00:08, 9.45it/s] 74it [00:08, 9.50it/s] 75it [00:08, 9.48it/s] 76it [00:08, 9.46it/s] 77it [00:08, 9.53it/s] 78it [00:08, 9.47it/s] 79it [00:08, 9.45it/s] 80it [00:08, 9.47it/s] 81it [00:08, 9.48it/s] 82it [00:08, 9.52it/s] 83it [00:09, 9.09it/s] 84it [00:09, 9.19it/s] 85it [00:09, 9.25it/s] 86it [00:09, 9.32it/s] 87it [00:09, 9.39it/s] 88it [00:09, 9.39it/s] 89it [00:09, 9.43it/s] 90it [00:09, 9.44it/s] 91it [00:09, 9.43it/s] 92it [00:10, 9.42it/s] 93it [00:10, 9.46it/s] 94it [00:10, 9.44it/s] 95it [00:10, 9.45it/s] 96it [00:10, 9.45it/s] 97it [00:10, 9.46it/s] 98it [00:10, 9.46it/s] 99it [00:10, 9.46it/s] 100it [00:10, 9.42it/s]2025-05-26 05:59:12,646 - INFO - [Epoch 041 | Batch 0100] IWAE-loss 5281.2070 | mean log_px -0.0259 | KL -3478.21 + 101it [00:10, 9.44it/s] 102it [00:11, 9.47it/s] 103it [00:11, 9.44it/s] 104it [00:11, 9.50it/s] 105it [00:11, 9.49it/s] 106it [00:11, 8.95it/s] 107it [00:11, 9.12it/s] 108it [00:11, 9.16it/s] 109it [00:11, 9.32it/s] 110it [00:11, 9.34it/s] 111it [00:12, 8.95it/s] 112it [00:12, 9.09it/s] 113it [00:12, 9.19it/s] 114it [00:12, 9.23it/s] 115it [00:12, 9.26it/s] 116it [00:12, 9.36it/s] 117it [00:12, 9.35it/s] 118it [00:12, 9.29it/s] 119it [00:12, 9.29it/s] 120it [00:13, 9.33it/s] 121it [00:13, 9.38it/s] 122it [00:13, 9.40it/s] 123it [00:13, 9.42it/s] 124it [00:13, 9.43it/s] 125it [00:13, 9.45it/s] 126it [00:13, 9.46it/s] 127it [00:13, 9.53it/s] 128it [00:13, 9.52it/s] 129it [00:13, 9.48it/s] 130it [00:14, 9.47it/s] 131it [00:14, 9.47it/s] 132it [00:14, 9.48it/s] 133it [00:14, 9.45it/s] 134it [00:14, 9.40it/s] 135it [00:14, 9.41it/s] 136it [00:14, 9.45it/s] 137it [00:14, 9.42it/s] 138it [00:14, 8.90it/s] 139it [00:15, 9.06it/s] 140it [00:15, 9.17it/s] 141it [00:15, 9.24it/s] 142it [00:15, 9.31it/s] 143it [00:15, 9.36it/s] 144it [00:15, 9.40it/s] 145it [00:15, 9.42it/s] 146it [00:15, 9.45it/s] 147it [00:15, 9.43it/s] 148it [00:16, 9.44it/s] 149it [00:16, 9.45it/s] 150it [00:16, 9.42it/s]2025-05-26 05:59:17,998 - INFO - [Epoch 041 | Batch 0150] IWAE-loss 5604.3018 | mean log_px -0.0409 | KL -3472.15 + 151it [00:16, 9.45it/s] 152it [00:16, 9.49it/s] 153it [00:16, 9.53it/s] 154it [00:16, 9.05it/s] 155it [00:16, 9.19it/s] 156it [00:16, 9.29it/s] 157it [00:16, 9.36it/s] 158it [00:17, 8.97it/s] 159it [00:17, 9.16it/s] 160it [00:17, 9.29it/s] 161it [00:17, 9.34it/s] 162it [00:17, 9.37it/s] 163it [00:17, 9.44it/s] 164it [00:17, 9.41it/s] 165it [00:17, 9.45it/s] 166it [00:17, 9.27it/s] 167it [00:18, 8.93it/s] 168it [00:18, 9.10it/s] 169it [00:18, 9.19it/s] 170it [00:18, 9.21it/s] 171it [00:18, 9.24it/s] 172it [00:18, 9.30it/s] 173it [00:18, 9.29it/s] 174it [00:18, 9.31it/s] 175it [00:18, 9.36it/s] 176it [00:19, 9.41it/s] 177it [00:19, 9.44it/s] 178it [00:19, 9.42it/s] 179it [00:19, 9.44it/s] 180it [00:19, 9.46it/s] 181it [00:19, 9.41it/s] 182it [00:19, 9.43it/s] 183it [00:19, 9.45it/s] 184it [00:19, 9.44it/s] 185it [00:19, 9.47it/s] 186it [00:20, 9.46it/s] 187it [00:20, 9.43it/s] 188it [00:20, 9.06it/s] 189it [00:20, 9.26it/s] 190it [00:20, 9.41it/s] 191it [00:20, 9.55it/s] 192it [00:20, 9.53it/s] 193it [00:20, 9.57it/s] 194it [00:20, 9.64it/s] 195it [00:21, 8.57it/s] 196it [00:21, 9.23it/s] +2025-05-26 05:59:22,943 - INFO - Epoch: 41, Objective: tensor([4431.4009], device='cuda:0', grad_fn=), Loss: 0.017086666077375412, KL/n: 70.84024810791016 + 0it [00:00, ?it/s]2025-05-26 05:59:23,399 - INFO - [Epoch 042 | Batch 0000] IWAE-loss 7730.5332 | mean log_px -0.0675 | KL -3471.14 + 1it [00:00, 5.47it/s] 2it [00:00, 7.38it/s] 3it [00:00, 7.74it/s] 4it [00:00, 8.45it/s] 5it [00:00, 8.93it/s] 6it [00:00, 9.21it/s] 7it [00:00, 9.43it/s] 8it [00:00, 9.53it/s] 9it [00:01, 9.64it/s] 10it [00:01, 9.70it/s] 11it [00:01, 9.77it/s] 12it [00:01, 9.78it/s] 13it [00:01, 9.82it/s] 14it [00:01, 9.41it/s] 15it [00:01, 9.56it/s] 16it [00:01, 9.64it/s] 17it [00:01, 9.01it/s] 18it [00:01, 9.21it/s] 19it [00:02, 9.38it/s] 20it [00:02, 9.52it/s] 21it [00:02, 9.15it/s] 22it [00:02, 9.35it/s] 23it [00:02, 9.51it/s] 24it [00:02, 9.61it/s] 25it [00:02, 9.69it/s] 26it [00:02, 9.74it/s] 27it [00:02, 9.78it/s] 28it [00:03, 9.79it/s] 29it [00:03, 9.83it/s] 30it [00:03, 9.83it/s] 31it [00:03, 9.86it/s] 32it [00:03, 9.84it/s] 33it [00:03, 9.44it/s] 34it [00:03, 9.55it/s] 35it [00:03, 9.64it/s] 36it [00:03, 9.69it/s] 37it [00:03, 9.76it/s] 38it [00:04, 9.38it/s] 39it [00:04, 9.53it/s] 40it [00:04, 9.62it/s] 41it [00:04, 9.70it/s] 42it [00:04, 9.73it/s] 43it [00:04, 9.78it/s] 44it [00:04, 9.78it/s] 45it [00:04, 9.82it/s] 46it [00:04, 9.81it/s] 47it [00:04, 9.85it/s] 48it [00:05, 9.84it/s] 49it [00:05, 9.85it/s] 50it [00:05, 9.84it/s]2025-05-26 05:59:28,583 - INFO - [Epoch 042 | Batch 0050] IWAE-loss 6543.3037 | mean log_px -0.0493 | KL -3464.77 + 51it [00:05, 9.85it/s] 52it [00:05, 9.84it/s] 53it [00:05, 9.85it/s] 54it [00:05, 9.83it/s] 55it [00:05, 9.85it/s] 56it [00:05, 9.84it/s] 57it [00:05, 9.85it/s] 58it [00:06, 9.83it/s] 59it [00:06, 9.86it/s] 60it [00:06, 9.86it/s] 61it [00:06, 9.86it/s] 62it [00:06, 9.85it/s] 63it [00:06, 9.87it/s] 64it [00:06, 9.85it/s] 65it [00:06, 9.86it/s] 66it [00:06, 9.83it/s] 67it [00:06, 9.83it/s] 68it [00:07, 9.83it/s] 69it [00:07, 9.84it/s] 70it [00:07, 9.84it/s] 71it [00:07, 9.85it/s] 72it [00:07, 9.83it/s] 73it [00:07, 9.84it/s] 74it [00:07, 9.83it/s] 75it [00:07, 9.83it/s] 76it [00:07, 9.82it/s] 77it [00:08, 9.85it/s] 78it [00:08, 9.84it/s] 79it [00:08, 9.86it/s] 80it [00:08, 9.84it/s] 81it [00:08, 9.86it/s] 82it [00:08, 9.84it/s] 83it [00:08, 9.84it/s] 84it [00:08, 9.83it/s] 85it [00:08, 9.84it/s] 86it [00:08, 9.57it/s] 87it [00:09, 9.26it/s] 88it [00:09, 9.40it/s] 89it [00:09, 9.54it/s] 90it [00:09, 9.62it/s] 91it [00:09, 9.69it/s] 92it [00:09, 9.72it/s] 93it [00:09, 9.76it/s] 94it [00:09, 9.78it/s] 95it [00:09, 9.79it/s] 96it [00:09, 9.79it/s] 97it [00:10, 9.81it/s] 98it [00:10, 9.81it/s] 99it [00:10, 9.83it/s] 100it [00:10, 9.82it/s]2025-05-26 05:59:33,690 - INFO - [Epoch 042 | Batch 0100] IWAE-loss 4768.8535 | mean log_px -0.0224 | KL -3467.10 + 101it [00:10, 9.81it/s] 102it [00:10, 9.81it/s] 103it [00:10, 9.42it/s] 104it [00:10, 9.52it/s] 105it [00:10, 9.38it/s] 106it [00:11, 9.34it/s] 107it [00:11, 9.34it/s] 108it [00:11, 9.49it/s] 109it [00:11, 9.60it/s] 110it [00:11, 9.10it/s] 111it [00:11, 9.34it/s] 112it [00:11, 9.49it/s] 113it [00:11, 9.60it/s] 114it [00:11, 9.65it/s] 115it [00:11, 9.71it/s] 116it [00:12, 9.75it/s] 117it [00:12, 9.77it/s] 118it [00:12, 9.40it/s] 119it [00:12, 9.51it/s] 120it [00:12, 9.59it/s] 121it [00:12, 9.66it/s] 122it [00:12, 9.69it/s] 123it [00:12, 9.17it/s] 124it [00:12, 9.35it/s] 125it [00:13, 9.50it/s] 126it [00:13, 9.59it/s] 127it [00:13, 9.10it/s] 128it [00:13, 9.12it/s] 129it [00:13, 9.27it/s] 130it [00:13, 8.72it/s] 131it [00:13, 8.98it/s] 132it [00:13, 9.03it/s] 133it [00:13, 9.21it/s] 134it [00:13, 9.29it/s] 135it [00:14, 9.28it/s] 136it [00:14, 9.33it/s] 137it [00:14, 9.35it/s] 138it [00:14, 9.39it/s] 139it [00:14, 9.38it/s] 140it [00:14, 9.38it/s] 141it [00:14, 9.29it/s] 142it [00:14, 8.86it/s] 143it [00:14, 8.83it/s] 144it [00:15, 8.96it/s] 145it [00:15, 9.04it/s] 146it [00:15, 9.09it/s] 147it [00:15, 9.18it/s] 148it [00:15, 9.20it/s] 149it [00:15, 9.23it/s] 150it [00:15, 9.25it/s]2025-05-26 05:59:39,062 - INFO - [Epoch 042 | Batch 0150] IWAE-loss 5339.9580 | mean log_px -0.0337 | KL -3464.08 + 151it [00:15, 8.77it/s] 152it [00:15, 8.90it/s] 153it [00:16, 9.00it/s] 154it [00:16, 9.09it/s] 155it [00:16, 9.14it/s] 156it [00:16, 9.13it/s] 157it [00:16, 9.29it/s] 158it [00:16, 9.28it/s] 159it [00:16, 9.34it/s] 160it [00:16, 9.42it/s] 161it [00:16, 8.93it/s] 162it [00:17, 9.09it/s] 163it [00:17, 9.22it/s] 164it [00:17, 9.34it/s] 165it [00:17, 9.32it/s] 166it [00:17, 9.35it/s] 167it [00:17, 9.38it/s] 168it [00:17, 9.33it/s] 169it [00:17, 9.37it/s] 170it [00:17, 9.41it/s] 171it [00:18, 9.41it/s] 172it [00:18, 9.41it/s] 173it [00:18, 9.44it/s] 174it [00:18, 9.45it/s] 175it [00:18, 9.48it/s] 176it [00:18, 9.45it/s] 177it [00:18, 9.43it/s] 178it [00:18, 9.42it/s] 179it [00:18, 9.42it/s] 180it [00:18, 9.45it/s] 181it [00:19, 9.43it/s] 182it [00:19, 9.45it/s] 183it [00:19, 9.48it/s] 184it [00:19, 9.39it/s] 185it [00:19, 9.42it/s] 186it [00:19, 9.44it/s] 187it [00:19, 9.43it/s] 188it [00:19, 9.40it/s] 189it [00:19, 9.47it/s] 190it [00:20, 9.46it/s] 191it [00:20, 9.45it/s] 192it [00:20, 9.46it/s] 193it [00:20, 9.49it/s] 194it [00:20, 9.48it/s] 195it [00:20, 8.89it/s] 196it [00:20, 8.82it/s] 196it [00:20, 9.44it/s] +2025-05-26 05:59:44,016 - INFO - Epoch: 42, Objective: tensor([5298.1240], device='cuda:0', grad_fn=), Loss: 0.0280563123524189, KL/n: 70.67806243896484 + 0it [00:00, ?it/s]2025-05-26 05:59:44,293 - INFO - [Epoch 043 | Batch 0000] IWAE-loss 4510.7559 | mean log_px -0.0216 | KL -3460.82 + 1it [00:00, 5.43it/s] 2it [00:00, 7.21it/s] 3it [00:00, 8.15it/s] 4it [00:00, 8.61it/s] 5it [00:00, 8.94it/s] 6it [00:00, 9.10it/s] 7it [00:00, 9.26it/s] 8it [00:00, 9.34it/s] 9it [00:01, 9.42it/s] 10it [00:01, 9.43it/s] 11it [00:01, 9.45it/s] 12it [00:01, 9.39it/s] 13it [00:01, 9.46it/s] 14it [00:01, 9.44it/s] 15it [00:01, 9.48it/s] 16it [00:01, 9.47it/s] 17it [00:01, 9.46it/s] 18it [00:01, 9.45it/s] 19it [00:02, 8.96it/s] 20it [00:02, 9.11it/s] 21it [00:02, 9.25it/s] 22it [00:02, 9.34it/s] 23it [00:02, 9.41it/s] 24it [00:02, 9.40it/s] 25it [00:02, 9.46it/s] 26it [00:02, 9.47it/s] 27it [00:02, 9.51it/s] 28it [00:03, 9.51it/s] 29it [00:03, 9.54it/s] 30it [00:03, 9.57it/s] 31it [00:03, 9.53it/s] 32it [00:03, 9.54it/s] 33it [00:03, 9.52it/s] 34it [00:03, 9.51it/s] 35it [00:03, 8.88it/s] 36it [00:03, 9.10it/s] 37it [00:04, 9.25it/s] 38it [00:04, 9.34it/s] 39it [00:04, 9.39it/s] 40it [00:04, 9.44it/s] 41it [00:04, 9.46it/s] 42it [00:04, 9.41it/s] 43it [00:04, 9.42it/s] 44it [00:04, 9.50it/s] 45it [00:04, 9.53it/s] 46it [00:04, 9.49it/s] 47it [00:05, 9.52it/s] 48it [00:05, 9.45it/s] 49it [00:05, 9.45it/s] 50it [00:05, 9.45it/s]2025-05-26 05:59:49,596 - INFO - [Epoch 043 | Batch 0050] IWAE-loss 4645.6123 | mean log_px -0.0196 | KL -3460.41 + 51it [00:05, 8.99it/s] 52it [00:05, 9.11it/s] 53it [00:05, 9.25it/s] 54it [00:05, 9.35it/s] 55it [00:05, 9.29it/s] 56it [00:06, 8.83it/s] 57it [00:06, 9.01it/s] 58it [00:06, 9.13it/s] 59it [00:06, 9.18it/s] 60it [00:06, 9.24it/s] 61it [00:06, 9.31it/s] 62it [00:06, 9.36it/s] 63it [00:06, 9.39it/s] 64it [00:06, 9.44it/s] 65it [00:07, 9.48it/s] 66it [00:07, 9.51it/s] 67it [00:07, 9.59it/s] 68it [00:07, 9.52it/s] 69it [00:07, 9.52it/s] 70it [00:07, 9.52it/s] 71it [00:07, 9.49it/s] 72it [00:07, 9.49it/s] 73it [00:07, 9.49it/s] 74it [00:07, 9.42it/s] 75it [00:08, 9.42it/s] 76it [00:08, 9.44it/s] 77it [00:08, 9.47it/s] 78it [00:08, 9.47it/s] 79it [00:08, 9.51it/s] 80it [00:08, 9.49it/s] 81it [00:08, 9.49it/s] 82it [00:08, 9.48it/s] 83it [00:08, 9.49it/s] 84it [00:09, 9.49it/s] 85it [00:09, 9.55it/s] 86it [00:09, 9.56it/s] 87it [00:09, 9.55it/s] 88it [00:09, 9.54it/s] 89it [00:09, 9.55it/s] 90it [00:09, 9.47it/s] 91it [00:09, 9.43it/s] 92it [00:09, 9.42it/s] 93it [00:09, 8.99it/s] 94it [00:10, 9.18it/s] 95it [00:10, 9.26it/s] 96it [00:10, 9.33it/s] 97it [00:10, 9.39it/s] 98it [00:10, 9.41it/s] 99it [00:10, 9.44it/s] 100it [00:10, 9.46it/s]2025-05-26 05:59:54,928 - INFO - [Epoch 043 | Batch 0100] IWAE-loss 7542.3433 | mean log_px -0.0583 | KL -3461.22 + 101it [00:10, 8.94it/s] 102it [00:10, 9.10it/s] 103it [00:11, 9.23it/s] 104it [00:11, 9.32it/s] 105it [00:11, 9.37it/s] 106it [00:11, 9.44it/s] 107it [00:11, 9.44it/s] 108it [00:11, 9.45it/s] 109it [00:11, 9.48it/s] 110it [00:11, 9.46it/s] 111it [00:11, 9.01it/s] 112it [00:12, 9.15it/s] 113it [00:12, 9.25it/s] 114it [00:12, 9.30it/s] 115it [00:12, 9.36it/s] 116it [00:12, 9.41it/s] 117it [00:12, 9.40it/s] 118it [00:12, 9.37it/s] 119it [00:12, 9.41it/s] 120it [00:12, 9.43it/s] 121it [00:12, 9.47it/s] 122it [00:13, 9.46it/s] 123it [00:13, 9.51it/s] 124it [00:13, 9.51it/s] 125it [00:13, 9.55it/s] 126it [00:13, 9.47it/s] 127it [00:13, 9.49it/s] 128it [00:13, 9.49it/s] 129it [00:13, 9.49it/s] 130it [00:13, 9.48it/s] 131it [00:14, 9.21it/s] 132it [00:14, 9.26it/s] 133it [00:14, 9.36it/s] 134it [00:14, 9.41it/s] 135it [00:14, 9.46it/s] 136it [00:14, 9.48it/s] 137it [00:14, 9.47it/s] 138it [00:14, 9.46it/s] 139it [00:14, 9.51it/s] 140it [00:14, 9.48it/s] 141it [00:15, 9.51it/s] 142it [00:15, 9.45it/s] 143it [00:15, 9.38it/s] 144it [00:15, 9.42it/s] 145it [00:15, 9.44it/s] 146it [00:15, 9.46it/s] 147it [00:15, 9.48it/s] 148it [00:15, 9.50it/s] 149it [00:15, 9.55it/s] 150it [00:16, 9.49it/s]2025-05-26 06:00:00,247 - INFO - [Epoch 043 | Batch 0150] IWAE-loss 4443.6572 | mean log_px -0.0191 | KL -3451.98 + 151it [00:16, 9.26it/s] 152it [00:16, 9.34it/s] 153it [00:16, 9.40it/s] 154it [00:16, 9.41it/s] 155it [00:16, 9.47it/s] 156it [00:16, 9.25it/s] 157it [00:16, 9.35it/s] 158it [00:16, 9.32it/s] 159it [00:16, 9.36it/s] 160it [00:17, 9.42it/s] 161it [00:17, 9.45it/s] 162it [00:17, 9.45it/s] 163it [00:17, 9.45it/s] 164it [00:17, 9.44it/s] 165it [00:17, 9.43it/s] 166it [00:17, 9.39it/s] 167it [00:17, 9.32it/s] 168it [00:17, 9.24it/s] 169it [00:18, 9.33it/s] 170it [00:18, 9.40it/s] 171it [00:18, 9.40it/s] 172it [00:18, 9.44it/s] 173it [00:18, 9.46it/s] 174it [00:18, 9.33it/s] 175it [00:18, 9.25it/s] 176it [00:18, 9.28it/s] 177it [00:18, 8.77it/s] 178it [00:19, 8.97it/s] 179it [00:19, 9.11it/s] 180it [00:19, 9.18it/s] 181it [00:19, 8.78it/s] 182it [00:19, 8.98it/s] 183it [00:19, 9.14it/s] 184it [00:19, 9.23it/s] 185it [00:19, 8.79it/s] 186it [00:19, 8.97it/s] 187it [00:20, 9.06it/s] 188it [00:20, 9.16it/s] 189it [00:20, 8.74it/s] 190it [00:20, 8.92it/s] 191it [00:20, 9.03it/s] 192it [00:20, 9.18it/s] 193it [00:20, 8.72it/s] 194it [00:20, 8.89it/s] 195it [00:20, 8.47it/s] 196it [00:21, 8.79it/s] 196it [00:21, 9.28it/s] +2025-05-26 06:00:05,262 - INFO - Epoch: 43, Objective: tensor([4990.5254], device='cuda:0', grad_fn=), Loss: 0.022801268845796585, KL/n: 70.53202056884766 + 0it [00:00, ?it/s]2025-05-26 06:00:05,726 - INFO - [Epoch 044 | Batch 0000] IWAE-loss 8241.9609 | mean log_px -0.0746 | KL -3451.67 + 1it [00:00, 4.61it/s] 2it [00:00, 6.61it/s] 3it [00:00, 7.63it/s] 4it [00:00, 8.26it/s] 5it [00:00, 8.71it/s] 6it [00:00, 8.97it/s] 7it [00:00, 9.19it/s] 8it [00:00, 9.22it/s] 9it [00:01, 9.33it/s] 10it [00:01, 9.39it/s] 11it [00:01, 9.43it/s] 12it [00:01, 9.48it/s] 13it [00:01, 9.51it/s] 14it [00:01, 9.50it/s] 15it [00:01, 9.50it/s] 16it [00:01, 9.48it/s] 17it [00:01, 9.48it/s] 18it [00:02, 9.49it/s] 19it [00:02, 9.50it/s] 20it [00:02, 9.46it/s] 21it [00:02, 9.50it/s] 22it [00:02, 9.46it/s] 23it [00:02, 9.55it/s] 24it [00:02, 9.58it/s] 25it [00:02, 9.03it/s] 26it [00:02, 9.12it/s] 27it [00:02, 9.25it/s] 28it [00:03, 9.32it/s] 29it [00:03, 9.42it/s] 30it [00:03, 9.41it/s] 31it [00:03, 9.46it/s] 32it [00:03, 9.51it/s] 33it [00:03, 9.49it/s] 34it [00:03, 9.53it/s] 35it [00:03, 9.57it/s] 36it [00:03, 9.44it/s] 37it [00:04, 9.19it/s] 38it [00:04, 9.04it/s] 39it [00:04, 9.17it/s] 40it [00:04, 9.25it/s] 41it [00:04, 9.35it/s] 42it [00:04, 9.35it/s] 43it [00:04, 9.33it/s] 44it [00:04, 9.30it/s] 45it [00:04, 9.37it/s] 46it [00:04, 9.40it/s] 47it [00:05, 9.35it/s] 48it [00:05, 9.40it/s] 49it [00:05, 9.43it/s] 50it [00:05, 9.47it/s]2025-05-26 06:00:11,064 - INFO - [Epoch 044 | Batch 0050] IWAE-loss 8636.9531 | mean log_px -0.0781 | KL -3454.60 + 51it [00:05, 9.34it/s] 52it [00:05, 9.32it/s] 53it [00:05, 9.28it/s] 54it [00:05, 9.28it/s] 55it [00:05, 9.31it/s] 56it [00:06, 9.35it/s] 57it [00:06, 9.39it/s] 58it [00:06, 9.43it/s] 59it [00:06, 9.40it/s] 60it [00:06, 9.36it/s] 61it [00:06, 9.40it/s] 62it [00:06, 9.43it/s] 63it [00:06, 9.44it/s] 64it [00:06, 9.44it/s] 65it [00:07, 9.48it/s] 66it [00:07, 9.39it/s] 67it [00:07, 9.43it/s] 68it [00:07, 9.46it/s] 69it [00:07, 9.49it/s] 70it [00:07, 9.47it/s] 71it [00:07, 9.50it/s] 72it [00:07, 9.44it/s] 73it [00:07, 9.47it/s] 74it [00:07, 9.47it/s] 75it [00:08, 9.48it/s] 76it [00:08, 9.50it/s] 77it [00:08, 9.52it/s] 78it [00:08, 9.48it/s] 79it [00:08, 9.47it/s] 80it [00:08, 9.44it/s] 81it [00:08, 9.46it/s] 82it [00:08, 9.42it/s] 83it [00:08, 9.46it/s] 84it [00:09, 9.45it/s] 85it [00:09, 9.46it/s] 86it [00:09, 8.96it/s] 87it [00:09, 8.98it/s] 88it [00:09, 9.06it/s] 89it [00:09, 9.09it/s] 90it [00:09, 9.14it/s] 91it [00:09, 9.15it/s] 92it [00:09, 9.22it/s] 93it [00:10, 9.20it/s] 94it [00:10, 9.14it/s] 95it [00:10, 9.00it/s] 96it [00:10, 8.91it/s] 97it [00:10, 8.82it/s] 98it [00:10, 8.80it/s] 99it [00:10, 8.57it/s] 100it [00:10, 8.81it/s]2025-05-26 06:00:16,461 - INFO - [Epoch 044 | Batch 0100] IWAE-loss 4468.0703 | mean log_px -0.0182 | KL -3448.35 + 101it [00:10, 9.04it/s] 102it [00:11, 9.18it/s] 103it [00:11, 9.28it/s] 104it [00:11, 9.34it/s] 105it [00:11, 9.41it/s] 106it [00:11, 9.44it/s] 107it [00:11, 9.48it/s] 108it [00:11, 9.48it/s] 109it [00:11, 9.48it/s] 110it [00:11, 9.48it/s] 111it [00:11, 9.51it/s] 112it [00:12, 9.56it/s] 113it [00:12, 9.58it/s] 114it [00:12, 9.62it/s] 115it [00:12, 9.57it/s] 116it [00:12, 9.53it/s] 117it [00:12, 9.53it/s] 118it [00:12, 9.10it/s] 119it [00:12, 9.24it/s] 120it [00:12, 9.31it/s] 121it [00:13, 9.38it/s] 122it [00:13, 9.42it/s] 123it [00:13, 9.47it/s] 124it [00:13, 9.50it/s] 125it [00:13, 9.53it/s] 126it [00:13, 9.55it/s] 127it [00:13, 9.55it/s] 128it [00:13, 9.49it/s] 129it [00:13, 9.48it/s] 130it [00:13, 9.48it/s] 131it [00:14, 9.51it/s] 132it [00:14, 9.52it/s] 133it [00:14, 9.51it/s] 134it [00:14, 9.48it/s] 135it [00:14, 9.44it/s] 136it [00:14, 9.50it/s] 137it [00:14, 9.51it/s] 138it [00:14, 9.45it/s] 139it [00:14, 8.88it/s] 140it [00:15, 9.06it/s] 141it [00:15, 9.18it/s] 142it [00:15, 9.27it/s] 143it [00:15, 9.37it/s] 144it [00:15, 9.37it/s] 145it [00:15, 9.46it/s] 146it [00:15, 9.52it/s] 147it [00:15, 9.51it/s] 148it [00:15, 9.51it/s] 149it [00:16, 9.53it/s] 150it [00:16, 9.53it/s]2025-05-26 06:00:21,750 - INFO - [Epoch 044 | Batch 0150] IWAE-loss 5638.1201 | mean log_px -0.0363 | KL -3448.95 + 151it [00:16, 9.55it/s] 152it [00:16, 9.53it/s] 153it [00:16, 9.48it/s] 154it [00:16, 9.43it/s] 155it [00:16, 9.48it/s] 156it [00:16, 9.08it/s] 157it [00:16, 9.26it/s] 158it [00:16, 9.38it/s] 159it [00:17, 9.38it/s] 160it [00:17, 9.39it/s] 161it [00:17, 9.28it/s] 162it [00:17, 9.36it/s] 163it [00:17, 9.44it/s] 164it [00:17, 9.43it/s] 165it [00:17, 9.45it/s] 166it [00:17, 9.46it/s] 167it [00:17, 9.36it/s] 168it [00:18, 9.44it/s] 169it [00:18, 9.51it/s] 170it [00:18, 9.53it/s] 171it [00:18, 9.53it/s] 172it [00:18, 9.57it/s] 173it [00:18, 9.54it/s] 174it [00:18, 9.51it/s] 175it [00:18, 9.49it/s] 176it [00:18, 9.47it/s] 177it [00:18, 9.50it/s] 178it [00:19, 9.50it/s] 179it [00:19, 9.55it/s] 180it [00:19, 9.50it/s] 181it [00:19, 9.52it/s] 182it [00:19, 9.55it/s] 183it [00:19, 9.60it/s] 184it [00:19, 9.54it/s] 185it [00:19, 9.55it/s] 186it [00:19, 9.49it/s] 187it [00:20, 9.15it/s] 188it [00:20, 9.24it/s] 189it [00:20, 9.30it/s] 190it [00:20, 9.37it/s] 191it [00:20, 9.40it/s] 192it [00:20, 9.41it/s] 193it [00:20, 8.92it/s] 194it [00:20, 9.14it/s] 195it [00:20, 8.69it/s] 196it [00:21, 9.01it/s] 196it [00:21, 9.30it/s] +2025-05-26 06:00:26,664 - INFO - Epoch: 44, Objective: tensor([5709.1240], device='cuda:0', grad_fn=), Loss: 0.03686925023794174, KL/n: 70.38143920898438 + 0it [00:00, ?it/s]2025-05-26 06:00:26,939 - INFO - [Epoch 045 | Batch 0000] IWAE-loss 6154.7354 | mean log_px -0.0426 | KL -3452.68 + 1it [00:00, 4.80it/s] 2it [00:00, 6.71it/s] 3it [00:00, 7.77it/s] 4it [00:00, 8.40it/s] 5it [00:00, 8.84it/s] 6it [00:00, 9.04it/s] 7it [00:00, 9.21it/s] 8it [00:00, 9.36it/s] 9it [00:01, 8.94it/s] 10it [00:01, 9.11it/s] 11it [00:01, 9.20it/s] 12it [00:01, 8.76it/s] 13it [00:01, 8.98it/s] 14it [00:01, 9.09it/s] 15it [00:01, 9.26it/s] 16it [00:01, 9.29it/s] 17it [00:01, 9.39it/s] 18it [00:02, 9.42it/s] 19it [00:02, 9.48it/s] 20it [00:02, 9.46it/s] 21it [00:02, 9.52it/s] 22it [00:02, 9.50it/s] 23it [00:02, 9.49it/s] 24it [00:02, 9.53it/s] 25it [00:02, 9.51it/s] 26it [00:02, 9.52it/s] 27it [00:02, 9.48it/s] 28it [00:03, 9.47it/s] 29it [00:03, 9.50it/s] 30it [00:03, 9.48it/s] 31it [00:03, 9.45it/s] 32it [00:03, 8.95it/s] 33it [00:03, 9.13it/s] 34it [00:03, 9.22it/s] 35it [00:03, 9.32it/s] 36it [00:03, 9.35it/s] 37it [00:04, 9.41it/s] 38it [00:04, 9.49it/s] 39it [00:04, 9.52it/s] 40it [00:04, 9.10it/s] 41it [00:04, 9.26it/s] 42it [00:04, 9.33it/s] 43it [00:04, 9.40it/s] 44it [00:04, 9.44it/s] 45it [00:04, 9.51it/s] 46it [00:05, 9.48it/s] 47it [00:05, 9.48it/s] 48it [00:05, 9.50it/s] 49it [00:05, 9.51it/s] 50it [00:05, 9.49it/s]2025-05-26 06:00:32,293 - INFO - [Epoch 045 | Batch 0050] IWAE-loss 4413.5903 | mean log_px -0.0159 | KL -3443.76 + 51it [00:05, 9.51it/s] 52it [00:05, 9.50it/s] 53it [00:05, 9.48it/s] 54it [00:05, 9.48it/s] 55it [00:05, 9.51it/s] 56it [00:06, 8.94it/s] 57it [00:06, 9.15it/s] 58it [00:06, 9.24it/s] 59it [00:06, 9.34it/s] 60it [00:06, 9.36it/s] 61it [00:06, 9.43it/s] 62it [00:06, 9.44it/s] 63it [00:06, 9.46it/s] 64it [00:06, 9.47it/s] 65it [00:07, 9.52it/s] 66it [00:07, 9.46it/s] 67it [00:07, 9.54it/s] 68it [00:07, 9.49it/s] 69it [00:07, 9.40it/s] 70it [00:07, 8.89it/s] 71it [00:07, 9.08it/s] 72it [00:07, 9.20it/s] 73it [00:07, 9.15it/s] 74it [00:08, 9.28it/s] 75it [00:08, 9.37it/s] 76it [00:08, 9.39it/s] 77it [00:08, 9.45it/s] 78it [00:08, 9.43it/s] 79it [00:08, 9.47it/s] 80it [00:08, 9.45it/s] 81it [00:08, 9.51it/s] 82it [00:08, 9.48it/s] 83it [00:08, 9.55it/s] 84it [00:09, 9.54it/s] 85it [00:09, 9.60it/s] 86it [00:09, 9.59it/s] 87it [00:09, 9.62it/s] 88it [00:09, 9.60it/s] 89it [00:09, 9.62it/s] 90it [00:09, 9.58it/s] 91it [00:09, 9.59it/s] 92it [00:09, 9.53it/s] 93it [00:09, 9.36it/s] 94it [00:10, 9.42it/s] 95it [00:10, 9.43it/s] 96it [00:10, 9.42it/s] 97it [00:10, 9.46it/s] 98it [00:10, 9.46it/s] 99it [00:10, 9.50it/s] 100it [00:10, 9.50it/s]2025-05-26 06:00:37,599 - INFO - [Epoch 045 | Batch 0100] IWAE-loss 5534.2393 | mean log_px -0.0361 | KL -3439.78 + 101it [00:10, 9.52it/s] 102it [00:10, 9.55it/s] 103it [00:11, 9.56it/s] 104it [00:11, 9.52it/s] 105it [00:11, 9.53it/s] 106it [00:11, 9.56it/s] 107it [00:11, 9.33it/s] 108it [00:11, 9.33it/s] 109it [00:11, 9.45it/s] 110it [00:11, 9.45it/s] 111it [00:11, 9.46it/s] 112it [00:12, 9.44it/s] 113it [00:12, 9.43it/s] 114it [00:12, 9.46it/s] 115it [00:12, 9.47it/s] 116it [00:12, 9.47it/s] 117it [00:12, 9.47it/s] 118it [00:12, 9.48it/s] 119it [00:12, 9.49it/s] 120it [00:12, 9.50it/s] 121it [00:12, 9.52it/s] 122it [00:13, 9.50it/s] 123it [00:13, 9.54it/s] 124it [00:13, 9.50it/s] 125it [00:13, 9.52it/s] 126it [00:13, 9.48it/s] 127it [00:13, 9.50it/s] 128it [00:13, 9.46it/s] 129it [00:13, 9.49it/s] 130it [00:13, 9.52it/s] 131it [00:14, 9.51it/s] 132it [00:14, 9.43it/s] 133it [00:14, 9.36it/s] 134it [00:14, 9.21it/s] 135it [00:14, 9.18it/s] 136it [00:14, 9.30it/s] 137it [00:14, 9.40it/s] 138it [00:14, 9.47it/s] 139it [00:14, 9.52it/s] 140it [00:14, 9.55it/s] 141it [00:15, 9.59it/s] 142it [00:15, 9.60it/s] 143it [00:15, 9.61it/s] 144it [00:15, 9.57it/s] 145it [00:15, 9.57it/s] 146it [00:15, 9.52it/s] 147it [00:15, 9.52it/s] 148it [00:15, 9.48it/s] 149it [00:15, 9.49it/s] 150it [00:16, 9.49it/s]2025-05-26 06:00:42,875 - INFO - [Epoch 045 | Batch 0150] IWAE-loss 5436.4814 | mean log_px -0.0340 | KL -3438.98 + 151it [00:16, 9.52it/s] 152it [00:16, 9.54it/s] 153it [00:16, 9.53it/s] 154it [00:16, 9.52it/s] 155it [00:16, 9.51it/s] 156it [00:16, 9.51it/s] 157it [00:16, 9.48it/s] 158it [00:16, 9.48it/s] 159it [00:16, 9.44it/s] 160it [00:17, 9.47it/s] 161it [00:17, 9.53it/s] 162it [00:17, 9.50it/s] 163it [00:17, 9.51it/s] 164it [00:17, 9.51it/s] 165it [00:17, 9.45it/s] 166it [00:17, 9.46it/s] 167it [00:17, 9.49it/s] 168it [00:17, 9.44it/s] 169it [00:18, 9.42it/s] 170it [00:18, 9.45it/s] 171it [00:18, 9.45it/s] 172it [00:18, 9.44it/s] 173it [00:18, 9.49it/s] 174it [00:18, 9.50it/s] 175it [00:18, 9.51it/s] 176it [00:18, 9.51it/s] 177it [00:18, 9.39it/s] 178it [00:18, 9.47it/s] 179it [00:19, 9.48it/s] 180it [00:19, 9.49it/s] 181it [00:19, 9.51it/s] 182it [00:19, 9.50it/s] 183it [00:19, 9.52it/s] 184it [00:19, 9.53it/s] 185it [00:19, 9.53it/s] 186it [00:19, 9.53it/s] 187it [00:19, 9.55it/s] 188it [00:20, 9.54it/s] 189it [00:20, 9.54it/s] 190it [00:20, 9.46it/s] 191it [00:20, 9.48it/s] 192it [00:20, 9.51it/s] 193it [00:20, 9.53it/s] 194it [00:20, 9.51it/s] 195it [00:20, 8.92it/s] 196it [00:20, 9.12it/s] 196it [00:20, 9.36it/s] +2025-05-26 06:00:47,737 - INFO - Epoch: 45, Objective: tensor([5079.6650], device='cuda:0', grad_fn=), Loss: 0.031979966908693314, KL/n: 70.21158599853516 + 0it [00:00, ?it/s]2025-05-26 06:00:48,196 - INFO - [Epoch 046 | Batch 0000] IWAE-loss 4801.6733 | mean log_px -0.0225 | KL -3436.86 + 1it [00:00, 5.42it/s] 2it [00:00, 7.23it/s] 3it [00:00, 8.11it/s] 4it [00:00, 8.63it/s] 5it [00:00, 8.93it/s] 6it [00:00, 9.10it/s] 7it [00:00, 9.21it/s] 8it [00:00, 9.31it/s] 9it [00:01, 9.44it/s] 10it [00:01, 9.51it/s] 11it [00:01, 9.52it/s] 12it [00:01, 9.49it/s] 13it [00:01, 9.47it/s] 14it [00:01, 9.45it/s] 15it [00:01, 9.50it/s] 16it [00:01, 9.45it/s] 17it [00:01, 9.45it/s] 18it [00:01, 9.17it/s] 19it [00:02, 9.28it/s] 20it [00:02, 8.83it/s] 21it [00:02, 9.04it/s] 22it [00:02, 9.18it/s] 23it [00:02, 9.25it/s] 24it [00:02, 9.28it/s] 25it [00:02, 9.37it/s] 26it [00:02, 9.41it/s] 27it [00:02, 9.45it/s] 28it [00:03, 9.45it/s] 29it [00:03, 9.48it/s] 30it [00:03, 9.53it/s] 31it [00:03, 9.60it/s] 32it [00:03, 9.56it/s] 33it [00:03, 9.06it/s] 34it [00:03, 9.23it/s] 35it [00:03, 9.27it/s] 36it [00:03, 9.13it/s] 37it [00:04, 8.64it/s] 38it [00:04, 8.67it/s] 39it [00:04, 8.52it/s] 40it [00:04, 8.85it/s] 41it [00:04, 9.11it/s] 42it [00:04, 9.27it/s] 43it [00:04, 9.40it/s] 44it [00:04, 9.49it/s] 45it [00:04, 9.56it/s] 46it [00:05, 9.59it/s] 47it [00:05, 9.64it/s] 48it [00:05, 9.66it/s] 49it [00:05, 9.68it/s] 50it [00:05, 9.67it/s]2025-05-26 06:00:53,538 - INFO - [Epoch 046 | Batch 0050] IWAE-loss 4658.3813 | mean log_px -0.0175 | KL -3431.65 + 51it [00:05, 9.69it/s] 52it [00:05, 9.70it/s] 53it [00:05, 9.71it/s] 54it [00:05, 9.69it/s] 55it [00:05, 9.71it/s] 56it [00:06, 9.69it/s] 57it [00:06, 9.71it/s] 58it [00:06, 9.69it/s] 59it [00:06, 9.71it/s] 60it [00:06, 9.70it/s] 61it [00:06, 9.73it/s] 62it [00:06, 9.71it/s] 63it [00:06, 9.71it/s] 64it [00:06, 9.70it/s] 65it [00:06, 9.72it/s] 66it [00:07, 9.70it/s] 67it [00:07, 9.72it/s] 68it [00:07, 9.72it/s] 69it [00:07, 9.73it/s] 70it [00:07, 9.41it/s] 71it [00:07, 9.49it/s] 72it [00:07, 9.55it/s] 73it [00:07, 9.12it/s] 74it [00:07, 9.29it/s] 75it [00:08, 9.40it/s] 76it [00:08, 9.49it/s] 77it [00:08, 8.98it/s] 78it [00:08, 9.17it/s] 79it [00:08, 9.33it/s] 80it [00:08, 9.45it/s] 81it [00:08, 9.55it/s] 82it [00:08, 9.44it/s] 83it [00:08, 9.54it/s] 84it [00:08, 9.54it/s] 85it [00:09, 9.44it/s] 86it [00:09, 9.47it/s] 87it [00:09, 8.99it/s] 88it [00:09, 9.19it/s] 89it [00:09, 9.35it/s] 90it [00:09, 9.46it/s] 91it [00:09, 9.55it/s] 92it [00:09, 9.55it/s] 93it [00:09, 9.61it/s] 94it [00:10, 9.23it/s] 95it [00:10, 9.36it/s] 96it [00:10, 9.46it/s] 97it [00:10, 9.54it/s] 98it [00:10, 9.60it/s] 99it [00:10, 9.64it/s] 100it [00:10, 9.65it/s]2025-05-26 06:00:58,790 - INFO - [Epoch 046 | Batch 0100] IWAE-loss 5551.6338 | mean log_px -0.0332 | KL -3436.21 + 101it [00:10, 9.65it/s] 102it [00:10, 9.66it/s] 103it [00:10, 9.70it/s] 104it [00:11, 9.70it/s] 105it [00:11, 9.71it/s] 106it [00:11, 9.72it/s] 107it [00:11, 9.73it/s] 108it [00:11, 9.43it/s] 109it [00:11, 9.51it/s] 110it [00:11, 9.53it/s] 111it [00:11, 9.21it/s] 112it [00:11, 9.36it/s] 113it [00:12, 9.47it/s] 114it [00:12, 9.52it/s] 115it [00:12, 9.58it/s] 116it [00:12, 9.06it/s] 117it [00:12, 9.26it/s] 118it [00:12, 9.36it/s] 119it [00:12, 9.46it/s] 120it [00:12, 9.08it/s] 121it [00:12, 9.27it/s] 122it [00:13, 9.38it/s] 123it [00:13, 8.95it/s] 124it [00:13, 9.16it/s] 125it [00:13, 9.32it/s] 126it [00:13, 8.89it/s] 127it [00:13, 9.02it/s] 128it [00:13, 9.21it/s] 129it [00:13, 9.37it/s] 130it [00:13, 9.46it/s] 131it [00:13, 9.01it/s] 132it [00:14, 9.19it/s] 133it [00:14, 9.34it/s] 134it [00:14, 9.43it/s] 135it [00:14, 9.51it/s] 136it [00:14, 9.58it/s] 137it [00:14, 9.62it/s] 138it [00:14, 9.64it/s] 139it [00:14, 9.65it/s] 140it [00:14, 9.67it/s] 141it [00:15, 9.70it/s] 142it [00:15, 9.69it/s] 143it [00:15, 9.71it/s] 144it [00:15, 9.70it/s] 145it [00:15, 9.72it/s] 146it [00:15, 9.70it/s] 147it [00:15, 9.72it/s] 148it [00:15, 9.70it/s] 149it [00:15, 9.71it/s] 150it [00:15, 9.14it/s]2025-05-26 06:01:04,094 - INFO - [Epoch 046 | Batch 0150] IWAE-loss 5915.6621 | mean log_px -0.0405 | KL -3435.87 + 151it [00:16, 9.30it/s] 152it [00:16, 9.43it/s] 153it [00:16, 9.52it/s] 154it [00:16, 9.58it/s] 155it [00:16, 9.64it/s] 156it [00:16, 9.67it/s] 157it [00:16, 9.69it/s] 158it [00:16, 9.69it/s] 159it [00:16, 9.71it/s] 160it [00:17, 9.66it/s] 161it [00:17, 9.59it/s] 162it [00:17, 9.23it/s] 163it [00:17, 9.37it/s] 164it [00:17, 9.44it/s] 165it [00:17, 9.51it/s] 166it [00:17, 9.55it/s] 167it [00:17, 9.60it/s] 168it [00:17, 9.63it/s] 169it [00:17, 9.67it/s] 170it [00:18, 9.68it/s] 171it [00:18, 9.69it/s] 172it [00:18, 9.68it/s] 173it [00:18, 9.70it/s] 174it [00:18, 9.70it/s] 175it [00:18, 9.72it/s] 176it [00:18, 9.72it/s] 177it [00:18, 9.73it/s] 178it [00:18, 9.72it/s] 179it [00:18, 9.73it/s] 180it [00:19, 9.72it/s] 181it [00:19, 9.56it/s] 182it [00:19, 9.48it/s] 183it [00:19, 9.49it/s] 184it [00:19, 9.00it/s] 185it [00:19, 9.21it/s] 186it [00:19, 9.36it/s] 187it [00:19, 9.47it/s] 188it [00:19, 9.53it/s] 189it [00:20, 9.60it/s] 190it [00:20, 9.62it/s] 191it [00:20, 9.65it/s] 192it [00:20, 9.64it/s] 193it [00:20, 9.50it/s] 194it [00:20, 9.56it/s] 195it [00:20, 9.01it/s] 196it [00:20, 9.26it/s] 196it [00:20, 9.40it/s] +2025-05-26 06:01:08,913 - INFO - Epoch: 46, Objective: tensor([5599.3286], device='cuda:0', grad_fn=), Loss: 0.028604112565517426, KL/n: 70.04393768310547 + 0it [00:00, ?it/s]2025-05-26 06:01:09,198 - INFO - [Epoch 047 | Batch 0000] IWAE-loss 6606.0967 | mean log_px -0.0507 | KL -3426.96 + 1it [00:00, 4.64it/s] 2it [00:00, 6.62it/s] 3it [00:00, 7.71it/s] 4it [00:00, 7.79it/s] 5it [00:00, 8.40it/s] 6it [00:00, 8.79it/s] 7it [00:00, 9.09it/s] 8it [00:00, 8.71it/s] 9it [00:01, 8.99it/s] 10it [00:01, 9.15it/s] 11it [00:01, 9.32it/s] 12it [00:01, 9.43it/s] 13it [00:01, 9.53it/s] 14it [00:01, 9.57it/s] 15it [00:01, 9.62it/s] 16it [00:01, 9.64it/s] 17it [00:01, 9.67it/s] 18it [00:02, 9.67it/s] 19it [00:02, 9.14it/s] 20it [00:02, 9.14it/s] 21it [00:02, 9.12it/s] 22it [00:02, 8.98it/s] 23it [00:02, 9.12it/s] 24it [00:02, 9.22it/s] 25it [00:02, 9.30it/s] 26it [00:02, 9.34it/s] 27it [00:03, 9.40it/s] 28it [00:03, 9.42it/s] 29it [00:03, 9.46it/s] 30it [00:03, 9.47it/s] 31it [00:03, 9.49it/s] 32it [00:03, 9.48it/s] 33it [00:03, 9.49it/s] 34it [00:03, 9.34it/s] 35it [00:03, 9.25it/s] 36it [00:03, 9.12it/s] 37it [00:04, 9.28it/s] 38it [00:04, 9.38it/s] 39it [00:04, 9.08it/s] 40it [00:04, 9.25it/s] 41it [00:04, 9.38it/s] 42it [00:04, 9.47it/s] 43it [00:04, 9.53it/s] 44it [00:04, 9.57it/s] 45it [00:04, 9.61it/s] 46it [00:05, 9.05it/s] 47it [00:05, 9.24it/s] 48it [00:05, 9.21it/s] 49it [00:05, 9.02it/s] 50it [00:05, 9.20it/s]2025-05-26 06:01:14,585 - INFO - [Epoch 047 | Batch 0050] IWAE-loss 5071.6953 | mean log_px -0.0309 | KL -3429.48 + 51it [00:05, 9.35it/s] 52it [00:05, 9.45it/s] 53it [00:05, 9.53it/s] 54it [00:05, 9.58it/s] 55it [00:05, 9.64it/s] 56it [00:06, 9.65it/s] 57it [00:06, 9.69it/s] 58it [00:06, 9.69it/s] 59it [00:06, 9.70it/s] 60it [00:06, 9.70it/s] 61it [00:06, 9.71it/s] 62it [00:06, 9.70it/s] 63it [00:06, 9.72it/s] 64it [00:06, 9.72it/s] 65it [00:07, 9.73it/s] 66it [00:07, 9.71it/s] 67it [00:07, 9.20it/s] 68it [00:07, 9.33it/s] 69it [00:07, 9.45it/s] 70it [00:07, 9.52it/s] 71it [00:07, 9.59it/s] 72it [00:07, 9.52it/s] 73it [00:07, 9.59it/s] 74it [00:07, 9.62it/s] 75it [00:08, 9.66it/s] 76it [00:08, 9.68it/s] 77it [00:08, 9.70it/s] 78it [00:08, 9.70it/s] 79it [00:08, 9.71it/s] 80it [00:08, 9.70it/s] 81it [00:08, 9.71it/s] 82it [00:08, 9.70it/s] 83it [00:08, 9.71it/s] 84it [00:09, 9.14it/s] 85it [00:09, 9.30it/s] 86it [00:09, 9.38it/s] 87it [00:09, 9.48it/s] 88it [00:09, 9.53it/s] 89it [00:09, 9.59it/s] 90it [00:09, 9.62it/s] 91it [00:09, 9.65it/s] 92it [00:09, 9.65it/s] 93it [00:09, 9.67it/s] 94it [00:10, 9.67it/s] 95it [00:10, 9.68it/s] 96it [00:10, 9.68it/s] 97it [00:10, 9.69it/s] 98it [00:10, 9.68it/s] 99it [00:10, 9.69it/s] 100it [00:10, 9.70it/s]2025-05-26 06:01:19,780 - INFO - [Epoch 047 | Batch 0100] IWAE-loss 4540.6260 | mean log_px -0.0246 | KL -3428.07 + 101it [00:10, 9.69it/s] 102it [00:10, 9.49it/s] 103it [00:10, 9.52it/s] 104it [00:11, 9.55it/s] 105it [00:11, 9.57it/s] 106it [00:11, 9.60it/s] 107it [00:11, 9.07it/s] 108it [00:11, 9.24it/s] 109it [00:11, 9.36it/s] 110it [00:11, 8.90it/s] 111it [00:11, 9.13it/s] 112it [00:11, 9.29it/s] 113it [00:12, 9.42it/s] 114it [00:12, 9.50it/s] 115it [00:12, 9.56it/s] 116it [00:12, 9.60it/s] 117it [00:12, 9.64it/s] 118it [00:12, 9.65it/s] 119it [00:12, 9.27it/s] 120it [00:12, 9.39it/s] 121it [00:12, 9.49it/s] 122it [00:13, 9.01it/s] 123it [00:13, 9.22it/s] 124it [00:13, 9.35it/s] 125it [00:13, 9.46it/s] 126it [00:13, 9.53it/s] 127it [00:13, 9.59it/s] 128it [00:13, 9.62it/s] 129it [00:13, 9.65it/s] 130it [00:13, 9.66it/s] 131it [00:13, 9.67it/s] 132it [00:14, 9.67it/s] 133it [00:14, 9.69it/s] 134it [00:14, 9.28it/s] 135it [00:14, 9.40it/s] 136it [00:14, 9.49it/s] 137it [00:14, 9.56it/s] 138it [00:14, 9.60it/s] 139it [00:14, 9.63it/s] 140it [00:14, 9.65it/s] 141it [00:14, 9.67it/s] 142it [00:15, 9.67it/s] 143it [00:15, 9.68it/s] 144it [00:15, 9.67it/s] 145it [00:15, 9.69it/s] 146it [00:15, 9.68it/s] 147it [00:15, 9.58it/s] 148it [00:15, 9.60it/s] 149it [00:15, 9.62it/s] 150it [00:15, 9.63it/s]2025-05-26 06:01:25,045 - INFO - [Epoch 047 | Batch 0150] IWAE-loss 4956.0400 | mean log_px -0.0260 | KL -3420.03 + 151it [00:16, 9.63it/s] 152it [00:16, 9.65it/s] 153it [00:16, 9.67it/s] 154it [00:16, 9.68it/s] 155it [00:16, 9.70it/s] 156it [00:16, 9.38it/s] 157it [00:16, 9.49it/s] 158it [00:16, 9.55it/s] 159it [00:16, 9.60it/s] 160it [00:16, 9.23it/s] 161it [00:17, 9.39it/s] 162it [00:17, 9.49it/s] 163it [00:17, 9.17it/s] 164it [00:17, 9.32it/s] 165it [00:17, 9.44it/s] 166it [00:17, 9.51it/s] 167it [00:17, 9.58it/s] 168it [00:17, 9.60it/s] 169it [00:17, 9.65it/s] 170it [00:18, 9.65it/s] 171it [00:18, 9.28it/s] 172it [00:18, 9.39it/s] 173it [00:18, 9.49it/s] 174it [00:18, 9.54it/s] 175it [00:18, 9.59it/s] 176it [00:18, 9.62it/s] 177it [00:18, 9.67it/s] 178it [00:18, 9.67it/s] 179it [00:18, 9.68it/s] 180it [00:19, 9.69it/s] 181it [00:19, 9.70it/s] 182it [00:19, 9.70it/s] 183it [00:19, 9.65it/s] 184it [00:19, 9.66it/s] 185it [00:19, 9.70it/s] 186it [00:19, 9.69it/s] 187it [00:19, 9.65it/s] 188it [00:19, 9.67it/s] 189it [00:20, 9.69it/s] 190it [00:20, 9.69it/s] 191it [00:20, 9.72it/s] 192it [00:20, 9.69it/s] 193it [00:20, 9.70it/s] 194it [00:20, 9.70it/s] 195it [00:20, 9.13it/s] 196it [00:20, 9.35it/s] 196it [00:20, 9.42it/s] +2025-05-26 06:01:29,859 - INFO - Epoch: 47, Objective: tensor([5860.7812], device='cuda:0', grad_fn=), Loss: 0.03282099589705467, KL/n: 69.88233184814453 + 0it [00:00, ?it/s]2025-05-26 06:01:30,299 - INFO - [Epoch 048 | Batch 0000] IWAE-loss 4398.5654 | mean log_px -0.0148 | KL -3425.91 + 1it [00:00, 6.12it/s] 2it [00:00, 7.74it/s] 3it [00:00, 8.56it/s] 4it [00:00, 8.98it/s] 5it [00:00, 9.25it/s] 6it [00:00, 9.39it/s] 7it [00:00, 9.47it/s] 8it [00:00, 9.54it/s] 9it [00:00, 9.61it/s] 10it [00:01, 9.40it/s] 11it [00:01, 9.47it/s] 12it [00:01, 9.53it/s] 13it [00:01, 9.59it/s] 14it [00:01, 9.63it/s] 15it [00:01, 9.66it/s] 16it [00:01, 9.66it/s] 17it [00:01, 9.69it/s] 18it [00:01, 9.69it/s] 19it [00:02, 9.70it/s] 20it [00:02, 9.68it/s] 21it [00:02, 9.71it/s] 22it [00:02, 9.69it/s] 23it [00:02, 9.71it/s] 24it [00:02, 9.70it/s] 25it [00:02, 9.71it/s] 26it [00:02, 9.70it/s] 27it [00:02, 9.72it/s] 28it [00:02, 9.71it/s] 29it [00:03, 9.72it/s] 30it [00:03, 9.72it/s] 31it [00:03, 9.73it/s] 32it [00:03, 9.71it/s] 33it [00:03, 9.72it/s] 34it [00:03, 9.72it/s] 35it [00:03, 9.72it/s] 36it [00:03, 9.71it/s] 37it [00:03, 9.72it/s] 38it [00:03, 9.70it/s] 39it [00:04, 9.72it/s] 40it [00:04, 9.70it/s] 41it [00:04, 9.73it/s] 42it [00:04, 9.72it/s] 43it [00:04, 9.73it/s] 44it [00:04, 9.72it/s] 45it [00:04, 9.74it/s] 46it [00:04, 9.73it/s] 47it [00:04, 9.59it/s] 48it [00:05, 9.60it/s] 49it [00:05, 9.65it/s] 50it [00:05, 9.65it/s]2025-05-26 06:01:35,466 - INFO - [Epoch 048 | Batch 0050] IWAE-loss 5411.3506 | mean log_px -0.0329 | KL -3426.38 + 51it [00:05, 9.66it/s] 52it [00:05, 9.65it/s] 53it [00:05, 9.29it/s] 54it [00:05, 9.39it/s] 55it [00:05, 9.49it/s] 56it [00:05, 9.55it/s] 57it [00:05, 9.06it/s] 58it [00:06, 9.25it/s] 59it [00:06, 9.39it/s] 60it [00:06, 9.48it/s] 61it [00:06, 9.56it/s] 62it [00:06, 9.59it/s] 63it [00:06, 9.05it/s] 64it [00:06, 9.21it/s] 65it [00:06, 9.36it/s] 66it [00:06, 9.46it/s] 67it [00:07, 9.55it/s] 68it [00:07, 9.59it/s] 69it [00:07, 9.63it/s] 70it [00:07, 9.64it/s] 71it [00:07, 9.68it/s] 72it [00:07, 9.68it/s] 73it [00:07, 9.70it/s] 74it [00:07, 9.69it/s] 75it [00:07, 9.14it/s] 76it [00:07, 9.29it/s] 77it [00:08, 9.43it/s] 78it [00:08, 9.51it/s] 79it [00:08, 9.59it/s] 80it [00:08, 9.63it/s] 81it [00:08, 9.67it/s] 82it [00:08, 9.68it/s] 83it [00:08, 9.69it/s] 84it [00:08, 9.71it/s] 85it [00:08, 9.73it/s] 86it [00:09, 9.72it/s] 87it [00:09, 9.74it/s] 88it [00:09, 9.74it/s] 89it [00:09, 9.74it/s] 90it [00:09, 9.74it/s] 91it [00:09, 9.74it/s] 92it [00:09, 9.72it/s] 93it [00:09, 9.74it/s] 94it [00:09, 9.72it/s] 95it [00:09, 9.15it/s] 96it [00:10, 9.29it/s] 97it [00:10, 9.42it/s] 98it [00:10, 9.49it/s] 99it [00:10, 9.57it/s] 100it [00:10, 9.60it/s]2025-05-26 06:01:40,713 - INFO - [Epoch 048 | Batch 0100] IWAE-loss 5481.2749 | mean log_px -0.0403 | KL -3417.41 + 101it [00:10, 9.63it/s] 102it [00:10, 9.64it/s] 103it [00:10, 9.68it/s] 104it [00:10, 9.68it/s] 105it [00:10, 9.71it/s] 106it [00:11, 9.71it/s] 107it [00:11, 9.72it/s] 108it [00:11, 9.71it/s] 109it [00:11, 9.73it/s] 110it [00:11, 9.71it/s] 111it [00:11, 9.72it/s] 112it [00:11, 9.71it/s] 113it [00:11, 9.73it/s] 114it [00:11, 9.16it/s] 115it [00:12, 9.33it/s] 116it [00:12, 9.42it/s] 117it [00:12, 9.52it/s] 118it [00:12, 9.58it/s] 119it [00:12, 9.63it/s] 120it [00:12, 9.51it/s] 121it [00:12, 9.56it/s] 122it [00:12, 9.59it/s] 123it [00:12, 9.64it/s] 124it [00:12, 9.64it/s] 125it [00:13, 9.66it/s] 126it [00:13, 9.67it/s] 127it [00:13, 9.67it/s] 128it [00:13, 9.66it/s] 129it [00:13, 9.27it/s] 130it [00:13, 9.39it/s] 131it [00:13, 9.49it/s] 132it [00:13, 9.56it/s] 133it [00:13, 9.21it/s] 134it [00:14, 9.24it/s] 135it [00:14, 9.17it/s] 136it [00:14, 8.60it/s] 137it [00:14, 8.82it/s] 138it [00:14, 8.99it/s] 139it [00:14, 9.11it/s] 140it [00:14, 9.19it/s] 141it [00:14, 9.25it/s] 142it [00:14, 9.29it/s] 143it [00:15, 9.33it/s] 144it [00:15, 9.33it/s] 145it [00:15, 8.84it/s] 146it [00:15, 8.98it/s] 147it [00:15, 9.13it/s] 148it [00:15, 9.29it/s] 149it [00:15, 9.38it/s] 150it [00:15, 9.46it/s]2025-05-26 06:01:46,022 - INFO - [Epoch 048 | Batch 0150] IWAE-loss 4167.0127 | mean log_px -0.0108 | KL -3420.06 + 151it [00:15, 8.97it/s] 152it [00:16, 9.18it/s] 153it [00:16, 9.34it/s] 154it [00:16, 9.43it/s] 155it [00:16, 9.53it/s] 156it [00:16, 9.58it/s] 157it [00:16, 9.62it/s] 158it [00:16, 9.64it/s] 159it [00:16, 9.67it/s] 160it [00:16, 9.09it/s] 161it [00:16, 9.28it/s] 162it [00:17, 9.40it/s] 163it [00:17, 9.50it/s] 164it [00:17, 9.56it/s] 165it [00:17, 9.61it/s] 166it [00:17, 9.63it/s] 167it [00:17, 9.66it/s] 168it [00:17, 9.66it/s] 169it [00:17, 9.70it/s] 170it [00:17, 9.12it/s] 171it [00:18, 9.29it/s] 172it [00:18, 9.40it/s] 173it [00:18, 9.49it/s] 174it [00:18, 9.53it/s] 175it [00:18, 9.60it/s] 176it [00:18, 9.62it/s] 177it [00:18, 9.65it/s] 178it [00:18, 9.65it/s] 179it [00:18, 9.68it/s] 180it [00:18, 9.67it/s] 181it [00:19, 9.68it/s] 182it [00:19, 9.67it/s] 183it [00:19, 9.70it/s] 184it [00:19, 9.69it/s] 185it [00:19, 9.70it/s] 186it [00:19, 9.54it/s] 187it [00:19, 9.58it/s] 188it [00:19, 9.60it/s] 189it [00:19, 9.57it/s] 190it [00:19, 9.57it/s] 191it [00:20, 9.59it/s] 192it [00:20, 9.61it/s] 193it [00:20, 9.08it/s] 194it [00:20, 9.23it/s] 195it [00:20, 8.83it/s] 196it [00:20, 8.90it/s] 196it [00:20, 9.46it/s] +2025-05-26 06:01:50,895 - INFO - Epoch: 48, Objective: tensor([5577.5146], device='cuda:0', grad_fn=), Loss: 0.034665796905756, KL/n: 69.71744537353516 + 0it [00:00, ?it/s]2025-05-26 06:01:51,206 - INFO - [Epoch 049 | Batch 0000] IWAE-loss 4387.7876 | mean log_px -0.0154 | KL -3415.77 + 1it [00:00, 4.49it/s] 2it [00:00, 6.43it/s] 3it [00:00, 7.61it/s] 4it [00:00, 8.32it/s] 5it [00:00, 8.77it/s] 6it [00:00, 9.03it/s] 7it [00:00, 9.23it/s] 8it [00:00, 9.36it/s] 9it [00:01, 9.48it/s] 10it [00:01, 9.51it/s] 11it [00:01, 9.57it/s] 12it [00:01, 9.62it/s] 13it [00:01, 9.65it/s] 14it [00:01, 9.66it/s] 15it [00:01, 9.65it/s] 16it [00:01, 9.63it/s] 17it [00:01, 9.66it/s] 18it [00:01, 9.67it/s] 19it [00:02, 9.70it/s] 20it [00:02, 9.70it/s] 21it [00:02, 9.71it/s] 22it [00:02, 9.71it/s] 23it [00:02, 9.72it/s] 24it [00:02, 9.72it/s] 25it [00:02, 9.72it/s] 26it [00:02, 9.71it/s] 27it [00:02, 9.71it/s] 28it [00:03, 9.71it/s] 29it [00:03, 9.63it/s] 30it [00:03, 9.56it/s] 31it [00:03, 9.61it/s] 32it [00:03, 9.64it/s] 33it [00:03, 9.67it/s] 34it [00:03, 9.24it/s] 35it [00:03, 9.38it/s] 36it [00:03, 9.46it/s] 37it [00:03, 9.54it/s] 38it [00:04, 9.59it/s] 39it [00:04, 9.62it/s] 40it [00:04, 9.62it/s] 41it [00:04, 9.65it/s] 42it [00:04, 9.66it/s] 43it [00:04, 9.69it/s] 44it [00:04, 9.70it/s] 45it [00:04, 9.72it/s] 46it [00:04, 9.71it/s] 47it [00:05, 9.18it/s] 48it [00:05, 9.33it/s] 49it [00:05, 9.45it/s] 50it [00:05, 9.52it/s]2025-05-26 06:01:56,409 - INFO - [Epoch 049 | Batch 0050] IWAE-loss 6286.7646 | mean log_px -0.0480 | KL -3411.50 + 51it [00:05, 9.57it/s] 52it [00:05, 9.61it/s] 53it [00:05, 9.65it/s] 54it [00:05, 9.65it/s] 55it [00:05, 9.68it/s] 56it [00:05, 9.69it/s] 57it [00:06, 9.70it/s] 58it [00:06, 9.71it/s] 59it [00:06, 9.69it/s] 60it [00:06, 9.61it/s] 61it [00:06, 9.63it/s] 62it [00:06, 9.64it/s] 63it [00:06, 9.66it/s] 64it [00:06, 9.65it/s] 65it [00:06, 9.07it/s] 66it [00:06, 9.22it/s] 67it [00:07, 9.37it/s] 68it [00:07, 9.47it/s] 69it [00:07, 9.56it/s] 70it [00:07, 9.60it/s] 71it [00:07, 9.65it/s] 72it [00:07, 9.68it/s] 73it [00:07, 9.66it/s] 74it [00:07, 9.68it/s] 75it [00:07, 9.70it/s] 76it [00:08, 9.72it/s] 77it [00:08, 9.73it/s] 78it [00:08, 9.73it/s] 79it [00:08, 9.72it/s] 80it [00:08, 9.69it/s] 81it [00:08, 9.71it/s] 82it [00:08, 9.71it/s] 83it [00:08, 9.73it/s] 84it [00:08, 9.72it/s] 85it [00:08, 9.73it/s] 86it [00:09, 9.71it/s] 87it [00:09, 9.68it/s] 88it [00:09, 9.67it/s] 89it [00:09, 9.69it/s] 90it [00:09, 9.69it/s] 91it [00:09, 9.69it/s] 92it [00:09, 9.68it/s] 93it [00:09, 9.68it/s] 94it [00:09, 9.68it/s] 95it [00:09, 9.70it/s] 96it [00:10, 9.69it/s] 97it [00:10, 9.71it/s] 98it [00:10, 9.69it/s] 99it [00:10, 9.71it/s] 100it [00:10, 9.70it/s]2025-05-26 06:02:01,589 - INFO - [Epoch 049 | Batch 0100] IWAE-loss 6288.9609 | mean log_px -0.0417 | KL -3411.01 + 101it [00:10, 9.71it/s] 102it [00:10, 9.70it/s] 103it [00:10, 9.65it/s] 104it [00:10, 9.67it/s] 105it [00:11, 9.70it/s] 106it [00:11, 9.69it/s] 107it [00:11, 9.71it/s] 108it [00:11, 9.69it/s] 109it [00:11, 9.71it/s] 110it [00:11, 9.71it/s] 111it [00:11, 9.73it/s] 112it [00:11, 9.70it/s] 113it [00:11, 9.71it/s] 114it [00:11, 9.70it/s] 115it [00:12, 9.72it/s] 116it [00:12, 9.73it/s] 117it [00:12, 9.73it/s] 118it [00:12, 9.72it/s] 119it [00:12, 9.74it/s] 120it [00:12, 9.72it/s] 121it [00:12, 9.73it/s] 122it [00:12, 9.73it/s] 123it [00:12, 9.72it/s] 124it [00:12, 9.72it/s] 125it [00:13, 9.73it/s] 126it [00:13, 9.72it/s] 127it [00:13, 9.72it/s] 128it [00:13, 9.68it/s] 129it [00:13, 9.69it/s] 130it [00:13, 9.69it/s] 131it [00:13, 9.70it/s] 132it [00:13, 9.67it/s] 133it [00:13, 9.70it/s] 134it [00:14, 9.63it/s] 135it [00:14, 9.22it/s] 136it [00:14, 9.29it/s] 137it [00:14, 8.84it/s] 138it [00:14, 9.04it/s] 139it [00:14, 9.13it/s] 140it [00:14, 9.22it/s] 141it [00:14, 9.35it/s] 142it [00:14, 8.81it/s] 143it [00:15, 9.06it/s] 144it [00:15, 9.18it/s] 145it [00:15, 9.34it/s] 146it [00:15, 9.43it/s] 147it [00:15, 9.49it/s] 148it [00:15, 9.50it/s] 149it [00:15, 8.96it/s] 150it [00:15, 9.15it/s]2025-05-26 06:02:06,850 - INFO - [Epoch 049 | Batch 0150] IWAE-loss 5174.5752 | mean log_px -0.0317 | KL -3409.79 + 151it [00:15, 9.29it/s] 152it [00:15, 9.39it/s] 153it [00:16, 9.44it/s] 154it [00:16, 8.94it/s] 155it [00:16, 9.14it/s] 156it [00:16, 9.28it/s] 157it [00:16, 8.92it/s] 158it [00:16, 9.08it/s] 159it [00:16, 9.22it/s] 160it [00:16, 8.80it/s] 161it [00:16, 9.02it/s] 162it [00:17, 9.18it/s] 163it [00:17, 9.33it/s] 164it [00:17, 8.82it/s] 165it [00:17, 9.03it/s] 166it [00:17, 9.22it/s] 167it [00:17, 9.38it/s] 168it [00:17, 9.40it/s] 169it [00:17, 9.49it/s] 170it [00:17, 9.54it/s] 171it [00:18, 9.58it/s] 172it [00:18, 9.59it/s] 173it [00:18, 9.60it/s] 174it [00:18, 9.06it/s] 175it [00:18, 9.26it/s] 176it [00:18, 9.40it/s] 177it [00:18, 9.51it/s] 178it [00:18, 9.56it/s] 179it [00:18, 9.62it/s] 180it [00:18, 9.65it/s] 181it [00:19, 9.07it/s] 182it [00:19, 9.24it/s] 183it [00:19, 9.38it/s] 184it [00:19, 9.48it/s] 185it [00:19, 9.56it/s] 186it [00:19, 9.60it/s] 187it [00:19, 9.64it/s] 188it [00:19, 9.64it/s] 189it [00:19, 9.68it/s] 190it [00:20, 9.68it/s] 191it [00:20, 9.70it/s] 192it [00:20, 9.69it/s] 193it [00:20, 9.71it/s] 194it [00:20, 9.72it/s] 195it [00:20, 9.16it/s] 196it [00:20, 9.38it/s] 196it [00:20, 9.46it/s] +2025-05-26 06:02:11,752 - INFO - Epoch: 49, Objective: tensor([5592.1567], device='cuda:0', grad_fn=), Loss: 0.03624124079942703, KL/n: 69.54737854003906 + 0it [00:00, ?it/s]2025-05-26 06:02:12,216 - INFO - [Epoch 050 | Batch 0000] IWAE-loss 4820.5073 | mean log_px -0.0246 | KL -3407.40 + 1it [00:00, 4.71it/s] 2it [00:00, 6.75it/s] 3it [00:00, 7.89it/s] 4it [00:00, 8.52it/s] 5it [00:00, 8.43it/s] 6it [00:00, 8.80it/s] 7it [00:00, 9.09it/s] 8it [00:00, 9.28it/s] 9it [00:01, 9.43it/s] 10it [00:01, 9.51it/s] 11it [00:01, 9.60it/s] 12it [00:01, 9.63it/s] 13it [00:01, 9.20it/s] 14it [00:01, 9.35it/s] 15it [00:01, 9.47it/s] 16it [00:01, 9.53it/s] 17it [00:01, 9.59it/s] 18it [00:01, 9.57it/s] 19it [00:02, 9.00it/s] 20it [00:02, 9.20it/s] 21it [00:02, 9.36it/s] 22it [00:02, 9.45it/s] 23it [00:02, 9.23it/s] 24it [00:02, 8.80it/s] 25it [00:02, 9.07it/s] 26it [00:02, 9.24it/s] 27it [00:02, 9.39it/s] 28it [00:03, 9.48it/s] 29it [00:03, 9.56it/s] 30it [00:03, 9.61it/s] 31it [00:03, 9.07it/s] 32it [00:03, 9.17it/s] 33it [00:03, 8.75it/s] 34it [00:03, 8.74it/s] 35it [00:03, 8.91it/s] 36it [00:03, 8.54it/s] 37it [00:04, 8.76it/s] 38it [00:04, 8.89it/s] 39it [00:04, 9.04it/s] 40it [00:04, 8.62it/s] 41it [00:04, 8.84it/s] 42it [00:04, 8.97it/s] 43it [00:04, 9.04it/s] 44it [00:04, 8.62it/s] 45it [00:05, 8.88it/s] 46it [00:05, 9.08it/s] 47it [00:05, 9.08it/s] 48it [00:05, 9.20it/s] 49it [00:05, 8.80it/s] 50it [00:05, 9.01it/s]2025-05-26 06:02:17,689 - INFO - [Epoch 050 | Batch 0050] IWAE-loss 6266.3530 | mean log_px -0.0450 | KL -3405.55 + 51it [00:05, 9.15it/s] 52it [00:05, 9.28it/s] 53it [00:05, 8.72it/s] 54it [00:05, 8.95it/s] 55it [00:06, 9.10it/s] 56it [00:06, 9.23it/s] 57it [00:06, 8.81it/s] 58it [00:06, 9.03it/s] 59it [00:06, 9.21it/s] 60it [00:06, 9.31it/s] 61it [00:06, 8.87it/s] 62it [00:06, 9.01it/s] 63it [00:06, 9.16it/s] 64it [00:07, 9.27it/s] 65it [00:07, 8.84it/s] 66it [00:07, 9.04it/s] 67it [00:07, 9.04it/s] 68it [00:07, 9.18it/s] 69it [00:07, 8.74it/s] 70it [00:07, 8.98it/s] 71it [00:07, 9.16it/s] 72it [00:07, 9.25it/s] 73it [00:08, 8.91it/s] 74it [00:08, 9.06it/s] 75it [00:08, 9.24it/s] 76it [00:08, 8.91it/s] 77it [00:08, 9.12it/s] 78it [00:08, 9.26it/s] 79it [00:08, 9.36it/s] 80it [00:08, 9.44it/s] 81it [00:08, 9.52it/s] 82it [00:09, 9.55it/s] 83it [00:09, 9.60it/s] 84it [00:09, 9.61it/s] 85it [00:09, 9.63it/s] 86it [00:09, 9.63it/s] 87it [00:09, 9.63it/s] 88it [00:09, 9.63it/s] 89it [00:09, 9.65it/s] 90it [00:09, 9.64it/s] 91it [00:09, 9.63it/s] 92it [00:10, 9.65it/s] 93it [00:10, 9.65it/s] 94it [00:10, 9.64it/s] 95it [00:10, 9.64it/s] 96it [00:10, 9.63it/s] 97it [00:10, 9.06it/s] 98it [00:10, 9.18it/s] 99it [00:10, 9.32it/s] 100it [00:10, 9.40it/s]2025-05-26 06:02:23,076 - INFO - [Epoch 050 | Batch 0100] IWAE-loss 5081.3320 | mean log_px -0.0248 | KL -3404.80 + 101it [00:11, 9.47it/s] 102it [00:11, 9.53it/s] 103it [00:11, 9.57it/s] 104it [00:11, 9.57it/s] 105it [00:11, 9.60it/s] 106it [00:11, 9.59it/s] 107it [00:11, 9.62it/s] 108it [00:11, 9.61it/s] 109it [00:11, 9.63it/s] 110it [00:12, 9.03it/s] 111it [00:12, 9.20it/s] 112it [00:12, 9.34it/s] 113it [00:12, 9.42it/s] 114it [00:12, 9.48it/s] 115it [00:12, 9.54it/s] 116it [00:12, 9.56it/s] 117it [00:12, 9.59it/s] 118it [00:12, 9.58it/s] 119it [00:12, 9.60it/s] 120it [00:13, 9.60it/s] 121it [00:13, 9.61it/s] 122it [00:13, 9.62it/s] 123it [00:13, 9.64it/s] 124it [00:13, 9.65it/s] 125it [00:13, 9.66it/s] 126it [00:13, 9.66it/s] 127it [00:13, 9.65it/s] 128it [00:13, 9.66it/s] 129it [00:13, 9.10it/s] 130it [00:14, 9.25it/s] 131it [00:14, 9.38it/s] 132it [00:14, 9.45it/s] 133it [00:14, 9.52it/s] 134it [00:14, 9.55it/s] 135it [00:14, 9.60it/s] 136it [00:14, 9.60it/s] 137it [00:14, 9.62it/s] 138it [00:14, 9.61it/s] 139it [00:15, 9.63it/s] 140it [00:15, 9.61it/s] 141it [00:15, 9.63it/s] 142it [00:15, 9.63it/s] 143it [00:15, 9.65it/s] 144it [00:15, 9.64it/s] 145it [00:15, 9.66it/s] 146it [00:15, 9.64it/s] 147it [00:15, 9.64it/s] 148it [00:15, 9.63it/s] 149it [00:16, 9.17it/s] 150it [00:16, 9.29it/s]2025-05-26 06:02:28,323 - INFO - [Epoch 050 | Batch 0150] IWAE-loss 5562.5117 | mean log_px -0.0343 | KL -3396.77 + 151it [00:16, 9.37it/s] 152it [00:16, 9.46it/s] 153it [00:16, 9.52it/s] 154it [00:16, 9.56it/s] 155it [00:16, 8.88it/s] 156it [00:16, 9.08it/s] 157it [00:16, 9.22it/s] 158it [00:17, 9.32it/s] 159it [00:17, 9.41it/s] 160it [00:17, 9.48it/s] 161it [00:17, 9.54it/s] 162it [00:17, 9.56it/s] 163it [00:17, 9.60it/s] 164it [00:17, 9.61it/s] 165it [00:17, 9.64it/s] 166it [00:17, 9.04it/s] 167it [00:18, 9.19it/s] 168it [00:18, 9.29it/s] 169it [00:18, 9.40it/s] 170it [00:18, 9.45it/s] 171it [00:18, 9.51it/s] 172it [00:18, 9.53it/s] 173it [00:18, 9.56it/s] 174it [00:18, 9.54it/s] 175it [00:18, 9.58it/s] 176it [00:18, 9.60it/s] 177it [00:19, 9.61it/s] 178it [00:19, 9.61it/s] 179it [00:19, 9.62it/s] 180it [00:19, 9.63it/s] 181it [00:19, 9.64it/s] 182it [00:19, 9.64it/s] 183it [00:19, 9.63it/s] 184it [00:19, 9.64it/s] 185it [00:19, 9.65it/s] 186it [00:20, 9.03it/s] 187it [00:20, 9.20it/s] 188it [00:20, 9.33it/s] 189it [00:20, 9.43it/s] 190it [00:20, 9.48it/s] 191it [00:20, 9.55it/s] 192it [00:20, 9.11it/s] 193it [00:20, 9.25it/s] 194it [00:20, 9.37it/s] 195it [00:20, 8.92it/s] 196it [00:21, 9.20it/s] 196it [00:21, 9.27it/s] +2025-05-26 06:02:33,214 - INFO - Epoch: 50, Objective: tensor([5149.9160], device='cuda:0', grad_fn=), Loss: 0.02591179683804512, KL/n: 69.36389923095703 + 0it [00:00, ?it/s]2025-05-26 06:02:33,489 - INFO - [Epoch 051 | Batch 0000] IWAE-loss 4607.3794 | mean log_px -0.0298 | KL -3396.73 + 1it [00:00, 5.53it/s] 2it [00:00, 7.41it/s] 3it [00:00, 8.35it/s] 4it [00:00, 8.61it/s] 5it [00:00, 8.98it/s] 6it [00:00, 9.12it/s] 7it [00:00, 9.34it/s] 8it [00:00, 9.45it/s] 9it [00:01, 9.53it/s] 10it [00:01, 9.59it/s] 11it [00:01, 9.66it/s] 12it [00:01, 9.66it/s] 13it [00:01, 9.70it/s] 14it [00:01, 9.70it/s] 15it [00:01, 9.67it/s] 16it [00:01, 9.57it/s] 17it [00:01, 9.40it/s] 18it [00:01, 9.47it/s] 19it [00:02, 9.54it/s] 20it [00:02, 9.31it/s] 21it [00:02, 9.37it/s] 22it [00:02, 9.44it/s] 23it [00:02, 9.49it/s] 24it [00:02, 9.54it/s] 25it [00:02, 9.60it/s] 26it [00:02, 9.63it/s] 27it [00:02, 9.66it/s] 28it [00:02, 9.67it/s] 29it [00:03, 9.69it/s] 30it [00:03, 9.70it/s] 31it [00:03, 9.71it/s] 32it [00:03, 9.70it/s] 33it [00:03, 9.72it/s] 34it [00:03, 9.71it/s] 35it [00:03, 9.72it/s] 36it [00:03, 9.70it/s] 37it [00:03, 9.71it/s] 38it [00:04, 9.70it/s] 39it [00:04, 9.71it/s] 40it [00:04, 9.70it/s] 41it [00:04, 9.72it/s] 42it [00:04, 9.71it/s] 43it [00:04, 9.72it/s] 44it [00:04, 9.70it/s] 45it [00:04, 9.71it/s] 46it [00:04, 9.44it/s] 47it [00:04, 9.52it/s] 48it [00:05, 9.57it/s] 49it [00:05, 9.63it/s] 50it [00:05, 9.64it/s]2025-05-26 06:02:38,685 - INFO - [Epoch 051 | Batch 0050] IWAE-loss 4357.4595 | mean log_px -0.0165 | KL -3393.12 + 51it [00:05, 9.64it/s] 52it [00:05, 9.64it/s] 53it [00:05, 9.67it/s] 54it [00:05, 9.68it/s] 55it [00:05, 9.71it/s] 56it [00:05, 9.71it/s] 57it [00:05, 9.71it/s] 58it [00:06, 9.70it/s] 59it [00:06, 9.71it/s] 60it [00:06, 9.53it/s] 61it [00:06, 9.58it/s] 62it [00:06, 9.60it/s] 63it [00:06, 9.65it/s] 64it [00:06, 9.57it/s] 65it [00:06, 9.53it/s] 66it [00:06, 9.52it/s] 67it [00:07, 9.60it/s] 68it [00:07, 9.62it/s] 69it [00:07, 9.67it/s] 70it [00:07, 9.69it/s] 71it [00:07, 9.70it/s] 72it [00:07, 9.69it/s] 73it [00:07, 9.66it/s] 74it [00:07, 9.68it/s] 75it [00:07, 9.72it/s] 76it [00:07, 9.71it/s] 77it [00:08, 9.72it/s] 78it [00:08, 9.71it/s] 79it [00:08, 9.73it/s] 80it [00:08, 9.73it/s] 81it [00:08, 9.73it/s] 82it [00:08, 9.72it/s] 83it [00:08, 9.40it/s] 84it [00:08, 9.49it/s] 85it [00:08, 9.58it/s] 86it [00:09, 9.61it/s] 87it [00:09, 9.65it/s] 88it [00:09, 9.54it/s] 89it [00:09, 9.58it/s] 90it [00:09, 9.51it/s] 91it [00:09, 9.52it/s] 92it [00:09, 9.53it/s] 93it [00:09, 9.56it/s] 94it [00:09, 9.56it/s] 95it [00:09, 9.53it/s] 96it [00:10, 9.52it/s] 97it [00:10, 9.59it/s] 98it [00:10, 9.59it/s] 99it [00:10, 9.57it/s] 100it [00:10, 9.52it/s]2025-05-26 06:02:43,884 - INFO - [Epoch 051 | Batch 0100] IWAE-loss 4766.6494 | mean log_px -0.0259 | KL -3393.81 + 101it [00:10, 9.55it/s] 102it [00:10, 9.58it/s] 103it [00:10, 9.57it/s] 104it [00:10, 9.48it/s] 105it [00:11, 9.31it/s] 106it [00:11, 9.38it/s] 107it [00:11, 9.40it/s] 108it [00:11, 9.45it/s] 109it [00:11, 9.44it/s] 110it [00:11, 9.45it/s] 111it [00:11, 9.49it/s] 112it [00:11, 9.43it/s] 113it [00:11, 9.50it/s] 114it [00:11, 9.49it/s] 115it [00:12, 9.53it/s] 116it [00:12, 9.54it/s] 117it [00:12, 9.36it/s] 118it [00:12, 9.35it/s] 119it [00:12, 9.43it/s] 120it [00:12, 9.46it/s] 121it [00:12, 9.51it/s] 122it [00:12, 9.55it/s] 123it [00:12, 9.58it/s] 124it [00:13, 9.55it/s] 125it [00:13, 9.55it/s] 126it [00:13, 9.55it/s] 127it [00:13, 9.56it/s] 128it [00:13, 9.51it/s] 129it [00:13, 9.47it/s] 130it [00:13, 9.38it/s] 131it [00:13, 9.09it/s] 132it [00:13, 9.09it/s] 133it [00:13, 9.25it/s] 134it [00:14, 9.31it/s] 135it [00:14, 9.33it/s] 136it [00:14, 9.34it/s] 137it [00:14, 9.39it/s] 138it [00:14, 9.43it/s] 139it [00:14, 9.45it/s] 140it [00:14, 9.24it/s] 141it [00:14, 9.32it/s] 142it [00:14, 9.37it/s] 143it [00:15, 9.44it/s] 144it [00:15, 9.39it/s] 145it [00:15, 9.45it/s] 146it [00:15, 9.46it/s] 147it [00:15, 9.48it/s] 148it [00:15, 9.46it/s] 149it [00:15, 9.48it/s] 150it [00:15, 9.45it/s]2025-05-26 06:02:49,187 - INFO - [Epoch 051 | Batch 0150] IWAE-loss 5195.3750 | mean log_px -0.0258 | KL -3389.90 + 151it [00:15, 9.51it/s] 152it [00:15, 9.52it/s] 153it [00:16, 9.50it/s] 154it [00:16, 9.49it/s] 155it [00:16, 9.47it/s] 156it [00:16, 9.48it/s] 157it [00:16, 9.49it/s] 158it [00:16, 9.45it/s] 159it [00:16, 9.46it/s] 160it [00:16, 9.47it/s] 161it [00:16, 9.50it/s] 162it [00:17, 9.50it/s] 163it [00:17, 9.51it/s] 164it [00:17, 9.55it/s] 165it [00:17, 9.49it/s] 166it [00:17, 9.26it/s] 167it [00:17, 9.29it/s] 168it [00:17, 9.36it/s] 169it [00:17, 9.37it/s] 170it [00:17, 9.42it/s] 171it [00:17, 9.42it/s] 172it [00:18, 9.08it/s] 173it [00:18, 9.24it/s] 174it [00:18, 9.33it/s] 175it [00:18, 9.36it/s] 176it [00:18, 9.42it/s] 177it [00:18, 9.41it/s] 178it [00:18, 9.43it/s] 179it [00:18, 9.46it/s] 180it [00:18, 9.45it/s] 181it [00:19, 9.33it/s] 182it [00:19, 9.37it/s] 183it [00:19, 9.40it/s] 184it [00:19, 9.22it/s] 185it [00:19, 9.34it/s] 186it [00:19, 9.40it/s] 187it [00:19, 9.43it/s] 188it [00:19, 9.46it/s] 189it [00:19, 9.49it/s] 190it [00:20, 9.54it/s] 191it [00:20, 9.50it/s] 192it [00:20, 9.49it/s] 193it [00:20, 9.50it/s] 194it [00:20, 9.44it/s] 195it [00:20, 8.88it/s] 196it [00:20, 9.06it/s] 196it [00:20, 9.45it/s] +2025-05-26 06:02:54,088 - INFO - Epoch: 51, Objective: tensor([5151.0229], device='cuda:0', grad_fn=), Loss: 0.03177899122238159, KL/n: 69.16956329345703 + 0it [00:00, ?it/s]2025-05-26 06:02:54,545 - INFO - [Epoch 052 | Batch 0000] IWAE-loss 4369.1685 | mean log_px -0.0140 | KL -3385.86 + 1it [00:00, 5.53it/s] 2it [00:00, 7.33it/s] 3it [00:00, 8.22it/s] 4it [00:00, 8.71it/s] 5it [00:00, 9.01it/s] 6it [00:00, 9.07it/s] 7it [00:00, 9.23it/s] 8it [00:00, 9.32it/s] 9it [00:01, 9.36it/s] 10it [00:01, 9.36it/s] 11it [00:01, 9.40it/s] 12it [00:01, 9.43it/s] 13it [00:01, 9.53it/s] 14it [00:01, 9.49it/s] 15it [00:01, 9.46it/s] 16it [00:01, 9.47it/s] 17it [00:01, 9.53it/s] 18it [00:01, 9.50it/s] 19it [00:02, 9.53it/s] 20it [00:02, 9.51it/s] 21it [00:02, 9.55it/s] 22it [00:02, 9.45it/s] 23it [00:02, 9.50it/s] 24it [00:02, 9.49it/s] 25it [00:02, 9.53it/s] 26it [00:02, 9.55it/s] 27it [00:02, 9.57it/s] 28it [00:03, 9.52it/s] 29it [00:03, 9.55it/s] 30it [00:03, 9.56it/s] 31it [00:03, 9.57it/s] 32it [00:03, 9.49it/s] 33it [00:03, 9.52it/s] 34it [00:03, 9.50it/s] 35it [00:03, 9.52it/s] 36it [00:03, 9.50it/s] 37it [00:03, 9.54it/s] 38it [00:04, 9.50it/s] 39it [00:04, 9.53it/s] 40it [00:04, 8.97it/s] 41it [00:04, 9.09it/s] 42it [00:04, 9.19it/s] 43it [00:04, 9.29it/s] 44it [00:04, 9.37it/s] 45it [00:04, 9.44it/s] 46it [00:04, 9.44it/s] 47it [00:05, 9.45it/s] 48it [00:05, 9.46it/s] 49it [00:05, 9.50it/s] 50it [00:05, 9.43it/s]2025-05-26 06:02:59,827 - INFO - [Epoch 052 | Batch 0050] IWAE-loss 4918.5332 | mean log_px -0.0245 | KL -3388.32 + 51it [00:05, 9.40it/s] 52it [00:05, 9.43it/s] 53it [00:05, 9.45it/s] 54it [00:05, 9.45it/s] 55it [00:05, 9.48it/s] 56it [00:05, 9.50it/s] 57it [00:06, 9.54it/s] 58it [00:06, 9.50it/s] 59it [00:06, 9.55it/s] 60it [00:06, 9.49it/s] 61it [00:06, 9.48it/s] 62it [00:06, 9.47it/s] 63it [00:06, 9.45it/s] 64it [00:06, 9.49it/s] 65it [00:06, 9.48it/s] 66it [00:07, 9.48it/s] 67it [00:07, 9.49it/s] 68it [00:07, 9.35it/s] 69it [00:07, 9.36it/s] 70it [00:07, 9.38it/s] 71it [00:07, 9.44it/s] 72it [00:07, 9.45it/s] 73it [00:07, 9.47it/s] 74it [00:07, 9.48it/s] 75it [00:07, 9.52it/s] 76it [00:08, 9.51it/s] 77it [00:08, 9.47it/s] 78it [00:08, 9.49it/s] 79it [00:08, 9.48it/s] 80it [00:08, 9.34it/s] 81it [00:08, 9.44it/s] 82it [00:08, 9.50it/s] 83it [00:08, 9.56it/s] 84it [00:08, 9.53it/s] 85it [00:09, 9.51it/s] 86it [00:09, 9.52it/s] 87it [00:09, 9.52it/s] 88it [00:09, 9.49it/s] 89it [00:09, 9.49it/s] 90it [00:09, 9.48it/s] 91it [00:09, 9.48it/s] 92it [00:09, 9.48it/s] 93it [00:09, 9.03it/s] 94it [00:10, 9.18it/s] 95it [00:10, 9.30it/s] 96it [00:10, 9.35it/s] 97it [00:10, 9.32it/s] 98it [00:10, 9.35it/s] 99it [00:10, 9.42it/s] 100it [00:10, 9.41it/s]2025-05-26 06:03:05,122 - INFO - [Epoch 052 | Batch 0100] IWAE-loss 4805.5391 | mean log_px -0.0203 | KL -3385.52 + 101it [00:10, 9.45it/s] 102it [00:10, 9.46it/s] 103it [00:10, 9.47it/s] 104it [00:11, 9.48it/s] 105it [00:11, 9.49it/s] 106it [00:11, 9.44it/s] 107it [00:11, 9.47it/s] 108it [00:11, 9.42it/s] 109it [00:11, 9.47it/s] 110it [00:11, 9.50it/s] 111it [00:11, 9.49it/s] 112it [00:11, 9.49it/s] 113it [00:12, 9.51it/s] 114it [00:12, 9.53it/s] 115it [00:12, 9.53it/s] 116it [00:12, 9.57it/s] 117it [00:12, 9.39it/s] 118it [00:12, 9.41it/s] 119it [00:12, 9.49it/s] 120it [00:12, 9.50it/s] 121it [00:12, 9.51it/s] 122it [00:12, 9.52it/s] 123it [00:13, 9.51it/s] 124it [00:13, 9.54it/s] 125it [00:13, 9.56it/s] 126it [00:13, 9.55it/s] 127it [00:13, 9.61it/s] 128it [00:13, 9.60it/s] 129it [00:13, 9.59it/s] 130it [00:13, 9.58it/s] 131it [00:13, 9.62it/s] 132it [00:14, 9.60it/s] 133it [00:14, 9.60it/s] 134it [00:14, 9.58it/s] 135it [00:14, 9.56it/s] 136it [00:14, 9.47it/s] 137it [00:14, 9.14it/s] 138it [00:14, 9.20it/s] 139it [00:14, 9.27it/s] 140it [00:14, 9.34it/s] 141it [00:14, 9.38it/s] 142it [00:15, 9.43it/s] 143it [00:15, 9.46it/s] 144it [00:15, 9.46it/s] 145it [00:15, 9.49it/s] 146it [00:15, 9.46it/s] 147it [00:15, 9.47it/s] 148it [00:15, 9.11it/s] 149it [00:15, 9.20it/s] 150it [00:15, 9.28it/s]2025-05-26 06:03:10,408 - INFO - [Epoch 052 | Batch 0150] IWAE-loss 5867.5352 | mean log_px -0.0419 | KL -3378.72 + 151it [00:16, 9.39it/s] 152it [00:16, 9.45it/s] 153it [00:16, 9.47it/s] 154it [00:16, 9.45it/s] 155it [00:16, 9.52it/s] 156it [00:16, 9.44it/s] 157it [00:16, 9.50it/s] 158it [00:16, 9.47it/s] 159it [00:16, 9.47it/s] 160it [00:16, 9.51it/s] 161it [00:17, 9.56it/s] 162it [00:17, 9.56it/s] 163it [00:17, 9.51it/s] 164it [00:17, 9.51it/s] 165it [00:17, 9.53it/s] 166it [00:17, 9.49it/s] 167it [00:17, 9.52it/s] 168it [00:17, 9.55it/s] 169it [00:17, 9.54it/s] 170it [00:18, 9.53it/s] 171it [00:18, 9.52it/s] 172it [00:18, 9.52it/s] 173it [00:18, 9.59it/s] 174it [00:18, 9.56it/s] 175it [00:18, 9.59it/s] 176it [00:18, 9.56it/s] 177it [00:18, 9.51it/s] 178it [00:18, 9.51it/s] 179it [00:18, 9.52it/s] 180it [00:19, 9.49it/s] 181it [00:19, 9.52it/s] 182it [00:19, 9.50it/s] 183it [00:19, 9.52it/s] 184it [00:19, 9.55it/s] 185it [00:19, 9.56it/s] 186it [00:19, 9.57it/s] 187it [00:19, 9.59it/s] 188it [00:19, 9.49it/s] 189it [00:20, 9.43it/s] 190it [00:20, 8.93it/s] 191it [00:20, 9.12it/s] 192it [00:20, 9.17it/s] 193it [00:20, 9.30it/s] 194it [00:20, 9.26it/s] 195it [00:20, 8.78it/s] 196it [00:20, 9.08it/s] 196it [00:20, 9.39it/s] +2025-05-26 06:03:15,288 - INFO - Epoch: 52, Objective: tensor([5528.3022], device='cuda:0', grad_fn=), Loss: 0.03874513879418373, KL/n: 69.0050048828125 + 0it [00:00, ?it/s]2025-05-26 06:03:15,543 - INFO - [Epoch 053 | Batch 0000] IWAE-loss 5155.4536 | mean log_px -0.0254 | KL -3377.25 + 1it [00:00, 6.14it/s] 2it [00:00, 7.71it/s] 3it [00:00, 8.47it/s] 4it [00:00, 8.84it/s] 5it [00:00, 9.14it/s] 6it [00:00, 8.72it/s] 7it [00:00, 8.97it/s] 8it [00:00, 9.10it/s] 9it [00:01, 9.19it/s] 10it [00:01, 9.26it/s] 11it [00:01, 9.33it/s] 12it [00:01, 9.34it/s] 13it [00:01, 9.36it/s] 14it [00:01, 9.37it/s] 15it [00:01, 9.44it/s] 16it [00:01, 9.10it/s] 17it [00:01, 9.27it/s] 18it [00:01, 9.27it/s] 19it [00:02, 9.35it/s] 20it [00:02, 9.33it/s] 21it [00:02, 9.40it/s] 22it [00:02, 9.43it/s] 23it [00:02, 9.45it/s] 24it [00:02, 9.46it/s] 25it [00:02, 9.52it/s] 26it [00:02, 9.49it/s] 27it [00:02, 9.50it/s] 28it [00:03, 9.02it/s] 29it [00:03, 8.99it/s] 30it [00:03, 9.02it/s] 31it [00:03, 8.69it/s] 32it [00:03, 8.94it/s] 33it [00:03, 9.14it/s] 34it [00:03, 9.26it/s] 35it [00:03, 9.39it/s] 36it [00:03, 9.40it/s] 37it [00:04, 9.43it/s] 38it [00:04, 8.93it/s] 39it [00:04, 9.09it/s] 40it [00:04, 9.23it/s] 41it [00:04, 9.01it/s] 42it [00:04, 9.15it/s] 43it [00:04, 9.12it/s] 44it [00:04, 9.22it/s] 45it [00:04, 9.37it/s] 46it [00:05, 9.21it/s] 47it [00:05, 8.96it/s] 48it [00:05, 9.07it/s] 49it [00:05, 9.20it/s] 50it [00:05, 9.26it/s]2025-05-26 06:03:20,951 - INFO - [Epoch 053 | Batch 0050] IWAE-loss 4669.8696 | mean log_px -0.0194 | KL -3377.31 + 51it [00:05, 9.30it/s] 52it [00:05, 9.30it/s] 53it [00:05, 9.34it/s] 54it [00:05, 9.36it/s] 55it [00:05, 9.44it/s] 56it [00:06, 9.44it/s] 57it [00:06, 9.48it/s] 58it [00:06, 9.48it/s] 59it [00:06, 9.44it/s] 60it [00:06, 9.43it/s] 61it [00:06, 9.48it/s] 62it [00:06, 9.14it/s] 63it [00:06, 9.25it/s] 64it [00:06, 9.31it/s] 65it [00:07, 9.39it/s] 66it [00:07, 9.39it/s] 67it [00:07, 9.38it/s] 68it [00:07, 9.41it/s] 69it [00:07, 9.47it/s] 70it [00:07, 9.43it/s] 71it [00:07, 9.49it/s] 72it [00:07, 9.43it/s] 73it [00:07, 9.49it/s] 74it [00:08, 9.46it/s] 75it [00:08, 9.50it/s] 76it [00:08, 9.53it/s] 77it [00:08, 9.57it/s] 78it [00:08, 9.56it/s] 79it [00:08, 9.53it/s] 80it [00:08, 9.54it/s] 81it [00:08, 9.57it/s] 82it [00:08, 9.59it/s] 83it [00:08, 9.54it/s] 84it [00:09, 9.49it/s] 85it [00:09, 9.47it/s] 86it [00:09, 9.48it/s] 87it [00:09, 9.47it/s] 88it [00:09, 9.45it/s] 89it [00:09, 9.48it/s] 90it [00:09, 9.48it/s] 91it [00:09, 9.48it/s] 92it [00:09, 9.44it/s] 93it [00:10, 9.45it/s] 94it [00:10, 9.46it/s] 95it [00:10, 9.50it/s] 96it [00:10, 9.42it/s] 97it [00:10, 9.35it/s] 98it [00:10, 9.17it/s] 99it [00:10, 8.75it/s] 100it [00:10, 8.94it/s]2025-05-26 06:03:26,270 - INFO - [Epoch 053 | Batch 0100] IWAE-loss 5013.9473 | mean log_px -0.0243 | KL -3370.79 + 101it [00:10, 9.15it/s] 102it [00:10, 9.23it/s] 103it [00:11, 9.27it/s] 104it [00:11, 9.30it/s] 105it [00:11, 9.36it/s] 106it [00:11, 9.33it/s] 107it [00:11, 9.37it/s] 108it [00:11, 9.34it/s] 109it [00:11, 9.36it/s] 110it [00:11, 9.22it/s] 111it [00:11, 9.32it/s] 112it [00:12, 9.36it/s] 113it [00:12, 9.42it/s] 114it [00:12, 8.92it/s] 115it [00:12, 9.11it/s] 116it [00:12, 9.21it/s] 117it [00:12, 9.28it/s] 118it [00:12, 9.36it/s] 119it [00:12, 9.40it/s] 120it [00:12, 9.39it/s] 121it [00:13, 9.41it/s] 122it [00:13, 9.44it/s] 123it [00:13, 9.46it/s] 124it [00:13, 9.45it/s] 125it [00:13, 9.49it/s] 126it [00:13, 9.42it/s] 127it [00:13, 9.45it/s] 128it [00:13, 9.43it/s] 129it [00:13, 9.46it/s] 130it [00:13, 9.42it/s] 131it [00:14, 9.50it/s] 132it [00:14, 9.38it/s] 133it [00:14, 9.35it/s] 134it [00:14, 9.38it/s] 135it [00:14, 9.36it/s] 136it [00:14, 9.42it/s] 137it [00:14, 8.95it/s] 138it [00:14, 9.09it/s] 139it [00:14, 9.19it/s] 140it [00:15, 9.32it/s] 141it [00:15, 9.38it/s] 142it [00:15, 9.42it/s] 143it [00:15, 9.42it/s] 144it [00:15, 9.40it/s] 145it [00:15, 9.46it/s] 146it [00:15, 9.40it/s] 147it [00:15, 9.42it/s] 148it [00:15, 9.41it/s] 149it [00:16, 9.40it/s] 150it [00:16, 9.43it/s]2025-05-26 06:03:31,610 - INFO - [Epoch 053 | Batch 0150] IWAE-loss 5491.2100 | mean log_px -0.0358 | KL -3374.70 + 151it [00:16, 9.45it/s] 152it [00:16, 9.44it/s] 153it [00:16, 9.45it/s] 154it [00:16, 9.46it/s] 155it [00:16, 9.49it/s] 156it [00:16, 9.47it/s] 157it [00:16, 9.43it/s] 158it [00:16, 9.46it/s] 159it [00:17, 9.49it/s] 160it [00:17, 9.53it/s] 161it [00:17, 9.51it/s] 162it [00:17, 9.49it/s] 163it [00:17, 9.49it/s] 164it [00:17, 9.47it/s] 165it [00:17, 9.48it/s] 166it [00:17, 9.46it/s] 167it [00:17, 9.48it/s] 168it [00:18, 9.45it/s] 169it [00:18, 9.42it/s] 170it [00:18, 9.38it/s] 171it [00:18, 9.42it/s] 172it [00:18, 8.89it/s] 173it [00:18, 9.08it/s] 174it [00:18, 9.18it/s] 175it [00:18, 9.26it/s] 176it [00:18, 9.29it/s] 177it [00:18, 9.36it/s] 178it [00:19, 9.41it/s] 179it [00:19, 9.40it/s] 180it [00:19, 9.42it/s] 181it [00:19, 9.43it/s] 182it [00:19, 9.43it/s] 183it [00:19, 9.48it/s] 184it [00:19, 8.94it/s] 185it [00:19, 9.14it/s] 186it [00:19, 9.19it/s] 187it [00:20, 9.23it/s] 188it [00:20, 9.25it/s] 189it [00:20, 9.37it/s] 190it [00:20, 9.42it/s] 191it [00:20, 9.47it/s] 192it [00:20, 9.47it/s] 193it [00:20, 8.94it/s] 194it [00:20, 9.06it/s] 195it [00:20, 8.62it/s] 196it [00:21, 8.97it/s] 196it [00:21, 9.28it/s] +2025-05-26 06:03:36,546 - INFO - Epoch: 53, Objective: tensor([5285.0635], device='cuda:0', grad_fn=), Loss: 0.031190963461995125, KL/n: 68.80663299560547 + 0it [00:00, ?it/s]2025-05-26 06:03:37,008 - INFO - [Epoch 054 | Batch 0000] IWAE-loss 4559.8145 | mean log_px -0.0225 | KL -3372.25 + 1it [00:00, 5.43it/s] 2it [00:00, 7.05it/s] 3it [00:00, 8.04it/s] 4it [00:00, 8.60it/s] 5it [00:00, 8.86it/s] 6it [00:00, 9.07it/s] 7it [00:00, 9.24it/s] 8it [00:00, 9.31it/s] 9it [00:01, 9.40it/s] 10it [00:01, 9.35it/s] 11it [00:01, 9.21it/s] 12it [00:01, 9.29it/s] 13it [00:01, 9.42it/s] 14it [00:01, 9.48it/s] 15it [00:01, 9.56it/s] 16it [00:01, 9.58it/s] 17it [00:01, 9.59it/s] 18it [00:01, 9.57it/s] 19it [00:02, 9.63it/s] 20it [00:02, 9.58it/s] 21it [00:02, 9.60it/s] 22it [00:02, 9.57it/s] 23it [00:02, 9.61it/s] 24it [00:02, 9.60it/s] 25it [00:02, 9.64it/s] 26it [00:02, 9.58it/s] 27it [00:02, 9.61it/s] 28it [00:03, 9.62it/s] 29it [00:03, 9.65it/s] 30it [00:03, 9.43it/s] 31it [00:03, 9.47it/s] 32it [00:03, 9.54it/s] 33it [00:03, 9.60it/s] 34it [00:03, 9.59it/s] 35it [00:03, 9.60it/s] 36it [00:03, 9.60it/s] 37it [00:03, 9.39it/s] 38it [00:04, 9.42it/s] 39it [00:04, 9.53it/s] 40it [00:04, 9.57it/s] 41it [00:04, 9.58it/s] 42it [00:04, 9.61it/s] 43it [00:04, 9.60it/s] 44it [00:04, 9.59it/s] 45it [00:04, 9.61it/s] 46it [00:04, 9.61it/s] 47it [00:05, 9.60it/s] 48it [00:05, 9.60it/s] 49it [00:05, 9.59it/s] 50it [00:05, 9.56it/s]2025-05-26 06:03:42,248 - INFO - [Epoch 054 | Batch 0050] IWAE-loss 4990.6138 | mean log_px -0.0290 | KL -3365.03 + 51it [00:05, 9.62it/s] 52it [00:05, 9.61it/s] 53it [00:05, 9.61it/s] 54it [00:05, 9.60it/s] 55it [00:05, 9.62it/s] 56it [00:05, 9.61it/s] 57it [00:06, 9.61it/s] 58it [00:06, 9.61it/s] 59it [00:06, 9.58it/s] 60it [00:06, 9.56it/s] 61it [00:06, 9.62it/s] 62it [00:06, 9.65it/s] 63it [00:06, 9.66it/s] 64it [00:06, 9.63it/s] 65it [00:06, 9.65it/s] 66it [00:06, 9.60it/s] 67it [00:07, 9.61it/s] 68it [00:07, 9.63it/s] 69it [00:07, 9.63it/s] 70it [00:07, 9.62it/s] 71it [00:07, 9.59it/s] 72it [00:07, 9.56it/s] 73it [00:07, 9.60it/s] 74it [00:07, 9.59it/s] 75it [00:07, 9.65it/s] 76it [00:08, 9.59it/s] 77it [00:08, 9.62it/s] 78it [00:08, 9.60it/s] 79it [00:08, 9.63it/s] 80it [00:08, 9.60it/s] 81it [00:08, 9.63it/s] 82it [00:08, 9.59it/s] 83it [00:08, 9.63it/s] 84it [00:08, 9.60it/s] 85it [00:08, 9.61it/s] 86it [00:09, 9.59it/s] 87it [00:09, 9.60it/s] 88it [00:09, 9.62it/s] 89it [00:09, 9.61it/s] 90it [00:09, 9.61it/s] 91it [00:09, 9.63it/s] 92it [00:09, 9.57it/s] 93it [00:09, 9.61it/s] 94it [00:09, 9.63it/s] 95it [00:10, 9.65it/s] 96it [00:10, 9.65it/s] 97it [00:10, 9.65it/s] 98it [00:10, 9.64it/s] 99it [00:10, 9.64it/s] 100it [00:10, 9.59it/s]2025-05-26 06:03:47,449 - INFO - [Epoch 054 | Batch 0100] IWAE-loss 5274.8164 | mean log_px -0.0305 | KL -3364.53 + 101it [00:10, 9.60it/s] 102it [00:10, 9.62it/s] 103it [00:10, 9.64it/s] 104it [00:10, 9.56it/s] 105it [00:11, 9.58it/s] 106it [00:11, 9.61it/s] 107it [00:11, 9.62it/s] 108it [00:11, 9.62it/s] 109it [00:11, 9.65it/s] 110it [00:11, 9.66it/s] 111it [00:11, 9.65it/s] 112it [00:11, 9.38it/s] 113it [00:11, 9.43it/s] 114it [00:11, 9.48it/s] 115it [00:12, 9.54it/s] 116it [00:12, 9.54it/s] 117it [00:12, 9.49it/s] 118it [00:12, 9.58it/s] 119it [00:12, 9.60it/s] 120it [00:12, 9.58it/s] 121it [00:12, 9.62it/s] 122it [00:12, 9.62it/s] 123it [00:12, 9.59it/s] 124it [00:13, 9.23it/s] 125it [00:13, 9.21it/s] 126it [00:13, 9.22it/s] 127it [00:13, 9.30it/s] 128it [00:13, 9.44it/s] 129it [00:13, 9.52it/s] 130it [00:13, 9.57it/s] 131it [00:13, 9.55it/s] 132it [00:13, 9.05it/s] 133it [00:14, 9.20it/s] 134it [00:14, 9.28it/s] 135it [00:14, 9.39it/s] 136it [00:14, 8.96it/s] 137it [00:14, 9.11it/s] 138it [00:14, 9.26it/s] 139it [00:14, 9.36it/s] 140it [00:14, 9.46it/s] 141it [00:14, 9.52it/s] 142it [00:14, 9.52it/s] 143it [00:15, 9.54it/s] 144it [00:15, 9.53it/s] 145it [00:15, 9.57it/s] 146it [00:15, 9.59it/s] 147it [00:15, 9.60it/s] 148it [00:15, 9.60it/s] 149it [00:15, 9.22it/s] 150it [00:15, 9.27it/s]2025-05-26 06:03:52,742 - INFO - [Epoch 054 | Batch 0150] IWAE-loss 4747.6250 | mean log_px -0.0197 | KL -3364.11 + 151it [00:15, 9.34it/s] 152it [00:16, 9.07it/s] 153it [00:16, 9.25it/s] 154it [00:16, 9.31it/s] 155it [00:16, 9.05it/s] 156it [00:16, 9.15it/s] 157it [00:16, 9.23it/s] 158it [00:16, 8.97it/s] 159it [00:16, 9.14it/s] 160it [00:16, 9.22it/s] 161it [00:17, 8.97it/s] 162it [00:17, 9.08it/s] 163it [00:17, 9.24it/s] 164it [00:17, 9.00it/s] 165it [00:17, 9.20it/s] 166it [00:17, 9.32it/s] 167it [00:17, 9.05it/s] 168it [00:17, 9.23it/s] 169it [00:17, 9.30it/s] 170it [00:18, 9.02it/s] 171it [00:18, 9.17it/s] 172it [00:18, 9.25it/s] 173it [00:18, 9.02it/s] 174it [00:18, 9.18it/s] 175it [00:18, 9.33it/s] 176it [00:18, 8.92it/s] 177it [00:18, 9.15it/s] 178it [00:18, 8.90it/s] 179it [00:18, 9.10it/s] 180it [00:19, 9.24it/s] 181it [00:19, 8.90it/s] 182it [00:19, 9.10it/s] 183it [00:19, 9.24it/s] 184it [00:19, 8.82it/s] 185it [00:19, 9.06it/s] 186it [00:19, 9.19it/s] 187it [00:19, 9.32it/s] 188it [00:19, 9.40it/s] 189it [00:20, 9.47it/s] 190it [00:20, 9.53it/s] 191it [00:20, 9.54it/s] 192it [00:20, 9.49it/s] 193it [00:20, 9.47it/s] 194it [00:20, 9.51it/s] 195it [00:20, 8.93it/s] 196it [00:20, 9.13it/s] 196it [00:20, 9.38it/s] +2025-05-26 06:03:57,761 - INFO - Epoch: 54, Objective: tensor([5742.4844], device='cuda:0', grad_fn=), Loss: 0.04035816341638565, KL/n: 68.60377502441406 + 0it [00:00, ?it/s]2025-05-26 06:03:58,018 - INFO - [Epoch 055 | Batch 0000] IWAE-loss 4954.8682 | mean log_px -0.0264 | KL -3363.76 + 1it [00:00, 6.12it/s] 2it [00:00, 7.68it/s] 3it [00:00, 8.43it/s] 4it [00:00, 8.76it/s] 5it [00:00, 9.05it/s] 6it [00:00, 9.17it/s] 7it [00:00, 9.32it/s] 8it [00:00, 9.31it/s] 9it [00:01, 9.40it/s] 10it [00:01, 9.43it/s] 11it [00:01, 9.45it/s] 12it [00:01, 9.39it/s] 13it [00:01, 9.39it/s] 14it [00:01, 9.41it/s] 15it [00:01, 9.47it/s] 16it [00:01, 9.50it/s] 17it [00:01, 9.54it/s] 18it [00:01, 9.48it/s] 19it [00:02, 9.43it/s] 20it [00:02, 9.39it/s] 21it [00:02, 9.30it/s] 22it [00:02, 9.23it/s] 23it [00:02, 9.27it/s] 24it [00:02, 9.30it/s] 25it [00:02, 9.27it/s] 26it [00:02, 9.34it/s] 27it [00:02, 9.29it/s] 28it [00:03, 9.35it/s] 29it [00:03, 9.42it/s] 30it [00:03, 9.48it/s] 31it [00:03, 9.49it/s] 32it [00:03, 9.47it/s] 33it [00:03, 9.43it/s] 34it [00:03, 9.37it/s] 35it [00:03, 9.36it/s] 36it [00:03, 9.39it/s] 37it [00:03, 9.30it/s] 38it [00:04, 9.32it/s] 39it [00:04, 9.12it/s] 40it [00:04, 9.12it/s] 41it [00:04, 9.21it/s] 42it [00:04, 9.23it/s] 43it [00:04, 9.32it/s] 44it [00:04, 9.35it/s] 45it [00:04, 9.40it/s] 46it [00:04, 9.39it/s] 47it [00:05, 9.40it/s] 48it [00:05, 9.43it/s] 49it [00:05, 9.44it/s] 50it [00:05, 9.38it/s]2025-05-26 06:04:03,351 - INFO - [Epoch 055 | Batch 0050] IWAE-loss 5218.8096 | mean log_px -0.0286 | KL -3357.67 + 51it [00:05, 9.33it/s] 52it [00:05, 9.36it/s] 53it [00:05, 9.37it/s] 54it [00:05, 9.39it/s] 55it [00:05, 9.40it/s] 56it [00:06, 9.28it/s] 57it [00:06, 9.32it/s] 58it [00:06, 9.34it/s] 59it [00:06, 9.39it/s] 60it [00:06, 9.42it/s] 61it [00:06, 9.49it/s] 62it [00:06, 9.47it/s] 63it [00:06, 9.40it/s] 64it [00:06, 9.26it/s] 65it [00:06, 9.16it/s] 66it [00:07, 8.72it/s] 67it [00:07, 8.96it/s] 68it [00:07, 9.09it/s] 69it [00:07, 9.27it/s] 70it [00:07, 9.37it/s] 71it [00:07, 9.47it/s] 72it [00:07, 9.50it/s] 73it [00:07, 9.33it/s] 74it [00:07, 9.37it/s] 75it [00:08, 9.46it/s] 76it [00:08, 9.46it/s] 77it [00:08, 9.53it/s] 78it [00:08, 9.51it/s] 79it [00:08, 9.58it/s] 80it [00:08, 9.59it/s] 81it [00:08, 9.63it/s] 82it [00:08, 9.61it/s] 83it [00:08, 9.56it/s] 84it [00:09, 9.53it/s] 85it [00:09, 9.56it/s] 86it [00:09, 9.56it/s] 87it [00:09, 9.59it/s] 88it [00:09, 9.51it/s] 89it [00:09, 9.55it/s] 90it [00:09, 9.56it/s] 91it [00:09, 9.53it/s] 92it [00:09, 9.56it/s] 93it [00:09, 9.56it/s] 94it [00:10, 9.59it/s] 95it [00:10, 9.59it/s] 96it [00:10, 9.57it/s] 97it [00:10, 9.60it/s] 98it [00:10, 9.62it/s] 99it [00:10, 9.59it/s] 100it [00:10, 9.60it/s]2025-05-26 06:04:08,638 - INFO - [Epoch 055 | Batch 0100] IWAE-loss 5689.7671 | mean log_px -0.0453 | KL -3352.47 + 101it [00:10, 9.64it/s] 102it [00:10, 9.42it/s] 103it [00:10, 9.47it/s] 104it [00:11, 9.52it/s] 105it [00:11, 9.49it/s] 106it [00:11, 9.52it/s] 107it [00:11, 9.58it/s] 108it [00:11, 9.60it/s] 109it [00:11, 9.55it/s] 110it [00:11, 9.52it/s] 111it [00:11, 9.54it/s] 112it [00:11, 9.53it/s] 113it [00:12, 9.55it/s] 114it [00:12, 9.51it/s] 115it [00:12, 9.55it/s] 116it [00:12, 9.57it/s] 117it [00:12, 9.32it/s] 118it [00:12, 9.41it/s] 119it [00:12, 9.45it/s] 120it [00:12, 9.50it/s] 121it [00:12, 9.55it/s] 122it [00:12, 9.53it/s] 123it [00:13, 9.54it/s] 124it [00:13, 9.54it/s] 125it [00:13, 9.59it/s] 126it [00:13, 9.59it/s] 127it [00:13, 9.59it/s] 128it [00:13, 9.50it/s] 129it [00:13, 9.57it/s] 130it [00:13, 9.61it/s] 131it [00:13, 9.61it/s] 132it [00:14, 9.57it/s] 133it [00:14, 9.57it/s] 134it [00:14, 9.57it/s] 135it [00:14, 9.57it/s] 136it [00:14, 9.60it/s] 137it [00:14, 9.63it/s] 138it [00:14, 9.63it/s] 139it [00:14, 9.61it/s] 140it [00:14, 9.55it/s] 141it [00:14, 9.54it/s] 142it [00:15, 9.53it/s] 143it [00:15, 9.52it/s] 144it [00:15, 9.54it/s] 145it [00:15, 9.52it/s] 146it [00:15, 9.55it/s] 147it [00:15, 9.54it/s] 148it [00:15, 9.52it/s] 149it [00:15, 9.53it/s] 150it [00:15, 9.55it/s]2025-05-26 06:04:13,880 - INFO - [Epoch 055 | Batch 0150] IWAE-loss 5461.5342 | mean log_px -0.0355 | KL -3352.60 + 151it [00:16, 9.52it/s] 152it [00:16, 9.56it/s] 153it [00:16, 9.60it/s] 154it [00:16, 9.58it/s] 155it [00:16, 9.54it/s] 156it [00:16, 9.57it/s] 157it [00:16, 9.53it/s] 158it [00:16, 9.51it/s] 159it [00:16, 9.57it/s] 160it [00:16, 9.55it/s] 161it [00:17, 9.58it/s] 162it [00:17, 9.51it/s] 163it [00:17, 9.51it/s] 164it [00:17, 8.94it/s] 165it [00:17, 9.05it/s] 166it [00:17, 8.94it/s] 167it [00:17, 8.77it/s] 168it [00:17, 8.50it/s] 169it [00:17, 8.73it/s] 170it [00:18, 8.87it/s] 171it [00:18, 8.52it/s] 172it [00:18, 8.75it/s] 173it [00:18, 8.88it/s] 174it [00:18, 8.95it/s] 175it [00:18, 8.57it/s] 176it [00:18, 8.75it/s] 177it [00:18, 8.88it/s] 178it [00:19, 8.96it/s] 179it [00:19, 8.61it/s] 180it [00:19, 8.77it/s] 181it [00:19, 8.91it/s] 182it [00:19, 9.02it/s] 183it [00:19, 8.62it/s] 184it [00:19, 8.82it/s] 185it [00:19, 8.91it/s] 186it [00:19, 8.98it/s] 187it [00:20, 8.78it/s] 188it [00:20, 8.94it/s] 189it [00:20, 9.13it/s] 190it [00:20, 8.75it/s] 191it [00:20, 9.01it/s] 192it [00:20, 9.14it/s] 193it [00:20, 9.20it/s] 194it [00:20, 8.78it/s] 195it [00:20, 8.48it/s] 196it [00:21, 8.81it/s] 196it [00:21, 9.29it/s] +2025-05-26 06:04:18,994 - INFO - Epoch: 55, Objective: tensor([5165.6812], device='cuda:0', grad_fn=), Loss: 0.03494435176253319, KL/n: 68.38105010986328 + 0it [00:00, ?it/s]2025-05-26 06:04:19,434 - INFO - [Epoch 056 | Batch 0000] IWAE-loss 4359.5181 | mean log_px -0.0144 | KL -3346.51 + 1it [00:00, 5.97it/s] 2it [00:00, 7.45it/s] 3it [00:00, 8.07it/s] 4it [00:00, 8.34it/s] 5it [00:00, 8.74it/s] 6it [00:00, 8.93it/s] 7it [00:00, 9.12it/s] 8it [00:00, 9.20it/s] 9it [00:01, 9.33it/s] 10it [00:01, 9.36it/s] 11it [00:01, 9.00it/s] 12it [00:01, 9.16it/s] 13it [00:01, 9.22it/s] 14it [00:01, 9.26it/s] 15it [00:01, 9.34it/s] 16it [00:01, 9.35it/s] 17it [00:01, 9.38it/s] 18it [00:02, 9.32it/s] 19it [00:02, 8.78it/s] 20it [00:02, 8.64it/s] 21it [00:02, 8.86it/s] 22it [00:02, 9.00it/s] 23it [00:02, 9.15it/s] 24it [00:02, 9.21it/s] 25it [00:02, 9.29it/s] 26it [00:02, 9.32it/s] 27it [00:02, 9.36it/s] 28it [00:03, 9.37it/s] 29it [00:03, 9.39it/s] 30it [00:03, 9.33it/s] 31it [00:03, 9.40it/s] 32it [00:03, 9.39it/s] 33it [00:03, 9.40it/s] 34it [00:03, 9.39it/s] 35it [00:03, 9.41it/s] 36it [00:03, 9.42it/s] 37it [00:04, 9.43it/s] 38it [00:04, 9.45it/s] 39it [00:04, 9.46it/s] 40it [00:04, 9.44it/s] 41it [00:04, 9.43it/s] 42it [00:04, 9.41it/s] 43it [00:04, 9.44it/s] 44it [00:04, 9.40it/s] 45it [00:04, 9.40it/s] 46it [00:05, 9.41it/s] 47it [00:05, 9.44it/s] 48it [00:05, 9.43it/s] 49it [00:05, 9.43it/s] 50it [00:05, 9.07it/s]2025-05-26 06:04:24,829 - INFO - [Epoch 056 | Batch 0050] IWAE-loss 7072.4180 | mean log_px -0.0646 | KL -3344.14 + 51it [00:05, 9.17it/s] 52it [00:05, 9.27it/s] 53it [00:05, 9.34it/s] 54it [00:05, 9.29it/s] 55it [00:05, 9.35it/s] 56it [00:06, 9.32it/s] 57it [00:06, 9.35it/s] 58it [00:06, 9.32it/s] 59it [00:06, 9.36it/s] 60it [00:06, 9.14it/s] 61it [00:06, 9.16it/s] 62it [00:06, 9.25it/s] 63it [00:06, 9.33it/s] 64it [00:06, 9.25it/s] 65it [00:07, 9.18it/s] 66it [00:07, 9.15it/s] 67it [00:07, 9.21it/s] 68it [00:07, 9.16it/s] 69it [00:07, 9.20it/s] 70it [00:07, 8.69it/s] 71it [00:07, 8.83it/s] 72it [00:07, 8.88it/s] 73it [00:07, 8.99it/s] 74it [00:08, 9.00it/s] 75it [00:08, 8.42it/s] 76it [00:08, 8.51it/s] 77it [00:08, 8.72it/s] 78it [00:08, 8.82it/s] 79it [00:08, 9.12it/s] 80it [00:08, 9.33it/s] 81it [00:08, 9.50it/s] 82it [00:08, 9.61it/s] 83it [00:09, 9.70it/s] 84it [00:09, 9.75it/s] 85it [00:09, 9.80it/s] 86it [00:09, 9.81it/s] 87it [00:09, 9.83it/s] 88it [00:09, 9.68it/s] 89it [00:09, 9.52it/s] 90it [00:09, 9.00it/s] 91it [00:09, 8.97it/s] 92it [00:10, 8.65it/s] 93it [00:10, 9.01it/s] 94it [00:10, 9.25it/s] 95it [00:10, 9.43it/s] 96it [00:10, 9.55it/s] 97it [00:10, 9.68it/s] 98it [00:10, 9.71it/s] 99it [00:10, 9.78it/s] 100it [00:10, 9.81it/s]2025-05-26 06:04:30,213 - INFO - [Epoch 056 | Batch 0100] IWAE-loss 4897.2031 | mean log_px -0.0227 | KL -3343.42 + 101it [00:10, 9.81it/s] 102it [00:11, 9.83it/s] 103it [00:11, 9.87it/s] 104it [00:11, 9.89it/s] 105it [00:11, 9.90it/s] 106it [00:11, 9.89it/s] 107it [00:11, 9.28it/s] 108it [00:11, 9.45it/s] 109it [00:11, 9.60it/s] 110it [00:11, 9.69it/s] 111it [00:11, 9.76it/s] 112it [00:12, 9.79it/s] 113it [00:12, 9.84it/s] 114it [00:12, 9.85it/s] 115it [00:12, 9.88it/s] 116it [00:12, 9.89it/s] 117it [00:12, 9.90it/s] 118it [00:12, 9.90it/s] 119it [00:12, 9.92it/s] 120it [00:12, 9.87it/s] 121it [00:12, 9.80it/s] 122it [00:13, 9.81it/s] 123it [00:13, 9.64it/s] 124it [00:13, 9.68it/s] 125it [00:13, 9.75it/s] 126it [00:13, 9.76it/s] 127it [00:13, 9.78it/s] 128it [00:13, 9.80it/s] 129it [00:13, 9.82it/s] 130it [00:13, 9.82it/s] 131it [00:14, 9.85it/s] 132it [00:14, 9.81it/s] 133it [00:14, 9.83it/s] 134it [00:14, 9.83it/s] 135it [00:14, 9.85it/s] 136it [00:14, 9.84it/s] 137it [00:14, 9.85it/s] 138it [00:14, 9.85it/s] 139it [00:14, 9.85it/s] 140it [00:14, 9.84it/s] 141it [00:15, 9.86it/s] 142it [00:15, 9.65it/s] 143it [00:15, 9.08it/s] 144it [00:15, 9.29it/s] 145it [00:15, 9.46it/s] 146it [00:15, 9.57it/s] 147it [00:15, 9.66it/s] 148it [00:15, 9.68it/s] 149it [00:15, 9.45it/s] 150it [00:15, 9.20it/s]2025-05-26 06:04:35,367 - INFO - [Epoch 056 | Batch 0150] IWAE-loss 4315.8975 | mean log_px -0.0143 | KL -3342.45 + 151it [00:16, 9.37it/s] 152it [00:16, 9.50it/s] 153it [00:16, 9.57it/s] 154it [00:16, 9.64it/s] 155it [00:16, 9.71it/s] 156it [00:16, 9.74it/s] 157it [00:16, 9.77it/s] 158it [00:16, 9.77it/s] 159it [00:16, 9.79it/s] 160it [00:17, 9.24it/s] 161it [00:17, 9.42it/s] 162it [00:17, 9.54it/s] 163it [00:17, 9.64it/s] 164it [00:17, 9.70it/s] 165it [00:17, 9.19it/s] 166it [00:17, 9.38it/s] 167it [00:17, 9.53it/s] 168it [00:17, 9.61it/s] 169it [00:17, 9.70it/s] 170it [00:18, 9.74it/s] 171it [00:18, 9.79it/s] 172it [00:18, 9.81it/s] 173it [00:18, 9.84it/s] 174it [00:18, 9.84it/s] 175it [00:18, 9.86it/s] 176it [00:18, 9.85it/s] 177it [00:18, 9.87it/s] 178it [00:18, 9.85it/s] 179it [00:18, 9.87it/s] 180it [00:19, 9.84it/s] 181it [00:19, 9.84it/s] 182it [00:19, 9.84it/s] 183it [00:19, 9.86it/s] 184it [00:19, 9.85it/s] 185it [00:19, 9.86it/s] 186it [00:19, 9.86it/s] 187it [00:19, 9.87it/s] 188it [00:19, 9.86it/s] 189it [00:19, 9.88it/s] 190it [00:20, 9.86it/s] 191it [00:20, 9.88it/s] 192it [00:20, 9.47it/s] 193it [00:20, 9.59it/s] 194it [00:20, 9.67it/s] 195it [00:20, 9.11it/s] 196it [00:20, 9.42it/s] +2025-05-26 06:04:40,116 - INFO - Epoch: 56, Objective: tensor([5050.2954], device='cuda:0', grad_fn=), Loss: 0.02728617750108242, KL/n: 68.18730926513672 + 0it [00:00, ?it/s]2025-05-26 06:04:40,397 - INFO - [Epoch 057 | Batch 0000] IWAE-loss 4560.9824 | mean log_px -0.0185 | KL -3340.02 + 1it [00:00, 5.25it/s] 2it [00:00, 7.19it/s] 3it [00:00, 8.20it/s] 4it [00:00, 8.73it/s] 5it [00:00, 9.04it/s] 6it [00:00, 9.27it/s] 7it [00:00, 9.42it/s] 8it [00:00, 8.86it/s] 9it [00:01, 9.12it/s] 10it [00:01, 9.31it/s] 11it [00:01, 9.46it/s] 12it [00:01, 9.53it/s] 13it [00:01, 9.63it/s] 14it [00:01, 9.67it/s] 15it [00:01, 9.62it/s] 16it [00:01, 9.65it/s] 17it [00:01, 9.72it/s] 18it [00:01, 9.72it/s] 19it [00:02, 9.77it/s] 20it [00:02, 9.76it/s] 21it [00:02, 9.77it/s] 22it [00:02, 9.77it/s] 23it [00:02, 9.80it/s] 24it [00:02, 9.80it/s] 25it [00:02, 9.81it/s] 26it [00:02, 9.79it/s] 27it [00:02, 9.76it/s] 28it [00:02, 9.71it/s] 29it [00:03, 9.73it/s] 30it [00:03, 9.71it/s] 31it [00:03, 9.76it/s] 32it [00:03, 9.77it/s] 33it [00:03, 9.76it/s] 34it [00:03, 9.75it/s] 35it [00:03, 9.72it/s] 36it [00:03, 9.74it/s] 37it [00:03, 9.73it/s] 38it [00:04, 9.73it/s] 39it [00:04, 9.73it/s] 40it [00:04, 9.73it/s] 41it [00:04, 9.75it/s] 42it [00:04, 9.11it/s] 43it [00:04, 9.29it/s] 44it [00:04, 9.43it/s] 45it [00:04, 9.55it/s] 46it [00:04, 9.62it/s] 47it [00:04, 9.68it/s] 48it [00:05, 9.73it/s] 49it [00:05, 9.77it/s] 50it [00:05, 9.29it/s]2025-05-26 06:04:45,587 - INFO - [Epoch 057 | Batch 0050] IWAE-loss 4015.7031 | mean log_px -0.0109 | KL -3334.84 + 51it [00:05, 9.46it/s] 52it [00:05, 9.52it/s] 53it [00:05, 9.64it/s] 54it [00:05, 9.60it/s] 55it [00:05, 9.58it/s] 56it [00:05, 9.62it/s] 57it [00:05, 9.65it/s] 58it [00:06, 9.07it/s] 59it [00:06, 9.30it/s] 60it [00:06, 9.42it/s] 61it [00:06, 9.54it/s] 62it [00:06, 9.62it/s] 63it [00:06, 9.70it/s] 64it [00:06, 9.09it/s] 65it [00:06, 9.28it/s] 66it [00:06, 9.41it/s] 67it [00:07, 9.52it/s] 68it [00:07, 9.56it/s] 69it [00:07, 9.63it/s] 70it [00:07, 9.68it/s] 71it [00:07, 9.71it/s] 72it [00:07, 9.56it/s] 73it [00:07, 9.62it/s] 74it [00:07, 9.64it/s] 75it [00:07, 9.68it/s] 76it [00:07, 9.71it/s] 77it [00:08, 9.74it/s] 78it [00:08, 9.73it/s] 79it [00:08, 9.74it/s] 80it [00:08, 9.74it/s] 81it [00:08, 9.74it/s] 82it [00:08, 9.77it/s] 83it [00:08, 9.80it/s] 84it [00:08, 9.79it/s] 85it [00:08, 9.79it/s] 86it [00:09, 9.80it/s] 87it [00:09, 9.76it/s] 88it [00:09, 9.75it/s] 89it [00:09, 9.77it/s] 90it [00:09, 9.72it/s] 91it [00:09, 9.74it/s] 92it [00:09, 9.72it/s] 93it [00:09, 9.75it/s] 94it [00:09, 9.74it/s] 95it [00:09, 9.45it/s] 96it [00:10, 8.98it/s] 97it [00:10, 9.21it/s] 98it [00:10, 9.35it/s] 99it [00:10, 9.47it/s] 100it [00:10, 9.56it/s]2025-05-26 06:04:50,798 - INFO - [Epoch 057 | Batch 0100] IWAE-loss 4555.8833 | mean log_px -0.0193 | KL -3332.19 + 101it [00:10, 9.61it/s] 102it [00:10, 9.63it/s] 103it [00:10, 9.70it/s] 104it [00:10, 9.71it/s] 105it [00:11, 9.72it/s] 106it [00:11, 9.13it/s] 107it [00:11, 9.33it/s] 108it [00:11, 9.48it/s] 109it [00:11, 9.61it/s] 110it [00:11, 9.68it/s] 111it [00:11, 9.73it/s] 112it [00:11, 9.74it/s] 113it [00:11, 9.79it/s] 114it [00:11, 9.78it/s] 115it [00:12, 9.79it/s] 116it [00:12, 9.77it/s] 117it [00:12, 9.81it/s] 118it [00:12, 9.81it/s] 119it [00:12, 9.83it/s] 120it [00:12, 9.11it/s] 121it [00:12, 8.99it/s] 122it [00:12, 8.87it/s] 123it [00:12, 9.07it/s] 124it [00:13, 9.21it/s] 125it [00:13, 9.32it/s] 126it [00:13, 9.38it/s] 127it [00:13, 9.44it/s] 128it [00:13, 9.49it/s] 129it [00:13, 9.51it/s] 130it [00:13, 9.53it/s] 131it [00:13, 9.56it/s] 132it [00:13, 9.53it/s] 133it [00:13, 9.55it/s] 134it [00:14, 9.63it/s] 135it [00:14, 9.35it/s] 136it [00:14, 9.46it/s] 137it [00:14, 9.55it/s] 138it [00:14, 9.59it/s] 139it [00:14, 9.66it/s] 140it [00:14, 9.70it/s] 141it [00:14, 9.75it/s] 142it [00:14, 9.76it/s] 143it [00:14, 9.79it/s] 144it [00:15, 9.79it/s] 145it [00:15, 9.81it/s] 146it [00:15, 9.76it/s] 147it [00:15, 9.77it/s] 148it [00:15, 9.75it/s] 149it [00:15, 9.79it/s] 150it [00:15, 9.76it/s]2025-05-26 06:04:56,016 - INFO - [Epoch 057 | Batch 0150] IWAE-loss 4984.7964 | mean log_px -0.0261 | KL -3333.72 + 151it [00:15, 9.75it/s] 152it [00:15, 9.75it/s] 153it [00:16, 9.78it/s] 154it [00:16, 9.75it/s] 155it [00:16, 9.76it/s] 156it [00:16, 9.78it/s] 157it [00:16, 9.76it/s] 158it [00:16, 9.74it/s] 159it [00:16, 9.73it/s] 160it [00:16, 9.12it/s] 161it [00:16, 9.33it/s] 162it [00:16, 9.45it/s] 163it [00:17, 9.33it/s] 164it [00:17, 9.41it/s] 165it [00:17, 9.53it/s] 166it [00:17, 9.60it/s] 167it [00:17, 9.66it/s] 168it [00:17, 9.71it/s] 169it [00:17, 9.66it/s] 170it [00:17, 9.67it/s] 171it [00:17, 9.73it/s] 172it [00:17, 9.73it/s] 173it [00:18, 9.77it/s] 174it [00:18, 9.78it/s] 175it [00:18, 9.83it/s] 176it [00:18, 9.83it/s] 177it [00:18, 9.82it/s] 178it [00:18, 9.80it/s] 179it [00:18, 9.79it/s] 180it [00:18, 9.76it/s] 181it [00:18, 9.76it/s] 182it [00:19, 9.74it/s] 183it [00:19, 9.76it/s] 184it [00:19, 9.72it/s] 185it [00:19, 9.76it/s] 186it [00:19, 9.76it/s] 187it [00:19, 9.77it/s] 188it [00:19, 9.74it/s] 189it [00:19, 9.76it/s] 190it [00:19, 9.78it/s] 191it [00:19, 9.78it/s] 192it [00:20, 9.78it/s] 193it [00:20, 9.79it/s] 194it [00:20, 9.79it/s] 195it [00:20, 8.76it/s] 196it [00:20, 9.54it/s] +2025-05-26 06:05:00,791 - INFO - Epoch: 57, Objective: tensor([5603.3149], device='cuda:0', grad_fn=), Loss: 0.03557281568646431, KL/n: 67.98454284667969 + 0it [00:00, ?it/s]2025-05-26 06:05:01,234 - INFO - [Epoch 058 | Batch 0000] IWAE-loss 4603.7197 | mean log_px -0.0217 | KL -3329.28 + 1it [00:00, 2.83it/s] 2it [00:00, 4.87it/s] 3it [00:00, 6.35it/s] 4it [00:00, 6.90it/s] 5it [00:00, 7.64it/s] 6it [00:00, 8.22it/s] 7it [00:00, 8.52it/s] 8it [00:01, 8.89it/s] 9it [00:01, 9.19it/s] 10it [00:01, 9.37it/s] 11it [00:01, 9.50it/s] 12it [00:01, 9.58it/s] 13it [00:01, 9.65it/s] 14it [00:01, 9.38it/s] 15it [00:01, 9.30it/s] 16it [00:01, 9.40it/s] 17it [00:02, 9.40it/s] 18it [00:02, 9.49it/s] 19it [00:02, 9.59it/s] 20it [00:02, 9.63it/s] 21it [00:02, 9.67it/s] 22it [00:02, 9.70it/s] 23it [00:02, 9.08it/s] 24it [00:02, 9.23it/s] 25it [00:02, 9.41it/s] 26it [00:02, 9.49it/s] 27it [00:03, 9.57it/s] 28it [00:03, 9.04it/s] 29it [00:03, 9.26it/s] 30it [00:03, 9.39it/s] 31it [00:03, 9.52it/s] 32it [00:03, 9.59it/s] 33it [00:03, 9.09it/s] 34it [00:03, 9.25it/s] 35it [00:03, 9.39it/s] 36it [00:04, 9.44it/s] 37it [00:04, 8.97it/s] 38it [00:04, 9.12it/s] 39it [00:04, 9.30it/s] 40it [00:04, 9.39it/s] 41it [00:04, 8.92it/s] 42it [00:04, 9.13it/s] 43it [00:04, 9.31it/s] 44it [00:04, 9.40it/s] 45it [00:05, 8.92it/s] 46it [00:05, 9.12it/s] 47it [00:05, 9.29it/s] 48it [00:05, 9.36it/s] 49it [00:05, 8.93it/s] 50it [00:05, 9.13it/s]2025-05-26 06:05:06,584 - INFO - [Epoch 058 | Batch 0050] IWAE-loss 4924.8784 | mean log_px -0.0293 | KL -3323.80 + 51it [00:05, 9.24it/s] 52it [00:05, 9.27it/s] 53it [00:05, 8.91it/s] 54it [00:06, 9.10it/s] 55it [00:06, 9.24it/s] 56it [00:06, 8.83it/s] 57it [00:06, 9.05it/s] 58it [00:06, 9.22it/s] 59it [00:06, 9.37it/s] 60it [00:06, 8.86it/s] 61it [00:06, 9.06it/s] 62it [00:06, 9.21it/s] 63it [00:07, 9.35it/s] 64it [00:07, 8.86it/s] 65it [00:07, 9.12it/s] 66it [00:07, 9.29it/s] 67it [00:07, 9.39it/s] 68it [00:07, 8.90it/s] 69it [00:07, 9.11it/s] 70it [00:07, 9.08it/s] 71it [00:07, 9.18it/s] 72it [00:08, 8.81it/s] 73it [00:08, 9.06it/s] 74it [00:08, 9.19it/s] 75it [00:08, 9.35it/s] 76it [00:08, 8.86it/s] 77it [00:08, 9.11it/s] 78it [00:08, 9.03it/s] 79it [00:08, 9.04it/s] 80it [00:08, 8.64it/s] 81it [00:09, 8.91it/s] 82it [00:09, 9.13it/s] 83it [00:09, 9.26it/s] 84it [00:09, 8.83it/s] 85it [00:09, 9.08it/s] 86it [00:09, 9.25it/s] 87it [00:09, 9.39it/s] 88it [00:09, 8.91it/s] 89it [00:09, 9.15it/s] 90it [00:09, 9.30it/s] 91it [00:10, 9.41it/s] 92it [00:10, 8.95it/s] 93it [00:10, 9.14it/s] 94it [00:10, 9.31it/s] 95it [00:10, 9.41it/s] 96it [00:10, 9.00it/s] 97it [00:10, 9.20it/s] 98it [00:10, 9.37it/s] 99it [00:10, 9.45it/s] 100it [00:11, 9.00it/s]2025-05-26 06:05:12,070 - INFO - [Epoch 058 | Batch 0100] IWAE-loss 4599.8813 | mean log_px -0.0212 | KL -3328.67 + 101it [00:11, 9.16it/s] 102it [00:11, 9.27it/s] 103it [00:11, 9.39it/s] 104it [00:11, 8.89it/s] 105it [00:11, 9.13it/s] 106it [00:11, 9.25it/s] 107it [00:11, 9.38it/s] 108it [00:11, 8.93it/s] 109it [00:12, 9.17it/s] 110it [00:12, 9.29it/s] 111it [00:12, 9.42it/s] 112it [00:12, 8.92it/s] 113it [00:12, 9.12it/s] 114it [00:12, 9.28it/s] 115it [00:12, 9.40it/s] 116it [00:12, 8.96it/s] 117it [00:12, 9.11it/s] 118it [00:13, 9.27it/s] 119it [00:13, 9.40it/s] 120it [00:13, 8.95it/s] 121it [00:13, 9.15it/s] 122it [00:13, 9.30it/s] 123it [00:13, 9.42it/s] 124it [00:13, 8.90it/s] 125it [00:13, 9.15it/s] 126it [00:13, 9.30it/s] 127it [00:14, 9.40it/s] 128it [00:14, 8.94it/s] 129it [00:14, 9.13it/s] 130it [00:14, 9.28it/s] 131it [00:14, 9.38it/s] 132it [00:14, 8.92it/s] 133it [00:14, 9.12it/s] 134it [00:14, 8.78it/s] 135it [00:14, 9.03it/s] 136it [00:15, 9.19it/s] 137it [00:15, 9.33it/s] 138it [00:15, 8.92it/s] 139it [00:15, 9.16it/s] 140it [00:15, 9.27it/s] 141it [00:15, 9.30it/s] 142it [00:15, 8.82it/s] 143it [00:15, 9.07it/s] 144it [00:15, 9.22it/s] 145it [00:15, 9.36it/s] 146it [00:16, 8.78it/s] 147it [00:16, 9.05it/s] 148it [00:16, 9.11it/s] 149it [00:16, 9.27it/s] 150it [00:16, 8.78it/s]2025-05-26 06:05:17,544 - INFO - [Epoch 058 | Batch 0150] IWAE-loss 4261.2881 | mean log_px -0.0143 | KL -3324.48 + 151it [00:16, 8.97it/s] 152it [00:16, 9.17it/s] 153it [00:16, 9.30it/s] 154it [00:16, 8.87it/s] 155it [00:17, 9.08it/s] 156it [00:17, 9.23it/s] 157it [00:17, 9.37it/s] 158it [00:17, 8.83it/s] 159it [00:17, 9.04it/s] 160it [00:17, 9.19it/s] 161it [00:17, 8.78it/s] 162it [00:17, 9.02it/s] 163it [00:17, 9.19it/s] 164it [00:18, 9.33it/s] 165it [00:18, 8.91it/s] 166it [00:18, 9.11it/s] 167it [00:18, 9.24it/s] 168it [00:18, 9.34it/s] 169it [00:18, 8.87it/s] 170it [00:18, 9.05it/s] 171it [00:18, 9.25it/s] 172it [00:18, 9.33it/s] 173it [00:19, 8.86it/s] 174it [00:19, 9.02it/s] 175it [00:19, 9.18it/s] 176it [00:19, 9.31it/s] 177it [00:19, 8.87it/s] 178it [00:19, 9.11it/s] 179it [00:19, 9.29it/s] 180it [00:19, 9.35it/s] 181it [00:19, 8.94it/s] 182it [00:20, 9.14it/s] 183it [00:20, 9.29it/s] 184it [00:20, 9.41it/s] 185it [00:20, 8.91it/s] 186it [00:20, 9.13it/s] 187it [00:20, 9.31it/s] 188it [00:20, 9.40it/s] 189it [00:20, 8.98it/s] 190it [00:20, 9.17it/s] 191it [00:21, 9.22it/s] 192it [00:21, 8.83it/s] 193it [00:21, 9.08it/s] 194it [00:21, 9.22it/s] 195it [00:21, 8.84it/s] 196it [00:21, 9.06it/s] +2025-05-26 06:05:22,564 - INFO - Epoch: 58, Objective: tensor([4525.3076], device='cuda:0', grad_fn=), Loss: 0.021634532138705254, KL/n: 67.80258178710938 + 0it [00:00, ?it/s]2025-05-26 06:05:22,841 - INFO - [Epoch 059 | Batch 0000] IWAE-loss 4513.4170 | mean log_px -0.0270 | KL -3325.71 + 1it [00:00, 4.76it/s] 2it [00:00, 6.78it/s] 3it [00:00, 7.95it/s] 4it [00:00, 8.59it/s] 6it [00:00, 8.94it/s] 7it [00:00, 9.20it/s] 8it [00:00, 9.37it/s] 9it [00:01, 9.52it/s] 10it [00:01, 9.62it/s] 11it [00:01, 9.70it/s] 12it [00:01, 9.19it/s] 13it [00:01, 9.39it/s] 14it [00:01, 9.44it/s] 15it [00:01, 8.90it/s] 16it [00:01, 8.85it/s] 17it [00:01, 9.09it/s] 18it [00:02, 9.25it/s] 19it [00:02, 9.37it/s] 20it [00:02, 9.47it/s] 21it [00:02, 9.54it/s] 22it [00:02, 9.59it/s] 23it [00:02, 9.63it/s] 24it [00:02, 9.65it/s] 25it [00:02, 9.13it/s] 26it [00:02, 9.18it/s] 27it [00:02, 9.27it/s] 28it [00:03, 9.38it/s] 29it [00:03, 9.51it/s] 30it [00:03, 9.60it/s] 31it [00:03, 9.66it/s] 32it [00:03, 9.71it/s] 33it [00:03, 9.77it/s] 34it [00:03, 9.78it/s] 35it [00:03, 9.78it/s] 36it [00:03, 9.74it/s] 37it [00:03, 9.72it/s] 38it [00:04, 9.68it/s] 39it [00:04, 9.69it/s] 40it [00:04, 9.67it/s] 41it [00:04, 9.71it/s] 42it [00:04, 9.66it/s] 43it [00:04, 9.68it/s] 44it [00:04, 9.08it/s] 45it [00:04, 9.25it/s] 46it [00:04, 9.33it/s] 47it [00:05, 9.45it/s] 48it [00:05, 9.48it/s] 49it [00:05, 9.51it/s] 50it [00:05, 9.56it/s]2025-05-26 06:05:28,121 - INFO - [Epoch 059 | Batch 0050] IWAE-loss 4204.3833 | mean log_px -0.0140 | KL -3318.27 + 51it [00:05, 9.57it/s] 52it [00:05, 9.65it/s] 53it [00:05, 9.72it/s] 54it [00:05, 9.75it/s] 55it [00:05, 9.79it/s] 56it [00:05, 9.79it/s] 57it [00:06, 9.81it/s] 58it [00:06, 9.80it/s] 59it [00:06, 9.83it/s] 60it [00:06, 9.84it/s] 61it [00:06, 9.26it/s] 62it [00:06, 9.36it/s] 63it [00:06, 9.50it/s] 64it [00:06, 8.95it/s] 65it [00:06, 9.19it/s] 66it [00:07, 9.18it/s] 67it [00:07, 9.37it/s] 68it [00:07, 9.50it/s] 69it [00:07, 9.62it/s] 70it [00:07, 9.67it/s] 71it [00:07, 9.69it/s] 72it [00:07, 9.73it/s] 73it [00:07, 9.78it/s] 74it [00:07, 9.79it/s] 75it [00:07, 9.82it/s] 76it [00:08, 9.81it/s] 77it [00:08, 9.82it/s] 78it [00:08, 9.25it/s] 79it [00:08, 9.42it/s] 80it [00:08, 9.55it/s] 81it [00:08, 9.65it/s] 82it [00:08, 9.44it/s] 83it [00:08, 9.16it/s] 84it [00:08, 9.20it/s] 85it [00:09, 9.35it/s] 86it [00:09, 9.45it/s] 87it [00:09, 9.59it/s] 88it [00:09, 9.65it/s] 89it [00:09, 9.72it/s] 90it [00:09, 9.76it/s] 91it [00:09, 9.40it/s] 92it [00:09, 9.52it/s] 93it [00:09, 9.62it/s] 94it [00:09, 9.10it/s] 95it [00:10, 9.30it/s] 96it [00:10, 9.45it/s] 97it [00:10, 9.58it/s] 98it [00:10, 9.66it/s] 99it [00:10, 9.73it/s] 100it [00:10, 9.76it/s]2025-05-26 06:05:33,348 - INFO - [Epoch 059 | Batch 0100] IWAE-loss 4880.2090 | mean log_px -0.0276 | KL -3318.33 + 101it [00:10, 9.78it/s] 102it [00:10, 9.80it/s] 103it [00:10, 9.82it/s] 104it [00:10, 9.83it/s] 105it [00:11, 9.85it/s] 106it [00:11, 9.84it/s] 107it [00:11, 9.86it/s] 108it [00:11, 9.86it/s] 109it [00:11, 9.87it/s] 110it [00:11, 9.87it/s] 111it [00:11, 9.88it/s] 112it [00:11, 9.86it/s] 113it [00:11, 9.86it/s] 114it [00:12, 9.67it/s] 115it [00:12, 9.10it/s] 116it [00:12, 9.31it/s] 117it [00:12, 9.45it/s] 118it [00:12, 9.57it/s] 119it [00:12, 9.60it/s] 120it [00:12, 9.65it/s] 121it [00:12, 9.69it/s] 122it [00:12, 9.13it/s] 123it [00:12, 9.35it/s] 124it [00:13, 9.50it/s] 125it [00:13, 9.62it/s] 126it [00:13, 9.30it/s] 127it [00:13, 9.47it/s] 128it [00:13, 9.58it/s] 129it [00:13, 9.27it/s] 130it [00:13, 9.42it/s] 131it [00:13, 9.56it/s] 132it [00:13, 9.64it/s] 133it [00:14, 9.70it/s] 134it [00:14, 9.12it/s] 135it [00:14, 9.34it/s] 136it [00:14, 9.49it/s] 137it [00:14, 9.61it/s] 138it [00:14, 9.67it/s] 139it [00:14, 9.74it/s] 140it [00:14, 9.75it/s] 141it [00:14, 9.16it/s] 142it [00:14, 9.37it/s] 144it [00:15, 9.69it/s] 146it [00:15, 9.85it/s] 148it [00:15, 9.92it/s] 149it [00:15, 9.93it/s] 150it [00:15, 9.94it/s]2025-05-26 06:05:38,534 - INFO - [Epoch 059 | Batch 0150] IWAE-loss 4119.4390 | mean log_px -0.0125 | KL -3316.20 + 151it [00:15, 9.44it/s] 153it [00:16, 9.69it/s] 155it [00:16, 9.83it/s] 157it [00:16, 9.91it/s] 159it [00:16, 9.98it/s] 160it [00:16, 9.97it/s] 162it [00:16, 10.02it/s] 164it [00:17, 10.05it/s] 166it [00:17, 10.04it/s] 168it [00:17, 9.74it/s] 170it [00:17, 9.85it/s] 172it [00:18, 9.92it/s] 173it [00:18, 9.56it/s] 174it [00:18, 9.63it/s] 176it [00:18, 9.80it/s] 178it [00:18, 9.90it/s] 180it [00:18, 9.97it/s] 182it [00:19, 10.03it/s] 184it [00:19, 10.05it/s] 186it [00:19, 9.72it/s] 188it [00:19, 9.83it/s] 189it [00:19, 9.86it/s] 190it [00:19, 9.46it/s] 192it [00:20, 9.68it/s] 193it [00:20, 9.26it/s] 194it [00:20, 9.41it/s] 195it [00:20, 9.10it/s] 196it [00:20, 8.96it/s] 196it [00:20, 9.52it/s] +2025-05-26 06:05:43,275 - INFO - Epoch: 59, Objective: tensor([5065.8369], device='cuda:0', grad_fn=), Loss: 0.029969044029712677, KL/n: 67.60353088378906 + 0it [00:00, ?it/s]2025-05-26 06:05:43,550 - INFO - [Epoch 060 | Batch 0000] IWAE-loss 5187.5234 | mean log_px -0.0315 | KL -3310.47 + 1it [00:00, 5.40it/s] 2it [00:00, 6.78it/s] 4it [00:00, 8.46it/s] 6it [00:00, 9.14it/s] 7it [00:00, 8.97it/s] 8it [00:00, 9.22it/s] 10it [00:01, 9.56it/s] 11it [00:01, 9.66it/s] 12it [00:01, 9.72it/s] 13it [00:01, 9.22it/s] 14it [00:01, 6.31it/s] 15it [00:01, 7.04it/s] 16it [00:01, 7.39it/s] 17it [00:02, 7.99it/s] 18it [00:02, 8.49it/s] 19it [00:02, 8.37it/s] 20it [00:02, 8.78it/s] 22it [00:02, 9.30it/s] 23it [00:02, 9.46it/s] 24it [00:02, 9.58it/s] 26it [00:02, 9.77it/s] 28it [00:03, 9.85it/s] 30it [00:03, 9.91it/s] 31it [00:03, 9.93it/s] 32it [00:03, 9.94it/s] 33it [00:03, 9.95it/s] 35it [00:03, 9.98it/s] 36it [00:03, 9.98it/s] 37it [00:04, 9.98it/s] 38it [00:04, 9.97it/s] 40it [00:04, 10.00it/s] 42it [00:04, 10.01it/s] 44it [00:04, 10.03it/s] 46it [00:04, 10.00it/s] 48it [00:05, 10.02it/s] 50it [00:05, 9.66it/s]2025-05-26 06:05:48,871 - INFO - [Epoch 060 | Batch 0050] IWAE-loss 4562.0859 | mean log_px -0.0215 | KL -3308.93 + 51it [00:05, 9.70it/s] 52it [00:05, 9.75it/s] 54it [00:05, 9.84it/s] 55it [00:05, 9.86it/s] 56it [00:06, 9.89it/s] 58it [00:06, 9.59it/s] 59it [00:06, 9.60it/s] 60it [00:06, 9.63it/s] 61it [00:06, 9.68it/s] 62it [00:06, 9.72it/s] 63it [00:06, 9.76it/s] 64it [00:06, 9.69it/s] 65it [00:06, 9.65it/s] 66it [00:07, 9.74it/s] 67it [00:07, 9.80it/s] 68it [00:07, 9.82it/s] 69it [00:07, 9.21it/s] 70it [00:07, 9.42it/s] 72it [00:07, 9.68it/s] 74it [00:07, 9.80it/s] 75it [00:07, 9.83it/s] 76it [00:08, 9.34it/s] 77it [00:08, 9.49it/s] 78it [00:08, 9.59it/s] 79it [00:08, 9.62it/s] 80it [00:08, 9.70it/s] 81it [00:08, 9.71it/s] 82it [00:08, 9.78it/s] 83it [00:08, 9.83it/s] 84it [00:08, 9.87it/s] 86it [00:09, 9.92it/s] 88it [00:09, 9.94it/s] 89it [00:09, 9.55it/s] 90it [00:09, 9.63it/s] 92it [00:09, 9.78it/s] 93it [00:09, 9.81it/s] 94it [00:09, 9.85it/s] 95it [00:10, 9.87it/s] 96it [00:10, 9.89it/s] 97it [00:10, 9.34it/s] 98it [00:10, 9.51it/s] 99it [00:10, 9.64it/s] 100it [00:10, 9.70it/s]2025-05-26 06:05:54,024 - INFO - [Epoch 060 | Batch 0100] IWAE-loss 4293.2979 | mean log_px -0.0141 | KL -3304.83 + 101it [00:10, 9.16it/s] 102it [00:10, 9.26it/s] 103it [00:10, 9.46it/s] 104it [00:10, 9.59it/s] 106it [00:11, 9.78it/s] 107it [00:11, 9.33it/s] 108it [00:11, 9.49it/s] 110it [00:11, 9.71it/s] 112it [00:11, 9.82it/s] 113it [00:11, 9.86it/s] 114it [00:12, 9.89it/s] 116it [00:12, 9.48it/s] 117it [00:12, 9.50it/s] 118it [00:12, 9.19it/s] 119it [00:12, 9.36it/s] 120it [00:12, 9.51it/s] 121it [00:12, 9.64it/s] 122it [00:12, 9.71it/s] 123it [00:12, 9.78it/s] 124it [00:13, 9.81it/s] 126it [00:13, 9.90it/s] 127it [00:13, 9.92it/s] 128it [00:13, 9.90it/s] 129it [00:13, 9.45it/s] 130it [00:13, 9.58it/s] 132it [00:13, 9.78it/s] 133it [00:13, 9.83it/s] 134it [00:14, 9.86it/s] 135it [00:14, 9.89it/s] 136it [00:14, 9.92it/s] 138it [00:14, 9.98it/s] 140it [00:14, 9.99it/s] 142it [00:14, 9.97it/s] 143it [00:14, 9.96it/s] 144it [00:15, 9.97it/s] 146it [00:15, 10.00it/s] 147it [00:15, 10.00it/s] 149it [00:15, 9.59it/s] 150it [00:15, 9.67it/s]2025-05-26 06:05:59,173 - INFO - [Epoch 060 | Batch 0150] IWAE-loss 4515.0557 | mean log_px -0.0186 | KL -3300.35 + 151it [00:15, 9.73it/s] 153it [00:16, 9.86it/s] 154it [00:16, 9.38it/s] 155it [00:16, 9.48it/s] 156it [00:16, 9.58it/s] 157it [00:16, 9.63it/s] 158it [00:16, 9.72it/s] 160it [00:16, 9.86it/s] 161it [00:16, 9.88it/s] 162it [00:16, 9.87it/s] 164it [00:17, 9.93it/s] 166it [00:17, 9.97it/s] 167it [00:17, 9.94it/s] 168it [00:17, 9.94it/s] 169it [00:17, 9.93it/s] 170it [00:17, 9.37it/s] 171it [00:17, 9.52it/s] 172it [00:17, 9.64it/s] 173it [00:18, 9.73it/s] 174it [00:18, 9.76it/s] 176it [00:18, 9.80it/s] 177it [00:18, 9.84it/s] 178it [00:18, 9.80it/s] 180it [00:18, 9.90it/s] 181it [00:18, 9.89it/s] 182it [00:18, 9.92it/s] 184it [00:19, 9.96it/s] 186it [00:19, 9.97it/s] 188it [00:19, 9.60it/s] 190it [00:19, 9.73it/s] 191it [00:19, 9.77it/s] 192it [00:19, 9.81it/s] 193it [00:20, 9.45it/s] 194it [00:20, 9.57it/s] 195it [00:20, 9.28it/s] 196it [00:20, 9.56it/s] +2025-05-26 06:06:03,901 - INFO - Epoch: 60, Objective: tensor([4183.7256], device='cuda:0', grad_fn=), Loss: 0.01641184277832508, KL/n: 67.38818359375 + 0it [00:00, ?it/s]2025-05-26 06:06:04,154 - INFO - [Epoch 061 | Batch 0000] IWAE-loss 4341.6694 | mean log_px -0.0202 | KL -3302.52 + 1it [00:00, 5.25it/s] 2it [00:00, 7.18it/s] 3it [00:00, 8.20it/s] 4it [00:00, 8.72it/s] 6it [00:00, 9.33it/s] 8it [00:00, 9.18it/s] 9it [00:01, 9.34it/s] 10it [00:01, 9.49it/s] 11it [00:01, 9.53it/s] 12it [00:01, 9.63it/s] 14it [00:01, 9.71it/s] 15it [00:01, 9.59it/s] 16it [00:01, 9.69it/s] 18it [00:01, 9.79it/s] 20it [00:02, 9.86it/s] 22it [00:02, 9.92it/s] 23it [00:02, 9.93it/s] 24it [00:02, 9.93it/s] 25it [00:02, 9.94it/s] 26it [00:02, 9.94it/s] 28it [00:02, 9.49it/s] 30it [00:03, 9.69it/s] 32it [00:03, 9.79it/s] 33it [00:03, 9.41it/s] 34it [00:03, 9.52it/s] 36it [00:03, 9.71it/s] 38it [00:03, 9.82it/s] 39it [00:04, 9.84it/s] 41it [00:04, 9.91it/s] 42it [00:04, 9.91it/s] 44it [00:04, 9.95it/s] 46it [00:04, 9.97it/s] 47it [00:04, 9.97it/s] 48it [00:04, 9.97it/s] 50it [00:05, 9.98it/s]2025-05-26 06:06:09,283 - INFO - [Epoch 061 | Batch 0050] IWAE-loss 4877.6030 | mean log_px -0.0282 | KL -3295.02 + 51it [00:05, 9.97it/s] 52it [00:05, 9.94it/s] 54it [00:05, 9.97it/s] 55it [00:05, 9.97it/s] 56it [00:05, 9.96it/s] 57it [00:05, 9.92it/s] 58it [00:06, 9.46it/s] 59it [00:06, 9.59it/s] 60it [00:06, 9.66it/s] 61it [00:06, 9.74it/s] 62it [00:06, 9.81it/s] 63it [00:06, 9.85it/s] 64it [00:06, 9.84it/s] 66it [00:06, 9.57it/s] 67it [00:06, 9.67it/s] 68it [00:07, 9.74it/s] 70it [00:07, 9.85it/s] 71it [00:07, 9.84it/s] 72it [00:07, 9.33it/s] 74it [00:07, 9.59it/s] 75it [00:07, 9.66it/s] 77it [00:07, 9.81it/s] 78it [00:08, 9.84it/s] 80it [00:08, 9.91it/s] 82it [00:08, 9.94it/s] 84it [00:08, 9.96it/s] 85it [00:08, 9.97it/s] 86it [00:08, 9.96it/s] 87it [00:08, 9.96it/s] 88it [00:09, 9.94it/s] 89it [00:09, 9.95it/s] 90it [00:09, 9.46it/s] 91it [00:09, 9.59it/s] 92it [00:09, 9.69it/s] 94it [00:09, 9.83it/s] 95it [00:09, 9.82it/s] 96it [00:09, 9.86it/s] 97it [00:09, 9.88it/s] 98it [00:10, 9.90it/s] 99it [00:10, 9.92it/s] 100it [00:10, 9.90it/s]2025-05-26 06:06:14,383 - INFO - [Epoch 061 | Batch 0100] IWAE-loss 4193.9419 | mean log_px -0.0158 | KL -3287.98 + 101it [00:10, 9.91it/s] 102it [00:10, 9.93it/s] 104it [00:10, 9.97it/s] 105it [00:10, 9.90it/s] 106it [00:10, 9.40it/s] 107it [00:11, 9.55it/s] 108it [00:11, 9.66it/s] 110it [00:11, 9.83it/s] 111it [00:11, 9.27it/s] 112it [00:11, 9.42it/s] 113it [00:11, 9.56it/s] 114it [00:11, 9.67it/s] 116it [00:11, 9.82it/s] 117it [00:12, 9.86it/s] 118it [00:12, 9.89it/s] 119it [00:12, 9.92it/s] 120it [00:12, 9.92it/s] 121it [00:12, 9.92it/s] 122it [00:12, 9.93it/s] 124it [00:12, 9.95it/s] 126it [00:12, 9.54it/s] 127it [00:13, 9.51it/s] 128it [00:13, 9.61it/s] 130it [00:13, 9.78it/s] 131it [00:13, 9.83it/s] 132it [00:13, 9.86it/s] 133it [00:13, 9.85it/s] 134it [00:13, 9.87it/s] 135it [00:13, 9.44it/s] 136it [00:13, 9.58it/s] 138it [00:14, 9.74it/s] 139it [00:14, 9.80it/s] 140it [00:14, 9.84it/s] 142it [00:14, 9.92it/s] 143it [00:14, 9.92it/s] 144it [00:14, 9.93it/s] 145it [00:14, 9.41it/s] 146it [00:15, 9.56it/s] 148it [00:15, 9.77it/s] 150it [00:15, 9.46it/s]2025-05-26 06:06:19,535 - INFO - [Epoch 061 | Batch 0150] IWAE-loss 4477.5815 | mean log_px -0.0203 | KL -3289.90 + 151it [00:15, 9.57it/s] 152it [00:15, 9.65it/s] 154it [00:15, 9.81it/s] 156it [00:16, 9.90it/s] 158it [00:16, 9.92it/s] 160it [00:16, 9.59it/s] 161it [00:16, 9.65it/s] 162it [00:16, 9.37it/s] 164it [00:16, 9.59it/s] 166it [00:17, 9.73it/s] 168it [00:17, 9.83it/s] 169it [00:17, 9.45it/s] 170it [00:17, 9.55it/s] 172it [00:17, 9.71it/s] 173it [00:17, 9.77it/s] 174it [00:17, 9.82it/s] 175it [00:18, 9.86it/s] 176it [00:18, 9.87it/s] 178it [00:18, 9.93it/s] 180it [00:18, 9.96it/s] 181it [00:18, 9.97it/s] 182it [00:18, 9.97it/s] 183it [00:18, 9.97it/s] 184it [00:18, 9.43it/s] 186it [00:19, 9.68it/s] 187it [00:19, 9.75it/s] 188it [00:19, 9.80it/s] 189it [00:19, 9.84it/s] 191it [00:19, 9.92it/s] 192it [00:19, 9.92it/s] 193it [00:19, 9.94it/s] 194it [00:19, 9.94it/s] 195it [00:20, 9.53it/s] 196it [00:20, 9.70it/s] +2025-05-26 06:06:24,236 - INFO - Epoch: 61, Objective: tensor([6526.4443], device='cuda:0', grad_fn=), Loss: 0.049620795994997025, KL/n: 67.15840148925781 + 0it [00:00, ?it/s]2025-05-26 06:06:24,519 - INFO - [Epoch 062 | Batch 0000] IWAE-loss 4576.0898 | mean log_px -0.0238 | KL -3289.67 + 1it [00:00, 4.66it/s] 2it [00:00, 6.77it/s] 4it [00:00, 8.54it/s] 5it [00:00, 8.45it/s] 7it [00:00, 9.15it/s] 9it [00:01, 9.52it/s] 10it [00:01, 9.19it/s] 12it [00:01, 9.52it/s] 14it [00:01, 9.72it/s] 15it [00:01, 9.37it/s] 17it [00:01, 9.63it/s] 19it [00:02, 9.80it/s] 20it [00:02, 9.82it/s] 22it [00:02, 9.93it/s] 24it [00:02, 9.59it/s] 25it [00:02, 9.34it/s] 26it [00:02, 9.31it/s] 27it [00:02, 9.45it/s] 28it [00:03, 9.57it/s] 29it [00:03, 9.14it/s] 30it [00:03, 9.35it/s] 32it [00:03, 9.62it/s] 33it [00:03, 6.46it/s] 34it [00:03, 7.07it/s] 35it [00:03, 7.67it/s] 37it [00:04, 8.57it/s] 38it [00:04, 8.45it/s] 40it [00:04, 9.04it/s] 42it [00:04, 9.42it/s] 44it [00:04, 9.66it/s] 46it [00:05, 9.82it/s] 48it [00:05, 9.93it/s] 50it [00:05, 9.98it/s]2025-05-26 06:06:29,894 - INFO - [Epoch 062 | Batch 0050] IWAE-loss 4915.9707 | mean log_px -0.0268 | KL -3286.16 + 52it [00:05, 10.02it/s] 54it [00:05, 10.03it/s] 56it [00:06, 10.06it/s] 58it [00:06, 10.07it/s] 60it [00:06, 10.08it/s] 62it [00:06, 10.08it/s] 64it [00:06, 10.09it/s] 66it [00:07, 10.10it/s] 68it [00:07, 9.82it/s] 70it [00:07, 9.90it/s] 72it [00:07, 9.97it/s] 74it [00:07, 10.01it/s] 76it [00:08, 10.04it/s] 78it [00:08, 10.07it/s] 80it [00:08, 10.08it/s] 82it [00:08, 10.09it/s] 84it [00:08, 10.09it/s] 86it [00:09, 10.10it/s] 88it [00:09, 10.09it/s] 90it [00:09, 9.73it/s] 92it [00:09, 9.85it/s] 94it [00:09, 9.91it/s] 96it [00:10, 9.66it/s] 98it [00:10, 9.79it/s] 100it [00:10, 9.88it/s]2025-05-26 06:06:34,907 - INFO - [Epoch 062 | Batch 0100] IWAE-loss 4170.7461 | mean log_px -0.0182 | KL -3282.61 + 101it [00:10, 9.54it/s] 103it [00:10, 9.71it/s] 105it [00:10, 9.85it/s] 107it [00:11, 9.92it/s] 109it [00:11, 9.98it/s] 111it [00:11, 10.02it/s] 113it [00:11, 10.05it/s] 115it [00:11, 10.07it/s] 117it [00:12, 10.09it/s] 119it [00:12, 10.11it/s] 121it [00:12, 9.77it/s] 123it [00:12, 9.87it/s] 125it [00:12, 9.94it/s] 127it [00:13, 10.00it/s] 129it [00:13, 10.03it/s] 131it [00:13, 10.06it/s] 133it [00:13, 10.08it/s] 135it [00:14, 9.75it/s] 137it [00:14, 9.86it/s] 139it [00:14, 9.94it/s] 141it [00:14, 9.65it/s] 143it [00:14, 9.79it/s] 145it [00:15, 9.89it/s] 146it [00:15, 9.91it/s] 148it [00:15, 9.97it/s] 150it [00:15, 10.02it/s]2025-05-26 06:06:39,949 - INFO - [Epoch 062 | Batch 0150] IWAE-loss 4884.0713 | mean log_px -0.0360 | KL -3281.47 + 152it [00:15, 9.57it/s] 153it [00:15, 9.30it/s] 155it [00:16, 9.55it/s] 157it [00:16, 9.72it/s] 159it [00:16, 9.83it/s] 160it [00:16, 9.85it/s] 161it [00:16, 9.81it/s] 163it [00:16, 9.92it/s] 165it [00:17, 9.98it/s] 167it [00:17, 10.03it/s] 169it [00:17, 10.06it/s] 171it [00:17, 9.77it/s] 173it [00:17, 9.87it/s] 175it [00:18, 9.94it/s] 177it [00:18, 9.98it/s] 179it [00:18, 10.01it/s] 181it [00:18, 9.71it/s] 183it [00:18, 9.82it/s] 185it [00:19, 9.57it/s] 187it [00:19, 9.72it/s] 189it [00:19, 9.83it/s] 190it [00:19, 9.48it/s] 192it [00:19, 9.68it/s] 194it [00:20, 9.82it/s] 195it [00:20, 9.56it/s] 196it [00:20, 9.35it/s] 196it [00:20, 9.66it/s] +2025-05-26 06:06:44,672 - INFO - Epoch: 62, Objective: tensor([5284.1826], device='cuda:0', grad_fn=), Loss: 0.03511318191885948, KL/n: 66.92284393310547 + 0it [00:00, ?it/s]2025-05-26 06:06:44,951 - INFO - [Epoch 063 | Batch 0000] IWAE-loss 4192.7603 | mean log_px -0.0176 | KL -3279.23 + 1it [00:00, 5.28it/s] 2it [00:00, 6.72it/s] 3it [00:00, 7.88it/s] 4it [00:00, 8.60it/s] 6it [00:00, 9.29it/s] 7it [00:00, 9.13it/s] 8it [00:00, 9.32it/s] 10it [00:01, 9.63it/s] 12it [00:01, 9.79it/s] 13it [00:01, 9.36it/s] 14it [00:01, 9.50it/s] 16it [00:01, 9.70it/s] 18it [00:01, 9.82it/s] 20it [00:02, 9.52it/s] 22it [00:02, 9.67it/s] 24it [00:02, 9.78it/s] 25it [00:02, 9.51it/s] 26it [00:02, 9.60it/s] 27it [00:02, 9.69it/s] 29it [00:03, 9.84it/s] 30it [00:03, 9.86it/s] 32it [00:03, 9.94it/s] 34it [00:03, 9.98it/s] 36it [00:03, 9.62it/s] 38it [00:04, 9.75it/s] 40it [00:04, 9.55it/s] 42it [00:04, 9.70it/s] 44it [00:04, 9.79it/s] 46it [00:04, 9.45it/s] 47it [00:04, 9.50it/s] 48it [00:05, 9.56it/s] 50it [00:05, 9.74it/s]2025-05-26 06:06:50,121 - INFO - [Epoch 063 | Batch 0050] IWAE-loss 4688.5366 | mean log_px -0.0212 | KL -3273.02 + 51it [00:05, 9.32it/s] 52it [00:05, 9.46it/s] 53it [00:05, 9.59it/s] 54it [00:05, 9.25it/s] 56it [00:05, 9.57it/s] 57it [00:06, 9.62it/s] 58it [00:06, 9.67it/s] 60it [00:06, 9.81it/s] 62it [00:06, 9.89it/s] 63it [00:06, 9.87it/s] 64it [00:06, 9.86it/s] 66it [00:06, 9.93it/s] 68it [00:07, 9.98it/s] 70it [00:07, 10.01it/s] 72it [00:07, 10.03it/s] 74it [00:07, 10.05it/s] 76it [00:07, 10.07it/s] 78it [00:08, 10.02it/s] 80it [00:08, 9.69it/s] 82it [00:08, 9.81it/s] 84it [00:08, 9.87it/s] 86it [00:08, 9.59it/s] 88it [00:09, 9.72it/s] 90it [00:09, 9.82it/s] 91it [00:09, 9.48it/s] 92it [00:09, 9.58it/s] 94it [00:09, 9.74it/s] 96it [00:09, 9.84it/s] 98it [00:10, 9.55it/s] 99it [00:10, 9.61it/s]2025-05-26 06:06:55,247 - INFO - [Epoch 063 | Batch 0100] IWAE-loss 4749.5503 | mean log_px -0.0224 | KL -3273.87 + 101it [00:10, 9.39it/s] 102it [00:10, 9.50it/s] 103it [00:10, 9.13it/s] 104it [00:10, 9.33it/s] 106it [00:11, 9.61it/s] 108it [00:11, 9.36it/s] 110it [00:11, 9.57it/s] 112it [00:11, 9.72it/s] 114it [00:11, 9.83it/s] 116it [00:12, 9.89it/s] 117it [00:12, 9.46it/s] 118it [00:12, 9.56it/s] 120it [00:12, 9.74it/s] 122it [00:12, 9.84it/s] 124it [00:12, 9.91it/s] 126it [00:13, 9.96it/s] 128it [00:13, 9.96it/s] 129it [00:13, 9.88it/s] 130it [00:13, 9.22it/s] 131it [00:13, 9.37it/s] 132it [00:13, 9.51it/s] 134it [00:13, 9.72it/s] 135it [00:14, 9.31it/s] 136it [00:14, 9.40it/s] 137it [00:14, 9.54it/s] 139it [00:14, 9.75it/s] 140it [00:14, 9.79it/s] 142it [00:14, 9.80it/s] 143it [00:14, 9.80it/s] 144it [00:14, 9.76it/s] 145it [00:15, 9.68it/s] 146it [00:15, 8.96it/s] 147it [00:15, 9.13it/s] 148it [00:15, 9.27it/s] 149it [00:15, 9.39it/s] 150it [00:15, 9.43it/s]2025-05-26 06:07:00,472 - INFO - [Epoch 063 | Batch 0150] IWAE-loss 3977.1768 | mean log_px -0.0134 | KL -3273.26 + 151it [00:15, 8.92it/s] 152it [00:15, 9.12it/s] 153it [00:15, 9.29it/s] 154it [00:16, 9.40it/s] 155it [00:16, 8.93it/s] 156it [00:16, 9.09it/s] 157it [00:16, 9.29it/s] 158it [00:16, 9.49it/s] 159it [00:16, 9.61it/s] 160it [00:16, 9.73it/s] 162it [00:16, 9.83it/s] 164it [00:17, 9.41it/s] 166it [00:17, 9.62it/s] 168it [00:17, 9.76it/s] 170it [00:17, 9.85it/s] 171it [00:17, 9.87it/s] 172it [00:17, 9.89it/s] 173it [00:18, 9.91it/s] 174it [00:18, 9.26it/s] 175it [00:18, 9.39it/s] 177it [00:18, 9.67it/s] 178it [00:18, 9.72it/s] 180it [00:18, 9.86it/s] 182it [00:18, 9.94it/s] 183it [00:19, 9.95it/s] 184it [00:19, 9.47it/s] 186it [00:19, 9.70it/s] 188it [00:19, 9.82it/s] 189it [00:19, 9.44it/s] 190it [00:19, 9.52it/s] 192it [00:19, 9.73it/s] 194it [00:20, 9.45it/s] 195it [00:20, 9.25it/s] 196it [00:20, 9.58it/s] +2025-05-26 06:07:05,272 - INFO - Epoch: 63, Objective: tensor([5113.3408], device='cuda:0', grad_fn=), Loss: 0.03467189148068428, KL/n: 66.71068572998047 + 0it [00:00, ?it/s]2025-05-26 06:07:05,550 - INFO - [Epoch 064 | Batch 0000] IWAE-loss 4048.0391 | mean log_px -0.0111 | KL -3268.86 + 1it [00:00, 4.70it/s] 2it [00:00, 6.78it/s] 4it [00:00, 8.47it/s] 6it [00:00, 9.16it/s] 7it [00:00, 8.89it/s] 9it [00:01, 9.35it/s] 10it [00:01, 9.46it/s] 12it [00:01, 9.67it/s] 14it [00:01, 9.44it/s] 16it [00:01, 9.60it/s] 17it [00:01, 9.61it/s] 18it [00:01, 9.63it/s] 19it [00:02, 9.65it/s] 20it [00:02, 9.68it/s] 21it [00:02, 9.69it/s] 22it [00:02, 9.73it/s] 23it [00:02, 9.77it/s] 24it [00:02, 9.81it/s] 26it [00:02, 9.91it/s] 28it [00:02, 9.95it/s] 29it [00:03, 9.96it/s] 30it [00:03, 9.95it/s] 32it [00:03, 9.97it/s] 34it [00:03, 9.96it/s] 35it [00:03, 9.52it/s] 36it [00:03, 6.78it/s] 37it [00:04, 7.34it/s] 38it [00:04, 7.87it/s] 40it [00:04, 8.66it/s] 42it [00:04, 9.13it/s] 44it [00:04, 9.19it/s] 45it [00:04, 9.33it/s] 46it [00:05, 9.47it/s] 48it [00:05, 9.68it/s] 49it [00:05, 9.73it/s] 50it [00:05, 9.77it/s]2025-05-26 06:07:10,875 - INFO - [Epoch 064 | Batch 0050] IWAE-loss 4078.9944 | mean log_px -0.0116 | KL -3263.32 + 51it [00:05, 9.30it/s] 53it [00:05, 9.59it/s] 54it [00:05, 9.68it/s] 56it [00:06, 9.80it/s] 57it [00:06, 9.84it/s] 58it [00:06, 9.88it/s] 60it [00:06, 9.94it/s] 61it [00:06, 9.92it/s] 62it [00:06, 9.94it/s] 64it [00:06, 9.96it/s] 66it [00:07, 9.92it/s] 68it [00:07, 9.96it/s] 69it [00:07, 9.97it/s] 70it [00:07, 9.96it/s] 72it [00:07, 10.00it/s] 73it [00:07, 9.98it/s] 74it [00:07, 9.96it/s] 76it [00:08, 9.99it/s] 77it [00:08, 9.99it/s] 78it [00:08, 9.96it/s] 79it [00:08, 9.54it/s] 81it [00:08, 9.75it/s] 83it [00:08, 9.86it/s] 84it [00:08, 9.87it/s] 85it [00:08, 9.79it/s] 86it [00:09, 9.80it/s] 88it [00:09, 9.88it/s] 89it [00:09, 9.77it/s] 90it [00:09, 9.69it/s] 92it [00:09, 9.83it/s] 94it [00:09, 9.91it/s] 96it [00:10, 9.96it/s] 98it [00:10, 9.98it/s] 99it [00:10, 9.97it/s] 100it [00:10, 9.94it/s]2025-05-26 06:07:15,939 - INFO - [Epoch 064 | Batch 0100] IWAE-loss 4177.9673 | mean log_px -0.0192 | KL -3262.71 + 101it [00:10, 9.43it/s] 102it [00:10, 9.56it/s] 104it [00:10, 9.74it/s] 106it [00:11, 9.84it/s] 108it [00:11, 9.89it/s] 109it [00:11, 9.48it/s] 110it [00:11, 9.57it/s] 111it [00:11, 9.65it/s] 112it [00:11, 9.20it/s] 113it [00:11, 9.40it/s] 114it [00:11, 9.53it/s] 115it [00:12, 9.66it/s] 116it [00:12, 9.72it/s] 117it [00:12, 9.32it/s] 118it [00:12, 9.51it/s] 119it [00:12, 9.63it/s] 120it [00:12, 9.71it/s] 121it [00:12, 9.79it/s] 122it [00:12, 9.81it/s] 123it [00:12, 9.86it/s] 124it [00:12, 9.86it/s] 125it [00:13, 9.89it/s] 126it [00:13, 9.90it/s] 127it [00:13, 9.91it/s] 128it [00:13, 9.91it/s] 129it [00:13, 9.93it/s] 130it [00:13, 9.31it/s] 131it [00:13, 9.50it/s] 132it [00:13, 9.62it/s] 133it [00:13, 9.12it/s] 134it [00:14, 9.35it/s] 135it [00:14, 9.53it/s] 136it [00:14, 9.64it/s] 138it [00:14, 9.80it/s] 139it [00:14, 9.32it/s] 140it [00:14, 9.48it/s] 142it [00:14, 9.69it/s] 144it [00:15, 9.80it/s] 145it [00:15, 9.83it/s] 146it [00:15, 9.84it/s] 147it [00:15, 9.86it/s] 148it [00:15, 9.53it/s] 149it [00:15, 9.64it/s] 150it [00:15, 9.73it/s]2025-05-26 06:07:21,131 - INFO - [Epoch 064 | Batch 0150] IWAE-loss 4131.0303 | mean log_px -0.0125 | KL -3256.42 + 151it [00:15, 9.20it/s] 152it [00:15, 9.41it/s] 154it [00:16, 9.66it/s] 155it [00:16, 9.73it/s] 156it [00:16, 9.26it/s] 157it [00:16, 9.43it/s] 158it [00:16, 9.52it/s] 160it [00:16, 9.71it/s] 161it [00:16, 9.78it/s] 162it [00:16, 9.83it/s] 163it [00:17, 9.87it/s] 164it [00:17, 9.89it/s] 165it [00:17, 9.90it/s] 166it [00:17, 9.89it/s] 168it [00:17, 9.95it/s] 169it [00:17, 9.43it/s] 170it [00:17, 9.56it/s] 172it [00:17, 9.73it/s] 173it [00:18, 9.79it/s] 174it [00:18, 9.84it/s] 175it [00:18, 9.88it/s] 176it [00:18, 9.89it/s] 178it [00:18, 9.94it/s] 179it [00:18, 9.95it/s] 180it [00:18, 9.95it/s] 181it [00:18, 9.96it/s] 182it [00:18, 9.96it/s] 183it [00:19, 9.35it/s] 184it [00:19, 9.51it/s] 185it [00:19, 9.63it/s] 186it [00:19, 9.71it/s] 187it [00:19, 9.30it/s] 188it [00:19, 9.50it/s] 189it [00:19, 9.63it/s] 190it [00:19, 9.70it/s] 191it [00:19, 9.78it/s] 192it [00:19, 9.82it/s] 193it [00:20, 9.87it/s] 194it [00:20, 9.88it/s] 195it [00:20, 9.36it/s] 196it [00:20, 9.54it/s] 196it [00:20, 9.57it/s] +2025-05-26 06:07:25,885 - INFO - Epoch: 64, Objective: tensor([4486.4854], device='cuda:0', grad_fn=), Loss: 0.017137622460722923, KL/n: 66.45817565917969 + 0it [00:00, ?it/s]2025-05-26 06:07:26,131 - INFO - [Epoch 065 | Batch 0000] IWAE-loss 4915.1265 | mean log_px -0.0304 | KL -3253.02 + 1it [00:00, 5.42it/s] 2it [00:00, 7.37it/s] 4it [00:00, 8.88it/s] 6it [00:00, 9.42it/s] 8it [00:00, 9.70it/s] 10it [00:01, 9.86it/s] 12it [00:01, 9.94it/s] 14it [00:01, 9.99it/s] 16it [00:01, 10.02it/s] 18it [00:01, 10.05it/s] 20it [00:02, 10.07it/s] 22it [00:02, 10.08it/s] 24it [00:02, 10.08it/s] 26it [00:02, 10.09it/s] 28it [00:02, 10.10it/s] 30it [00:03, 10.11it/s] 32it [00:03, 10.10it/s] 34it [00:03, 10.11it/s] 36it [00:03, 9.75it/s] 38it [00:03, 9.85it/s] 40it [00:04, 9.93it/s] 42it [00:04, 9.97it/s] 44it [00:04, 10.00it/s] 46it [00:04, 10.04it/s] 48it [00:04, 10.05it/s] 50it [00:05, 10.07it/s]2025-05-26 06:07:31,137 - INFO - [Epoch 065 | Batch 0050] IWAE-loss 4041.6321 | mean log_px -0.0125 | KL -3247.29 + 52it [00:05, 9.49it/s] 53it [00:05, 9.48it/s] 55it [00:05, 9.68it/s] 57it [00:05, 9.83it/s] 59it [00:05, 9.92it/s] 61it [00:06, 9.98it/s] 63it [00:06, 9.97it/s] 65it [00:06, 10.00it/s] 66it [00:06, 10.00it/s] 68it [00:06, 10.03it/s] 70it [00:07, 10.06it/s] 72it [00:07, 10.06it/s] 74it [00:07, 10.08it/s] 76it [00:07, 10.08it/s] 78it [00:07, 10.08it/s] 80it [00:08, 10.09it/s] 82it [00:08, 10.08it/s] 84it [00:08, 10.09it/s] 86it [00:08, 9.74it/s] 88it [00:08, 9.84it/s] 90it [00:09, 9.91it/s] 91it [00:09, 9.61it/s] 93it [00:09, 9.74it/s] 95it [00:09, 9.84it/s] 96it [00:09, 9.86it/s] 98it [00:09, 9.94it/s] 100it [00:10, 9.99it/s]2025-05-26 06:07:36,186 - INFO - [Epoch 065 | Batch 0100] IWAE-loss 4149.1934 | mean log_px -0.0150 | KL -3245.47 + 101it [00:10, 9.57it/s] 103it [00:10, 9.76it/s] 105it [00:10, 9.86it/s] 107it [00:10, 9.93it/s] 108it [00:10, 9.94it/s] 110it [00:11, 9.99it/s] 111it [00:11, 9.47it/s] 112it [00:11, 9.56it/s] 114it [00:11, 9.76it/s] 116it [00:11, 9.88it/s] 117it [00:11, 9.88it/s] 119it [00:12, 9.97it/s] 121it [00:12, 10.02it/s] 123it [00:12, 10.04it/s] 125it [00:12, 10.06it/s] 127it [00:12, 10.07it/s] 129it [00:13, 10.07it/s] 131it [00:13, 10.07it/s] 133it [00:13, 10.07it/s] 135it [00:13, 9.70it/s] 136it [00:13, 9.71it/s] 137it [00:13, 9.77it/s] 139it [00:14, 9.88it/s] 141it [00:14, 9.56it/s] 142it [00:14, 9.62it/s] 144it [00:14, 9.77it/s] 146it [00:14, 9.50it/s] 148it [00:15, 9.67it/s] 150it [00:15, 9.79it/s]2025-05-26 06:07:41,280 - INFO - [Epoch 065 | Batch 0150] IWAE-loss 5137.2002 | mean log_px -0.0301 | KL -3244.56 + 151it [00:15, 9.46it/s] 152it [00:15, 9.56it/s] 154it [00:15, 9.75it/s] 156it [00:15, 9.87it/s] 158it [00:16, 9.92it/s] 160it [00:16, 9.97it/s] 162it [00:16, 9.99it/s] 164it [00:16, 10.01it/s] 166it [00:16, 10.03it/s] 168it [00:17, 10.04it/s] 170it [00:17, 10.05it/s] 172it [00:17, 9.61it/s] 174it [00:17, 9.76it/s] 176it [00:17, 9.87it/s] 178it [00:18, 9.94it/s] 180it [00:18, 9.99it/s] 181it [00:18, 9.71it/s] 183it [00:18, 9.84it/s] 184it [00:18, 9.55it/s] 186it [00:18, 9.73it/s] 187it [00:18, 9.38it/s] 189it [00:19, 9.63it/s] 191it [00:19, 9.43it/s] 192it [00:19, 9.53it/s] 194it [00:19, 9.74it/s] 195it [00:19, 9.47it/s] 196it [00:19, 9.81it/s] +2025-05-26 06:07:45,990 - INFO - Epoch: 65, Objective: tensor([4243.4243], device='cuda:0', grad_fn=), Loss: 0.016095492988824844, KL/n: 66.21897888183594 + 0it [00:00, ?it/s]2025-05-26 06:07:46,279 - INFO - [Epoch 066 | Batch 0000] IWAE-loss 4330.0098 | mean log_px -0.0173 | KL -3242.21 + 1it [00:00, 4.48it/s] 2it [00:00, 6.60it/s] 4it [00:00, 8.41it/s] 6it [00:00, 9.15it/s] 7it [00:00, 8.89it/s] 9it [00:01, 9.37it/s] 10it [00:01, 9.50it/s] 12it [00:01, 9.74it/s] 14it [00:01, 9.86it/s] 16it [00:01, 9.94it/s] 18it [00:01, 9.99it/s] 20it [00:02, 10.03it/s] 22it [00:02, 10.05it/s] 24it [00:02, 9.98it/s] 26it [00:02, 10.00it/s] 27it [00:02, 10.00it/s] 28it [00:02, 9.55it/s] 30it [00:03, 9.74it/s] 32it [00:03, 9.86it/s] 34it [00:03, 9.94it/s] 36it [00:03, 9.99it/s] 38it [00:03, 10.01it/s] 39it [00:04, 10.00it/s] 40it [00:04, 6.91it/s] 42it [00:04, 7.81it/s] 43it [00:04, 7.87it/s] 44it [00:04, 8.28it/s] 46it [00:04, 8.90it/s] 48it [00:05, 9.30it/s] 50it [00:05, 9.55it/s]2025-05-26 06:07:51,562 - INFO - [Epoch 066 | Batch 0050] IWAE-loss 5074.5923 | mean log_px -0.0331 | KL -3240.32 + 52it [00:05, 9.70it/s] 54it [00:05, 9.81it/s] 56it [00:05, 9.88it/s] 58it [00:06, 9.94it/s] 60it [00:06, 9.98it/s] 62it [00:06, 10.02it/s] 64it [00:06, 10.01it/s] 66it [00:06, 9.69it/s] 68it [00:07, 9.80it/s] 70it [00:07, 9.88it/s] 72it [00:07, 9.93it/s] 73it [00:07, 9.91it/s] 74it [00:07, 9.93it/s] 76it [00:07, 9.99it/s] 78it [00:08, 10.01it/s] 80it [00:08, 10.04it/s] 82it [00:08, 10.06it/s] 84it [00:08, 10.06it/s] 86it [00:08, 10.07it/s] 88it [00:09, 10.08it/s] 90it [00:09, 10.07it/s] 92it [00:09, 9.71it/s] 94it [00:09, 9.82it/s] 96it [00:09, 9.89it/s] 98it [00:10, 9.94it/s] 100it [00:10, 9.99it/s]2025-05-26 06:07:56,578 - INFO - [Epoch 066 | Batch 0100] IWAE-loss 4414.3447 | mean log_px -0.0179 | KL -3239.95 + 102it [00:10, 10.01it/s] 104it [00:10, 9.70it/s] 106it [00:11, 9.81it/s] 108it [00:11, 9.89it/s] 110it [00:11, 9.95it/s] 112it [00:11, 9.98it/s] 114it [00:11, 10.01it/s] 116it [00:12, 10.04it/s] 118it [00:12, 10.04it/s] 120it [00:12, 10.06it/s] 122it [00:12, 9.73it/s] 124it [00:12, 9.83it/s] 126it [00:13, 9.91it/s] 128it [00:13, 9.92it/s] 130it [00:13, 9.96it/s] 132it [00:13, 10.01it/s] 134it [00:13, 10.03it/s] 136it [00:14, 9.92it/s] 137it [00:14, 9.93it/s] 138it [00:14, 9.94it/s] 140it [00:14, 9.98it/s] 142it [00:14, 10.01it/s] 144it [00:14, 10.01it/s] 146it [00:15, 10.03it/s] 148it [00:15, 9.70it/s] 149it [00:15, 9.75it/s]2025-05-26 06:08:01,623 - INFO - [Epoch 066 | Batch 0150] IWAE-loss 4754.2173 | mean log_px -0.0265 | KL -3233.78 + 151it [00:15, 9.47it/s] 152it [00:15, 9.56it/s] 154it [00:15, 9.73it/s] 155it [00:15, 9.37it/s] 157it [00:16, 9.31it/s] 158it [00:16, 9.43it/s] 160it [00:16, 9.66it/s] 161it [00:16, 9.17it/s] 162it [00:16, 9.07it/s] 163it [00:16, 9.14it/s] 164it [00:16, 9.30it/s] 165it [00:17, 9.45it/s] 166it [00:17, 9.53it/s] 167it [00:17, 9.24it/s] 168it [00:17, 9.41it/s] 169it [00:17, 9.55it/s] 170it [00:17, 9.05it/s] 171it [00:17, 9.27it/s] 172it [00:17, 9.43it/s] 173it [00:17, 9.51it/s] 174it [00:18, 9.64it/s] 175it [00:18, 9.16it/s] 177it [00:18, 9.56it/s] 178it [00:18, 9.56it/s] 179it [00:18, 9.57it/s] 180it [00:18, 9.64it/s] 182it [00:18, 9.82it/s] 183it [00:18, 9.46it/s] 184it [00:19, 9.57it/s] 186it [00:19, 9.44it/s] 188it [00:19, 9.64it/s] 190it [00:19, 9.42it/s] 191it [00:19, 9.52it/s] 192it [00:19, 9.39it/s] 193it [00:20, 9.28it/s] 194it [00:20, 9.03it/s] 195it [00:20, 8.79it/s] 196it [00:20, 9.60it/s] +2025-05-26 06:08:06,548 - INFO - Epoch: 66, Objective: tensor([4165.6123], device='cuda:0', grad_fn=), Loss: 0.015236176550388336, KL/n: 65.961181640625 + 0it [00:00, ?it/s]2025-05-26 06:08:06,825 - INFO - [Epoch 067 | Batch 0000] IWAE-loss 4508.1504 | mean log_px -0.0203 | KL -3233.36 + 1it [00:00, 5.41it/s] 2it [00:00, 7.39it/s] 4it [00:00, 8.88it/s] 6it [00:00, 9.44it/s] 8it [00:00, 9.70it/s] 10it [00:01, 9.85it/s] 12it [00:01, 9.94it/s] 14it [00:01, 9.99it/s] 16it [00:01, 10.01it/s] 18it [00:01, 10.04it/s] 20it [00:02, 10.07it/s] 22it [00:02, 10.08it/s] 24it [00:02, 10.10it/s] 26it [00:02, 10.11it/s] 28it [00:02, 9.86it/s] 29it [00:02, 9.49it/s] 30it [00:03, 9.53it/s] 31it [00:03, 9.52it/s] 32it [00:03, 9.58it/s] 33it [00:03, 9.66it/s] 34it [00:03, 9.68it/s] 35it [00:03, 9.73it/s] 36it [00:03, 9.72it/s] 37it [00:03, 9.78it/s] 38it [00:03, 9.78it/s] 39it [00:04, 9.33it/s] 40it [00:04, 9.41it/s] 41it [00:04, 9.53it/s] 42it [00:04, 9.62it/s] 43it [00:04, 9.70it/s] 44it [00:04, 9.75it/s] 45it [00:04, 9.76it/s] 46it [00:04, 9.62it/s] 47it [00:04, 8.95it/s] 48it [00:04, 9.16it/s] 49it [00:05, 9.35it/s] 50it [00:05, 9.47it/s]2025-05-26 06:08:11,936 - INFO - [Epoch 067 | Batch 0050] IWAE-loss 4197.2188 | mean log_px -0.0214 | KL -3226.38 + 51it [00:05, 9.55it/s] 52it [00:05, 9.63it/s] 53it [00:05, 9.71it/s] 54it [00:05, 9.76it/s] 55it [00:05, 9.67it/s] 56it [00:05, 9.62it/s] 57it [00:05, 9.64it/s] 58it [00:06, 9.68it/s] 59it [00:06, 9.75it/s] 60it [00:06, 9.77it/s] 61it [00:06, 9.82it/s] 62it [00:06, 9.80it/s] 63it [00:06, 9.76it/s] 64it [00:06, 9.77it/s] 65it [00:06, 9.81it/s] 66it [00:06, 9.83it/s] 67it [00:06, 9.84it/s] 68it [00:07, 9.84it/s] 69it [00:07, 9.85it/s] 70it [00:07, 9.84it/s] 71it [00:07, 9.87it/s] 72it [00:07, 9.85it/s] 73it [00:07, 9.86it/s] 74it [00:07, 9.86it/s] 75it [00:07, 9.86it/s] 76it [00:07, 9.85it/s] 77it [00:07, 9.86it/s] 78it [00:08, 9.85it/s] 79it [00:08, 9.86it/s] 80it [00:08, 9.84it/s] 81it [00:08, 9.86it/s] 82it [00:08, 9.84it/s] 83it [00:08, 9.86it/s] 84it [00:08, 9.85it/s] 85it [00:08, 9.86it/s] 86it [00:08, 9.86it/s] 87it [00:08, 9.86it/s] 88it [00:09, 9.85it/s] 89it [00:09, 9.86it/s] 90it [00:09, 9.84it/s] 91it [00:09, 9.86it/s] 92it [00:09, 9.26it/s] 93it [00:09, 9.44it/s] 94it [00:09, 9.56it/s] 95it [00:09, 9.63it/s] 96it [00:09, 9.69it/s] 97it [00:09, 9.75it/s] 98it [00:10, 9.77it/s] 99it [00:10, 9.80it/s] 100it [00:10, 9.81it/s]2025-05-26 06:08:17,045 - INFO - [Epoch 067 | Batch 0100] IWAE-loss 4479.0835 | mean log_px -0.0211 | KL -3224.74 + 101it [00:10, 9.81it/s] 102it [00:10, 9.82it/s] 103it [00:10, 9.83it/s] 104it [00:10, 9.42it/s] 105it [00:10, 9.54it/s] 106it [00:10, 9.23it/s] 107it [00:11, 9.41it/s] 108it [00:11, 9.54it/s] 109it [00:11, 9.65it/s] 110it [00:11, 9.70it/s] 111it [00:11, 9.76it/s] 112it [00:11, 9.77it/s] 113it [00:11, 9.80it/s] 114it [00:11, 9.79it/s] 115it [00:11, 9.82it/s] 116it [00:11, 9.82it/s] 117it [00:12, 9.84it/s] 118it [00:12, 9.84it/s] 119it [00:12, 9.85it/s] 120it [00:12, 9.84it/s] 121it [00:12, 9.86it/s] 122it [00:12, 9.85it/s] 123it [00:12, 9.87it/s] 124it [00:12, 9.85it/s] 125it [00:12, 9.86it/s] 126it [00:12, 9.85it/s] 127it [00:13, 9.85it/s] 128it [00:13, 9.86it/s] 129it [00:13, 9.87it/s] 130it [00:13, 9.81it/s] 131it [00:13, 9.83it/s] 132it [00:13, 9.83it/s] 133it [00:13, 9.86it/s] 134it [00:13, 9.58it/s] 135it [00:13, 9.30it/s] 136it [00:14, 9.44it/s] 137it [00:14, 9.58it/s] 138it [00:14, 9.64it/s] 139it [00:14, 9.72it/s] 140it [00:14, 9.75it/s] 141it [00:14, 9.79it/s] 142it [00:14, 9.81it/s] 143it [00:14, 9.83it/s] 144it [00:14, 9.83it/s] 145it [00:14, 9.84it/s] 146it [00:15, 9.84it/s] 147it [00:15, 9.81it/s] 148it [00:15, 9.81it/s] 149it [00:15, 9.84it/s] 150it [00:15, 9.83it/s]2025-05-26 06:08:22,175 - INFO - [Epoch 067 | Batch 0150] IWAE-loss 4168.6562 | mean log_px -0.0179 | KL -3215.23 + 151it [00:15, 9.83it/s] 152it [00:15, 9.83it/s] 153it [00:15, 9.85it/s] 154it [00:15, 9.84it/s] 155it [00:15, 9.85it/s] 156it [00:16, 9.85it/s] 157it [00:16, 9.87it/s] 158it [00:16, 9.07it/s] 159it [00:16, 9.26it/s] 160it [00:16, 9.43it/s] 161it [00:16, 9.57it/s] 162it [00:16, 9.64it/s] 163it [00:16, 9.72it/s] 164it [00:16, 9.75it/s] 165it [00:16, 9.80it/s] 166it [00:17, 9.82it/s] 167it [00:17, 9.85it/s] 168it [00:17, 9.83it/s] 169it [00:17, 9.85it/s] 170it [00:17, 9.85it/s] 171it [00:17, 9.85it/s] 172it [00:17, 9.85it/s] 173it [00:17, 9.85it/s] 174it [00:17, 9.77it/s] 175it [00:18, 9.80it/s] 176it [00:18, 9.80it/s] 177it [00:18, 9.81it/s] 178it [00:18, 9.81it/s] 179it [00:18, 9.80it/s] 180it [00:18, 9.81it/s] 181it [00:18, 9.83it/s] 182it [00:18, 9.82it/s] 183it [00:18, 9.83it/s] 184it [00:18, 9.83it/s] 185it [00:19, 9.79it/s] 186it [00:19, 9.80it/s] 187it [00:19, 9.83it/s] 188it [00:19, 9.83it/s] 189it [00:19, 9.85it/s] 190it [00:19, 9.84it/s] 191it [00:19, 9.84it/s] 192it [00:19, 9.82it/s] 193it [00:19, 9.83it/s] 194it [00:19, 9.82it/s] 195it [00:20, 9.21it/s] 196it [00:20, 9.69it/s] +2025-05-26 06:08:26,902 - INFO - Epoch: 67, Objective: tensor([4425.1938], device='cuda:0', grad_fn=), Loss: 0.020734276622533798, KL/n: 65.69780731201172 + 0it [00:00, ?it/s]2025-05-26 06:08:27,194 - INFO - [Epoch 068 | Batch 0000] IWAE-loss 4215.6938 | mean log_px -0.0170 | KL -3219.93 + 1it [00:00, 5.15it/s] 2it [00:00, 6.99it/s] 3it [00:00, 7.91it/s] 4it [00:00, 8.50it/s] 5it [00:00, 8.94it/s] 6it [00:00, 9.19it/s] 7it [00:00, 9.25it/s] 8it [00:00, 9.35it/s] 9it [00:01, 9.34it/s] 10it [00:01, 9.37it/s] 11it [00:01, 9.51it/s] 12it [00:01, 9.54it/s] 13it [00:01, 9.43it/s] 14it [00:01, 9.47it/s] 15it [00:01, 9.49it/s] 16it [00:01, 9.46it/s] 17it [00:01, 9.52it/s] 18it [00:01, 9.49it/s] 19it [00:02, 9.50it/s] 20it [00:02, 9.46it/s] 21it [00:02, 9.48it/s] 22it [00:02, 9.47it/s] 23it [00:02, 9.50it/s] 24it [00:02, 9.41it/s] 25it [00:02, 9.47it/s] 26it [00:02, 9.53it/s] 27it [00:02, 9.55it/s] 28it [00:03, 9.52it/s] 29it [00:03, 9.49it/s] 30it [00:03, 9.49it/s] 31it [00:03, 9.47it/s] 32it [00:03, 9.48it/s] 33it [00:03, 9.54it/s] 34it [00:03, 9.56it/s] 35it [00:03, 9.55it/s] 36it [00:03, 9.50it/s] 37it [00:03, 9.50it/s] 38it [00:04, 9.53it/s] 39it [00:04, 9.55it/s] 40it [00:04, 9.47it/s] 41it [00:04, 9.51it/s] 42it [00:04, 9.47it/s] 43it [00:04, 9.49it/s] 44it [00:04, 9.46it/s] 45it [00:04, 9.51it/s] 46it [00:04, 9.51it/s] 47it [00:05, 9.49it/s] 48it [00:05, 9.54it/s] 49it [00:05, 9.52it/s] 50it [00:05, 9.50it/s]2025-05-26 06:08:32,453 - INFO - [Epoch 068 | Batch 0050] IWAE-loss 4135.7124 | mean log_px -0.0192 | KL -3214.93 + 51it [00:05, 9.56it/s] 52it [00:05, 9.56it/s] 53it [00:05, 9.52it/s] 54it [00:05, 9.46it/s] 55it [00:05, 9.46it/s] 56it [00:05, 9.48it/s] 57it [00:06, 8.97it/s] 58it [00:06, 9.15it/s] 59it [00:06, 9.22it/s] 60it [00:06, 9.28it/s] 61it [00:06, 6.16it/s] 62it [00:06, 6.89it/s] 63it [00:06, 7.50it/s] 64it [00:07, 7.89it/s] 65it [00:07, 8.24it/s] 66it [00:07, 8.13it/s] 67it [00:07, 8.52it/s] 68it [00:07, 8.82it/s] 69it [00:07, 9.05it/s] 70it [00:07, 9.14it/s] 71it [00:07, 9.24it/s] 72it [00:07, 9.27it/s] 73it [00:08, 9.31it/s] 74it [00:08, 9.31it/s] 75it [00:08, 9.35it/s] 76it [00:08, 9.02it/s] 77it [00:08, 8.62it/s] 78it [00:08, 8.85it/s] 79it [00:08, 9.02it/s] 80it [00:08, 8.99it/s] 81it [00:08, 9.15it/s] 82it [00:09, 9.20it/s] 83it [00:09, 9.32it/s] 84it [00:09, 9.38it/s] 85it [00:09, 9.43it/s] 86it [00:09, 9.41it/s] 87it [00:09, 9.43it/s] 88it [00:09, 9.50it/s] 89it [00:09, 9.53it/s] 90it [00:09, 9.52it/s] 91it [00:09, 9.53it/s] 92it [00:10, 9.52it/s] 93it [00:10, 9.54it/s] 94it [00:10, 9.53it/s] 95it [00:10, 8.99it/s] 96it [00:10, 9.09it/s] 97it [00:10, 9.01it/s] 98it [00:10, 8.87it/s] 99it [00:10, 9.08it/s] 100it [00:10, 9.20it/s]2025-05-26 06:08:38,042 - INFO - [Epoch 068 | Batch 0100] IWAE-loss 4981.6865 | mean log_px -0.0295 | KL -3210.19 + 101it [00:11, 9.31it/s] 102it [00:11, 9.31it/s] 103it [00:11, 9.37it/s] 104it [00:11, 9.39it/s] 105it [00:11, 9.40it/s] 106it [00:11, 9.41it/s] 107it [00:11, 9.46it/s] 108it [00:11, 9.44it/s] 109it [00:11, 9.45it/s] 110it [00:12, 9.04it/s] 111it [00:12, 9.22it/s] 112it [00:12, 9.26it/s] 113it [00:12, 9.31it/s] 114it [00:12, 9.37it/s] 115it [00:12, 9.39it/s] 116it [00:12, 9.40it/s] 117it [00:12, 9.46it/s] 118it [00:12, 9.44it/s] 119it [00:12, 9.47it/s] 120it [00:13, 9.49it/s] 121it [00:13, 8.96it/s] 122it [00:13, 9.11it/s] 123it [00:13, 9.24it/s] 124it [00:13, 9.30it/s] 125it [00:13, 9.37it/s] 126it [00:13, 9.39it/s] 127it [00:13, 9.44it/s] 128it [00:13, 9.43it/s] 129it [00:14, 9.50it/s] 130it [00:14, 9.48it/s] 131it [00:14, 9.50it/s] 132it [00:14, 9.49it/s] 133it [00:14, 9.53it/s] 134it [00:14, 9.53it/s] 135it [00:14, 9.54it/s] 136it [00:14, 8.93it/s] 137it [00:14, 9.09it/s] 138it [00:15, 9.19it/s] 139it [00:15, 9.32it/s] 140it [00:15, 8.84it/s] 141it [00:15, 9.03it/s] 142it [00:15, 9.12it/s] 143it [00:15, 9.27it/s] 144it [00:15, 8.77it/s] 145it [00:15, 9.02it/s] 146it [00:15, 9.11it/s] 147it [00:15, 9.23it/s] 148it [00:16, 8.78it/s] 149it [00:16, 8.96it/s] 150it [00:16, 9.14it/s]2025-05-26 06:08:43,435 - INFO - [Epoch 068 | Batch 0150] IWAE-loss 3965.0554 | mean log_px -0.0127 | KL -3208.22 + 151it [00:16, 9.25it/s] 152it [00:16, 9.33it/s] 153it [00:16, 9.34it/s] 154it [00:16, 9.41it/s] 155it [00:16, 9.46it/s] 156it [00:16, 9.44it/s] 157it [00:17, 9.48it/s] 158it [00:17, 9.51it/s] 159it [00:17, 8.98it/s] 160it [00:17, 9.14it/s] 161it [00:17, 9.28it/s] 162it [00:17, 9.33it/s] 163it [00:17, 9.38it/s] 164it [00:17, 9.01it/s] 165it [00:17, 9.17it/s] 166it [00:18, 9.27it/s] 167it [00:18, 9.35it/s] 168it [00:18, 9.41it/s] 169it [00:18, 9.04it/s] 170it [00:18, 9.12it/s] 171it [00:18, 9.21it/s] 172it [00:18, 9.27it/s] 173it [00:18, 8.94it/s] 174it [00:18, 9.09it/s] 175it [00:19, 9.23it/s] 176it [00:19, 9.29it/s] 177it [00:19, 9.37it/s] 178it [00:19, 9.39it/s] 179it [00:19, 9.44it/s] 180it [00:19, 9.43it/s] 181it [00:19, 9.47it/s] 182it [00:19, 9.50it/s] 183it [00:19, 9.54it/s] 184it [00:19, 9.49it/s] 185it [00:20, 9.14it/s] 186it [00:20, 9.05it/s] 187it [00:20, 9.17it/s] 188it [00:20, 8.85it/s] 189it [00:20, 9.06it/s] 190it [00:20, 9.19it/s] 191it [00:20, 9.31it/s] 192it [00:20, 9.24it/s] 193it [00:20, 9.31it/s] 194it [00:21, 9.37it/s] 195it [00:21, 8.81it/s] 196it [00:21, 9.00it/s] 196it [00:21, 9.17it/s] +2025-05-26 06:08:48,412 - INFO - Epoch: 68, Objective: tensor([4401.1167], device='cuda:0', grad_fn=), Loss: 0.016813162714242935, KL/n: 65.4537582397461 + 0it [00:00, ?it/s]2025-05-26 06:08:48,690 - INFO - [Epoch 069 | Batch 0000] IWAE-loss 3877.0161 | mean log_px -0.0104 | KL -3203.73 + 1it [00:00, 5.37it/s] 2it [00:00, 7.23it/s] 3it [00:00, 8.13it/s] 4it [00:00, 8.63it/s] 5it [00:00, 8.98it/s] 6it [00:00, 9.18it/s] 7it [00:00, 9.26it/s] 8it [00:00, 9.32it/s] 9it [00:01, 9.42it/s] 10it [00:01, 9.41it/s] 11it [00:01, 9.45it/s] 12it [00:01, 9.45it/s] 13it [00:01, 9.46it/s] 14it [00:01, 9.40it/s] 15it [00:01, 9.39it/s] 16it [00:01, 9.41it/s] 17it [00:01, 9.45it/s] 18it [00:01, 9.46it/s] 19it [00:02, 9.04it/s] 20it [00:02, 9.17it/s] 21it [00:02, 9.31it/s] 22it [00:02, 8.87it/s] 23it [00:02, 9.03it/s] 24it [00:02, 9.15it/s] 25it [00:02, 9.32it/s] 26it [00:02, 9.36it/s] 27it [00:02, 9.40it/s] 28it [00:03, 9.41it/s] 29it [00:03, 9.44it/s] 30it [00:03, 9.46it/s] 31it [00:03, 9.40it/s] 32it [00:03, 9.36it/s] 33it [00:03, 9.40it/s] 34it [00:03, 9.40it/s] 35it [00:03, 9.46it/s] 36it [00:03, 9.47it/s] 37it [00:04, 9.51it/s] 38it [00:04, 9.51it/s] 39it [00:04, 9.50it/s] 40it [00:04, 9.53it/s] 41it [00:04, 9.53it/s] 42it [00:04, 9.52it/s] 43it [00:04, 9.56it/s] 44it [00:04, 9.54it/s] 45it [00:04, 9.55it/s] 46it [00:04, 9.53it/s] 47it [00:05, 9.56it/s] 48it [00:05, 9.54it/s] 49it [00:05, 9.54it/s] 50it [00:05, 9.54it/s]2025-05-26 06:08:53,988 - INFO - [Epoch 069 | Batch 0050] IWAE-loss 3863.5151 | mean log_px -0.0112 | KL -3199.91 + 51it [00:05, 9.49it/s] 52it [00:05, 9.40it/s] 53it [00:05, 9.47it/s] 54it [00:05, 9.50it/s] 55it [00:05, 9.51it/s] 56it [00:06, 9.50it/s] 57it [00:06, 9.45it/s] 58it [00:06, 9.47it/s] 59it [00:06, 9.54it/s] 60it [00:06, 9.51it/s] 61it [00:06, 9.53it/s] 62it [00:06, 9.53it/s] 63it [00:06, 9.54it/s] 64it [00:06, 9.52it/s] 65it [00:06, 9.53it/s] 66it [00:07, 9.51it/s] 67it [00:07, 9.50it/s] 68it [00:07, 9.43it/s] 69it [00:07, 9.43it/s] 70it [00:07, 9.43it/s] 71it [00:07, 9.34it/s] 72it [00:07, 9.39it/s] 73it [00:07, 9.38it/s] 74it [00:07, 9.41it/s] 75it [00:08, 9.45it/s] 76it [00:08, 9.41it/s] 77it [00:08, 9.41it/s] 78it [00:08, 9.41it/s] 79it [00:08, 9.48it/s] 80it [00:08, 8.95it/s] 81it [00:08, 9.08it/s] 82it [00:08, 9.19it/s] 83it [00:08, 9.27it/s] 84it [00:08, 9.33it/s] 85it [00:09, 9.41it/s] 86it [00:09, 9.43it/s] 87it [00:09, 9.42it/s] 88it [00:09, 9.43it/s] 89it [00:09, 9.47it/s] 90it [00:09, 9.49it/s] 91it [00:09, 9.53it/s] 92it [00:09, 9.54it/s] 93it [00:09, 9.57it/s] 94it [00:10, 9.58it/s] 95it [00:10, 9.47it/s] 96it [00:10, 9.52it/s] 97it [00:10, 9.52it/s] 98it [00:10, 9.49it/s] 99it [00:10, 9.47it/s] 100it [00:10, 9.49it/s]2025-05-26 06:08:59,286 - INFO - [Epoch 069 | Batch 0100] IWAE-loss 3742.5066 | mean log_px -0.0079 | KL -3197.15 + 101it [00:10, 9.53it/s] 102it [00:10, 9.51it/s] 103it [00:10, 9.51it/s] 104it [00:11, 9.49it/s] 105it [00:11, 9.51it/s] 106it [00:11, 9.56it/s] 107it [00:11, 9.58it/s] 108it [00:11, 9.56it/s] 109it [00:11, 9.55it/s] 110it [00:11, 9.53it/s] 111it [00:11, 9.53it/s] 112it [00:11, 9.48it/s] 113it [00:12, 9.51it/s] 114it [00:12, 9.50it/s] 115it [00:12, 9.57it/s] 116it [00:12, 9.55it/s] 117it [00:12, 9.58it/s] 118it [00:12, 9.58it/s] 119it [00:12, 9.55it/s] 120it [00:12, 9.52it/s] 121it [00:12, 9.59it/s] 122it [00:12, 9.40it/s] 123it [00:13, 9.13it/s] 124it [00:13, 9.20it/s] 125it [00:13, 9.32it/s] 126it [00:13, 9.41it/s] 127it [00:13, 9.46it/s] 128it [00:13, 9.46it/s] 129it [00:13, 9.47it/s] 130it [00:13, 9.47it/s] 131it [00:13, 9.48it/s] 132it [00:14, 9.46it/s] 133it [00:14, 9.49it/s] 134it [00:14, 9.46it/s] 135it [00:14, 9.46it/s] 136it [00:14, 9.46it/s] 137it [00:14, 9.52it/s] 138it [00:14, 9.52it/s] 139it [00:14, 9.52it/s] 140it [00:14, 9.51it/s] 141it [00:14, 9.57it/s] 142it [00:15, 9.49it/s] 143it [00:15, 9.51it/s] 144it [00:15, 9.47it/s] 145it [00:15, 9.44it/s] 146it [00:15, 9.45it/s] 147it [00:15, 9.48it/s] 148it [00:15, 9.48it/s] 149it [00:15, 9.49it/s] 150it [00:15, 9.49it/s]2025-05-26 06:09:04,557 - INFO - [Epoch 069 | Batch 0150] IWAE-loss 4124.4932 | mean log_px -0.0141 | KL -3199.10 + 151it [00:16, 9.49it/s] 152it [00:16, 9.49it/s] 153it [00:16, 9.57it/s] 154it [00:16, 9.59it/s] 155it [00:16, 9.06it/s] 156it [00:16, 9.21it/s] 157it [00:16, 9.31it/s] 158it [00:16, 9.36it/s] 159it [00:16, 9.38it/s] 160it [00:17, 9.27it/s] 161it [00:17, 9.14it/s] 162it [00:17, 9.26it/s] 163it [00:17, 9.38it/s] 164it [00:17, 9.44it/s] 165it [00:17, 9.48it/s] 166it [00:17, 9.51it/s] 167it [00:17, 9.56it/s] 168it [00:17, 9.59it/s] 169it [00:17, 9.61it/s] 170it [00:18, 9.59it/s] 171it [00:18, 9.57it/s] 172it [00:18, 9.59it/s] 173it [00:18, 9.57it/s] 174it [00:18, 9.47it/s] 175it [00:18, 9.53it/s] 176it [00:18, 9.52it/s] 177it [00:18, 9.54it/s] 178it [00:18, 9.48it/s] 179it [00:19, 9.49it/s] 180it [00:19, 9.49it/s] 181it [00:19, 9.48it/s] 182it [00:19, 9.43it/s] 183it [00:19, 9.50it/s] 184it [00:19, 9.47it/s] 185it [00:19, 9.50it/s] 186it [00:19, 9.49it/s] 187it [00:19, 9.53it/s] 188it [00:19, 9.51it/s] 189it [00:20, 9.53it/s] 190it [00:20, 9.55it/s] 191it [00:20, 9.51it/s] 192it [00:20, 9.52it/s] 193it [00:20, 9.54it/s] 194it [00:20, 8.94it/s] 195it [00:20, 8.53it/s] 196it [00:20, 8.81it/s] 196it [00:20, 9.37it/s] +2025-05-26 06:09:09,457 - INFO - Epoch: 69, Objective: tensor([5429.6377], device='cuda:0', grad_fn=), Loss: 0.039554789662361145, KL/n: 65.18160247802734 +2025-05-26 06:09:09,462 - INFO - Select objective: bbb + 0it [00:00, ?it/s] 2it [00:00, 16.00it/s] 5it [00:00, 22.55it/s] 9it [00:00, 26.29it/s] 12it [00:00, 27.31it/s] 15it [00:00, 27.94it/s] 18it [00:00, 28.43it/s] 21it [00:00, 28.72it/s] 24it [00:00, 29.05it/s] 27it [00:00, 29.16it/s] 30it [00:01, 29.24it/s] 33it [00:01, 28.92it/s] 36it [00:01, 29.19it/s] 39it [00:01, 29.39it/s] 43it [00:01, 29.75it/s] 47it [00:01, 29.85it/s] 51it [00:01, 30.03it/s] 55it [00:01, 30.06it/s] 59it [00:02, 30.03it/s] 63it [00:02, 30.08it/s] 67it [00:02, 30.06it/s] 71it [00:02, 30.13it/s] 75it [00:02, 30.11it/s] 79it [00:02, 30.11it/s] 83it [00:02, 30.08it/s] 87it [00:02, 30.09it/s] 91it [00:03, 30.10it/s] 95it [00:03, 30.17it/s] 99it [00:03, 30.17it/s] 103it [00:03, 30.18it/s] 107it [00:03, 30.20it/s] 111it [00:03, 30.23it/s] 115it [00:03, 30.12it/s] 119it [00:04, 30.00it/s] 123it [00:04, 30.08it/s] 127it [00:04, 30.13it/s] 131it [00:04, 30.07it/s] 135it [00:04, 30.12it/s] 139it [00:04, 30.13it/s] 143it [00:04, 30.17it/s] 147it [00:04, 30.10it/s] 151it [00:05, 30.09it/s] 155it [00:05, 30.11it/s] 159it [00:05, 30.19it/s] 163it [00:05, 30.16it/s] 167it [00:05, 30.19it/s] 171it [00:05, 30.15it/s] 175it [00:05, 30.19it/s] 179it [00:06, 30.12it/s] 183it [00:06, 30.15it/s] 187it [00:06, 30.19it/s] 191it [00:06, 30.17it/s] 195it [00:06, 30.11it/s] 199it [00:06, 30.11it/s] 203it [00:06, 30.19it/s] 207it [00:06, 30.20it/s] 211it [00:07, 30.15it/s] 215it [00:07, 30.23it/s] 219it [00:07, 30.23it/s] 223it [00:07, 30.21it/s] 227it [00:07, 30.23it/s] 231it [00:07, 30.24it/s] 235it [00:07, 30.20it/s] 239it [00:08, 30.22it/s] 243it [00:08, 30.18it/s] 247it [00:08, 30.16it/s] 251it [00:08, 30.16it/s] 255it [00:08, 30.16it/s] 259it [00:08, 30.20it/s] 263it [00:08, 30.22it/s] 267it [00:08, 30.22it/s] 271it [00:09, 30.22it/s] 275it [00:09, 30.20it/s] 279it [00:09, 27.84it/s] 280it [00:09, 29.61it/s] +2025-05-26 06:09:19,259 - INFO - Epoch: 0, Objective: 0.033187031745910645, Loss: 0.030574092641472816, KL/n: 0.0026129374746233225 + 0%| | 0/84 [00:00 Date: Mon, 26 May 2025 20:42:20 +0200 Subject: [PATCH 12/14] addig kl penalty --- core/objective/IWAEObjective.py | 8 +++----- 1 file changed, 3 insertions(+), 5 deletions(-) diff --git a/core/objective/IWAEObjective.py b/core/objective/IWAEObjective.py index 7274302..7954e20 100644 --- a/core/objective/IWAEObjective.py +++ b/core/objective/IWAEObjective.py @@ -14,6 +14,7 @@ def __init__(self, kl_penalty: float, n: int, temperature: float = 1.0) -> None: self.kl_penalty = kl_penalty # usually 1 / |D| self.temperature = temperature self.k = n + logging.debug(f"KL penalty {self.kl_penalty}") logging.debug(f"IWAE temperature {self.temperature}") logging.debug(f"IWAE k {self.k}") @@ -65,9 +66,6 @@ def calculate( scale = dataset_size / batch_size # N / |B| log_ws = [] # list[k] of scalars - temp = self.temperature - beta = 0.001 - for l in range(self.k): # sample w and compute log p(x|w) logits = bounded_call(model, data, pmin) if pmin is not None else model(data) @@ -80,8 +78,8 @@ def calculate( log_lik = scale * log_px.sum() # scalar # global KL part - kl = beta * (self._log_prior(model) - self._log_post(model)) - log_w = log_lik + temp * kl # scalar + kl = self.kl_penalty * (self._log_prior(model) - self._log_post(model)) + log_w = log_lik + kl # scalar log_ws.append(log_w) # -------------------- per-sample logging -------------------- From 083480c3d77da30e1458e84f43a8680b4aa8b091 Mon Sep 17 00:00:00 2001 From: yauhenii Date: Mon, 26 May 2025 23:01:48 +0200 Subject: [PATCH 13/14] add experiments --- ...c_conv15_sigma_0.01_kl_0.0001_lr_0.01.yaml | 63 +++++++++++++++++++ ...onv15_sigma_0.001_kl_0.0001_lr_0.0001.yaml | 62 ++++++++++++++++++ ...nv15_sigma_0.005_kl_0.00005_lr_0.0001.yaml | 62 ++++++++++++++++++ ...onv15_sigma_0.005_kl_0.0001_lr_0.0001.yaml | 62 ++++++++++++++++++ ...conv15_sigma_0.005_kl_0.001_lr_0.0001.yaml | 62 ++++++++++++++++++ ...conv15_sigma_0.01_kl_0.0001_lr_0.0001.yaml | 62 ++++++++++++++++++ 6 files changed, 373 insertions(+) create mode 100644 config/iwae-cifar-penalty/fclassic_conv15_sigma_0.01_kl_0.0001_lr_0.01.yaml create mode 100644 config/iwae-cifar-penalty/iwae_conv15_sigma_0.001_kl_0.0001_lr_0.0001.yaml create mode 100644 config/iwae-cifar-penalty/iwae_conv15_sigma_0.005_kl_0.00005_lr_0.0001.yaml create mode 100644 config/iwae-cifar-penalty/iwae_conv15_sigma_0.005_kl_0.0001_lr_0.0001.yaml create mode 100644 config/iwae-cifar-penalty/iwae_conv15_sigma_0.005_kl_0.001_lr_0.0001.yaml create mode 100644 config/iwae-cifar-penalty/iwae_conv15_sigma_0.01_kl_0.0001_lr_0.0001.yaml diff --git a/config/iwae-cifar-penalty/fclassic_conv15_sigma_0.01_kl_0.0001_lr_0.01.yaml b/config/iwae-cifar-penalty/fclassic_conv15_sigma_0.01_kl_0.0001_lr_0.01.yaml new file mode 100644 index 0000000..0edc39c --- /dev/null +++ b/config/iwae-cifar-penalty/fclassic_conv15_sigma_0.01_kl_0.0001_lr_0.01.yaml @@ -0,0 +1,63 @@ +bound: + delta: 0.025 + delta_test: 0.01 +dist_init: + seed: 110 +factory: + bounds: + - kl + - mcallester + data_loader: + name: cifar10 + params: + dataset_path: ./data/cifar10 + losses: + - nll_loss + - scaled_nll_loss + - 01_loss + metrics: + - accuracy_micro_metric + - accuracy_macro_metric + - f1_micro_metric + - f1_macro_metric + model: + name: conv15 + params: + dataset: cifar10 + in_channels: 3 + posterior_objective: + name: fclassic + params: + delta: 0.025 + kl_penalty: 1.0 + prior_objective: + name: fclassic + params: + delta: 0.025 + kl_penalty: 0.0001 +log_wandb: true +mcsamples: 1000 +pmin: 5.0e-05 +posterior: + training: + epochs: 1 + lr: 0.001 + momentum: 0.9 + seed: 1135 +prior: + training: + epochs: 100 + lr: 0.01 + momentum: 0.95 + seed: 1135 +sigma: 0.01 +split_config: + batch_size: 250 + dataset_loader_seed: 112 + seed: 111 +split_strategy: + prior_percent: 0.7 + prior_type: learnt + self_certified: true + train_percent: 1.0 + val_percent: 0.0 diff --git a/config/iwae-cifar-penalty/iwae_conv15_sigma_0.001_kl_0.0001_lr_0.0001.yaml b/config/iwae-cifar-penalty/iwae_conv15_sigma_0.001_kl_0.0001_lr_0.0001.yaml new file mode 100644 index 0000000..9f6e49f --- /dev/null +++ b/config/iwae-cifar-penalty/iwae_conv15_sigma_0.001_kl_0.0001_lr_0.0001.yaml @@ -0,0 +1,62 @@ +bound: + delta: 0.025 + delta_test: 0.01 +dist_init: + seed: 110 +factory: + bounds: + - kl + - mcallester + data_loader: + name: cifar10 + params: + dataset_path: ./data/cifar10 + losses: + - nll_loss + - scaled_nll_loss + - 01_loss + metrics: + - accuracy_micro_metric + - accuracy_macro_metric + - f1_micro_metric + - f1_macro_metric + model: + name: conv15 + params: + dataset: cifar10 + in_channels: 3 + posterior_objective: + name: bbb + params: + kl_penalty: 1.0 + prior_objective: + name: iwae + params: + n: 10 + kl_penalty: 0.0001 +log_wandb: true +mcsamples: 1000 +pmin: 5.0e-05 +posterior: + training: + epochs: 1 + lr: 0.001 + momentum: 0.9 + seed: 1135 +prior: + training: + epochs: 100 + lr: 0.0001 + momentum: 0.95 + seed: 1135 +sigma: 0.001 +split_config: + batch_size: 250 + dataset_loader_seed: 112 + seed: 111 +split_strategy: + prior_percent: 0.7 + prior_type: learnt + self_certified: true + train_percent: 1.0 + val_percent: 0.0 diff --git a/config/iwae-cifar-penalty/iwae_conv15_sigma_0.005_kl_0.00005_lr_0.0001.yaml b/config/iwae-cifar-penalty/iwae_conv15_sigma_0.005_kl_0.00005_lr_0.0001.yaml new file mode 100644 index 0000000..bd001be --- /dev/null +++ b/config/iwae-cifar-penalty/iwae_conv15_sigma_0.005_kl_0.00005_lr_0.0001.yaml @@ -0,0 +1,62 @@ +bound: + delta: 0.025 + delta_test: 0.01 +dist_init: + seed: 110 +factory: + bounds: + - kl + - mcallester + data_loader: + name: cifar10 + params: + dataset_path: ./data/cifar10 + losses: + - nll_loss + - scaled_nll_loss + - 01_loss + metrics: + - accuracy_micro_metric + - accuracy_macro_metric + - f1_micro_metric + - f1_macro_metric + model: + name: conv15 + params: + dataset: cifar10 + in_channels: 3 + posterior_objective: + name: bbb + params: + kl_penalty: 1.0 + prior_objective: + name: iwae + params: + n: 10 + kl_penalty: 0.00005 +log_wandb: true +mcsamples: 1000 +pmin: 5.0e-05 +posterior: + training: + epochs: 1 + lr: 0.001 + momentum: 0.9 + seed: 1135 +prior: + training: + epochs: 100 + lr: 0.0001 + momentum: 0.95 + seed: 1135 +sigma: 0.005 +split_config: + batch_size: 250 + dataset_loader_seed: 112 + seed: 111 +split_strategy: + prior_percent: 0.7 + prior_type: learnt + self_certified: true + train_percent: 1.0 + val_percent: 0.0 diff --git a/config/iwae-cifar-penalty/iwae_conv15_sigma_0.005_kl_0.0001_lr_0.0001.yaml b/config/iwae-cifar-penalty/iwae_conv15_sigma_0.005_kl_0.0001_lr_0.0001.yaml new file mode 100644 index 0000000..a76e7f3 --- /dev/null +++ b/config/iwae-cifar-penalty/iwae_conv15_sigma_0.005_kl_0.0001_lr_0.0001.yaml @@ -0,0 +1,62 @@ +bound: + delta: 0.025 + delta_test: 0.01 +dist_init: + seed: 110 +factory: + bounds: + - kl + - mcallester + data_loader: + name: cifar10 + params: + dataset_path: ./data/cifar10 + losses: + - nll_loss + - scaled_nll_loss + - 01_loss + metrics: + - accuracy_micro_metric + - accuracy_macro_metric + - f1_micro_metric + - f1_macro_metric + model: + name: conv15 + params: + dataset: cifar10 + in_channels: 3 + posterior_objective: + name: bbb + params: + kl_penalty: 1.0 + prior_objective: + name: iwae + params: + n: 10 + kl_penalty: 0.0001 +log_wandb: true +mcsamples: 1000 +pmin: 5.0e-05 +posterior: + training: + epochs: 1 + lr: 0.001 + momentum: 0.9 + seed: 1135 +prior: + training: + epochs: 100 + lr: 0.0001 + momentum: 0.95 + seed: 1135 +sigma: 0.005 +split_config: + batch_size: 250 + dataset_loader_seed: 112 + seed: 111 +split_strategy: + prior_percent: 0.7 + prior_type: learnt + self_certified: true + train_percent: 1.0 + val_percent: 0.0 diff --git a/config/iwae-cifar-penalty/iwae_conv15_sigma_0.005_kl_0.001_lr_0.0001.yaml b/config/iwae-cifar-penalty/iwae_conv15_sigma_0.005_kl_0.001_lr_0.0001.yaml new file mode 100644 index 0000000..72e6961 --- /dev/null +++ b/config/iwae-cifar-penalty/iwae_conv15_sigma_0.005_kl_0.001_lr_0.0001.yaml @@ -0,0 +1,62 @@ +bound: + delta: 0.025 + delta_test: 0.01 +dist_init: + seed: 110 +factory: + bounds: + - kl + - mcallester + data_loader: + name: cifar10 + params: + dataset_path: ./data/cifar10 + losses: + - nll_loss + - scaled_nll_loss + - 01_loss + metrics: + - accuracy_micro_metric + - accuracy_macro_metric + - f1_micro_metric + - f1_macro_metric + model: + name: conv15 + params: + dataset: cifar10 + in_channels: 3 + posterior_objective: + name: bbb + params: + kl_penalty: 1.0 + prior_objective: + name: iwae + params: + n: 10 + kl_penalty: 0.001 +log_wandb: true +mcsamples: 1000 +pmin: 5.0e-05 +posterior: + training: + epochs: 1 + lr: 0.001 + momentum: 0.9 + seed: 1135 +prior: + training: + epochs: 100 + lr: 0.0001 + momentum: 0.95 + seed: 1135 +sigma: 0.005 +split_config: + batch_size: 250 + dataset_loader_seed: 112 + seed: 111 +split_strategy: + prior_percent: 0.7 + prior_type: learnt + self_certified: true + train_percent: 1.0 + val_percent: 0.0 diff --git a/config/iwae-cifar-penalty/iwae_conv15_sigma_0.01_kl_0.0001_lr_0.0001.yaml b/config/iwae-cifar-penalty/iwae_conv15_sigma_0.01_kl_0.0001_lr_0.0001.yaml new file mode 100644 index 0000000..69b504f --- /dev/null +++ b/config/iwae-cifar-penalty/iwae_conv15_sigma_0.01_kl_0.0001_lr_0.0001.yaml @@ -0,0 +1,62 @@ +bound: + delta: 0.025 + delta_test: 0.01 +dist_init: + seed: 110 +factory: + bounds: + - kl + - mcallester + data_loader: + name: cifar10 + params: + dataset_path: ./data/cifar10 + losses: + - nll_loss + - scaled_nll_loss + - 01_loss + metrics: + - accuracy_micro_metric + - accuracy_macro_metric + - f1_micro_metric + - f1_macro_metric + model: + name: conv15 + params: + dataset: cifar10 + in_channels: 3 + posterior_objective: + name: bbb + params: + kl_penalty: 1.0 + prior_objective: + name: iwae + params: + n: 10 + kl_penalty: 0.0001 +log_wandb: true +mcsamples: 1000 +pmin: 5.0e-05 +posterior: + training: + epochs: 1 + lr: 0.001 + momentum: 0.9 + seed: 1135 +prior: + training: + epochs: 100 + lr: 0.0001 + momentum: 0.95 + seed: 1135 +sigma: 0.01 +split_config: + batch_size: 250 + dataset_loader_seed: 112 + seed: 111 +split_strategy: + prior_percent: 0.7 + prior_type: learnt + self_certified: true + train_percent: 1.0 + val_percent: 0.0 From ed099bf213b920e8369fb9c72281b1afcdef7635 Mon Sep 17 00:00:00 2001 From: Misipuk Date: Tue, 27 May 2025 23:36:47 +0200 Subject: [PATCH 14/14] added-configs --- ...ma_0.005_kl_0.0001_lr_0.0001_post_bbb.yaml | 62 +++++++++++++++++++ ...a_0.005_kl_0.0001_lr_0.0001_post_iwae.yaml | 62 +++++++++++++++++++ .../iwae_mnist_cifar_v2/test_conv_100_3.yaml | 62 +++++++++++++++++++ 3 files changed, 186 insertions(+) create mode 100644 config/iwae_mnist_cifar_v2/iwae_conv15_sigma_0.005_kl_0.0001_lr_0.0001_post_bbb.yaml create mode 100644 config/iwae_mnist_cifar_v2/iwae_conv15_sigma_0.005_kl_0.0001_lr_0.0001_post_iwae.yaml create mode 100644 config/iwae_mnist_cifar_v2/test_conv_100_3.yaml diff --git a/config/iwae_mnist_cifar_v2/iwae_conv15_sigma_0.005_kl_0.0001_lr_0.0001_post_bbb.yaml b/config/iwae_mnist_cifar_v2/iwae_conv15_sigma_0.005_kl_0.0001_lr_0.0001_post_bbb.yaml new file mode 100644 index 0000000..ab12f58 --- /dev/null +++ b/config/iwae_mnist_cifar_v2/iwae_conv15_sigma_0.005_kl_0.0001_lr_0.0001_post_bbb.yaml @@ -0,0 +1,62 @@ +bound: + delta: 0.025 + delta_test: 0.01 +dist_init: + seed: 110 +factory: + bounds: + - kl + - mcallester + data_loader: + name: cifar10 + params: + dataset_path: ./data/cifar10 + losses: + - nll_loss + - scaled_nll_loss + - 01_loss + metrics: + - accuracy_micro_metric + - accuracy_macro_metric + - f1_micro_metric + - f1_macro_metric + model: + name: conv15 + params: + dataset: cifar10 + in_channels: 3 + posterior_objective: + name: bbb + params: + kl_penalty: 1.0 + prior_objective: + name: iwae + params: + n: 10 + kl_penalty: 0.0001 +log_wandb: true +mcsamples: 1000 +pmin: 5.0e-05 +posterior: + training: + epochs: 1 + lr: 0.0001 + momentum: 0.9 + seed: 1135 +prior: + training: + epochs: 100 + lr: 0.0001 + momentum: 0.95 + seed: 1135 +sigma: 0.005 +split_config: + batch_size: 250 + dataset_loader_seed: 112 + seed: 111 +split_strategy: + prior_percent: 0.7 + prior_type: learnt + self_certified: true + train_percent: 1.0 + val_percent: 0.0 diff --git a/config/iwae_mnist_cifar_v2/iwae_conv15_sigma_0.005_kl_0.0001_lr_0.0001_post_iwae.yaml b/config/iwae_mnist_cifar_v2/iwae_conv15_sigma_0.005_kl_0.0001_lr_0.0001_post_iwae.yaml new file mode 100644 index 0000000..b019569 --- /dev/null +++ b/config/iwae_mnist_cifar_v2/iwae_conv15_sigma_0.005_kl_0.0001_lr_0.0001_post_iwae.yaml @@ -0,0 +1,62 @@ +bound: + delta: 0.025 + delta_test: 0.01 +dist_init: + seed: 110 +factory: + bounds: + - kl + - mcallester + data_loader: + name: cifar10 + params: + dataset_path: ./data/cifar10 + losses: + - nll_loss + - scaled_nll_loss + - 01_loss + metrics: + - accuracy_micro_metric + - accuracy_macro_metric + - f1_micro_metric + - f1_macro_metric + model: + name: conv15 + params: + dataset: cifar10 + in_channels: 3 + posterior_objective: + name: iwae + params: + kl_penalty: 1.0 + prior_objective: + name: iwae + params: + n: 10 + kl_penalty: 0.0001 +log_wandb: true +mcsamples: 1000 +pmin: 5.0e-05 +posterior: + training: + epochs: 1 + lr: 0.0001 + momentum: 0.9 + seed: 1135 +prior: + training: + epochs: 100 + lr: 0.0001 + momentum: 0.95 + seed: 1135 +sigma: 0.005 +split_config: + batch_size: 250 + dataset_loader_seed: 112 + seed: 111 +split_strategy: + prior_percent: 0.7 + prior_type: learnt + self_certified: true + train_percent: 1.0 + val_percent: 0.0 diff --git a/config/iwae_mnist_cifar_v2/test_conv_100_3.yaml b/config/iwae_mnist_cifar_v2/test_conv_100_3.yaml new file mode 100644 index 0000000..54137a6 --- /dev/null +++ b/config/iwae_mnist_cifar_v2/test_conv_100_3.yaml @@ -0,0 +1,62 @@ +bound: + delta: 0.025 + delta_test: 0.01 +dist_init: + seed: 110 +factory: + bounds: + - kl + - mcallester + data_loader: + name: mnist + params: + dataset_path: ./data/mnist + losses: + - nll_loss + - scaled_nll_loss + - 01_loss + metrics: + - accuracy_micro_metric + - accuracy_macro_metric + - f1_micro_metric + - f1_macro_metric + model: + name: conv + params: + dataset: mnist + in_channels: 1 + posterior_objective: + name: bbb + params: + kl_penalty: 1.0 + prior_objective: + name: iwae + params: + n: 10 + kl_penalty: 0.001 +log_wandb: true +mcsamples: 1000 +pmin: 5.0e-05 +posterior: + training: + epochs: 3 + lr: 0.0001 + momentum: 0.9 + seed: 1135 +prior: + training: + epochs: 100 + lr: 0.0001 + momentum: 0.95 + seed: 1135 +sigma: 0.005 +split_config: + batch_size: 250 + dataset_loader_seed: 112 + seed: 111 +split_strategy: + prior_percent: 0.7 + prior_type: learnt + self_certified: true + train_percent: 1.0 + val_percent: 0.0 \ No newline at end of file