diff --git "a/flowsdvae_500kx512_lgn0p0/log.txt" "b/flowsdvae_500kx512_lgn0p0/log.txt" new file mode 100644--- /dev/null +++ "b/flowsdvae_500kx512_lgn0p0/log.txt" @@ -0,0 +1,5283 @@ +[2025-02-27 15:05:22] Model: DistributedDataParallel( + (module): FlowAE( + (flow): FlowDecoder( + (conv_in): Conv2d(512, 512, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (mid): Module( + (block_1): ResnetBlock( + (norm1): RMSNorm() + (conv1): Conv2d(512, 512, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (temb_proj): Conv2d(512, 512, kernel_size=(1, 1), stride=(1, 1)) + (norm2): RMSNorm() + (dropout): Dropout(p=0.0, inplace=False) + (conv2): Conv2d(512, 512, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + ) + (attn_1): AttnBlock( + (norm): RMSNorm() + (q): Conv2d(512, 512, kernel_size=(1, 1), stride=(1, 1)) + (k): Conv2d(512, 512, kernel_size=(1, 1), stride=(1, 1)) + (v): Conv2d(512, 512, kernel_size=(1, 1), stride=(1, 1)) + (proj_out): Conv2d(512, 512, kernel_size=(1, 1), stride=(1, 1)) + ) + (block_2): ResnetBlock( + (norm1): RMSNorm() + (conv1): Conv2d(512, 512, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (temb_proj): Conv2d(512, 512, kernel_size=(1, 1), stride=(1, 1)) + (norm2): RMSNorm() + (dropout): Dropout(p=0.0, inplace=False) + (conv2): Conv2d(512, 512, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + ) + ) + (up): ModuleList( + (0): Module( + (block): ModuleList( + (0): ResnetBlock( + (norm1): RMSNorm() + (conv1): Conv2d(256, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (temb_proj): Conv2d(512, 128, kernel_size=(1, 1), stride=(1, 1)) + (norm2): RMSNorm() + (dropout): Dropout(p=0.0, inplace=False) + (conv2): Conv2d(128, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (nin_shortcut): Conv2d(256, 128, kernel_size=(1, 1), stride=(1, 1)) + ) + (1-2): 2 x ResnetBlock( + (norm1): RMSNorm() + (conv1): Conv2d(128, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (temb_proj): Conv2d(512, 128, kernel_size=(1, 1), stride=(1, 1)) + (norm2): RMSNorm() + (dropout): Dropout(p=0.0, inplace=False) + (conv2): Conv2d(128, 128, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + ) + ) + (attn): ModuleList() + ) + (1): Module( + (block): ModuleList( + (0): ResnetBlock( + (norm1): RMSNorm() + (conv1): Conv2d(512, 256, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (temb_proj): Conv2d(512, 256, kernel_size=(1, 1), stride=(1, 1)) + (norm2): RMSNorm() + (dropout): Dropout(p=0.0, inplace=False) + (conv2): Conv2d(256, 256, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (nin_shortcut): Conv2d(512, 256, kernel_size=(1, 1), stride=(1, 1)) + ) + (1-2): 2 x ResnetBlock( + (norm1): RMSNorm() + (conv1): Conv2d(256, 256, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (temb_proj): Conv2d(512, 256, kernel_size=(1, 1), stride=(1, 1)) + (norm2): RMSNorm() + (dropout): Dropout(p=0.0, inplace=False) + (conv2): Conv2d(256, 256, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + ) + ) + (attn): ModuleList() + (upsample): Upsample( + (conv): Conv2d(256, 256, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + ) + ) + (2-3): 2 x Module( + (block): ModuleList( + (0-2): 3 x ResnetBlock( + (norm1): RMSNorm() + (conv1): Conv2d(512, 512, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + (temb_proj): Conv2d(512, 512, kernel_size=(1, 1), stride=(1, 1)) + (norm2): RMSNorm() + (dropout): Dropout(p=0.0, inplace=False) + (conv2): Conv2d(512, 512, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + ) + ) + (attn): ModuleList() + (upsample): Upsample( + (conv): Conv2d(512, 512, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + ) + ) + ) + (norm_out): RMSNorm() + (conv_out): Conv2d(128, 3, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1)) + ) + (t_embedder): TimestepEmbedder( + (mlp): Sequential( + (0): Linear(in_features=256, out_features=512, bias=True) + (1): SiLU() + (2): Linear(in_features=512, out_features=512, bias=True) + ) + ) + (y_embedder): Conv2d(4, 512, kernel_size=(1, 1), stride=(1, 1)) + (x_embedder): PatchEmbed( + (proj): Conv2d(3, 512, kernel_size=(8, 8), stride=(8, 8)) + (norm): Identity() + ) + ) +) +[2025-02-27 15:05:22] FlowVAE Parameters: 55.53M +[2025-02-27 15:05:22] FlowVAE Trainable Parameters: 55.01M +[2025-02-27 15:05:22] Optimizer: AdamW, lr=0.0002, beta2=0.95 +[2025-02-27 15:05:22] module.pos_embed.requires_grad : False +[2025-02-27 15:05:22] module.flow.conv_in.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.conv_in.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.mid.block_1.norm1.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.mid.block_1.conv1.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.mid.block_1.conv1.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.mid.block_1.temb_proj.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.mid.block_1.temb_proj.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.mid.block_1.norm2.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.mid.block_1.conv2.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.mid.block_1.conv2.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.mid.attn_1.norm.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.mid.attn_1.q.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.mid.attn_1.q.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.mid.attn_1.k.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.mid.attn_1.k.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.mid.attn_1.v.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.mid.attn_1.v.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.mid.attn_1.proj_out.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.mid.attn_1.proj_out.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.mid.block_2.norm1.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.mid.block_2.conv1.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.mid.block_2.conv1.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.mid.block_2.temb_proj.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.mid.block_2.temb_proj.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.mid.block_2.norm2.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.mid.block_2.conv2.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.mid.block_2.conv2.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.0.block.0.norm1.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.0.block.0.conv1.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.0.block.0.conv1.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.0.block.0.temb_proj.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.0.block.0.temb_proj.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.0.block.0.norm2.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.0.block.0.conv2.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.0.block.0.conv2.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.0.block.0.nin_shortcut.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.0.block.0.nin_shortcut.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.0.block.1.norm1.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.0.block.1.conv1.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.0.block.1.conv1.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.0.block.1.temb_proj.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.0.block.1.temb_proj.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.0.block.1.norm2.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.0.block.1.conv2.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.0.block.1.conv2.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.0.block.2.norm1.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.0.block.2.conv1.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.0.block.2.conv1.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.0.block.2.temb_proj.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.0.block.2.temb_proj.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.0.block.2.norm2.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.0.block.2.conv2.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.0.block.2.conv2.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.1.block.0.norm1.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.1.block.0.conv1.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.1.block.0.conv1.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.1.block.0.temb_proj.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.1.block.0.temb_proj.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.1.block.0.norm2.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.1.block.0.conv2.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.1.block.0.conv2.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.1.block.0.nin_shortcut.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.1.block.0.nin_shortcut.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.1.block.1.norm1.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.1.block.1.conv1.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.1.block.1.conv1.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.1.block.1.temb_proj.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.1.block.1.temb_proj.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.1.block.1.norm2.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.1.block.1.conv2.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.1.block.1.conv2.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.1.block.2.norm1.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.1.block.2.conv1.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.1.block.2.conv1.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.1.block.2.temb_proj.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.1.block.2.temb_proj.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.1.block.2.norm2.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.1.block.2.conv2.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.1.block.2.conv2.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.1.upsample.conv.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.1.upsample.conv.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.2.block.0.norm1.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.2.block.0.conv1.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.2.block.0.conv1.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.2.block.0.temb_proj.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.2.block.0.temb_proj.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.2.block.0.norm2.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.2.block.0.conv2.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.2.block.0.conv2.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.2.block.1.norm1.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.2.block.1.conv1.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.2.block.1.conv1.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.2.block.1.temb_proj.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.2.block.1.temb_proj.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.2.block.1.norm2.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.2.block.1.conv2.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.2.block.1.conv2.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.2.block.2.norm1.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.2.block.2.conv1.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.2.block.2.conv1.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.2.block.2.temb_proj.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.2.block.2.temb_proj.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.2.block.2.norm2.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.2.block.2.conv2.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.2.block.2.conv2.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.2.upsample.conv.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.2.upsample.conv.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.3.block.0.norm1.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.3.block.0.conv1.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.3.block.0.conv1.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.3.block.0.temb_proj.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.3.block.0.temb_proj.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.3.block.0.norm2.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.3.block.0.conv2.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.3.block.0.conv2.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.3.block.1.norm1.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.3.block.1.conv1.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.3.block.1.conv1.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.3.block.1.temb_proj.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.3.block.1.temb_proj.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.3.block.1.norm2.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.3.block.1.conv2.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.3.block.1.conv2.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.3.block.2.norm1.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.3.block.2.conv1.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.3.block.2.conv1.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.3.block.2.temb_proj.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.3.block.2.temb_proj.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.3.block.2.norm2.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.3.block.2.conv2.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.3.block.2.conv2.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.3.upsample.conv.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.up.3.upsample.conv.bias.requires_grad : True +[2025-02-27 15:05:22] module.flow.norm_out.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.conv_out.weight.requires_grad : True +[2025-02-27 15:05:22] module.flow.conv_out.bias.requires_grad : True +[2025-02-27 15:05:22] module.t_embedder.mlp.0.weight.requires_grad : True +[2025-02-27 15:05:22] module.t_embedder.mlp.0.bias.requires_grad : True +[2025-02-27 15:05:22] module.t_embedder.mlp.2.weight.requires_grad : True +[2025-02-27 15:05:22] module.t_embedder.mlp.2.bias.requires_grad : True +[2025-02-27 15:05:22] module.y_embedder.weight.requires_grad : True +[2025-02-27 15:05:22] module.y_embedder.bias.requires_grad : True +[2025-02-27 15:05:22] module.x_embedder.proj.weight.requires_grad : True +[2025-02-27 15:05:22] module.x_embedder.proj.bias.requires_grad : True +[2025-02-27 15:05:23] Dataset contains 1,281,168 images /data/checkpoints/LanguageBind/offline_feature/offline_sdvae_256_path/imagenet_train_256 +[2025-02-27 15:05:23] Batch size 32 per gpu, with 512 global batch size +[2025-02-27 15:05:23] Train config: {'ckpt_path': '/data/logs/flow/flowsdvae_500kx512_lgn0p0/checkpoints/0500000.pt', 'data': {'raw_data_dir': '/data/OpenDataLab___ImageNet-1K/raw/ImageNet-1K/train', 'raw_val_data_dir': '/data/OpenDataLab___ImageNet-1K/raw/ImageNet-1K/val', 'data_path': '/data/checkpoints/LanguageBind/offline_feature/offline_sdvae_256_path/imagenet_train_256', 'fid_reference_file': '/data/checkpoints/VIRTUAL_imagenet256_labeled.npz', 'image_size': 256, 'num_classes': 1000, 'num_workers': 32, 'latent_norm': False, 'latent_multiplier': 0.18215}, 'vae': {'vae_type': 'FlowSDVAE', 'model_path': '/data/checkpoints/stabilityai/sd-vae-ft-ema/vae-ft-ema-560000-ema-pruned.safetensors', 'downsample_ratio': 8, 'multi_latent': False, 'add_y_to_x': False, 'norm_type': 'rmsnorm'}, 'model': {'model_type': 'DiT-S/2', 'use_qknorm': True, 'use_swiglu': True, 'use_rope': True, 'use_rmsnorm': True, 'in_chans': 4, 'use_checkpoint': False}, 'train': {'max_steps': 500000, 'global_batch_size': 512, 'global_seed': 0, 'output_dir': '../logs/flow/flowsdvae_500kx512_lgn0p0', 'ckpt': None, 'log_every': 100, 'ckpt_every': 50000, 'eval_every': 50000, 'wandb': True, 'seed': 1234, 'precision': 'bf16', 'resume': False}, 'optimizer': {'lr': 0.0002, 'beta2': 0.95}, 'wandb': {'proj_name': 'flow', 'log_name': 'flowsdvae_500kx512_lgn0p0', 'key': '953e958793b218efb850fa194e85843e2c3bd88b'}, 'scheduler': {'diffusion': False, 'transport': True}, 'diffusion': {'learn_sigma': True, 'diffusion_steps': 1000}, 'transport': {'path_type': 'Linear', 'prediction': 'velocity', 'loss_weight': None, 'sample_eps': None, 'train_eps': None, 'use_cosine_loss': True, 'use_lognorm': True}, 'sample': {'mode': 'ODE', 'sampling_method': 'euler', 'atol': 1e-06, 'rtol': 0.001, 'reverse': False, 'likelihood': False, 'num_sampling_steps': 250, 'cfg_scale': 1.0, 'per_proc_batch_size': 64, 'fid_num': 50000, 'cfg_interval_start': 0.0, 'timestep_shift': 0.0}, 'flowvae_transport': {'path_type': 'Linear', 'prediction': 'velocity', 'loss_weight': None, 'sample_eps': None, 'train_eps': None, 'use_cosine_loss': False, 'use_lognorm': True, 'l2_loss': True, 'shift_lg': True, 'shifted_mu': 0.0, 'timestep_sampling': 'lognorm', 'beta_alpha': None, 'beta_beta': None, 'pareto_alpha': None}, 'flowvae_sample': {'mode': 'ODE', 'sampling_method': 'euler', 'atol': 1e-06, 'rtol': 0.001, 'reverse': False, 'likelihood': False, 'num_sampling_steps': 3, 'cfg_scale': 1.0, 'per_proc_batch_size': 64, 'fid_num': 50000, 'cfg_interval_start': 0.0, 'timestep_shift': 0.0}} +[2025-02-27 15:07:22] (step=0000100) Train Loss: 1.1212, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 0.84, Grad Norm: 2.0826 +[2025-02-27 15:08:22] (step=0000200) Train Loss: 1.0388, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.4600 +[2025-02-27 15:09:22] (step=0000300) Train Loss: 1.0265, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.4504 +[2025-02-27 15:10:22] (step=0000400) Train Loss: 1.0087, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.4444 +[2025-02-27 15:11:21] (step=0000500) Train Loss: 0.9530, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.5989 +[2025-02-27 15:12:21] (step=0000600) Train Loss: 0.8187, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.9897 +[2025-02-27 15:13:21] (step=0000700) Train Loss: 0.6821, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 1.1270 +[2025-02-27 15:14:20] (step=0000800) Train Loss: 0.5541, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 1.4289 +[2025-02-27 15:15:20] (step=0000900) Train Loss: 0.4774, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 1.4954 +[2025-02-27 15:16:20] (step=0001000) Train Loss: 0.4061, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 1.4940 +[2025-02-27 15:17:20] (step=0001100) Train Loss: 0.3388, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 1.4667 +[2025-02-27 15:18:19] (step=0001200) Train Loss: 0.2952, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 1.5525 +[2025-02-27 15:19:19] (step=0001300) Train Loss: 0.2767, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 1.5831 +[2025-02-27 15:20:19] (step=0001400) Train Loss: 0.2579, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 1.4519 +[2025-02-27 15:21:19] (step=0001500) Train Loss: 0.2471, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 1.4311 +[2025-02-27 15:22:18] (step=0001600) Train Loss: 0.2390, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 1.4136 +[2025-02-27 15:23:18] (step=0001700) Train Loss: 0.2325, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 1.3169 +[2025-02-27 15:24:18] (step=0001800) Train Loss: 0.2270, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 1.3440 +[2025-02-27 15:25:17] (step=0001900) Train Loss: 0.2213, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 1.3021 +[2025-02-27 15:26:17] (step=0002000) Train Loss: 0.2150, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 1.2622 +[2025-02-27 15:27:17] (step=0002100) Train Loss: 0.2114, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 1.2489 +[2025-02-27 15:28:16] (step=0002200) Train Loss: 0.2079, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 1.2193 +[2025-02-27 15:29:16] (step=0002300) Train Loss: 0.2071, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 1.2339 +[2025-02-27 15:30:15] (step=0002400) Train Loss: 0.2002, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 1.1762 +[2025-02-27 15:31:15] (step=0002500) Train Loss: 0.1982, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 1.0878 +[2025-02-27 15:32:18] (step=0002600) Train Loss: 0.1947, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 1.1842 +[2025-02-27 15:33:18] (step=0002700) Train Loss: 0.1898, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 1.0616 +[2025-02-27 15:34:17] (step=0002800) Train Loss: 0.1869, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 1.0956 +[2025-02-27 15:35:17] (step=0002900) Train Loss: 0.1858, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 1.1287 +[2025-02-27 15:36:17] (step=0003000) Train Loss: 0.1829, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 1.0132 +[2025-02-27 15:37:16] (step=0003100) Train Loss: 0.1793, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 1.0156 +[2025-02-27 15:38:16] (step=0003200) Train Loss: 0.1847, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 1.2264 +[2025-02-27 15:39:16] (step=0003300) Train Loss: 0.1752, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 1.0344 +[2025-02-27 15:40:15] (step=0003400) Train Loss: 0.1744, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 1.1092 +[2025-02-27 15:41:15] (step=0003500) Train Loss: 0.1700, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.9700 +[2025-02-27 15:42:15] (step=0003600) Train Loss: 0.1674, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.9942 +[2025-02-27 15:43:14] (step=0003700) Train Loss: 0.1676, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 1.0268 +[2025-02-27 15:44:14] (step=0003800) Train Loss: 0.1628, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.9702 +[2025-02-27 15:45:14] (step=0003900) Train Loss: 0.1635, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.9962 +[2025-02-27 15:46:13] (step=0004000) Train Loss: 0.1581, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.9767 +[2025-02-27 15:47:13] (step=0004100) Train Loss: 0.1551, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.9627 +[2025-02-27 15:48:13] (step=0004200) Train Loss: 0.1514, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 1.0111 +[2025-02-27 15:49:12] (step=0004300) Train Loss: 0.1447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.9703 +[2025-02-27 15:50:12] (step=0004400) Train Loss: 0.1398, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.9206 +[2025-02-27 15:51:11] (step=0004500) Train Loss: 0.1352, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.9665 +[2025-02-27 15:52:11] (step=0004600) Train Loss: 0.1273, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.8766 +[2025-02-27 15:53:11] (step=0004700) Train Loss: 0.1190, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.8519 +[2025-02-27 15:54:10] (step=0004800) Train Loss: 0.1145, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.8185 +[2025-02-27 15:55:10] (step=0004900) Train Loss: 0.1114, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.8587 +[2025-02-27 15:56:10] (step=0005000) Train Loss: 0.1072, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.7651 +[2025-02-27 15:57:12] (step=0005100) Train Loss: 0.1064, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.60, Grad Norm: 0.7843 +[2025-02-27 15:58:12] (step=0005200) Train Loss: 0.1035, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.7652 +[2025-02-27 15:59:12] (step=0005300) Train Loss: 0.1019, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.7317 +[2025-02-27 16:00:11] (step=0005400) Train Loss: 0.1027, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.8714 +[2025-02-27 16:01:11] (step=0005500) Train Loss: 0.1003, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.7202 +[2025-02-27 16:02:11] (step=0005600) Train Loss: 0.0982, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.7311 +[2025-02-27 16:03:11] (step=0005700) Train Loss: 0.0973, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.7241 +[2025-02-27 16:04:10] (step=0005800) Train Loss: 0.0952, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.6965 +[2025-02-27 16:05:10] (step=0005900) Train Loss: 0.0922, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.6845 +[2025-02-27 16:06:10] (step=0006000) Train Loss: 0.0865, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.6991 +[2025-02-27 16:07:10] (step=0006100) Train Loss: 0.0812, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.6774 +[2025-02-27 16:08:09] (step=0006200) Train Loss: 0.0782, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.6871 +[2025-02-27 16:09:09] (step=0006300) Train Loss: 0.0764, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.6567 +[2025-02-27 16:10:09] (step=0006400) Train Loss: 0.0753, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.6684 +[2025-02-27 16:11:09] (step=0006500) Train Loss: 0.0743, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.6619 +[2025-02-27 16:12:08] (step=0006600) Train Loss: 0.0733, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.6451 +[2025-02-27 16:13:08] (step=0006700) Train Loss: 0.0728, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.6859 +[2025-02-27 16:14:08] (step=0006800) Train Loss: 0.0715, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.6174 +[2025-02-27 16:15:08] (step=0006900) Train Loss: 0.0710, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.6242 +[2025-02-27 16:16:07] (step=0007000) Train Loss: 0.0700, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.6231 +[2025-02-27 16:17:07] (step=0007100) Train Loss: 0.0699, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.6220 +[2025-02-27 16:18:07] (step=0007200) Train Loss: 0.0691, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.6168 +[2025-02-27 16:19:07] (step=0007300) Train Loss: 0.0681, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.6053 +[2025-02-27 16:20:06] (step=0007400) Train Loss: 0.0679, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.6030 +[2025-02-27 16:21:06] (step=0007500) Train Loss: 0.0678, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.6266 +[2025-02-27 16:22:08] (step=0007600) Train Loss: 0.0669, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.60, Grad Norm: 0.6086 +[2025-02-27 16:23:08] (step=0007700) Train Loss: 0.0665, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.5972 +[2025-02-27 16:24:08] (step=0007800) Train Loss: 0.0656, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.5678 +[2025-02-27 16:25:08] (step=0007900) Train Loss: 0.0659, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.5897 +[2025-02-27 16:26:07] (step=0008000) Train Loss: 0.0651, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.5843 +[2025-02-27 16:27:07] (step=0008100) Train Loss: 0.0644, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.5903 +[2025-02-27 16:28:07] (step=0008200) Train Loss: 0.0640, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.5606 +[2025-02-27 16:29:07] (step=0008300) Train Loss: 0.0633, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.5848 +[2025-02-27 16:30:06] (step=0008400) Train Loss: 0.0634, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.5598 +[2025-02-27 16:31:06] (step=0008500) Train Loss: 0.0629, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.5481 +[2025-02-27 16:32:06] (step=0008600) Train Loss: 0.0633, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.5639 +[2025-02-27 16:33:05] (step=0008700) Train Loss: 0.0631, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.5737 +[2025-02-27 16:34:05] (step=0008800) Train Loss: 0.0630, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.5677 +[2025-02-27 16:35:05] (step=0008900) Train Loss: 0.0620, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.5514 +[2025-02-27 16:36:04] (step=0009000) Train Loss: 0.0620, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.5481 +[2025-02-27 16:37:04] (step=0009100) Train Loss: 0.0620, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.5589 +[2025-02-27 16:38:04] (step=0009200) Train Loss: 0.0616, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.5607 +[2025-02-27 16:39:03] (step=0009300) Train Loss: 0.0610, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.5466 +[2025-02-27 16:40:03] (step=0009400) Train Loss: 0.0610, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.5451 +[2025-02-27 16:41:03] (step=0009500) Train Loss: 0.0605, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.5734 +[2025-02-27 16:42:02] (step=0009600) Train Loss: 0.0606, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.5367 +[2025-02-27 16:43:02] (step=0009700) Train Loss: 0.0602, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.5348 +[2025-02-27 16:44:02] (step=0009800) Train Loss: 0.0603, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.5445 +[2025-02-27 16:45:01] (step=0009900) Train Loss: 0.0599, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.5448 +[2025-02-27 16:46:01] (step=0010000) Train Loss: 0.0601, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.5534 +[2025-02-27 16:47:04] (step=0010100) Train Loss: 0.0598, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.60, Grad Norm: 0.5417 +[2025-02-27 16:48:03] (step=0010200) Train Loss: 0.0591, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.5266 +[2025-02-27 16:49:03] (step=0010300) Train Loss: 0.0598, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.5250 +[2025-02-27 16:50:03] (step=0010400) Train Loss: 0.0592, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.5332 +[2025-02-27 16:51:03] (step=0010500) Train Loss: 0.0583, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.5233 +[2025-02-27 16:52:02] (step=0010600) Train Loss: 0.0588, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.5255 +[2025-02-27 16:53:02] (step=0010700) Train Loss: 0.0584, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.5250 +[2025-02-27 16:54:02] (step=0010800) Train Loss: 0.0589, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.5270 +[2025-02-27 16:55:02] (step=0010900) Train Loss: 0.0581, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.5011 +[2025-02-27 16:56:01] (step=0011000) Train Loss: 0.0584, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.5281 +[2025-02-27 16:57:01] (step=0011100) Train Loss: 0.0575, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.5125 +[2025-02-27 16:58:01] (step=0011200) Train Loss: 0.0579, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.5083 +[2025-02-27 16:59:00] (step=0011300) Train Loss: 0.0578, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.5138 +[2025-02-27 17:00:00] (step=0011400) Train Loss: 0.0579, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.5064 +[2025-02-27 17:01:00] (step=0011500) Train Loss: 0.0574, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.5015 +[2025-02-27 17:02:00] (step=0011600) Train Loss: 0.0575, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.5147 +[2025-02-27 17:02:59] (step=0011700) Train Loss: 0.0575, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.4969 +[2025-02-27 17:03:59] (step=0011800) Train Loss: 0.0572, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.4974 +[2025-02-27 17:04:59] (step=0011900) Train Loss: 0.0573, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.5020 +[2025-02-27 17:05:58] (step=0012000) Train Loss: 0.0569, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.5047 +[2025-02-27 17:06:58] (step=0012100) Train Loss: 0.0572, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.4844 +[2025-02-27 17:07:58] (step=0012200) Train Loss: 0.0565, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.5080 +[2025-02-27 17:08:58] (step=0012300) Train Loss: 0.0565, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.4737 +[2025-02-27 17:09:57] (step=0012400) Train Loss: 0.0567, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.4902 +[2025-02-27 17:10:57] (step=0012500) Train Loss: 0.0562, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.4951 +[2025-02-27 17:12:00] (step=0012600) Train Loss: 0.0560, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.60, Grad Norm: 0.4923 +[2025-02-27 17:12:59] (step=0012700) Train Loss: 0.0562, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.4821 +[2025-02-27 17:13:59] (step=0012800) Train Loss: 0.0567, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.4718 +[2025-02-27 17:14:59] (step=0012900) Train Loss: 0.0566, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.4978 +[2025-02-27 17:15:59] (step=0013000) Train Loss: 0.0562, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.4912 +[2025-02-27 17:16:58] (step=0013100) Train Loss: 0.0563, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.4713 +[2025-02-27 17:17:58] (step=0013200) Train Loss: 0.0562, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.4747 +[2025-02-27 17:18:58] (step=0013300) Train Loss: 0.0556, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.4668 +[2025-02-27 17:19:57] (step=0013400) Train Loss: 0.0553, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.4796 +[2025-02-27 17:20:57] (step=0013500) Train Loss: 0.0559, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.4598 +[2025-02-27 17:21:57] (step=0013600) Train Loss: 0.0556, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.4676 +[2025-02-27 17:22:57] (step=0013700) Train Loss: 0.0557, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.4791 +[2025-02-27 17:23:56] (step=0013800) Train Loss: 0.0556, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.4455 +[2025-02-27 17:24:56] (step=0013900) Train Loss: 0.0557, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.4734 +[2025-02-27 17:25:56] (step=0014000) Train Loss: 0.0552, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.4560 +[2025-02-27 17:26:56] (step=0014100) Train Loss: 0.0551, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.4722 +[2025-02-27 17:27:55] (step=0014200) Train Loss: 0.0554, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.4559 +[2025-02-27 17:28:55] (step=0014300) Train Loss: 0.0548, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.4638 +[2025-02-27 17:29:55] (step=0014400) Train Loss: 0.0545, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.4654 +[2025-02-27 17:30:55] (step=0014500) Train Loss: 0.0552, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.4665 +[2025-02-27 17:31:54] (step=0014600) Train Loss: 0.0549, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.4474 +[2025-02-27 17:32:54] (step=0014700) Train Loss: 0.0550, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.4546 +[2025-02-27 17:33:54] (step=0014800) Train Loss: 0.0548, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.4425 +[2025-02-27 17:34:53] (step=0014900) Train Loss: 0.0553, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.4430 +[2025-02-27 17:35:53] (step=0015000) Train Loss: 0.0547, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.4507 +[2025-02-27 17:36:56] (step=0015100) Train Loss: 0.0544, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.60, Grad Norm: 0.4437 +[2025-02-27 17:37:55] (step=0015200) Train Loss: 0.0550, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.4509 +[2025-02-27 17:38:55] (step=0015300) Train Loss: 0.0542, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.4393 +[2025-02-27 17:39:55] (step=0015400) Train Loss: 0.0543, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.4451 +[2025-02-27 17:40:54] (step=0015500) Train Loss: 0.0546, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.4302 +[2025-02-27 17:41:54] (step=0015600) Train Loss: 0.0546, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.4301 +[2025-02-27 17:42:54] (step=0015700) Train Loss: 0.0544, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.4534 +[2025-02-27 17:43:53] (step=0015800) Train Loss: 0.0543, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.4190 +[2025-02-27 17:44:53] (step=0015900) Train Loss: 0.0541, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.4296 +[2025-02-27 17:45:53] (step=0016000) Train Loss: 0.0540, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.4292 +[2025-02-27 17:46:53] (step=0016100) Train Loss: 0.0539, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.4290 +[2025-02-27 17:47:52] (step=0016200) Train Loss: 0.0542, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.4255 +[2025-02-27 17:48:52] (step=0016300) Train Loss: 0.0540, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.4458 +[2025-02-27 17:49:52] (step=0016400) Train Loss: 0.0542, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.4257 +[2025-02-27 17:50:51] (step=0016500) Train Loss: 0.0544, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.4410 +[2025-02-27 17:51:51] (step=0016600) Train Loss: 0.0535, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.4333 +[2025-02-27 17:52:51] (step=0016700) Train Loss: 0.0540, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.4396 +[2025-02-27 17:53:50] (step=0016800) Train Loss: 0.0538, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.4185 +[2025-02-27 17:54:50] (step=0016900) Train Loss: 0.0543, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.4249 +[2025-02-27 17:55:50] (step=0017000) Train Loss: 0.0539, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.4267 +[2025-02-27 17:56:49] (step=0017100) Train Loss: 0.0536, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3991 +[2025-02-27 17:57:49] (step=0017200) Train Loss: 0.0537, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.4064 +[2025-02-27 17:58:49] (step=0017300) Train Loss: 0.0534, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.4264 +[2025-02-27 17:59:49] (step=0017400) Train Loss: 0.0537, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3984 +[2025-02-27 18:00:48] (step=0017500) Train Loss: 0.0535, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.4081 +[2025-02-27 18:01:51] (step=0017600) Train Loss: 0.0535, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.60, Grad Norm: 0.4169 +[2025-02-27 18:02:50] (step=0017700) Train Loss: 0.0533, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.4166 +[2025-02-27 18:03:50] (step=0017800) Train Loss: 0.0534, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.4080 +[2025-02-27 18:04:50] (step=0017900) Train Loss: 0.0535, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.4145 +[2025-02-27 18:05:49] (step=0018000) Train Loss: 0.0533, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.4050 +[2025-02-27 18:06:49] (step=0018100) Train Loss: 0.0532, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3937 +[2025-02-27 18:07:49] (step=0018200) Train Loss: 0.0538, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.4099 +[2025-02-27 18:08:49] (step=0018300) Train Loss: 0.0533, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.4108 +[2025-02-27 18:09:48] (step=0018400) Train Loss: 0.0530, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.4008 +[2025-02-27 18:10:48] (step=0018500) Train Loss: 0.0529, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.4166 +[2025-02-27 18:11:48] (step=0018600) Train Loss: 0.0528, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3858 +[2025-02-27 18:12:47] (step=0018700) Train Loss: 0.0532, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.4141 +[2025-02-27 18:13:47] (step=0018800) Train Loss: 0.0532, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3992 +[2025-02-27 18:14:47] (step=0018900) Train Loss: 0.0531, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3956 +[2025-02-27 18:15:46] (step=0019000) Train Loss: 0.0526, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3953 +[2025-02-27 18:16:46] (step=0019100) Train Loss: 0.0529, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.4049 +[2025-02-27 18:17:46] (step=0019200) Train Loss: 0.0527, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.4026 +[2025-02-27 18:18:45] (step=0019300) Train Loss: 0.0523, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.4082 +[2025-02-27 18:19:45] (step=0019400) Train Loss: 0.0526, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.4066 +[2025-02-27 18:20:45] (step=0019500) Train Loss: 0.0528, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3883 +[2025-02-27 18:21:45] (step=0019600) Train Loss: 0.0524, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3890 +[2025-02-27 18:22:44] (step=0019700) Train Loss: 0.0527, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3905 +[2025-02-27 18:23:44] (step=0019800) Train Loss: 0.0528, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3809 +[2025-02-27 18:24:44] (step=0019900) Train Loss: 0.0523, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.4005 +[2025-02-27 18:25:43] (step=0020000) Train Loss: 0.0526, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3898 +[2025-02-27 18:26:46] (step=0020100) Train Loss: 0.0526, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.60, Grad Norm: 0.4048 +[2025-02-27 18:27:46] (step=0020200) Train Loss: 0.0527, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3891 +[2025-02-27 18:28:45] (step=0020300) Train Loss: 0.0523, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3834 +[2025-02-27 18:29:45] (step=0020400) Train Loss: 0.0521, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3910 +[2025-02-27 18:30:45] (step=0020500) Train Loss: 0.0521, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3790 +[2025-02-27 18:31:45] (step=0020600) Train Loss: 0.0525, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3843 +[2025-02-27 18:32:44] (step=0020700) Train Loss: 0.0520, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3896 +[2025-02-27 18:33:44] (step=0020800) Train Loss: 0.0520, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3772 +[2025-02-27 18:34:44] (step=0020900) Train Loss: 0.0522, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3764 +[2025-02-27 18:35:43] (step=0021000) Train Loss: 0.0524, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3787 +[2025-02-27 18:36:43] (step=0021100) Train Loss: 0.0523, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3714 +[2025-02-27 18:37:43] (step=0021200) Train Loss: 0.0518, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3838 +[2025-02-27 18:38:42] (step=0021300) Train Loss: 0.0518, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3644 +[2025-02-27 18:39:42] (step=0021400) Train Loss: 0.0522, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3757 +[2025-02-27 18:40:42] (step=0021500) Train Loss: 0.0527, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3778 +[2025-02-27 18:41:42] (step=0021600) Train Loss: 0.0519, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3980 +[2025-02-27 18:42:41] (step=0021700) Train Loss: 0.0524, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3843 +[2025-02-27 18:43:41] (step=0021800) Train Loss: 0.0523, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3759 +[2025-02-27 18:44:41] (step=0021900) Train Loss: 0.0517, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3807 +[2025-02-27 18:45:40] (step=0022000) Train Loss: 0.0518, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3593 +[2025-02-27 18:46:40] (step=0022100) Train Loss: 0.0521, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3770 +[2025-02-27 18:47:40] (step=0022200) Train Loss: 0.0518, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3699 +[2025-02-27 18:48:39] (step=0022300) Train Loss: 0.0518, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3617 +[2025-02-27 18:49:39] (step=0022400) Train Loss: 0.0521, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3631 +[2025-02-27 18:50:39] (step=0022500) Train Loss: 0.0517, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3565 +[2025-02-27 18:51:41] (step=0022600) Train Loss: 0.0517, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.60, Grad Norm: 0.3599 +[2025-02-27 18:52:41] (step=0022700) Train Loss: 0.0523, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3608 +[2025-02-27 18:53:41] (step=0022800) Train Loss: 0.0520, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3700 +[2025-02-27 18:54:40] (step=0022900) Train Loss: 0.0514, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3604 +[2025-02-27 18:55:40] (step=0023000) Train Loss: 0.0519, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3704 +[2025-02-27 18:56:40] (step=0023100) Train Loss: 0.0518, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3606 +[2025-02-27 18:57:39] (step=0023200) Train Loss: 0.0517, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3721 +[2025-02-27 18:58:39] (step=0023300) Train Loss: 0.0518, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3553 +[2025-02-27 18:59:39] (step=0023400) Train Loss: 0.0516, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3663 +[2025-02-27 19:00:38] (step=0023500) Train Loss: 0.0513, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3638 +[2025-02-27 19:01:38] (step=0023600) Train Loss: 0.0517, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3533 +[2025-02-27 19:02:38] (step=0023700) Train Loss: 0.0515, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3559 +[2025-02-27 19:03:38] (step=0023800) Train Loss: 0.0514, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3585 +[2025-02-27 19:04:37] (step=0023900) Train Loss: 0.0513, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3451 +[2025-02-27 19:05:37] (step=0024000) Train Loss: 0.0514, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3570 +[2025-02-27 19:06:37] (step=0024100) Train Loss: 0.0516, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3574 +[2025-02-27 19:07:36] (step=0024200) Train Loss: 0.0511, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3584 +[2025-02-27 19:08:36] (step=0024300) Train Loss: 0.0516, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3468 +[2025-02-27 19:09:36] (step=0024400) Train Loss: 0.0511, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3577 +[2025-02-27 19:10:35] (step=0024500) Train Loss: 0.0517, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3459 +[2025-02-27 19:11:35] (step=0024600) Train Loss: 0.0514, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3526 +[2025-02-27 19:12:35] (step=0024700) Train Loss: 0.0515, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3457 +[2025-02-27 19:13:34] (step=0024800) Train Loss: 0.0516, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3582 +[2025-02-27 19:14:34] (step=0024900) Train Loss: 0.0513, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3471 +[2025-02-27 19:15:34] (step=0025000) Train Loss: 0.0513, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3366 +[2025-02-27 19:16:36] (step=0025100) Train Loss: 0.0513, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.60, Grad Norm: 0.3548 +[2025-02-27 19:17:36] (step=0025200) Train Loss: 0.0513, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3581 +[2025-02-27 19:18:36] (step=0025300) Train Loss: 0.0506, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3331 +[2025-02-27 19:19:36] (step=0025400) Train Loss: 0.0513, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3545 +[2025-02-27 19:20:35] (step=0025500) Train Loss: 0.0517, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3463 +[2025-02-27 19:21:35] (step=0025600) Train Loss: 0.0513, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3475 +[2025-02-27 19:22:35] (step=0025700) Train Loss: 0.0510, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3551 +[2025-02-27 19:23:34] (step=0025800) Train Loss: 0.0509, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3558 +[2025-02-27 19:24:34] (step=0025900) Train Loss: 0.0509, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3432 +[2025-02-27 19:25:34] (step=0026000) Train Loss: 0.0511, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3527 +[2025-02-27 19:26:34] (step=0026100) Train Loss: 0.0506, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3597 +[2025-02-27 19:27:33] (step=0026200) Train Loss: 0.0509, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3421 +[2025-02-27 19:28:33] (step=0026300) Train Loss: 0.0515, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3353 +[2025-02-27 19:29:33] (step=0026400) Train Loss: 0.0506, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3383 +[2025-02-27 19:30:33] (step=0026500) Train Loss: 0.0506, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3299 +[2025-02-27 19:31:33] (step=0026600) Train Loss: 0.0506, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3315 +[2025-02-27 19:32:32] (step=0026700) Train Loss: 0.0511, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3323 +[2025-02-27 19:33:32] (step=0026800) Train Loss: 0.0510, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3439 +[2025-02-27 19:34:32] (step=0026900) Train Loss: 0.0507, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3488 +[2025-02-27 19:35:32] (step=0027000) Train Loss: 0.0506, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3375 +[2025-02-27 19:36:31] (step=0027100) Train Loss: 0.0504, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3331 +[2025-02-27 19:37:31] (step=0027200) Train Loss: 0.0508, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3322 +[2025-02-27 19:38:31] (step=0027300) Train Loss: 0.0506, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3460 +[2025-02-27 19:39:31] (step=0027400) Train Loss: 0.0509, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3225 +[2025-02-27 19:40:31] (step=0027500) Train Loss: 0.0508, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3429 +[2025-02-27 19:41:33] (step=0027600) Train Loss: 0.0508, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.60, Grad Norm: 0.3313 +[2025-02-27 19:42:33] (step=0027700) Train Loss: 0.0506, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3190 +[2025-02-27 19:43:33] (step=0027800) Train Loss: 0.0507, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3313 +[2025-02-27 19:44:32] (step=0027900) Train Loss: 0.0508, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3340 +[2025-02-27 19:45:32] (step=0028000) Train Loss: 0.0506, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3339 +[2025-02-27 19:46:32] (step=0028100) Train Loss: 0.0504, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3261 +[2025-02-27 19:47:31] (step=0028200) Train Loss: 0.0506, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3238 +[2025-02-27 19:48:31] (step=0028300) Train Loss: 0.0510, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3374 +[2025-02-27 19:49:31] (step=0028400) Train Loss: 0.0508, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3306 +[2025-02-27 19:50:31] (step=0028500) Train Loss: 0.0504, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3215 +[2025-02-27 19:51:30] (step=0028600) Train Loss: 0.0502, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3192 +[2025-02-27 19:52:30] (step=0028700) Train Loss: 0.0507, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3185 +[2025-02-27 19:53:30] (step=0028800) Train Loss: 0.0506, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3178 +[2025-02-27 19:54:29] (step=0028900) Train Loss: 0.0504, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3243 +[2025-02-27 19:55:29] (step=0029000) Train Loss: 0.0507, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3185 +[2025-02-27 19:56:29] (step=0029100) Train Loss: 0.0503, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3162 +[2025-02-27 19:57:28] (step=0029200) Train Loss: 0.0506, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3313 +[2025-02-27 19:58:28] (step=0029300) Train Loss: 0.0504, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3305 +[2025-02-27 19:59:28] (step=0029400) Train Loss: 0.0500, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3346 +[2025-02-27 20:00:27] (step=0029500) Train Loss: 0.0506, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3061 +[2025-02-27 20:01:27] (step=0029600) Train Loss: 0.0503, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3170 +[2025-02-27 20:02:27] (step=0029700) Train Loss: 0.0504, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3177 +[2025-02-27 20:03:27] (step=0029800) Train Loss: 0.0506, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3435 +[2025-02-27 20:04:26] (step=0029900) Train Loss: 0.0505, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3096 +[2025-02-27 20:05:26] (step=0030000) Train Loss: 0.0504, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3309 +[2025-02-27 20:06:28] (step=0030100) Train Loss: 0.0506, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.60, Grad Norm: 0.3322 +[2025-02-27 20:07:28] (step=0030200) Train Loss: 0.0503, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3213 +[2025-02-27 20:08:28] (step=0030300) Train Loss: 0.0500, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3120 +[2025-02-27 20:09:28] (step=0030400) Train Loss: 0.0505, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3098 +[2025-02-27 20:10:27] (step=0030500) Train Loss: 0.0505, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3221 +[2025-02-27 20:11:27] (step=0030600) Train Loss: 0.0504, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3253 +[2025-02-27 20:12:27] (step=0030700) Train Loss: 0.0505, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3216 +[2025-02-27 20:13:27] (step=0030800) Train Loss: 0.0503, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3003 +[2025-02-27 20:14:26] (step=0030900) Train Loss: 0.0503, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3221 +[2025-02-27 20:15:26] (step=0031000) Train Loss: 0.0499, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3147 +[2025-02-27 20:16:26] (step=0031100) Train Loss: 0.0500, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3230 +[2025-02-27 20:17:26] (step=0031200) Train Loss: 0.0502, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3184 +[2025-02-27 20:18:25] (step=0031300) Train Loss: 0.0496, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3130 +[2025-02-27 20:19:25] (step=0031400) Train Loss: 0.0504, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3081 +[2025-02-27 20:20:25] (step=0031500) Train Loss: 0.0504, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3143 +[2025-02-27 20:21:25] (step=0031600) Train Loss: 0.0500, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3065 +[2025-02-27 20:22:24] (step=0031700) Train Loss: 0.0498, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3071 +[2025-02-27 20:23:24] (step=0031800) Train Loss: 0.0499, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3225 +[2025-02-27 20:24:24] (step=0031900) Train Loss: 0.0498, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2981 +[2025-02-27 20:25:23] (step=0032000) Train Loss: 0.0502, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3031 +[2025-02-27 20:26:23] (step=0032100) Train Loss: 0.0502, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3084 +[2025-02-27 20:27:23] (step=0032200) Train Loss: 0.0499, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2969 +[2025-02-27 20:28:23] (step=0032300) Train Loss: 0.0499, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3132 +[2025-02-27 20:29:22] (step=0032400) Train Loss: 0.0498, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3102 +[2025-02-27 20:30:22] (step=0032500) Train Loss: 0.0498, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3081 +[2025-02-27 20:31:25] (step=0032600) Train Loss: 0.0496, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.60, Grad Norm: 0.2910 +[2025-02-27 20:32:24] (step=0032700) Train Loss: 0.0503, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3019 +[2025-02-27 20:33:24] (step=0032800) Train Loss: 0.0502, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2969 +[2025-02-27 20:34:24] (step=0032900) Train Loss: 0.0502, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3125 +[2025-02-27 20:35:24] (step=0033000) Train Loss: 0.0500, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2982 +[2025-02-27 20:36:23] (step=0033100) Train Loss: 0.0504, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.3040 +[2025-02-27 20:37:23] (step=0033200) Train Loss: 0.0497, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2994 +[2025-02-27 20:38:23] (step=0033300) Train Loss: 0.0500, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2948 +[2025-02-27 20:39:22] (step=0033400) Train Loss: 0.0496, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2994 +[2025-02-27 20:40:22] (step=0033500) Train Loss: 0.0496, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2992 +[2025-02-27 20:41:22] (step=0033600) Train Loss: 0.0501, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2983 +[2025-02-27 20:42:21] (step=0033700) Train Loss: 0.0496, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2981 +[2025-02-27 20:43:21] (step=0033800) Train Loss: 0.0499, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2872 +[2025-02-27 20:44:21] (step=0033900) Train Loss: 0.0501, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2988 +[2025-02-27 20:45:21] (step=0034000) Train Loss: 0.0498, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2985 +[2025-02-27 20:46:20] (step=0034100) Train Loss: 0.0500, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3004 +[2025-02-27 20:47:20] (step=0034200) Train Loss: 0.0499, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3051 +[2025-02-27 20:48:20] (step=0034300) Train Loss: 0.0494, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2846 +[2025-02-27 20:49:19] (step=0034400) Train Loss: 0.0496, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3214 +[2025-02-27 20:50:19] (step=0034500) Train Loss: 0.0496, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2881 +[2025-02-27 20:51:19] (step=0034600) Train Loss: 0.0501, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2999 +[2025-02-27 20:52:19] (step=0034700) Train Loss: 0.0492, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2872 +[2025-02-27 20:53:18] (step=0034800) Train Loss: 0.0498, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2969 +[2025-02-27 20:54:18] (step=0034900) Train Loss: 0.0495, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3083 +[2025-02-27 20:55:18] (step=0035000) Train Loss: 0.0497, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2888 +[2025-02-27 20:56:20] (step=0035100) Train Loss: 0.0493, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.60, Grad Norm: 0.2883 +[2025-02-27 20:57:20] (step=0035200) Train Loss: 0.0496, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2893 +[2025-02-27 20:58:20] (step=0035300) Train Loss: 0.0502, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3141 +[2025-02-27 20:59:20] (step=0035400) Train Loss: 0.0498, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2626 +[2025-02-27 21:00:19] (step=0035500) Train Loss: 0.0497, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2966 +[2025-02-27 21:01:19] (step=0035600) Train Loss: 0.0500, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2848 +[2025-02-27 21:02:19] (step=0035700) Train Loss: 0.0499, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2915 +[2025-02-27 21:03:19] (step=0035800) Train Loss: 0.0495, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2846 +[2025-02-27 21:04:18] (step=0035900) Train Loss: 0.0495, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.3000 +[2025-02-27 21:05:18] (step=0036000) Train Loss: 0.0497, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2889 +[2025-02-27 21:06:18] (step=0036100) Train Loss: 0.0493, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2798 +[2025-02-27 21:07:18] (step=0036200) Train Loss: 0.0493, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2866 +[2025-02-27 21:08:17] (step=0036300) Train Loss: 0.0494, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2845 +[2025-02-27 21:09:17] (step=0036400) Train Loss: 0.0496, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2904 +[2025-02-27 21:10:17] (step=0036500) Train Loss: 0.0493, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2981 +[2025-02-27 21:11:17] (step=0036600) Train Loss: 0.0493, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2832 +[2025-02-27 21:12:17] (step=0036700) Train Loss: 0.0494, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2883 +[2025-02-27 21:13:16] (step=0036800) Train Loss: 0.0495, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2906 +[2025-02-27 21:14:16] (step=0036900) Train Loss: 0.0497, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2904 +[2025-02-27 21:15:16] (step=0037000) Train Loss: 0.0494, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2865 +[2025-02-27 21:16:16] (step=0037100) Train Loss: 0.0499, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2937 +[2025-02-27 21:17:15] (step=0037200) Train Loss: 0.0497, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2938 +[2025-02-27 21:18:15] (step=0037300) Train Loss: 0.0490, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2858 +[2025-02-27 21:19:15] (step=0037400) Train Loss: 0.0492, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2734 +[2025-02-27 21:20:15] (step=0037500) Train Loss: 0.0496, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2881 +[2025-02-27 21:21:17] (step=0037600) Train Loss: 0.0492, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.60, Grad Norm: 0.2889 +[2025-02-27 21:22:17] (step=0037700) Train Loss: 0.0492, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2672 +[2025-02-27 21:23:17] (step=0037800) Train Loss: 0.0490, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2836 +[2025-02-27 21:24:17] (step=0037900) Train Loss: 0.0496, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2730 +[2025-02-27 21:25:16] (step=0038000) Train Loss: 0.0493, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2914 +[2025-02-27 21:26:16] (step=0038100) Train Loss: 0.0495, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2930 +[2025-02-27 21:27:16] (step=0038200) Train Loss: 0.0494, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2830 +[2025-02-27 21:28:16] (step=0038300) Train Loss: 0.0495, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2656 +[2025-02-27 21:29:15] (step=0038400) Train Loss: 0.0493, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2793 +[2025-02-27 21:30:15] (step=0038500) Train Loss: 0.0487, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2708 +[2025-02-27 21:31:15] (step=0038600) Train Loss: 0.0495, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2797 +[2025-02-27 21:32:14] (step=0038700) Train Loss: 0.0495, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2696 +[2025-02-27 21:33:14] (step=0038800) Train Loss: 0.0497, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2735 +[2025-02-27 21:34:14] (step=0038900) Train Loss: 0.0490, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2740 +[2025-02-27 21:35:14] (step=0039000) Train Loss: 0.0490, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2813 +[2025-02-27 21:36:13] (step=0039100) Train Loss: 0.0493, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2700 +[2025-02-27 21:37:13] (step=0039200) Train Loss: 0.0491, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2799 +[2025-02-27 21:38:13] (step=0039300) Train Loss: 0.0492, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2756 +[2025-02-27 21:39:13] (step=0039400) Train Loss: 0.0494, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2813 +[2025-02-27 21:40:12] (step=0039500) Train Loss: 0.0491, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2713 +[2025-02-27 21:41:12] (step=0039600) Train Loss: 0.0490, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2725 +[2025-02-27 21:42:12] (step=0039700) Train Loss: 0.0488, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2822 +[2025-02-27 21:43:11] (step=0039800) Train Loss: 0.0492, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2674 +[2025-02-27 21:44:11] (step=0039900) Train Loss: 0.0492, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2909 +[2025-02-27 21:45:11] (step=0040000) Train Loss: 0.0490, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2701 +[2025-02-27 21:46:13] (step=0040100) Train Loss: 0.0493, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.60, Grad Norm: 0.2743 +[2025-02-27 21:47:13] (step=0040200) Train Loss: 0.0491, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2757 +[2025-02-27 21:48:13] (step=0040300) Train Loss: 0.0493, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2700 +[2025-02-27 21:49:13] (step=0040400) Train Loss: 0.0489, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2791 +[2025-02-27 21:50:13] (step=0040500) Train Loss: 0.0492, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2649 +[2025-02-27 21:51:13] (step=0040600) Train Loss: 0.0491, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2650 +[2025-02-27 21:52:12] (step=0040700) Train Loss: 0.0491, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2808 +[2025-02-27 21:53:12] (step=0040800) Train Loss: 0.0494, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2633 +[2025-02-27 21:54:12] (step=0040900) Train Loss: 0.0494, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2554 +[2025-02-27 21:55:12] (step=0041000) Train Loss: 0.0491, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2654 +[2025-02-27 21:56:11] (step=0041100) Train Loss: 0.0485, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2753 +[2025-02-27 21:57:11] (step=0041200) Train Loss: 0.0488, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2615 +[2025-02-27 21:58:11] (step=0041300) Train Loss: 0.0496, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2732 +[2025-02-27 21:59:11] (step=0041400) Train Loss: 0.0489, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2709 +[2025-02-27 22:00:11] (step=0041500) Train Loss: 0.0488, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2710 +[2025-02-27 22:01:10] (step=0041600) Train Loss: 0.0490, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2629 +[2025-02-27 22:02:10] (step=0041700) Train Loss: 0.0491, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2613 +[2025-02-27 22:03:10] (step=0041800) Train Loss: 0.0488, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2722 +[2025-02-27 22:04:09] (step=0041900) Train Loss: 0.0488, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2604 +[2025-02-27 22:05:09] (step=0042000) Train Loss: 0.0489, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2565 +[2025-02-27 22:06:09] (step=0042100) Train Loss: 0.0489, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2612 +[2025-02-27 22:07:09] (step=0042200) Train Loss: 0.0490, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2636 +[2025-02-27 22:08:08] (step=0042300) Train Loss: 0.0489, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2538 +[2025-02-27 22:09:08] (step=0042400) Train Loss: 0.0489, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2620 +[2025-02-27 22:10:08] (step=0042500) Train Loss: 0.0490, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2568 +[2025-02-27 22:11:10] (step=0042600) Train Loss: 0.0488, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.60, Grad Norm: 0.2640 +[2025-02-27 22:12:10] (step=0042700) Train Loss: 0.0490, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2601 +[2025-02-27 22:13:10] (step=0042800) Train Loss: 0.0491, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2663 +[2025-02-27 22:14:09] (step=0042900) Train Loss: 0.0493, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2543 +[2025-02-27 22:15:09] (step=0043000) Train Loss: 0.0489, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2625 +[2025-02-27 22:16:09] (step=0043100) Train Loss: 0.0487, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2689 +[2025-02-27 22:17:09] (step=0043200) Train Loss: 0.0489, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2587 +[2025-02-27 22:18:08] (step=0043300) Train Loss: 0.0487, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2601 +[2025-02-27 22:19:08] (step=0043400) Train Loss: 0.0486, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2657 +[2025-02-27 22:20:08] (step=0043500) Train Loss: 0.0489, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2528 +[2025-02-27 22:21:07] (step=0043600) Train Loss: 0.0489, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2481 +[2025-02-27 22:22:07] (step=0043700) Train Loss: 0.0485, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2640 +[2025-02-27 22:23:07] (step=0043800) Train Loss: 0.0487, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2720 +[2025-02-27 22:24:06] (step=0043900) Train Loss: 0.0488, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2708 +[2025-02-27 22:25:06] (step=0044000) Train Loss: 0.0488, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2550 +[2025-02-27 22:26:06] (step=0044100) Train Loss: 0.0486, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2607 +[2025-02-27 22:27:06] (step=0044200) Train Loss: 0.0489, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2561 +[2025-02-27 22:28:05] (step=0044300) Train Loss: 0.0486, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2591 +[2025-02-27 22:29:05] (step=0044400) Train Loss: 0.0489, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2548 +[2025-02-27 22:30:05] (step=0044500) Train Loss: 0.0491, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2579 +[2025-02-27 22:31:04] (step=0044600) Train Loss: 0.0488, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2535 +[2025-02-27 22:32:04] (step=0044700) Train Loss: 0.0490, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2433 +[2025-02-27 22:33:04] (step=0044800) Train Loss: 0.0487, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2545 +[2025-02-27 22:34:03] (step=0044900) Train Loss: 0.0488, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2539 +[2025-02-27 22:35:03] (step=0045000) Train Loss: 0.0489, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2560 +[2025-02-27 22:36:06] (step=0045100) Train Loss: 0.0488, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.61, Grad Norm: 0.2665 +[2025-02-27 22:37:05] (step=0045200) Train Loss: 0.0485, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2499 +[2025-02-27 22:38:05] (step=0045300) Train Loss: 0.0484, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2574 +[2025-02-27 22:39:05] (step=0045400) Train Loss: 0.0490, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2505 +[2025-02-27 22:40:04] (step=0045500) Train Loss: 0.0483, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2609 +[2025-02-27 22:41:04] (step=0045600) Train Loss: 0.0484, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2463 +[2025-02-27 22:42:04] (step=0045700) Train Loss: 0.0487, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2575 +[2025-02-27 22:43:03] (step=0045800) Train Loss: 0.0486, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2397 +[2025-02-27 22:44:03] (step=0045900) Train Loss: 0.0489, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2555 +[2025-02-27 22:45:03] (step=0046000) Train Loss: 0.0482, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2522 +[2025-02-27 22:46:03] (step=0046100) Train Loss: 0.0487, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2460 +[2025-02-27 22:47:02] (step=0046200) Train Loss: 0.0485, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2604 +[2025-02-27 22:48:02] (step=0046300) Train Loss: 0.0484, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2489 +[2025-02-27 22:49:02] (step=0046400) Train Loss: 0.0487, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2488 +[2025-02-27 22:50:01] (step=0046500) Train Loss: 0.0489, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2514 +[2025-02-27 22:51:01] (step=0046600) Train Loss: 0.0487, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2465 +[2025-02-27 22:52:01] (step=0046700) Train Loss: 0.0484, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2541 +[2025-02-27 22:53:01] (step=0046800) Train Loss: 0.0484, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2534 +[2025-02-27 22:54:00] (step=0046900) Train Loss: 0.0485, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2369 +[2025-02-27 22:55:00] (step=0047000) Train Loss: 0.0486, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2535 +[2025-02-27 22:56:00] (step=0047100) Train Loss: 0.0484, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2296 +[2025-02-27 22:56:59] (step=0047200) Train Loss: 0.0487, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2486 +[2025-02-27 22:57:59] (step=0047300) Train Loss: 0.0487, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2476 +[2025-02-27 22:58:59] (step=0047400) Train Loss: 0.0484, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2468 +[2025-02-27 22:59:59] (step=0047500) Train Loss: 0.0484, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2572 +[2025-02-27 23:01:01] (step=0047600) Train Loss: 0.0487, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.60, Grad Norm: 0.2475 +[2025-02-27 23:02:01] (step=0047700) Train Loss: 0.0484, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2493 +[2025-02-27 23:03:01] (step=0047800) Train Loss: 0.0484, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2456 +[2025-02-27 23:04:00] (step=0047900) Train Loss: 0.0488, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2440 +[2025-02-27 23:05:00] (step=0048000) Train Loss: 0.0485, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2398 +[2025-02-27 23:06:00] (step=0048100) Train Loss: 0.0486, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2415 +[2025-02-27 23:06:59] (step=0048200) Train Loss: 0.0484, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2444 +[2025-02-27 23:07:59] (step=0048300) Train Loss: 0.0484, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2571 +[2025-02-27 23:08:59] (step=0048400) Train Loss: 0.0484, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2453 +[2025-02-27 23:09:58] (step=0048500) Train Loss: 0.0485, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2498 +[2025-02-27 23:10:58] (step=0048600) Train Loss: 0.0484, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2348 +[2025-02-27 23:11:58] (step=0048700) Train Loss: 0.0482, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2493 +[2025-02-27 23:12:57] (step=0048800) Train Loss: 0.0484, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2303 +[2025-02-27 23:13:57] (step=0048900) Train Loss: 0.0485, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2577 +[2025-02-27 23:14:57] (step=0049000) Train Loss: 0.0487, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2401 +[2025-02-27 23:15:56] (step=0049100) Train Loss: 0.0483, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2565 +[2025-02-27 23:16:56] (step=0049200) Train Loss: 0.0481, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2436 +[2025-02-27 23:17:56] (step=0049300) Train Loss: 0.0481, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2377 +[2025-02-27 23:18:55] (step=0049400) Train Loss: 0.0482, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2451 +[2025-02-27 23:19:55] (step=0049500) Train Loss: 0.0482, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2344 +[2025-02-27 23:20:55] (step=0049600) Train Loss: 0.0483, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2457 +[2025-02-27 23:21:55] (step=0049700) Train Loss: 0.0483, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2371 +[2025-02-27 23:22:54] (step=0049800) Train Loss: 0.0484, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2510 +[2025-02-27 23:23:54] (step=0049900) Train Loss: 0.0485, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2525 +[2025-02-27 23:24:54] (step=0050000) Train Loss: 0.0483, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2410 +[2025-02-27 23:24:57] Saved checkpoint to ../logs/flow/flowsdvae_500kx512_lgn0p0/checkpoints/0050000.pt +[2025-02-27 23:31:18] (step=0050000), Fid=8.871754730314251, PSNR=26.106669029331208, LPIPS=0.24334770441055298, SSIM=0.7058218717575073 +[2025-02-27 23:32:20] (step=0050100) Train Loss: 0.0480, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 0.22, Grad Norm: 0.2418 +[2025-02-27 23:33:20] (step=0050200) Train Loss: 0.0481, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2424 +[2025-02-27 23:34:20] (step=0050300) Train Loss: 0.0484, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2343 +[2025-02-27 23:35:20] (step=0050400) Train Loss: 0.0487, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2337 +[2025-02-27 23:36:19] (step=0050500) Train Loss: 0.0481, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2336 +[2025-02-27 23:37:19] (step=0050600) Train Loss: 0.0479, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2362 +[2025-02-27 23:38:19] (step=0050700) Train Loss: 0.0487, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2339 +[2025-02-27 23:39:18] (step=0050800) Train Loss: 0.0478, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2434 +[2025-02-27 23:40:18] (step=0050900) Train Loss: 0.0485, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2446 +[2025-02-27 23:41:18] (step=0051000) Train Loss: 0.0486, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2271 +[2025-02-27 23:42:17] (step=0051100) Train Loss: 0.0481, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2358 +[2025-02-27 23:43:17] (step=0051200) Train Loss: 0.0485, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2281 +[2025-02-27 23:44:17] (step=0051300) Train Loss: 0.0484, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2332 +[2025-02-27 23:45:16] (step=0051400) Train Loss: 0.0484, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2357 +[2025-02-27 23:46:16] (step=0051500) Train Loss: 0.0484, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2406 +[2025-02-27 23:47:16] (step=0051600) Train Loss: 0.0481, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2266 +[2025-02-27 23:48:16] (step=0051700) Train Loss: 0.0479, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2323 +[2025-02-27 23:49:15] (step=0051800) Train Loss: 0.0480, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2343 +[2025-02-27 23:50:15] (step=0051900) Train Loss: 0.0481, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2487 +[2025-02-27 23:51:15] (step=0052000) Train Loss: 0.0481, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2302 +[2025-02-27 23:52:14] (step=0052100) Train Loss: 0.0485, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2319 +[2025-02-27 23:53:14] (step=0052200) Train Loss: 0.0477, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2378 +[2025-02-27 23:54:14] (step=0052300) Train Loss: 0.0479, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2284 +[2025-02-27 23:55:13] (step=0052400) Train Loss: 0.0487, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2356 +[2025-02-27 23:56:13] (step=0052500) Train Loss: 0.0482, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2308 +[2025-02-27 23:57:16] (step=0052600) Train Loss: 0.0479, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.2395 +[2025-02-27 23:58:16] (step=0052700) Train Loss: 0.0482, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2264 +[2025-02-27 23:59:16] (step=0052800) Train Loss: 0.0482, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2356 +[2025-02-28 00:00:15] (step=0052900) Train Loss: 0.0487, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2357 +[2025-02-28 00:01:15] (step=0053000) Train Loss: 0.0482, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2223 +[2025-02-28 00:02:15] (step=0053100) Train Loss: 0.0481, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2309 +[2025-02-28 00:03:14] (step=0053200) Train Loss: 0.0479, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2264 +[2025-02-28 00:04:14] (step=0053300) Train Loss: 0.0482, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2332 +[2025-02-28 00:05:14] (step=0053400) Train Loss: 0.0482, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2355 +[2025-02-28 00:06:13] (step=0053500) Train Loss: 0.0478, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2296 +[2025-02-28 00:07:13] (step=0053600) Train Loss: 0.0481, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2279 +[2025-02-28 00:08:13] (step=0053700) Train Loss: 0.0479, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2263 +[2025-02-28 00:09:13] (step=0053800) Train Loss: 0.0482, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2254 +[2025-02-28 00:10:12] (step=0053900) Train Loss: 0.0481, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2370 +[2025-02-28 00:11:12] (step=0054000) Train Loss: 0.0479, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2267 +[2025-02-28 00:12:12] (step=0054100) Train Loss: 0.0479, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2283 +[2025-02-28 00:13:11] (step=0054200) Train Loss: 0.0481, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2267 +[2025-02-28 00:14:11] (step=0054300) Train Loss: 0.0477, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2246 +[2025-02-28 00:15:11] (step=0054400) Train Loss: 0.0478, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2304 +[2025-02-28 00:16:10] (step=0054500) Train Loss: 0.0484, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2272 +[2025-02-28 00:17:10] (step=0054600) Train Loss: 0.0476, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2372 +[2025-02-28 00:18:10] (step=0054700) Train Loss: 0.0479, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2136 +[2025-02-28 00:19:10] (step=0054800) Train Loss: 0.0478, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2287 +[2025-02-28 00:20:09] (step=0054900) Train Loss: 0.0482, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2280 +[2025-02-28 00:21:09] (step=0055000) Train Loss: 0.0485, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2287 +[2025-02-28 00:22:12] (step=0055100) Train Loss: 0.0481, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.60, Grad Norm: 0.2367 +[2025-02-28 00:23:11] (step=0055200) Train Loss: 0.0477, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2257 +[2025-02-28 00:24:11] (step=0055300) Train Loss: 0.0478, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2314 +[2025-02-28 00:25:11] (step=0055400) Train Loss: 0.0479, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2303 +[2025-02-28 00:26:10] (step=0055500) Train Loss: 0.0483, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2191 +[2025-02-28 00:27:10] (step=0055600) Train Loss: 0.0480, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2213 +[2025-02-28 00:28:10] (step=0055700) Train Loss: 0.0480, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2226 +[2025-02-28 00:29:09] (step=0055800) Train Loss: 0.0479, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2335 +[2025-02-28 00:30:09] (step=0055900) Train Loss: 0.0477, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2302 +[2025-02-28 00:31:09] (step=0056000) Train Loss: 0.0476, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2270 +[2025-02-28 00:32:08] (step=0056100) Train Loss: 0.0483, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2160 +[2025-02-28 00:33:08] (step=0056200) Train Loss: 0.0482, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2213 +[2025-02-28 00:34:08] (step=0056300) Train Loss: 0.0477, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2156 +[2025-02-28 00:35:07] (step=0056400) Train Loss: 0.0481, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2199 +[2025-02-28 00:36:07] (step=0056500) Train Loss: 0.0476, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2147 +[2025-02-28 00:37:07] (step=0056600) Train Loss: 0.0479, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2292 +[2025-02-28 00:38:06] (step=0056700) Train Loss: 0.0482, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2231 +[2025-02-28 00:39:06] (step=0056800) Train Loss: 0.0478, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2236 +[2025-02-28 00:40:06] (step=0056900) Train Loss: 0.0482, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2106 +[2025-02-28 00:41:05] (step=0057000) Train Loss: 0.0479, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2176 +[2025-02-28 00:42:05] (step=0057100) Train Loss: 0.0483, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2142 +[2025-02-28 00:43:05] (step=0057200) Train Loss: 0.0476, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2223 +[2025-02-28 00:44:04] (step=0057300) Train Loss: 0.0478, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2208 +[2025-02-28 00:45:04] (step=0057400) Train Loss: 0.0477, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2211 +[2025-02-28 00:46:04] (step=0057500) Train Loss: 0.0481, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2302 +[2025-02-28 00:47:07] (step=0057600) Train Loss: 0.0478, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.2325 +[2025-02-28 00:48:06] (step=0057700) Train Loss: 0.0480, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2192 +[2025-02-28 00:49:06] (step=0057800) Train Loss: 0.0479, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2335 +[2025-02-28 00:50:06] (step=0057900) Train Loss: 0.0483, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2156 +[2025-02-28 00:51:06] (step=0058000) Train Loss: 0.0477, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2215 +[2025-02-28 00:52:06] (step=0058100) Train Loss: 0.0476, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2135 +[2025-02-28 00:53:05] (step=0058200) Train Loss: 0.0476, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2257 +[2025-02-28 00:54:05] (step=0058300) Train Loss: 0.0476, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2074 +[2025-02-28 00:55:05] (step=0058400) Train Loss: 0.0478, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.66, Grad Norm: 0.2198 +[2025-02-28 00:56:05] (step=0058500) Train Loss: 0.0479, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.66, Grad Norm: 0.2128 +[2025-02-28 00:57:05] (step=0058600) Train Loss: 0.0482, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2290 +[2025-02-28 00:58:05] (step=0058700) Train Loss: 0.0481, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2239 +[2025-02-28 00:59:04] (step=0058800) Train Loss: 0.0483, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2208 +[2025-02-28 01:00:04] (step=0058900) Train Loss: 0.0474, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2139 +[2025-02-28 01:01:04] (step=0059000) Train Loss: 0.0476, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2182 +[2025-02-28 01:02:04] (step=0059100) Train Loss: 0.0480, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2215 +[2025-02-28 01:03:03] (step=0059200) Train Loss: 0.0484, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2191 +[2025-02-28 01:04:03] (step=0059300) Train Loss: 0.0481, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2161 +[2025-02-28 01:05:03] (step=0059400) Train Loss: 0.0480, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2234 +[2025-02-28 01:06:03] (step=0059500) Train Loss: 0.0479, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2085 +[2025-02-28 01:07:02] (step=0059600) Train Loss: 0.0477, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2180 +[2025-02-28 01:08:02] (step=0059700) Train Loss: 0.0477, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2046 +[2025-02-28 01:09:01] (step=0059800) Train Loss: 0.0475, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2150 +[2025-02-28 01:10:01] (step=0059900) Train Loss: 0.0474, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2150 +[2025-02-28 01:11:01] (step=0060000) Train Loss: 0.0477, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2078 +[2025-02-28 01:12:04] (step=0060100) Train Loss: 0.0480, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.58, Grad Norm: 0.2184 +[2025-02-28 01:13:04] (step=0060200) Train Loss: 0.0476, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2130 +[2025-02-28 01:14:04] (step=0060300) Train Loss: 0.0476, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2121 +[2025-02-28 01:15:03] (step=0060400) Train Loss: 0.0475, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2130 +[2025-02-28 01:16:03] (step=0060500) Train Loss: 0.0474, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2110 +[2025-02-28 01:17:03] (step=0060600) Train Loss: 0.0478, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2081 +[2025-02-28 01:18:02] (step=0060700) Train Loss: 0.0475, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2172 +[2025-02-28 01:19:02] (step=0060800) Train Loss: 0.0481, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2206 +[2025-02-28 01:20:02] (step=0060900) Train Loss: 0.0478, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2003 +[2025-02-28 01:21:01] (step=0061000) Train Loss: 0.0478, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2047 +[2025-02-28 01:22:01] (step=0061100) Train Loss: 0.0476, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2056 +[2025-02-28 01:23:01] (step=0061200) Train Loss: 0.0473, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2118 +[2025-02-28 01:24:00] (step=0061300) Train Loss: 0.0477, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2108 +[2025-02-28 01:25:00] (step=0061400) Train Loss: 0.0481, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2193 +[2025-02-28 01:25:59] (step=0061500) Train Loss: 0.0475, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2089 +[2025-02-28 01:26:59] (step=0061600) Train Loss: 0.0478, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2161 +[2025-02-28 01:27:59] (step=0061700) Train Loss: 0.0474, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2127 +[2025-02-28 01:28:58] (step=0061800) Train Loss: 0.0475, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2168 +[2025-02-28 01:29:58] (step=0061900) Train Loss: 0.0479, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2072 +[2025-02-28 01:30:58] (step=0062000) Train Loss: 0.0474, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2057 +[2025-02-28 01:31:57] (step=0062100) Train Loss: 0.0481, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2079 +[2025-02-28 01:32:57] (step=0062200) Train Loss: 0.0477, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2146 +[2025-02-28 01:33:57] (step=0062300) Train Loss: 0.0481, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2064 +[2025-02-28 01:34:56] (step=0062400) Train Loss: 0.0478, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2138 +[2025-02-28 01:35:56] (step=0062500) Train Loss: 0.0479, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2141 +[2025-02-28 01:36:59] (step=0062600) Train Loss: 0.0476, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.2141 +[2025-02-28 01:37:58] (step=0062700) Train Loss: 0.0478, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2084 +[2025-02-28 01:38:58] (step=0062800) Train Loss: 0.0474, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2021 +[2025-02-28 01:39:58] (step=0062900) Train Loss: 0.0477, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2163 +[2025-02-28 01:40:57] (step=0063000) Train Loss: 0.0477, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2041 +[2025-02-28 01:41:57] (step=0063100) Train Loss: 0.0477, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2177 +[2025-02-28 01:42:57] (step=0063200) Train Loss: 0.0477, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2116 +[2025-02-28 01:43:56] (step=0063300) Train Loss: 0.0480, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2071 +[2025-02-28 01:44:56] (step=0063400) Train Loss: 0.0474, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2080 +[2025-02-28 01:45:56] (step=0063500) Train Loss: 0.0477, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2101 +[2025-02-28 01:46:55] (step=0063600) Train Loss: 0.0479, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2141 +[2025-02-28 01:47:55] (step=0063700) Train Loss: 0.0479, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2093 +[2025-02-28 01:48:55] (step=0063800) Train Loss: 0.0473, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2135 +[2025-02-28 01:49:54] (step=0063900) Train Loss: 0.0476, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2167 +[2025-02-28 01:50:54] (step=0064000) Train Loss: 0.0474, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2044 +[2025-02-28 01:51:54] (step=0064100) Train Loss: 0.0477, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2041 +[2025-02-28 01:52:53] (step=0064200) Train Loss: 0.0483, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2005 +[2025-02-28 01:53:53] (step=0064300) Train Loss: 0.0477, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2125 +[2025-02-28 01:54:53] (step=0064400) Train Loss: 0.0478, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2013 +[2025-02-28 01:55:52] (step=0064500) Train Loss: 0.0476, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2088 +[2025-02-28 01:56:52] (step=0064600) Train Loss: 0.0477, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2045 +[2025-02-28 01:57:52] (step=0064700) Train Loss: 0.0473, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1990 +[2025-02-28 01:58:51] (step=0064800) Train Loss: 0.0472, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2103 +[2025-02-28 01:59:51] (step=0064900) Train Loss: 0.0476, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2104 +[2025-02-28 02:00:51] (step=0065000) Train Loss: 0.0474, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1988 +[2025-02-28 02:01:54] (step=0065100) Train Loss: 0.0474, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.2102 +[2025-02-28 02:02:53] (step=0065200) Train Loss: 0.0480, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2021 +[2025-02-28 02:03:53] (step=0065300) Train Loss: 0.0476, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1969 +[2025-02-28 02:04:53] (step=0065400) Train Loss: 0.0476, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2082 +[2025-02-28 02:05:52] (step=0065500) Train Loss: 0.0475, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1981 +[2025-02-28 02:06:52] (step=0065600) Train Loss: 0.0472, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2105 +[2025-02-28 02:07:52] (step=0065700) Train Loss: 0.0476, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2032 +[2025-02-28 02:08:51] (step=0065800) Train Loss: 0.0474, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2086 +[2025-02-28 02:09:51] (step=0065900) Train Loss: 0.0469, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1998 +[2025-02-28 02:10:51] (step=0066000) Train Loss: 0.0479, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2047 +[2025-02-28 02:11:50] (step=0066100) Train Loss: 0.0480, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2168 +[2025-02-28 02:12:50] (step=0066200) Train Loss: 0.0471, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2050 +[2025-02-28 02:13:50] (step=0066300) Train Loss: 0.0470, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2050 +[2025-02-28 02:14:50] (step=0066400) Train Loss: 0.0477, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2086 +[2025-02-28 02:15:49] (step=0066500) Train Loss: 0.0479, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2044 +[2025-02-28 02:16:49] (step=0066600) Train Loss: 0.0476, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1930 +[2025-02-28 02:17:49] (step=0066700) Train Loss: 0.0474, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2075 +[2025-02-28 02:18:49] (step=0066800) Train Loss: 0.0474, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2013 +[2025-02-28 02:19:48] (step=0066900) Train Loss: 0.0472, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1981 +[2025-02-28 02:20:48] (step=0067000) Train Loss: 0.0473, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2005 +[2025-02-28 02:21:48] (step=0067100) Train Loss: 0.0473, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1911 +[2025-02-28 02:22:48] (step=0067200) Train Loss: 0.0474, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2069 +[2025-02-28 02:23:47] (step=0067300) Train Loss: 0.0478, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1975 +[2025-02-28 02:24:47] (step=0067400) Train Loss: 0.0475, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2052 +[2025-02-28 02:25:47] (step=0067500) Train Loss: 0.0476, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2009 +[2025-02-28 02:26:50] (step=0067600) Train Loss: 0.0474, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1990 +[2025-02-28 02:27:50] (step=0067700) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2030 +[2025-02-28 02:28:49] (step=0067800) Train Loss: 0.0475, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1958 +[2025-02-28 02:29:49] (step=0067900) Train Loss: 0.0471, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2015 +[2025-02-28 02:30:49] (step=0068000) Train Loss: 0.0469, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1970 +[2025-02-28 02:31:48] (step=0068100) Train Loss: 0.0473, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1976 +[2025-02-28 02:32:48] (step=0068200) Train Loss: 0.0472, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2011 +[2025-02-28 02:33:48] (step=0068300) Train Loss: 0.0475, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1938 +[2025-02-28 02:34:48] (step=0068400) Train Loss: 0.0471, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2003 +[2025-02-28 02:35:47] (step=0068500) Train Loss: 0.0474, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2069 +[2025-02-28 02:36:47] (step=0068600) Train Loss: 0.0477, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1996 +[2025-02-28 02:37:47] (step=0068700) Train Loss: 0.0477, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1971 +[2025-02-28 02:38:46] (step=0068800) Train Loss: 0.0472, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2061 +[2025-02-28 02:39:46] (step=0068900) Train Loss: 0.0476, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2011 +[2025-02-28 02:40:46] (step=0069000) Train Loss: 0.0473, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2061 +[2025-02-28 02:41:46] (step=0069100) Train Loss: 0.0470, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2028 +[2025-02-28 02:42:45] (step=0069200) Train Loss: 0.0472, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1969 +[2025-02-28 02:43:45] (step=0069300) Train Loss: 0.0472, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2021 +[2025-02-28 02:44:45] (step=0069400) Train Loss: 0.0473, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1994 +[2025-02-28 02:45:44] (step=0069500) Train Loss: 0.0476, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2020 +[2025-02-28 02:46:44] (step=0069600) Train Loss: 0.0475, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1987 +[2025-02-28 02:47:44] (step=0069700) Train Loss: 0.0475, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.2118 +[2025-02-28 02:48:44] (step=0069800) Train Loss: 0.0471, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1973 +[2025-02-28 02:49:43] (step=0069900) Train Loss: 0.0475, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1972 +[2025-02-28 02:50:43] (step=0070000) Train Loss: 0.0473, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1975 +[2025-02-28 02:51:46] (step=0070100) Train Loss: 0.0473, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1997 +[2025-02-28 02:52:46] (step=0070200) Train Loss: 0.0470, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1967 +[2025-02-28 02:53:45] (step=0070300) Train Loss: 0.0474, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1922 +[2025-02-28 02:54:45] (step=0070400) Train Loss: 0.0473, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1950 +[2025-02-28 02:55:45] (step=0070500) Train Loss: 0.0472, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1957 +[2025-02-28 02:56:44] (step=0070600) Train Loss: 0.0470, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1933 +[2025-02-28 02:57:44] (step=0070700) Train Loss: 0.0472, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1974 +[2025-02-28 02:58:44] (step=0070800) Train Loss: 0.0476, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1967 +[2025-02-28 02:59:43] (step=0070900) Train Loss: 0.0473, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1958 +[2025-02-28 03:00:43] (step=0071000) Train Loss: 0.0470, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2044 +[2025-02-28 03:01:43] (step=0071100) Train Loss: 0.0471, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1996 +[2025-02-28 03:02:42] (step=0071200) Train Loss: 0.0469, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1950 +[2025-02-28 03:03:42] (step=0071300) Train Loss: 0.0472, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1948 +[2025-02-28 03:04:42] (step=0071400) Train Loss: 0.0471, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1993 +[2025-02-28 03:05:42] (step=0071500) Train Loss: 0.0476, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1915 +[2025-02-28 03:06:41] (step=0071600) Train Loss: 0.0476, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1912 +[2025-02-28 03:07:41] (step=0071700) Train Loss: 0.0473, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1935 +[2025-02-28 03:08:41] (step=0071800) Train Loss: 0.0472, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1855 +[2025-02-28 03:09:40] (step=0071900) Train Loss: 0.0474, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1949 +[2025-02-28 03:10:40] (step=0072000) Train Loss: 0.0473, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1911 +[2025-02-28 03:11:40] (step=0072100) Train Loss: 0.0470, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1946 +[2025-02-28 03:12:39] (step=0072200) Train Loss: 0.0474, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1903 +[2025-02-28 03:13:39] (step=0072300) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1869 +[2025-02-28 03:14:39] (step=0072400) Train Loss: 0.0475, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1898 +[2025-02-28 03:15:39] (step=0072500) Train Loss: 0.0473, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1980 +[2025-02-28 03:16:41] (step=0072600) Train Loss: 0.0469, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1868 +[2025-02-28 03:17:41] (step=0072700) Train Loss: 0.0476, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1911 +[2025-02-28 03:18:41] (step=0072800) Train Loss: 0.0472, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1839 +[2025-02-28 03:19:40] (step=0072900) Train Loss: 0.0470, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1863 +[2025-02-28 03:20:40] (step=0073000) Train Loss: 0.0472, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1887 +[2025-02-28 03:21:40] (step=0073100) Train Loss: 0.0472, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1934 +[2025-02-28 03:22:39] (step=0073200) Train Loss: 0.0471, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1811 +[2025-02-28 03:23:39] (step=0073300) Train Loss: 0.0471, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1900 +[2025-02-28 03:24:39] (step=0073400) Train Loss: 0.0474, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1896 +[2025-02-28 03:25:39] (step=0073500) Train Loss: 0.0470, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1885 +[2025-02-28 03:26:38] (step=0073600) Train Loss: 0.0469, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1905 +[2025-02-28 03:27:38] (step=0073700) Train Loss: 0.0472, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1950 +[2025-02-28 03:28:37] (step=0073800) Train Loss: 0.0470, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1915 +[2025-02-28 03:29:37] (step=0073900) Train Loss: 0.0472, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1866 +[2025-02-28 03:30:37] (step=0074000) Train Loss: 0.0469, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.2007 +[2025-02-28 03:31:36] (step=0074100) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1885 +[2025-02-28 03:32:36] (step=0074200) Train Loss: 0.0470, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1870 +[2025-02-28 03:33:36] (step=0074300) Train Loss: 0.0471, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1922 +[2025-02-28 03:34:35] (step=0074400) Train Loss: 0.0472, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1884 +[2025-02-28 03:35:35] (step=0074500) Train Loss: 0.0472, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1792 +[2025-02-28 03:36:35] (step=0074600) Train Loss: 0.0472, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1844 +[2025-02-28 03:37:34] (step=0074700) Train Loss: 0.0470, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1934 +[2025-02-28 03:38:34] (step=0074800) Train Loss: 0.0470, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1860 +[2025-02-28 03:39:34] (step=0074900) Train Loss: 0.0471, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1910 +[2025-02-28 03:40:33] (step=0075000) Train Loss: 0.0471, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1848 +[2025-02-28 03:41:36] (step=0075100) Train Loss: 0.0473, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1947 +[2025-02-28 03:42:36] (step=0075200) Train Loss: 0.0469, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1796 +[2025-02-28 03:43:36] (step=0075300) Train Loss: 0.0469, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1937 +[2025-02-28 03:44:35] (step=0075400) Train Loss: 0.0473, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1927 +[2025-02-28 03:45:35] (step=0075500) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1988 +[2025-02-28 03:46:35] (step=0075600) Train Loss: 0.0475, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1792 +[2025-02-28 03:47:34] (step=0075700) Train Loss: 0.0473, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1940 +[2025-02-28 03:48:34] (step=0075800) Train Loss: 0.0472, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1972 +[2025-02-28 03:49:33] (step=0075900) Train Loss: 0.0472, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1875 +[2025-02-28 03:50:33] (step=0076000) Train Loss: 0.0472, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1774 +[2025-02-28 03:51:33] (step=0076100) Train Loss: 0.0471, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1899 +[2025-02-28 03:52:32] (step=0076200) Train Loss: 0.0470, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1880 +[2025-02-28 03:53:32] (step=0076300) Train Loss: 0.0472, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1876 +[2025-02-28 03:54:32] (step=0076400) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1893 +[2025-02-28 03:55:31] (step=0076500) Train Loss: 0.0472, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1838 +[2025-02-28 03:56:31] (step=0076600) Train Loss: 0.0470, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1810 +[2025-02-28 03:57:31] (step=0076700) Train Loss: 0.0471, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1818 +[2025-02-28 03:58:30] (step=0076800) Train Loss: 0.0471, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1836 +[2025-02-28 03:59:30] (step=0076900) Train Loss: 0.0472, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1867 +[2025-02-28 04:00:30] (step=0077000) Train Loss: 0.0472, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1875 +[2025-02-28 04:01:29] (step=0077100) Train Loss: 0.0473, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1780 +[2025-02-28 04:02:29] (step=0077200) Train Loss: 0.0472, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1757 +[2025-02-28 04:03:28] (step=0077300) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1906 +[2025-02-28 04:04:28] (step=0077400) Train Loss: 0.0469, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1888 +[2025-02-28 04:05:28] (step=0077500) Train Loss: 0.0471, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1831 +[2025-02-28 04:06:31] (step=0077600) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.60, Grad Norm: 0.1791 +[2025-02-28 04:07:30] (step=0077700) Train Loss: 0.0470, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1954 +[2025-02-28 04:08:30] (step=0077800) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1855 +[2025-02-28 04:09:30] (step=0077900) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1797 +[2025-02-28 04:10:29] (step=0078000) Train Loss: 0.0471, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1812 +[2025-02-28 04:11:29] (step=0078100) Train Loss: 0.0472, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1880 +[2025-02-28 04:12:28] (step=0078200) Train Loss: 0.0472, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1782 +[2025-02-28 04:13:28] (step=0078300) Train Loss: 0.0472, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1806 +[2025-02-28 04:14:28] (step=0078400) Train Loss: 0.0472, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1876 +[2025-02-28 04:15:27] (step=0078500) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1830 +[2025-02-28 04:16:27] (step=0078600) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1777 +[2025-02-28 04:17:27] (step=0078700) Train Loss: 0.0472, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1887 +[2025-02-28 04:18:26] (step=0078800) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1837 +[2025-02-28 04:19:26] (step=0078900) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1767 +[2025-02-28 04:20:26] (step=0079000) Train Loss: 0.0472, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1774 +[2025-02-28 04:21:25] (step=0079100) Train Loss: 0.0473, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1808 +[2025-02-28 04:22:25] (step=0079200) Train Loss: 0.0472, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1820 +[2025-02-28 04:23:25] (step=0079300) Train Loss: 0.0470, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1811 +[2025-02-28 04:24:24] (step=0079400) Train Loss: 0.0471, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1778 +[2025-02-28 04:25:24] (step=0079500) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1855 +[2025-02-28 04:26:24] (step=0079600) Train Loss: 0.0469, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1871 +[2025-02-28 04:27:23] (step=0079700) Train Loss: 0.0473, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1778 +[2025-02-28 04:28:23] (step=0079800) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1763 +[2025-02-28 04:29:23] (step=0079900) Train Loss: 0.0474, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1833 +[2025-02-28 04:30:22] (step=0080000) Train Loss: 0.0469, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1819 +[2025-02-28 04:31:25] (step=0080100) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1808 +[2025-02-28 04:32:25] (step=0080200) Train Loss: 0.0469, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1798 +[2025-02-28 04:33:24] (step=0080300) Train Loss: 0.0476, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1780 +[2025-02-28 04:34:24] (step=0080400) Train Loss: 0.0471, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1813 +[2025-02-28 04:35:24] (step=0080500) Train Loss: 0.0469, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1778 +[2025-02-28 04:36:23] (step=0080600) Train Loss: 0.0470, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1755 +[2025-02-28 04:37:23] (step=0080700) Train Loss: 0.0469, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1791 +[2025-02-28 04:38:23] (step=0080800) Train Loss: 0.0470, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1832 +[2025-02-28 04:39:22] (step=0080900) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1715 +[2025-02-28 04:40:22] (step=0081000) Train Loss: 0.0469, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1861 +[2025-02-28 04:41:22] (step=0081100) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1769 +[2025-02-28 04:42:21] (step=0081200) Train Loss: 0.0470, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1760 +[2025-02-28 04:43:21] (step=0081300) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1855 +[2025-02-28 04:44:21] (step=0081400) Train Loss: 0.0470, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1785 +[2025-02-28 04:45:20] (step=0081500) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1782 +[2025-02-28 04:46:20] (step=0081600) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1757 +[2025-02-28 04:47:20] (step=0081700) Train Loss: 0.0471, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1762 +[2025-02-28 04:48:19] (step=0081800) Train Loss: 0.0471, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1804 +[2025-02-28 04:49:19] (step=0081900) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1717 +[2025-02-28 04:50:19] (step=0082000) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1772 +[2025-02-28 04:51:18] (step=0082100) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1810 +[2025-02-28 04:52:18] (step=0082200) Train Loss: 0.0472, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1715 +[2025-02-28 04:53:18] (step=0082300) Train Loss: 0.0470, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1735 +[2025-02-28 04:54:17] (step=0082400) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1764 +[2025-02-28 04:55:17] (step=0082500) Train Loss: 0.0473, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1799 +[2025-02-28 04:56:20] (step=0082600) Train Loss: 0.0465, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.60, Grad Norm: 0.1753 +[2025-02-28 04:57:20] (step=0082700) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1717 +[2025-02-28 04:58:19] (step=0082800) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1764 +[2025-02-28 04:59:19] (step=0082900) Train Loss: 0.0469, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1759 +[2025-02-28 05:00:19] (step=0083000) Train Loss: 0.0471, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1823 +[2025-02-28 05:01:18] (step=0083100) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1743 +[2025-02-28 05:02:18] (step=0083200) Train Loss: 0.0470, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1779 +[2025-02-28 05:03:18] (step=0083300) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1731 +[2025-02-28 05:04:17] (step=0083400) Train Loss: 0.0470, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1808 +[2025-02-28 05:05:17] (step=0083500) Train Loss: 0.0469, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1624 +[2025-02-28 05:06:17] (step=0083600) Train Loss: 0.0465, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1719 +[2025-02-28 05:07:16] (step=0083700) Train Loss: 0.0471, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1861 +[2025-02-28 05:08:16] (step=0083800) Train Loss: 0.0469, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1738 +[2025-02-28 05:09:16] (step=0083900) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1803 +[2025-02-28 05:10:15] (step=0084000) Train Loss: 0.0469, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1788 +[2025-02-28 05:11:15] (step=0084100) Train Loss: 0.0469, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1804 +[2025-02-28 05:12:15] (step=0084200) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1792 +[2025-02-28 05:13:14] (step=0084300) Train Loss: 0.0465, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1691 +[2025-02-28 05:14:14] (step=0084400) Train Loss: 0.0470, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1787 +[2025-02-28 05:15:14] (step=0084500) Train Loss: 0.0475, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1656 +[2025-02-28 05:16:13] (step=0084600) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1796 +[2025-02-28 05:17:13] (step=0084700) Train Loss: 0.0475, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1710 +[2025-02-28 05:18:13] (step=0084800) Train Loss: 0.0469, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1782 +[2025-02-28 05:19:12] (step=0084900) Train Loss: 0.0470, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1725 +[2025-02-28 05:20:12] (step=0085000) Train Loss: 0.0469, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1682 +[2025-02-28 05:21:15] (step=0085100) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.60, Grad Norm: 0.1735 +[2025-02-28 05:22:14] (step=0085200) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1775 +[2025-02-28 05:23:14] (step=0085300) Train Loss: 0.0470, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1799 +[2025-02-28 05:24:14] (step=0085400) Train Loss: 0.0470, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1754 +[2025-02-28 05:25:13] (step=0085500) Train Loss: 0.0465, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1789 +[2025-02-28 05:26:13] (step=0085600) Train Loss: 0.0470, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1807 +[2025-02-28 05:27:12] (step=0085700) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1839 +[2025-02-28 05:28:12] (step=0085800) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1693 +[2025-02-28 05:29:12] (step=0085900) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1680 +[2025-02-28 05:30:11] (step=0086000) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1693 +[2025-02-28 05:31:11] (step=0086100) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1710 +[2025-02-28 05:32:11] (step=0086200) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1777 +[2025-02-28 05:33:10] (step=0086300) Train Loss: 0.0469, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1629 +[2025-02-28 05:34:10] (step=0086400) Train Loss: 0.0472, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1770 +[2025-02-28 05:35:10] (step=0086500) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1704 +[2025-02-28 05:36:09] (step=0086600) Train Loss: 0.0471, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1711 +[2025-02-28 05:37:09] (step=0086700) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1704 +[2025-02-28 05:38:09] (step=0086800) Train Loss: 0.0469, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1682 +[2025-02-28 05:39:08] (step=0086900) Train Loss: 0.0469, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1754 +[2025-02-28 05:40:08] (step=0087000) Train Loss: 0.0465, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1687 +[2025-02-28 05:41:08] (step=0087100) Train Loss: 0.0472, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1732 +[2025-02-28 05:42:07] (step=0087200) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1672 +[2025-02-28 05:43:07] (step=0087300) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1709 +[2025-02-28 05:44:07] (step=0087400) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1725 +[2025-02-28 05:45:06] (step=0087500) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1697 +[2025-02-28 05:46:09] (step=0087600) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1742 +[2025-02-28 05:47:09] (step=0087700) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1729 +[2025-02-28 05:48:09] (step=0087800) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1729 +[2025-02-28 05:49:08] (step=0087900) Train Loss: 0.0471, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1680 +[2025-02-28 05:50:08] (step=0088000) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1741 +[2025-02-28 05:51:08] (step=0088100) Train Loss: 0.0473, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1723 +[2025-02-28 05:52:07] (step=0088200) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1708 +[2025-02-28 05:53:07] (step=0088300) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1778 +[2025-02-28 05:54:07] (step=0088400) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1736 +[2025-02-28 05:55:06] (step=0088500) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1701 +[2025-02-28 05:56:06] (step=0088600) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1764 +[2025-02-28 05:57:06] (step=0088700) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1749 +[2025-02-28 05:58:05] (step=0088800) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1664 +[2025-02-28 05:59:05] (step=0088900) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1730 +[2025-02-28 06:00:05] (step=0089000) Train Loss: 0.0470, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1744 +[2025-02-28 06:01:04] (step=0089100) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1706 +[2025-02-28 06:02:04] (step=0089200) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1661 +[2025-02-28 06:03:04] (step=0089300) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1665 +[2025-02-28 06:04:03] (step=0089400) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1595 +[2025-02-28 06:05:03] (step=0089500) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1699 +[2025-02-28 06:06:03] (step=0089600) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1696 +[2025-02-28 06:07:02] (step=0089700) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1618 +[2025-02-28 06:08:02] (step=0089800) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1732 +[2025-02-28 06:09:02] (step=0089900) Train Loss: 0.0465, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1707 +[2025-02-28 06:10:01] (step=0090000) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1645 +[2025-02-28 06:11:04] (step=0090100) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1699 +[2025-02-28 06:12:04] (step=0090200) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1774 +[2025-02-28 06:13:04] (step=0090300) Train Loss: 0.0473, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1666 +[2025-02-28 06:14:03] (step=0090400) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1638 +[2025-02-28 06:15:03] (step=0090500) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1716 +[2025-02-28 06:16:03] (step=0090600) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1671 +[2025-02-28 06:17:02] (step=0090700) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1691 +[2025-02-28 06:18:02] (step=0090800) Train Loss: 0.0469, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1653 +[2025-02-28 06:19:02] (step=0090900) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1666 +[2025-02-28 06:20:01] (step=0091000) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1695 +[2025-02-28 06:21:01] (step=0091100) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1650 +[2025-02-28 06:22:00] (step=0091200) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1678 +[2025-02-28 06:23:00] (step=0091300) Train Loss: 0.0465, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1598 +[2025-02-28 06:24:00] (step=0091400) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1696 +[2025-02-28 06:24:59] (step=0091500) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1645 +[2025-02-28 06:25:59] (step=0091600) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1688 +[2025-02-28 06:26:59] (step=0091700) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1682 +[2025-02-28 06:27:58] (step=0091800) Train Loss: 0.0472, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1673 +[2025-02-28 06:28:58] (step=0091900) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1721 +[2025-02-28 06:29:58] (step=0092000) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1633 +[2025-02-28 06:30:58] (step=0092100) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1633 +[2025-02-28 06:31:57] (step=0092200) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1611 +[2025-02-28 06:32:57] (step=0092300) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1637 +[2025-02-28 06:33:57] (step=0092400) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1705 +[2025-02-28 06:34:57] (step=0092500) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1745 +[2025-02-28 06:36:00] (step=0092600) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1664 +[2025-02-28 06:37:00] (step=0092700) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1615 +[2025-02-28 06:37:59] (step=0092800) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1664 +[2025-02-28 06:38:59] (step=0092900) Train Loss: 0.0465, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1709 +[2025-02-28 06:39:59] (step=0093000) Train Loss: 0.0465, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1623 +[2025-02-28 06:40:58] (step=0093100) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1592 +[2025-02-28 06:41:58] (step=0093200) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1613 +[2025-02-28 06:42:58] (step=0093300) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1734 +[2025-02-28 06:43:58] (step=0093400) Train Loss: 0.0465, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1620 +[2025-02-28 06:44:57] (step=0093500) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1680 +[2025-02-28 06:45:57] (step=0093600) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1597 +[2025-02-28 06:46:57] (step=0093700) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1561 +[2025-02-28 06:47:57] (step=0093800) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1597 +[2025-02-28 06:48:56] (step=0093900) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1713 +[2025-02-28 06:49:56] (step=0094000) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1531 +[2025-02-28 06:50:56] (step=0094100) Train Loss: 0.0465, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1594 +[2025-02-28 06:51:56] (step=0094200) Train Loss: 0.0465, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1650 +[2025-02-28 06:52:55] (step=0094300) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1635 +[2025-02-28 06:53:55] (step=0094400) Train Loss: 0.0465, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1605 +[2025-02-28 06:54:55] (step=0094500) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1608 +[2025-02-28 06:55:55] (step=0094600) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1651 +[2025-02-28 06:56:54] (step=0094700) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1664 +[2025-02-28 06:57:54] (step=0094800) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1589 +[2025-02-28 06:58:54] (step=0094900) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1596 +[2025-02-28 06:59:54] (step=0095000) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1586 +[2025-02-28 07:00:56] (step=0095100) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1627 +[2025-02-28 07:01:56] (step=0095200) Train Loss: 0.0471, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1666 +[2025-02-28 07:02:56] (step=0095300) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1644 +[2025-02-28 07:03:56] (step=0095400) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1696 +[2025-02-28 07:04:55] (step=0095500) Train Loss: 0.0469, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1662 +[2025-02-28 07:05:55] (step=0095600) Train Loss: 0.0465, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1626 +[2025-02-28 07:06:55] (step=0095700) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1603 +[2025-02-28 07:07:54] (step=0095800) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1610 +[2025-02-28 07:08:54] (step=0095900) Train Loss: 0.0465, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1632 +[2025-02-28 07:09:54] (step=0096000) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1641 +[2025-02-28 07:10:53] (step=0096100) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1588 +[2025-02-28 07:11:53] (step=0096200) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1672 +[2025-02-28 07:12:53] (step=0096300) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1672 +[2025-02-28 07:13:52] (step=0096400) Train Loss: 0.0465, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1595 +[2025-02-28 07:14:52] (step=0096500) Train Loss: 0.0471, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1585 +[2025-02-28 07:15:52] (step=0096600) Train Loss: 0.0465, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1644 +[2025-02-28 07:16:52] (step=0096700) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1579 +[2025-02-28 07:17:51] (step=0096800) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1647 +[2025-02-28 07:18:51] (step=0096900) Train Loss: 0.0470, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1655 +[2025-02-28 07:19:51] (step=0097000) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1572 +[2025-02-28 07:20:50] (step=0097100) Train Loss: 0.0465, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1582 +[2025-02-28 07:21:50] (step=0097200) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1525 +[2025-02-28 07:22:50] (step=0097300) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1577 +[2025-02-28 07:23:49] (step=0097400) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1608 +[2025-02-28 07:24:49] (step=0097500) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1672 +[2025-02-28 07:25:52] (step=0097600) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1553 +[2025-02-28 07:26:52] (step=0097700) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1576 +[2025-02-28 07:27:51] (step=0097800) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1586 +[2025-02-28 07:28:51] (step=0097900) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1548 +[2025-02-28 07:29:51] (step=0098000) Train Loss: 0.0465, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1628 +[2025-02-28 07:30:50] (step=0098100) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1640 +[2025-02-28 07:31:50] (step=0098200) Train Loss: 0.0465, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1589 +[2025-02-28 07:32:50] (step=0098300) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1680 +[2025-02-28 07:33:49] (step=0098400) Train Loss: 0.0471, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1512 +[2025-02-28 07:34:49] (step=0098500) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1623 +[2025-02-28 07:35:49] (step=0098600) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1478 +[2025-02-28 07:36:49] (step=0098700) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1608 +[2025-02-28 07:37:48] (step=0098800) Train Loss: 0.0465, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1541 +[2025-02-28 07:38:48] (step=0098900) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1606 +[2025-02-28 07:39:48] (step=0099000) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1593 +[2025-02-28 07:40:47] (step=0099100) Train Loss: 0.0465, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1630 +[2025-02-28 07:41:47] (step=0099200) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1569 +[2025-02-28 07:42:47] (step=0099300) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1581 +[2025-02-28 07:43:47] (step=0099400) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1541 +[2025-02-28 07:44:46] (step=0099500) Train Loss: 0.0465, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1527 +[2025-02-28 07:45:46] (step=0099600) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1601 +[2025-02-28 07:46:46] (step=0099700) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1612 +[2025-02-28 07:47:45] (step=0099800) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1535 +[2025-02-28 07:48:45] (step=0099900) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1630 +[2025-02-28 07:49:45] (step=0100000) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1620 +[2025-02-28 07:49:48] Saved checkpoint to ../logs/flow/flowsdvae_500kx512_lgn0p0/checkpoints/0100000.pt +[2025-02-28 07:55:29] (step=0100000), Fid=11.432212264136467, PSNR=26.724181042742728, LPIPS=0.22398734092712402, SSIM=0.7371894717216492 +[2025-02-28 07:56:32] (step=0100100) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 0.25, Grad Norm: 0.1559 +[2025-02-28 07:57:32] (step=0100200) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1572 +[2025-02-28 07:58:32] (step=0100300) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1538 +[2025-02-28 07:59:31] (step=0100400) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1531 +[2025-02-28 08:00:31] (step=0100500) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1593 +[2025-02-28 08:01:31] (step=0100600) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1555 +[2025-02-28 08:02:31] (step=0100700) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1582 +[2025-02-28 08:03:30] (step=0100800) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1545 +[2025-02-28 08:04:30] (step=0100900) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1586 +[2025-02-28 08:05:30] (step=0101000) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1537 +[2025-02-28 08:06:29] (step=0101100) Train Loss: 0.0465, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1538 +[2025-02-28 08:07:29] (step=0101200) Train Loss: 0.0465, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1598 +[2025-02-28 08:08:28] (step=0101300) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1513 +[2025-02-28 08:09:28] (step=0101400) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1568 +[2025-02-28 08:10:28] (step=0101500) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1526 +[2025-02-28 08:11:27] (step=0101600) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1518 +[2025-02-28 08:12:27] (step=0101700) Train Loss: 0.0465, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1594 +[2025-02-28 08:13:26] (step=0101800) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1530 +[2025-02-28 08:14:26] (step=0101900) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1528 +[2025-02-28 08:15:26] (step=0102000) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1548 +[2025-02-28 08:16:25] (step=0102100) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1562 +[2025-02-28 08:17:25] (step=0102200) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1587 +[2025-02-28 08:18:24] (step=0102300) Train Loss: 0.0469, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1497 +[2025-02-28 08:19:24] (step=0102400) Train Loss: 0.0465, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1590 +[2025-02-28 08:20:24] (step=0102500) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1555 +[2025-02-28 08:21:26] (step=0102600) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1528 +[2025-02-28 08:22:26] (step=0102700) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1593 +[2025-02-28 08:23:26] (step=0102800) Train Loss: 0.0465, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1578 +[2025-02-28 08:24:26] (step=0102900) Train Loss: 0.0465, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1533 +[2025-02-28 08:25:25] (step=0103000) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1491 +[2025-02-28 08:26:25] (step=0103100) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1571 +[2025-02-28 08:27:25] (step=0103200) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1539 +[2025-02-28 08:28:25] (step=0103300) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1473 +[2025-02-28 08:29:24] (step=0103400) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1547 +[2025-02-28 08:30:24] (step=0103500) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1522 +[2025-02-28 08:31:24] (step=0103600) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1514 +[2025-02-28 08:32:23] (step=0103700) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1459 +[2025-02-28 08:33:23] (step=0103800) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1570 +[2025-02-28 08:34:22] (step=0103900) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1457 +[2025-02-28 08:35:22] (step=0104000) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1523 +[2025-02-28 08:36:22] (step=0104100) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1517 +[2025-02-28 08:37:21] (step=0104200) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1525 +[2025-02-28 08:38:21] (step=0104300) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1564 +[2025-02-28 08:39:20] (step=0104400) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1524 +[2025-02-28 08:40:20] (step=0104500) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1486 +[2025-02-28 08:41:20] (step=0104600) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1480 +[2025-02-28 08:42:19] (step=0104700) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1524 +[2025-02-28 08:43:19] (step=0104800) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1556 +[2025-02-28 08:44:18] (step=0104900) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1552 +[2025-02-28 08:45:18] (step=0105000) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1495 +[2025-02-28 08:46:21] (step=0105100) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1551 +[2025-02-28 08:47:21] (step=0105200) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1479 +[2025-02-28 08:48:20] (step=0105300) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1622 +[2025-02-28 08:49:20] (step=0105400) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1526 +[2025-02-28 08:50:19] (step=0105500) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1558 +[2025-02-28 08:51:19] (step=0105600) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1553 +[2025-02-28 08:52:19] (step=0105700) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1590 +[2025-02-28 08:53:18] (step=0105800) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1468 +[2025-02-28 08:54:18] (step=0105900) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1529 +[2025-02-28 08:55:18] (step=0106000) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1472 +[2025-02-28 08:56:17] (step=0106100) Train Loss: 0.0465, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1527 +[2025-02-28 08:57:17] (step=0106200) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1459 +[2025-02-28 08:58:16] (step=0106300) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1523 +[2025-02-28 08:59:16] (step=0106400) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1482 +[2025-02-28 09:00:16] (step=0106500) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1505 +[2025-02-28 09:01:15] (step=0106600) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1503 +[2025-02-28 09:02:15] (step=0106700) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1460 +[2025-02-28 09:03:14] (step=0106800) Train Loss: 0.0465, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1454 +[2025-02-28 09:04:14] (step=0106900) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1499 +[2025-02-28 09:05:14] (step=0107000) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1516 +[2025-02-28 09:06:13] (step=0107100) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1526 +[2025-02-28 09:07:13] (step=0107200) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1491 +[2025-02-28 09:08:12] (step=0107300) Train Loss: 0.0465, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1528 +[2025-02-28 09:09:12] (step=0107400) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1520 +[2025-02-28 09:10:11] (step=0107500) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1528 +[2025-02-28 09:11:14] (step=0107600) Train Loss: 0.0465, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1511 +[2025-02-28 09:12:14] (step=0107700) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1463 +[2025-02-28 09:13:14] (step=0107800) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1413 +[2025-02-28 09:14:13] (step=0107900) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1541 +[2025-02-28 09:15:13] (step=0108000) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1446 +[2025-02-28 09:16:12] (step=0108100) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1479 +[2025-02-28 09:17:12] (step=0108200) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1534 +[2025-02-28 09:18:12] (step=0108300) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1498 +[2025-02-28 09:19:11] (step=0108400) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1526 +[2025-02-28 09:20:11] (step=0108500) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1457 +[2025-02-28 09:21:10] (step=0108600) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1524 +[2025-02-28 09:22:10] (step=0108700) Train Loss: 0.0469, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1517 +[2025-02-28 09:23:09] (step=0108800) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1460 +[2025-02-28 09:24:09] (step=0108900) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1495 +[2025-02-28 09:25:09] (step=0109000) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1462 +[2025-02-28 09:26:08] (step=0109100) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1432 +[2025-02-28 09:27:08] (step=0109200) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1469 +[2025-02-28 09:28:07] (step=0109300) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1507 +[2025-02-28 09:29:07] (step=0109400) Train Loss: 0.0468, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1483 +[2025-02-28 09:30:07] (step=0109500) Train Loss: 0.0465, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1458 +[2025-02-28 09:31:07] (step=0109600) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1486 +[2025-02-28 09:32:06] (step=0109700) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1487 +[2025-02-28 09:33:06] (step=0109800) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1506 +[2025-02-28 09:34:06] (step=0109900) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1471 +[2025-02-28 09:35:05] (step=0110000) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1474 +[2025-02-28 09:36:08] (step=0110100) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1528 +[2025-02-28 09:37:08] (step=0110200) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1495 +[2025-02-28 09:38:08] (step=0110300) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1508 +[2025-02-28 09:39:07] (step=0110400) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1454 +[2025-02-28 09:40:07] (step=0110500) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1505 +[2025-02-28 09:41:06] (step=0110600) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1516 +[2025-02-28 09:42:06] (step=0110700) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1528 +[2025-02-28 09:43:06] (step=0110800) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1512 +[2025-02-28 09:44:05] (step=0110900) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1520 +[2025-02-28 09:45:05] (step=0111000) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1468 +[2025-02-28 09:46:04] (step=0111100) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1449 +[2025-02-28 09:47:04] (step=0111200) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1478 +[2025-02-28 09:48:03] (step=0111300) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1509 +[2025-02-28 09:49:03] (step=0111400) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1421 +[2025-02-28 09:50:03] (step=0111500) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1433 +[2025-02-28 09:51:02] (step=0111600) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1480 +[2025-02-28 09:52:02] (step=0111700) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1466 +[2025-02-28 09:53:01] (step=0111800) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1462 +[2025-02-28 09:54:01] (step=0111900) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1502 +[2025-02-28 09:55:01] (step=0112000) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1438 +[2025-02-28 09:56:00] (step=0112100) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1419 +[2025-02-28 09:57:00] (step=0112200) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1484 +[2025-02-28 09:57:59] (step=0112300) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1460 +[2025-02-28 09:58:59] (step=0112400) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1460 +[2025-02-28 09:59:58] (step=0112500) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1476 +[2025-02-28 10:01:01] (step=0112600) Train Loss: 0.0465, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1458 +[2025-02-28 10:02:01] (step=0112700) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1441 +[2025-02-28 10:03:01] (step=0112800) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1455 +[2025-02-28 10:04:00] (step=0112900) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1431 +[2025-02-28 10:05:00] (step=0113000) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1416 +[2025-02-28 10:05:59] (step=0113100) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1458 +[2025-02-28 10:06:59] (step=0113200) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1448 +[2025-02-28 10:07:59] (step=0113300) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1426 +[2025-02-28 10:08:58] (step=0113400) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1479 +[2025-02-28 10:09:58] (step=0113500) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1499 +[2025-02-28 10:10:57] (step=0113600) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1411 +[2025-02-28 10:11:57] (step=0113700) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1501 +[2025-02-28 10:12:57] (step=0113800) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1419 +[2025-02-28 10:13:56] (step=0113900) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1421 +[2025-02-28 10:14:56] (step=0114000) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1393 +[2025-02-28 10:15:56] (step=0114100) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1450 +[2025-02-28 10:16:55] (step=0114200) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1407 +[2025-02-28 10:17:55] (step=0114300) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1468 +[2025-02-28 10:18:55] (step=0114400) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1377 +[2025-02-28 10:19:54] (step=0114500) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1388 +[2025-02-28 10:20:54] (step=0114600) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1452 +[2025-02-28 10:21:53] (step=0114700) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1422 +[2025-02-28 10:22:53] (step=0114800) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1396 +[2025-02-28 10:23:53] (step=0114900) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1440 +[2025-02-28 10:24:52] (step=0115000) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1402 +[2025-02-28 10:25:55] (step=0115100) Train Loss: 0.0466, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1468 +[2025-02-28 10:26:55] (step=0115200) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1402 +[2025-02-28 10:27:55] (step=0115300) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1429 +[2025-02-28 10:28:55] (step=0115400) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1475 +[2025-02-28 10:29:54] (step=0115500) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1450 +[2025-02-28 10:30:54] (step=0115600) Train Loss: 0.0465, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1459 +[2025-02-28 10:31:53] (step=0115700) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1454 +[2025-02-28 10:32:53] (step=0115800) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1403 +[2025-02-28 10:33:53] (step=0115900) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1474 +[2025-02-28 10:34:52] (step=0116000) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1430 +[2025-02-28 10:35:52] (step=0116100) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1436 +[2025-02-28 10:36:52] (step=0116200) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1474 +[2025-02-28 10:37:51] (step=0116300) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1411 +[2025-02-28 10:38:51] (step=0116400) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1438 +[2025-02-28 10:39:51] (step=0116500) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1453 +[2025-02-28 10:40:50] (step=0116600) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1444 +[2025-02-28 10:41:50] (step=0116700) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1476 +[2025-02-28 10:42:50] (step=0116800) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1410 +[2025-02-28 10:43:50] (step=0116900) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1426 +[2025-02-28 10:44:49] (step=0117000) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1436 +[2025-02-28 10:45:49] (step=0117100) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1392 +[2025-02-28 10:46:48] (step=0117200) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1463 +[2025-02-28 10:47:48] (step=0117300) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1373 +[2025-02-28 10:48:47] (step=0117400) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1428 +[2025-02-28 10:49:47] (step=0117500) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1405 +[2025-02-28 10:50:50] (step=0117600) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1344 +[2025-02-28 10:51:50] (step=0117700) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1405 +[2025-02-28 10:52:49] (step=0117800) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1428 +[2025-02-28 10:53:49] (step=0117900) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1354 +[2025-02-28 10:54:49] (step=0118000) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1371 +[2025-02-28 10:55:48] (step=0118100) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1354 +[2025-02-28 10:56:48] (step=0118200) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1426 +[2025-02-28 10:57:47] (step=0118300) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1394 +[2025-02-28 10:58:47] (step=0118400) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1344 +[2025-02-28 10:59:46] (step=0118500) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1419 +[2025-02-28 11:00:46] (step=0118600) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1389 +[2025-02-28 11:01:45] (step=0118700) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1410 +[2025-02-28 11:02:45] (step=0118800) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1384 +[2025-02-28 11:03:44] (step=0118900) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1433 +[2025-02-28 11:04:44] (step=0119000) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1379 +[2025-02-28 11:05:43] (step=0119100) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1442 +[2025-02-28 11:06:42] (step=0119200) Train Loss: 0.0467, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1330 +[2025-02-28 11:07:42] (step=0119300) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1372 +[2025-02-28 11:08:42] (step=0119400) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1420 +[2025-02-28 11:09:41] (step=0119500) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1396 +[2025-02-28 11:10:41] (step=0119600) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1376 +[2025-02-28 11:11:40] (step=0119700) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1392 +[2025-02-28 11:12:39] (step=0119800) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1387 +[2025-02-28 11:13:39] (step=0119900) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1347 +[2025-02-28 11:14:38] (step=0120000) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1375 +[2025-02-28 11:15:41] (step=0120100) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.60, Grad Norm: 0.1414 +[2025-02-28 11:16:41] (step=0120200) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1395 +[2025-02-28 11:17:40] (step=0120300) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1334 +[2025-02-28 11:18:40] (step=0120400) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1404 +[2025-02-28 11:19:40] (step=0120500) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1383 +[2025-02-28 11:20:39] (step=0120600) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1366 +[2025-02-28 11:21:39] (step=0120700) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1391 +[2025-02-28 11:22:38] (step=0120800) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1410 +[2025-02-28 11:23:38] (step=0120900) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1354 +[2025-02-28 11:24:37] (step=0121000) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1350 +[2025-02-28 11:25:37] (step=0121100) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1346 +[2025-02-28 11:26:37] (step=0121200) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1399 +[2025-02-28 11:27:36] (step=0121300) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1378 +[2025-02-28 11:28:36] (step=0121400) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1368 +[2025-02-28 11:29:35] (step=0121500) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1391 +[2025-02-28 11:30:35] (step=0121600) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1366 +[2025-02-28 11:31:34] (step=0121700) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1383 +[2025-02-28 11:32:34] (step=0121800) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1350 +[2025-02-28 11:33:34] (step=0121900) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1364 +[2025-02-28 11:34:33] (step=0122000) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1424 +[2025-02-28 11:35:33] (step=0122100) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1345 +[2025-02-28 11:36:32] (step=0122200) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1342 +[2025-02-28 11:37:32] (step=0122300) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1333 +[2025-02-28 11:38:31] (step=0122400) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1384 +[2025-02-28 11:39:31] (step=0122500) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1384 +[2025-02-28 11:40:34] (step=0122600) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1353 +[2025-02-28 11:41:34] (step=0122700) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1347 +[2025-02-28 11:42:33] (step=0122800) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1357 +[2025-02-28 11:43:33] (step=0122900) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1441 +[2025-02-28 11:44:32] (step=0123000) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1378 +[2025-02-28 11:45:32] (step=0123100) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1331 +[2025-02-28 11:46:31] (step=0123200) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1369 +[2025-02-28 11:47:30] (step=0123300) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1363 +[2025-02-28 11:48:30] (step=0123400) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1391 +[2025-02-28 11:49:29] (step=0123500) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1442 +[2025-02-28 11:50:29] (step=0123600) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1336 +[2025-02-28 11:51:28] (step=0123700) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1421 +[2025-02-28 11:52:28] (step=0123800) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1329 +[2025-02-28 11:53:27] (step=0123900) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1334 +[2025-02-28 11:54:27] (step=0124000) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1391 +[2025-02-28 11:55:26] (step=0124100) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1375 +[2025-02-28 11:56:26] (step=0124200) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1359 +[2025-02-28 11:57:25] (step=0124300) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1373 +[2025-02-28 11:58:24] (step=0124400) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1349 +[2025-02-28 11:59:24] (step=0124500) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1338 +[2025-02-28 12:00:23] (step=0124600) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1381 +[2025-02-28 12:01:23] (step=0124700) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1364 +[2025-02-28 12:02:22] (step=0124800) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1261 +[2025-02-28 12:03:22] (step=0124900) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1353 +[2025-02-28 12:04:21] (step=0125000) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1310 +[2025-02-28 12:05:22] (step=0125100) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.66, Grad Norm: 0.1393 +[2025-02-28 12:06:24] (step=0125200) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.61, Grad Norm: 0.1358 +[2025-02-28 12:07:23] (step=0125300) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1349 +[2025-02-28 12:08:23] (step=0125400) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1385 +[2025-02-28 12:09:22] (step=0125500) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1385 +[2025-02-28 12:10:22] (step=0125600) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1300 +[2025-02-28 12:11:22] (step=0125700) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1361 +[2025-02-28 12:12:21] (step=0125800) Train Loss: 0.0465, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1340 +[2025-02-28 12:13:21] (step=0125900) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1348 +[2025-02-28 12:14:20] (step=0126000) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1368 +[2025-02-28 12:15:20] (step=0126100) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1375 +[2025-02-28 12:16:19] (step=0126200) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1346 +[2025-02-28 12:17:19] (step=0126300) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1386 +[2025-02-28 12:18:18] (step=0126400) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1382 +[2025-02-28 12:19:18] (step=0126500) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1289 +[2025-02-28 12:20:17] (step=0126600) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1339 +[2025-02-28 12:21:17] (step=0126700) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1374 +[2025-02-28 12:22:17] (step=0126800) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1391 +[2025-02-28 12:23:16] (step=0126900) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1343 +[2025-02-28 12:24:16] (step=0127000) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1285 +[2025-02-28 12:25:15] (step=0127100) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1334 +[2025-02-28 12:26:15] (step=0127200) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1306 +[2025-02-28 12:27:14] (step=0127300) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1349 +[2025-02-28 12:28:14] (step=0127400) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1349 +[2025-02-28 12:29:13] (step=0127500) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1372 +[2025-02-28 12:30:13] (step=0127600) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1327 +[2025-02-28 12:31:16] (step=0127700) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1410 +[2025-02-28 12:32:15] (step=0127800) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1296 +[2025-02-28 12:33:15] (step=0127900) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1342 +[2025-02-28 12:34:15] (step=0128000) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1329 +[2025-02-28 12:35:14] (step=0128100) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1375 +[2025-02-28 12:36:14] (step=0128200) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1353 +[2025-02-28 12:37:13] (step=0128300) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1332 +[2025-02-28 12:38:13] (step=0128400) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1406 +[2025-02-28 12:39:12] (step=0128500) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1410 +[2025-02-28 12:40:12] (step=0128600) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1270 +[2025-02-28 12:41:11] (step=0128700) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1294 +[2025-02-28 12:42:11] (step=0128800) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1357 +[2025-02-28 12:43:10] (step=0128900) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1308 +[2025-02-28 12:44:10] (step=0129000) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1352 +[2025-02-28 12:45:09] (step=0129100) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1301 +[2025-02-28 12:46:09] (step=0129200) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1341 +[2025-02-28 12:47:08] (step=0129300) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1343 +[2025-02-28 12:48:08] (step=0129400) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1286 +[2025-02-28 12:49:07] (step=0129500) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1299 +[2025-02-28 12:50:07] (step=0129600) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1360 +[2025-02-28 12:51:07] (step=0129700) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1320 +[2025-02-28 12:52:06] (step=0129800) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1323 +[2025-02-28 12:53:06] (step=0129900) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1309 +[2025-02-28 12:54:05] (step=0130000) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1272 +[2025-02-28 12:55:05] (step=0130100) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1338 +[2025-02-28 12:56:08] (step=0130200) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.58, Grad Norm: 0.1382 +[2025-02-28 12:57:07] (step=0130300) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1282 +[2025-02-28 12:58:07] (step=0130400) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1346 +[2025-02-28 12:59:06] (step=0130500) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1306 +[2025-02-28 13:00:06] (step=0130600) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1307 +[2025-02-28 13:01:06] (step=0130700) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1325 +[2025-02-28 13:02:05] (step=0130800) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1292 +[2025-02-28 13:03:05] (step=0130900) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1335 +[2025-02-28 13:04:04] (step=0131000) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1302 +[2025-02-28 13:05:04] (step=0131100) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1335 +[2025-02-28 13:06:03] (step=0131200) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1347 +[2025-02-28 13:07:03] (step=0131300) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1274 +[2025-02-28 13:08:02] (step=0131400) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1329 +[2025-02-28 13:09:02] (step=0131500) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1314 +[2025-02-28 13:10:01] (step=0131600) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1306 +[2025-02-28 13:11:01] (step=0131700) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1310 +[2025-02-28 13:12:00] (step=0131800) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1279 +[2025-02-28 13:13:00] (step=0131900) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1289 +[2025-02-28 13:13:59] (step=0132000) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1300 +[2025-02-28 13:14:59] (step=0132100) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1338 +[2025-02-28 13:15:58] (step=0132200) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1257 +[2025-02-28 13:16:58] (step=0132300) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1352 +[2025-02-28 13:17:57] (step=0132400) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1355 +[2025-02-28 13:18:57] (step=0132500) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1362 +[2025-02-28 13:19:56] (step=0132600) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1340 +[2025-02-28 13:20:59] (step=0132700) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1301 +[2025-02-28 13:21:59] (step=0132800) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1331 +[2025-02-28 13:22:59] (step=0132900) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1298 +[2025-02-28 13:23:58] (step=0133000) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1275 +[2025-02-28 13:24:58] (step=0133100) Train Loss: 0.0463, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1317 +[2025-02-28 13:25:57] (step=0133200) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1257 +[2025-02-28 13:26:57] (step=0133300) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1279 +[2025-02-28 13:27:56] (step=0133400) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1340 +[2025-02-28 13:28:56] (step=0133500) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1262 +[2025-02-28 13:29:55] (step=0133600) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1353 +[2025-02-28 13:30:55] (step=0133700) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1288 +[2025-02-28 13:31:54] (step=0133800) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1296 +[2025-02-28 13:32:54] (step=0133900) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1298 +[2025-02-28 13:33:53] (step=0134000) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1347 +[2025-02-28 13:34:53] (step=0134100) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1284 +[2025-02-28 13:35:52] (step=0134200) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1299 +[2025-02-28 13:36:52] (step=0134300) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1305 +[2025-02-28 13:37:51] (step=0134400) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1238 +[2025-02-28 13:38:51] (step=0134500) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1287 +[2025-02-28 13:39:51] (step=0134600) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1315 +[2025-02-28 13:40:50] (step=0134700) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1249 +[2025-02-28 13:41:50] (step=0134800) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1242 +[2025-02-28 13:42:49] (step=0134900) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1282 +[2025-02-28 13:43:49] (step=0135000) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1269 +[2025-02-28 13:44:48] (step=0135100) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1278 +[2025-02-28 13:45:51] (step=0135200) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1301 +[2025-02-28 13:46:51] (step=0135300) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1333 +[2025-02-28 13:47:50] (step=0135400) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1267 +[2025-02-28 13:48:50] (step=0135500) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1310 +[2025-02-28 13:49:49] (step=0135600) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1290 +[2025-02-28 13:50:49] (step=0135700) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1287 +[2025-02-28 13:51:48] (step=0135800) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1289 +[2025-02-28 13:52:48] (step=0135900) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1286 +[2025-02-28 13:53:47] (step=0136000) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1266 +[2025-02-28 13:54:47] (step=0136100) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1260 +[2025-02-28 13:55:46] (step=0136200) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1243 +[2025-02-28 13:56:46] (step=0136300) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1282 +[2025-02-28 13:57:45] (step=0136400) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1305 +[2025-02-28 13:58:45] (step=0136500) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1181 +[2025-02-28 13:59:44] (step=0136600) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1347 +[2025-02-28 14:00:44] (step=0136700) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1258 +[2025-02-28 14:01:44] (step=0136800) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1314 +[2025-02-28 14:02:43] (step=0136900) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1289 +[2025-02-28 14:03:43] (step=0137000) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1330 +[2025-02-28 14:04:42] (step=0137100) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1307 +[2025-02-28 14:05:42] (step=0137200) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1330 +[2025-02-28 14:06:41] (step=0137300) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1313 +[2025-02-28 14:07:41] (step=0137400) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1279 +[2025-02-28 14:08:40] (step=0137500) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1328 +[2025-02-28 14:09:40] (step=0137600) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1247 +[2025-02-28 14:10:43] (step=0137700) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1192 +[2025-02-28 14:11:42] (step=0137800) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1337 +[2025-02-28 14:12:42] (step=0137900) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1221 +[2025-02-28 14:13:41] (step=0138000) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1241 +[2025-02-28 14:14:41] (step=0138100) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1233 +[2025-02-28 14:15:41] (step=0138200) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1303 +[2025-02-28 14:16:40] (step=0138300) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1277 +[2025-02-28 14:17:40] (step=0138400) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1281 +[2025-02-28 14:18:39] (step=0138500) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1300 +[2025-02-28 14:19:39] (step=0138600) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1276 +[2025-02-28 14:20:39] (step=0138700) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1318 +[2025-02-28 14:21:38] (step=0138800) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1271 +[2025-02-28 14:22:38] (step=0138900) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1284 +[2025-02-28 14:23:37] (step=0139000) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1233 +[2025-02-28 14:24:37] (step=0139100) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1209 +[2025-02-28 14:25:36] (step=0139200) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1315 +[2025-02-28 14:26:36] (step=0139300) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1251 +[2025-02-28 14:27:35] (step=0139400) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1308 +[2025-02-28 14:28:35] (step=0139500) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1287 +[2025-02-28 14:29:34] (step=0139600) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1285 +[2025-02-28 14:30:34] (step=0139700) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1327 +[2025-02-28 14:31:33] (step=0139800) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1266 +[2025-02-28 14:32:33] (step=0139900) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1228 +[2025-02-28 14:33:33] (step=0140000) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1276 +[2025-02-28 14:34:32] (step=0140100) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1291 +[2025-02-28 14:35:35] (step=0140200) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.60, Grad Norm: 0.1246 +[2025-02-28 14:36:34] (step=0140300) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1287 +[2025-02-28 14:37:34] (step=0140400) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1232 +[2025-02-28 14:38:33] (step=0140500) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1305 +[2025-02-28 14:39:33] (step=0140600) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1274 +[2025-02-28 14:40:32] (step=0140700) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1322 +[2025-02-28 14:41:32] (step=0140800) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1180 +[2025-02-28 14:42:32] (step=0140900) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1230 +[2025-02-28 14:43:31] (step=0141000) Train Loss: 0.0464, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1258 +[2025-02-28 14:44:31] (step=0141100) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1200 +[2025-02-28 14:45:30] (step=0141200) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1275 +[2025-02-28 14:46:30] (step=0141300) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1257 +[2025-02-28 14:47:29] (step=0141400) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1287 +[2025-02-28 14:48:29] (step=0141500) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1244 +[2025-02-28 14:49:28] (step=0141600) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1291 +[2025-02-28 14:50:28] (step=0141700) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1232 +[2025-02-28 14:51:27] (step=0141800) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1299 +[2025-02-28 14:52:27] (step=0141900) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1246 +[2025-02-28 14:53:26] (step=0142000) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1271 +[2025-02-28 14:54:26] (step=0142100) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1212 +[2025-02-28 14:55:25] (step=0142200) Train Loss: 0.0462, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1221 +[2025-02-28 14:56:25] (step=0142300) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1241 +[2025-02-28 14:57:25] (step=0142400) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1236 +[2025-02-28 14:58:24] (step=0142500) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1242 +[2025-02-28 14:59:24] (step=0142600) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1232 +[2025-02-28 15:00:27] (step=0142700) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1236 +[2025-02-28 15:01:26] (step=0142800) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1240 +[2025-02-28 15:02:26] (step=0142900) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1237 +[2025-02-28 15:03:25] (step=0143000) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1234 +[2025-02-28 15:04:25] (step=0143100) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1305 +[2025-02-28 15:05:24] (step=0143200) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1190 +[2025-02-28 15:06:24] (step=0143300) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1327 +[2025-02-28 15:07:23] (step=0143400) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1177 +[2025-02-28 15:08:23] (step=0143500) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1248 +[2025-02-28 15:09:22] (step=0143600) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1223 +[2025-02-28 15:10:22] (step=0143700) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1277 +[2025-02-28 15:11:21] (step=0143800) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1173 +[2025-02-28 15:12:21] (step=0143900) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1273 +[2025-02-28 15:13:20] (step=0144000) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1245 +[2025-02-28 15:14:20] (step=0144100) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1266 +[2025-02-28 15:15:19] (step=0144200) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1238 +[2025-02-28 15:16:19] (step=0144300) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1251 +[2025-02-28 15:17:19] (step=0144400) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1207 +[2025-02-28 15:18:18] (step=0144500) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1221 +[2025-02-28 15:19:18] (step=0144600) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1237 +[2025-02-28 15:20:17] (step=0144700) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1227 +[2025-02-28 15:21:17] (step=0144800) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1212 +[2025-02-28 15:22:16] (step=0144900) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1222 +[2025-02-28 15:23:16] (step=0145000) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1187 +[2025-02-28 15:24:15] (step=0145100) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1201 +[2025-02-28 15:25:18] (step=0145200) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1226 +[2025-02-28 15:26:18] (step=0145300) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1265 +[2025-02-28 15:27:17] (step=0145400) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1217 +[2025-02-28 15:28:17] (step=0145500) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1213 +[2025-02-28 15:29:17] (step=0145600) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1226 +[2025-02-28 15:30:16] (step=0145700) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1217 +[2025-02-28 15:31:16] (step=0145800) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1212 +[2025-02-28 15:32:15] (step=0145900) Train Loss: 0.0461, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1201 +[2025-02-28 15:33:15] (step=0146000) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1187 +[2025-02-28 15:34:14] (step=0146100) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1217 +[2025-02-28 15:35:14] (step=0146200) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1201 +[2025-02-28 15:36:13] (step=0146300) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1203 +[2025-02-28 15:37:13] (step=0146400) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1211 +[2025-02-28 15:38:12] (step=0146500) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1217 +[2025-02-28 15:39:12] (step=0146600) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1239 +[2025-02-28 15:40:11] (step=0146700) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1180 +[2025-02-28 15:41:11] (step=0146800) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1250 +[2025-02-28 15:42:10] (step=0146900) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1287 +[2025-02-28 15:43:10] (step=0147000) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1180 +[2025-02-28 15:44:10] (step=0147100) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1206 +[2025-02-28 15:45:09] (step=0147200) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1209 +[2025-02-28 15:46:09] (step=0147300) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1236 +[2025-02-28 15:47:08] (step=0147400) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1297 +[2025-02-28 15:48:08] (step=0147500) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1180 +[2025-02-28 15:49:07] (step=0147600) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1253 +[2025-02-28 15:50:10] (step=0147700) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1266 +[2025-02-28 15:51:10] (step=0147800) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1298 +[2025-02-28 15:52:09] (step=0147900) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1223 +[2025-02-28 15:53:09] (step=0148000) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1221 +[2025-02-28 15:54:08] (step=0148100) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1166 +[2025-02-28 15:55:08] (step=0148200) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1238 +[2025-02-28 15:56:08] (step=0148300) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1163 +[2025-02-28 15:57:07] (step=0148400) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1182 +[2025-02-28 15:58:07] (step=0148500) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1169 +[2025-02-28 15:59:06] (step=0148600) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1200 +[2025-02-28 16:00:06] (step=0148700) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1201 +[2025-02-28 16:01:05] (step=0148800) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1190 +[2025-02-28 16:02:05] (step=0148900) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1137 +[2025-02-28 16:03:04] (step=0149000) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1198 +[2025-02-28 16:04:04] (step=0149100) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1172 +[2025-02-28 16:05:03] (step=0149200) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1200 +[2025-02-28 16:06:03] (step=0149300) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1173 +[2025-02-28 16:07:02] (step=0149400) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1201 +[2025-02-28 16:08:02] (step=0149500) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1177 +[2025-02-28 16:09:02] (step=0149600) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1157 +[2025-02-28 16:10:01] (step=0149700) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1195 +[2025-02-28 16:11:01] (step=0149800) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1213 +[2025-02-28 16:12:00] (step=0149900) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1207 +[2025-02-28 16:13:00] (step=0150000) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1190 +[2025-02-28 16:13:03] Saved checkpoint to ../logs/flow/flowsdvae_500kx512_lgn0p0/checkpoints/0150000.pt +[2025-02-28 16:18:34] (step=0150000), Fid=12.033696733859415, PSNR=26.874297228240966, LPIPS=0.2253125160932541, SSIM=0.7429574131965637 +[2025-02-28 16:19:33] (step=0150100) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 0.25, Grad Norm: 0.1165 +[2025-02-28 16:20:36] (step=0150200) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1151 +[2025-02-28 16:21:36] (step=0150300) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1207 +[2025-02-28 16:22:36] (step=0150400) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1225 +[2025-02-28 16:23:35] (step=0150500) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1199 +[2025-02-28 16:24:35] (step=0150600) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1218 +[2025-02-28 16:25:35] (step=0150700) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1172 +[2025-02-28 16:26:35] (step=0150800) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1227 +[2025-02-28 16:27:34] (step=0150900) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1145 +[2025-02-28 16:28:34] (step=0151000) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1198 +[2025-02-28 16:29:34] (step=0151100) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1246 +[2025-02-28 16:30:34] (step=0151200) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1112 +[2025-02-28 16:31:33] (step=0151300) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1230 +[2025-02-28 16:32:33] (step=0151400) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1161 +[2025-02-28 16:33:33] (step=0151500) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1228 +[2025-02-28 16:34:32] (step=0151600) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1254 +[2025-02-28 16:35:32] (step=0151700) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1181 +[2025-02-28 16:36:32] (step=0151800) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1187 +[2025-02-28 16:37:31] (step=0151900) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1169 +[2025-02-28 16:38:31] (step=0152000) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1226 +[2025-02-28 16:39:31] (step=0152100) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1175 +[2025-02-28 16:40:31] (step=0152200) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1144 +[2025-02-28 16:41:30] (step=0152300) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1159 +[2025-02-28 16:42:30] (step=0152400) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1195 +[2025-02-28 16:43:30] (step=0152500) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1151 +[2025-02-28 16:44:30] (step=0152600) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1225 +[2025-02-28 16:45:32] (step=0152700) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1174 +[2025-02-28 16:46:32] (step=0152800) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1172 +[2025-02-28 16:47:32] (step=0152900) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1179 +[2025-02-28 16:48:31] (step=0153000) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1153 +[2025-02-28 16:49:31] (step=0153100) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1186 +[2025-02-28 16:50:31] (step=0153200) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1113 +[2025-02-28 16:51:30] (step=0153300) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1195 +[2025-02-28 16:52:30] (step=0153400) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1156 +[2025-02-28 16:53:30] (step=0153500) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1183 +[2025-02-28 16:54:29] (step=0153600) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1228 +[2025-02-28 16:55:29] (step=0153700) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1188 +[2025-02-28 16:56:29] (step=0153800) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1192 +[2025-02-28 16:57:28] (step=0153900) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1206 +[2025-02-28 16:58:28] (step=0154000) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1123 +[2025-02-28 16:59:28] (step=0154100) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1164 +[2025-02-28 17:00:27] (step=0154200) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1188 +[2025-02-28 17:01:27] (step=0154300) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1160 +[2025-02-28 17:02:27] (step=0154400) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1147 +[2025-02-28 17:03:26] (step=0154500) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1192 +[2025-02-28 17:04:26] (step=0154600) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1174 +[2025-02-28 17:05:26] (step=0154700) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1225 +[2025-02-28 17:06:25] (step=0154800) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1173 +[2025-02-28 17:07:25] (step=0154900) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1213 +[2025-02-28 17:08:25] (step=0155000) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1172 +[2025-02-28 17:09:25] (step=0155100) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1180 +[2025-02-28 17:10:27] (step=0155200) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1163 +[2025-02-28 17:11:27] (step=0155300) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1127 +[2025-02-28 17:12:27] (step=0155400) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1184 +[2025-02-28 17:13:26] (step=0155500) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1126 +[2025-02-28 17:14:26] (step=0155600) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1192 +[2025-02-28 17:15:26] (step=0155700) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1144 +[2025-02-28 17:16:25] (step=0155800) Train Loss: 0.0460, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1183 +[2025-02-28 17:17:25] (step=0155900) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1151 +[2025-02-28 17:18:25] (step=0156000) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1229 +[2025-02-28 17:19:24] (step=0156100) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1105 +[2025-02-28 17:20:24] (step=0156200) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1137 +[2025-02-28 17:21:24] (step=0156300) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1182 +[2025-02-28 17:22:23] (step=0156400) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1124 +[2025-02-28 17:23:23] (step=0156500) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1193 +[2025-02-28 17:24:23] (step=0156600) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1157 +[2025-02-28 17:25:22] (step=0156700) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1159 +[2025-02-28 17:26:22] (step=0156800) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1164 +[2025-02-28 17:27:22] (step=0156900) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1155 +[2025-02-28 17:28:21] (step=0157000) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1213 +[2025-02-28 17:29:21] (step=0157100) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1114 +[2025-02-28 17:30:21] (step=0157200) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1203 +[2025-02-28 17:31:20] (step=0157300) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1114 +[2025-02-28 17:32:20] (step=0157400) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1155 +[2025-02-28 17:33:20] (step=0157500) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1148 +[2025-02-28 17:34:19] (step=0157600) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1142 +[2025-02-28 17:35:22] (step=0157700) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1094 +[2025-02-28 17:36:22] (step=0157800) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1168 +[2025-02-28 17:37:22] (step=0157900) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1149 +[2025-02-28 17:38:21] (step=0158000) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1169 +[2025-02-28 17:39:21] (step=0158100) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1135 +[2025-02-28 17:40:21] (step=0158200) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1138 +[2025-02-28 17:41:20] (step=0158300) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1163 +[2025-02-28 17:42:20] (step=0158400) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1167 +[2025-02-28 17:43:20] (step=0158500) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1144 +[2025-02-28 17:44:19] (step=0158600) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1165 +[2025-02-28 17:45:19] (step=0158700) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1141 +[2025-02-28 17:46:19] (step=0158800) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1227 +[2025-02-28 17:47:18] (step=0158900) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1157 +[2025-02-28 17:48:18] (step=0159000) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1124 +[2025-02-28 17:49:18] (step=0159100) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1196 +[2025-02-28 17:50:17] (step=0159200) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1098 +[2025-02-28 17:51:17] (step=0159300) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1180 +[2025-02-28 17:52:17] (step=0159400) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1142 +[2025-02-28 17:53:16] (step=0159500) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1152 +[2025-02-28 17:54:16] (step=0159600) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1192 +[2025-02-28 17:55:15] (step=0159700) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1121 +[2025-02-28 17:56:15] (step=0159800) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1220 +[2025-02-28 17:57:15] (step=0159900) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1119 +[2025-02-28 17:58:14] (step=0160000) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1169 +[2025-02-28 17:59:14] (step=0160100) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1105 +[2025-02-28 18:00:17] (step=0160200) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1169 +[2025-02-28 18:01:17] (step=0160300) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1154 +[2025-02-28 18:02:17] (step=0160400) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1099 +[2025-02-28 18:03:16] (step=0160500) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1196 +[2025-02-28 18:04:16] (step=0160600) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1187 +[2025-02-28 18:05:16] (step=0160700) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1113 +[2025-02-28 18:06:15] (step=0160800) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1191 +[2025-02-28 18:07:15] (step=0160900) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1175 +[2025-02-28 18:08:15] (step=0161000) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1114 +[2025-02-28 18:09:14] (step=0161100) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1160 +[2025-02-28 18:10:14] (step=0161200) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1152 +[2025-02-28 18:11:14] (step=0161300) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1111 +[2025-02-28 18:12:14] (step=0161400) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1127 +[2025-02-28 18:13:13] (step=0161500) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1143 +[2025-02-28 18:14:13] (step=0161600) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1184 +[2025-02-28 18:15:13] (step=0161700) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1134 +[2025-02-28 18:16:12] (step=0161800) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1107 +[2025-02-28 18:17:12] (step=0161900) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1137 +[2025-02-28 18:18:12] (step=0162000) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1169 +[2025-02-28 18:19:12] (step=0162100) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1174 +[2025-02-28 18:20:11] (step=0162200) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1116 +[2025-02-28 18:21:11] (step=0162300) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1118 +[2025-02-28 18:22:11] (step=0162400) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1129 +[2025-02-28 18:23:11] (step=0162500) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1145 +[2025-02-28 18:24:10] (step=0162600) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1101 +[2025-02-28 18:25:13] (step=0162700) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1118 +[2025-02-28 18:26:13] (step=0162800) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1157 +[2025-02-28 18:27:13] (step=0162900) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1151 +[2025-02-28 18:28:12] (step=0163000) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1112 +[2025-02-28 18:29:12] (step=0163100) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1103 +[2025-02-28 18:30:12] (step=0163200) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1135 +[2025-02-28 18:31:11] (step=0163300) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1109 +[2025-02-28 18:32:11] (step=0163400) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1114 +[2025-02-28 18:33:11] (step=0163500) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1126 +[2025-02-28 18:34:10] (step=0163600) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1142 +[2025-02-28 18:35:10] (step=0163700) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1133 +[2025-02-28 18:36:10] (step=0163800) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1152 +[2025-02-28 18:37:09] (step=0163900) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1115 +[2025-02-28 18:38:09] (step=0164000) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1135 +[2025-02-28 18:39:08] (step=0164100) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1149 +[2025-02-28 18:40:08] (step=0164200) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1109 +[2025-02-28 18:41:08] (step=0164300) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1139 +[2025-02-28 18:42:07] (step=0164400) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1100 +[2025-02-28 18:43:07] (step=0164500) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1084 +[2025-02-28 18:44:07] (step=0164600) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1139 +[2025-02-28 18:45:06] (step=0164700) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1127 +[2025-02-28 18:46:06] (step=0164800) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1106 +[2025-02-28 18:47:06] (step=0164900) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1132 +[2025-02-28 18:48:05] (step=0165000) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1097 +[2025-02-28 18:49:05] (step=0165100) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1135 +[2025-02-28 18:50:08] (step=0165200) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.60, Grad Norm: 0.1137 +[2025-02-28 18:51:07] (step=0165300) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1113 +[2025-02-28 18:52:07] (step=0165400) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1133 +[2025-02-28 18:53:07] (step=0165500) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1152 +[2025-02-28 18:54:06] (step=0165600) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1160 +[2025-02-28 18:55:06] (step=0165700) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1136 +[2025-02-28 18:56:06] (step=0165800) Train Loss: 0.0459, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1059 +[2025-02-28 18:57:05] (step=0165900) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1082 +[2025-02-28 18:58:05] (step=0166000) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1102 +[2025-02-28 18:59:05] (step=0166100) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1091 +[2025-02-28 19:00:04] (step=0166200) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1080 +[2025-02-28 19:01:04] (step=0166300) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1160 +[2025-02-28 19:02:04] (step=0166400) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1096 +[2025-02-28 19:03:03] (step=0166500) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1059 +[2025-02-28 19:04:03] (step=0166600) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1120 +[2025-02-28 19:05:03] (step=0166700) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1118 +[2025-02-28 19:06:02] (step=0166800) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1107 +[2025-02-28 19:07:02] (step=0166900) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1095 +[2025-02-28 19:08:02] (step=0167000) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1075 +[2025-02-28 19:09:02] (step=0167100) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1122 +[2025-02-28 19:10:01] (step=0167200) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1144 +[2025-02-28 19:11:01] (step=0167300) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1114 +[2025-02-28 19:12:01] (step=0167400) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1089 +[2025-02-28 19:13:01] (step=0167500) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1117 +[2025-02-28 19:14:01] (step=0167600) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1085 +[2025-02-28 19:15:03] (step=0167700) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1070 +[2025-02-28 19:16:03] (step=0167800) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1141 +[2025-02-28 19:17:03] (step=0167900) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1103 +[2025-02-28 19:18:03] (step=0168000) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1125 +[2025-02-28 19:19:02] (step=0168100) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1118 +[2025-02-28 19:20:02] (step=0168200) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1088 +[2025-02-28 19:21:02] (step=0168300) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1107 +[2025-02-28 19:22:02] (step=0168400) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1109 +[2025-02-28 19:23:01] (step=0168500) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1117 +[2025-02-28 19:24:01] (step=0168600) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1098 +[2025-02-28 19:25:01] (step=0168700) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1128 +[2025-02-28 19:26:00] (step=0168800) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1131 +[2025-02-28 19:27:00] (step=0168900) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1075 +[2025-02-28 19:28:00] (step=0169000) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1039 +[2025-02-28 19:29:00] (step=0169100) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1130 +[2025-02-28 19:29:59] (step=0169200) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1085 +[2025-02-28 19:30:59] (step=0169300) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1069 +[2025-02-28 19:31:59] (step=0169400) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1073 +[2025-02-28 19:32:59] (step=0169500) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1102 +[2025-02-28 19:33:58] (step=0169600) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1055 +[2025-02-28 19:34:58] (step=0169700) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1083 +[2025-02-28 19:35:58] (step=0169800) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1086 +[2025-02-28 19:36:57] (step=0169900) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1136 +[2025-02-28 19:37:57] (step=0170000) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1107 +[2025-02-28 19:38:57] (step=0170100) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1112 +[2025-02-28 19:40:00] (step=0170200) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1057 +[2025-02-28 19:41:00] (step=0170300) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1120 +[2025-02-28 19:41:59] (step=0170400) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1096 +[2025-02-28 19:42:59] (step=0170500) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1141 +[2025-02-28 19:43:59] (step=0170600) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1126 +[2025-02-28 19:44:58] (step=0170700) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1144 +[2025-02-28 19:45:58] (step=0170800) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1131 +[2025-02-28 19:46:58] (step=0170900) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1059 +[2025-02-28 19:47:57] (step=0171000) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1123 +[2025-02-28 19:48:57] (step=0171100) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1106 +[2025-02-28 19:49:57] (step=0171200) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1082 +[2025-02-28 19:50:57] (step=0171300) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1123 +[2025-02-28 19:51:56] (step=0171400) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1050 +[2025-02-28 19:52:56] (step=0171500) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1109 +[2025-02-28 19:53:56] (step=0171600) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1080 +[2025-02-28 19:54:55] (step=0171700) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1080 +[2025-02-28 19:55:55] (step=0171800) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1096 +[2025-02-28 19:56:55] (step=0171900) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1105 +[2025-02-28 19:57:54] (step=0172000) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1077 +[2025-02-28 19:58:54] (step=0172100) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1161 +[2025-02-28 19:59:54] (step=0172200) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1013 +[2025-02-28 20:00:53] (step=0172300) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1084 +[2025-02-28 20:01:53] (step=0172400) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1066 +[2025-02-28 20:02:53] (step=0172500) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1142 +[2025-02-28 20:03:52] (step=0172600) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1113 +[2025-02-28 20:04:55] (step=0172700) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1148 +[2025-02-28 20:05:55] (step=0172800) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1100 +[2025-02-28 20:06:55] (step=0172900) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1127 +[2025-02-28 20:07:54] (step=0173000) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1148 +[2025-02-28 20:08:54] (step=0173100) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1100 +[2025-02-28 20:09:54] (step=0173200) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1053 +[2025-02-28 20:10:54] (step=0173300) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1084 +[2025-02-28 20:11:53] (step=0173400) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1076 +[2025-02-28 20:12:53] (step=0173500) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1075 +[2025-02-28 20:13:53] (step=0173600) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1090 +[2025-02-28 20:14:53] (step=0173700) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1046 +[2025-02-28 20:15:53] (step=0173800) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1104 +[2025-02-28 20:16:52] (step=0173900) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1076 +[2025-02-28 20:17:52] (step=0174000) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1069 +[2025-02-28 20:18:52] (step=0174100) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1118 +[2025-02-28 20:19:51] (step=0174200) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1101 +[2025-02-28 20:20:51] (step=0174300) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1070 +[2025-02-28 20:21:51] (step=0174400) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1074 +[2025-02-28 20:22:50] (step=0174500) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1088 +[2025-02-28 20:23:50] (step=0174600) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1101 +[2025-02-28 20:24:50] (step=0174700) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1095 +[2025-02-28 20:25:50] (step=0174800) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1060 +[2025-02-28 20:26:49] (step=0174900) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1104 +[2025-02-28 20:27:49] (step=0175000) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1102 +[2025-02-28 20:28:49] (step=0175100) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1090 +[2025-02-28 20:29:52] (step=0175200) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1113 +[2025-02-28 20:30:52] (step=0175300) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.66, Grad Norm: 0.1084 +[2025-02-28 20:31:51] (step=0175400) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1112 +[2025-02-28 20:32:51] (step=0175500) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1107 +[2025-02-28 20:33:51] (step=0175600) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1110 +[2025-02-28 20:34:51] (step=0175700) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1062 +[2025-02-28 20:35:51] (step=0175800) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1077 +[2025-02-28 20:36:50] (step=0175900) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1027 +[2025-02-28 20:37:50] (step=0176000) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1101 +[2025-02-28 20:38:50] (step=0176100) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1078 +[2025-02-28 20:39:49] (step=0176200) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1063 +[2025-02-28 20:40:49] (step=0176300) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1048 +[2025-02-28 20:41:49] (step=0176400) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1117 +[2025-02-28 20:42:48] (step=0176500) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1071 +[2025-02-28 20:43:48] (step=0176600) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1083 +[2025-02-28 20:44:48] (step=0176700) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1070 +[2025-02-28 20:45:47] (step=0176800) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1046 +[2025-02-28 20:46:47] (step=0176900) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1106 +[2025-02-28 20:47:47] (step=0177000) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1046 +[2025-02-28 20:48:46] (step=0177100) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1080 +[2025-02-28 20:49:46] (step=0177200) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1100 +[2025-02-28 20:50:46] (step=0177300) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1135 +[2025-02-28 20:51:45] (step=0177400) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1074 +[2025-02-28 20:52:45] (step=0177500) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1112 +[2025-02-28 20:53:44] (step=0177600) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1060 +[2025-02-28 20:54:47] (step=0177700) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1047 +[2025-02-28 20:55:47] (step=0177800) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1086 +[2025-02-28 20:56:47] (step=0177900) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1071 +[2025-02-28 20:57:47] (step=0178000) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1076 +[2025-02-28 20:58:46] (step=0178100) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1067 +[2025-02-28 20:59:46] (step=0178200) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1105 +[2025-02-28 21:00:45] (step=0178300) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1027 +[2025-02-28 21:01:45] (step=0178400) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1089 +[2025-02-28 21:02:45] (step=0178500) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1067 +[2025-02-28 21:03:44] (step=0178600) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1077 +[2025-02-28 21:04:44] (step=0178700) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1039 +[2025-02-28 21:05:44] (step=0178800) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1015 +[2025-02-28 21:06:43] (step=0178900) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1076 +[2025-02-28 21:07:43] (step=0179000) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1058 +[2025-02-28 21:08:43] (step=0179100) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1086 +[2025-02-28 21:09:42] (step=0179200) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1023 +[2025-02-28 21:10:42] (step=0179300) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1038 +[2025-02-28 21:11:42] (step=0179400) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1080 +[2025-02-28 21:12:41] (step=0179500) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1036 +[2025-02-28 21:13:41] (step=0179600) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1082 +[2025-02-28 21:14:41] (step=0179700) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1047 +[2025-02-28 21:15:40] (step=0179800) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1038 +[2025-02-28 21:16:40] (step=0179900) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1073 +[2025-02-28 21:17:40] (step=0180000) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1071 +[2025-02-28 21:18:39] (step=0180100) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1041 +[2025-02-28 21:19:42] (step=0180200) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1068 +[2025-02-28 21:20:42] (step=0180300) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1060 +[2025-02-28 21:21:42] (step=0180400) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1061 +[2025-02-28 21:22:41] (step=0180500) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1052 +[2025-02-28 21:23:41] (step=0180600) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1044 +[2025-02-28 21:24:41] (step=0180700) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1068 +[2025-02-28 21:25:40] (step=0180800) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1009 +[2025-02-28 21:26:40] (step=0180900) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1067 +[2025-02-28 21:27:39] (step=0181000) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1039 +[2025-02-28 21:28:39] (step=0181100) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1074 +[2025-02-28 21:29:39] (step=0181200) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1097 +[2025-02-28 21:30:38] (step=0181300) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0996 +[2025-02-28 21:31:38] (step=0181400) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1050 +[2025-02-28 21:32:38] (step=0181500) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1045 +[2025-02-28 21:33:37] (step=0181600) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1040 +[2025-02-28 21:34:37] (step=0181700) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1015 +[2025-02-28 21:35:37] (step=0181800) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1056 +[2025-02-28 21:36:36] (step=0181900) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1063 +[2025-02-28 21:37:36] (step=0182000) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1074 +[2025-02-28 21:38:36] (step=0182100) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1052 +[2025-02-28 21:39:35] (step=0182200) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1081 +[2025-02-28 21:40:35] (step=0182300) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1053 +[2025-02-28 21:41:35] (step=0182400) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1029 +[2025-02-28 21:42:34] (step=0182500) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1038 +[2025-02-28 21:43:34] (step=0182600) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1083 +[2025-02-28 21:44:37] (step=0182700) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1037 +[2025-02-28 21:45:37] (step=0182800) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1073 +[2025-02-28 21:46:36] (step=0182900) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1035 +[2025-02-28 21:47:36] (step=0183000) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1082 +[2025-02-28 21:48:36] (step=0183100) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1040 +[2025-02-28 21:49:35] (step=0183200) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1045 +[2025-02-28 21:50:35] (step=0183300) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1081 +[2025-02-28 21:51:35] (step=0183400) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1010 +[2025-02-28 21:52:34] (step=0183500) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1052 +[2025-02-28 21:53:34] (step=0183600) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0992 +[2025-02-28 21:54:34] (step=0183700) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1040 +[2025-02-28 21:55:33] (step=0183800) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1014 +[2025-02-28 21:56:33] (step=0183900) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0973 +[2025-02-28 21:57:33] (step=0184000) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1078 +[2025-02-28 21:58:32] (step=0184100) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1062 +[2025-02-28 21:59:32] (step=0184200) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1012 +[2025-02-28 22:00:32] (step=0184300) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1043 +[2025-02-28 22:01:31] (step=0184400) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1013 +[2025-02-28 22:02:31] (step=0184500) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1038 +[2025-02-28 22:03:31] (step=0184600) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1004 +[2025-02-28 22:04:31] (step=0184700) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1067 +[2025-02-28 22:05:30] (step=0184800) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1017 +[2025-02-28 22:06:30] (step=0184900) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1077 +[2025-02-28 22:07:30] (step=0185000) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1012 +[2025-02-28 22:08:29] (step=0185100) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1040 +[2025-02-28 22:09:32] (step=0185200) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.60, Grad Norm: 0.0993 +[2025-02-28 22:10:32] (step=0185300) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1082 +[2025-02-28 22:11:31] (step=0185400) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1029 +[2025-02-28 22:12:31] (step=0185500) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1024 +[2025-02-28 22:13:31] (step=0185600) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1001 +[2025-02-28 22:14:30] (step=0185700) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1031 +[2025-02-28 22:15:30] (step=0185800) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1025 +[2025-02-28 22:16:30] (step=0185900) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0995 +[2025-02-28 22:17:29] (step=0186000) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1011 +[2025-02-28 22:18:29] (step=0186100) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1019 +[2025-02-28 22:19:29] (step=0186200) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1022 +[2025-02-28 22:20:28] (step=0186300) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0999 +[2025-02-28 22:21:28] (step=0186400) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1023 +[2025-02-28 22:22:28] (step=0186500) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1001 +[2025-02-28 22:23:27] (step=0186600) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1008 +[2025-02-28 22:24:27] (step=0186700) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1015 +[2025-02-28 22:25:27] (step=0186800) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1027 +[2025-02-28 22:26:26] (step=0186900) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1031 +[2025-02-28 22:27:26] (step=0187000) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1060 +[2025-02-28 22:28:26] (step=0187100) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1011 +[2025-02-28 22:29:25] (step=0187200) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1023 +[2025-02-28 22:30:25] (step=0187300) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1029 +[2025-02-28 22:31:25] (step=0187400) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1025 +[2025-02-28 22:32:24] (step=0187500) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1015 +[2025-02-28 22:33:24] (step=0187600) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1102 +[2025-02-28 22:34:27] (step=0187700) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1012 +[2025-02-28 22:35:27] (step=0187800) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1059 +[2025-02-28 22:36:26] (step=0187900) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1018 +[2025-02-28 22:37:26] (step=0188000) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1061 +[2025-02-28 22:38:26] (step=0188100) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1040 +[2025-02-28 22:39:25] (step=0188200) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1045 +[2025-02-28 22:40:25] (step=0188300) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1046 +[2025-02-28 22:41:25] (step=0188400) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1079 +[2025-02-28 22:42:24] (step=0188500) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1035 +[2025-02-28 22:43:24] (step=0188600) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1021 +[2025-02-28 22:44:24] (step=0188700) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1004 +[2025-02-28 22:45:23] (step=0188800) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1031 +[2025-02-28 22:46:23] (step=0188900) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1051 +[2025-02-28 22:47:23] (step=0189000) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1004 +[2025-02-28 22:48:22] (step=0189100) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1069 +[2025-02-28 22:49:22] (step=0189200) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1030 +[2025-02-28 22:50:22] (step=0189300) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1017 +[2025-02-28 22:51:21] (step=0189400) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1007 +[2025-02-28 22:52:21] (step=0189500) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1014 +[2025-02-28 22:53:21] (step=0189600) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0979 +[2025-02-28 22:54:20] (step=0189700) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1072 +[2025-02-28 22:55:20] (step=0189800) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1039 +[2025-02-28 22:56:20] (step=0189900) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1091 +[2025-02-28 22:57:19] (step=0190000) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1046 +[2025-02-28 22:58:19] (step=0190100) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0988 +[2025-02-28 22:59:22] (step=0190200) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1052 +[2025-02-28 23:00:22] (step=0190300) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1018 +[2025-02-28 23:01:21] (step=0190400) Train Loss: 0.0458, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1088 +[2025-02-28 23:02:21] (step=0190500) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1021 +[2025-02-28 23:03:21] (step=0190600) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1016 +[2025-02-28 23:04:20] (step=0190700) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1003 +[2025-02-28 23:05:20] (step=0190800) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1052 +[2025-02-28 23:06:20] (step=0190900) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0941 +[2025-02-28 23:07:19] (step=0191000) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1031 +[2025-02-28 23:08:19] (step=0191100) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0996 +[2025-02-28 23:09:19] (step=0191200) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1066 +[2025-02-28 23:10:18] (step=0191300) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1009 +[2025-02-28 23:11:18] (step=0191400) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0995 +[2025-02-28 23:12:18] (step=0191500) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1010 +[2025-02-28 23:13:17] (step=0191600) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1010 +[2025-02-28 23:14:17] (step=0191700) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0971 +[2025-02-28 23:15:17] (step=0191800) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1087 +[2025-02-28 23:16:16] (step=0191900) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1011 +[2025-02-28 23:17:16] (step=0192000) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1074 +[2025-02-28 23:18:16] (step=0192100) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1019 +[2025-02-28 23:19:15] (step=0192200) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0984 +[2025-02-28 23:20:15] (step=0192300) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1040 +[2025-02-28 23:21:15] (step=0192400) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1016 +[2025-02-28 23:22:14] (step=0192500) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1008 +[2025-02-28 23:23:14] (step=0192600) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1009 +[2025-02-28 23:24:17] (step=0192700) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0969 +[2025-02-28 23:25:16] (step=0192800) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1034 +[2025-02-28 23:26:16] (step=0192900) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0994 +[2025-02-28 23:27:16] (step=0193000) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1024 +[2025-02-28 23:28:15] (step=0193100) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1017 +[2025-02-28 23:29:15] (step=0193200) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1020 +[2025-02-28 23:30:15] (step=0193300) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1007 +[2025-02-28 23:31:14] (step=0193400) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1032 +[2025-02-28 23:32:14] (step=0193500) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1029 +[2025-02-28 23:33:14] (step=0193600) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1034 +[2025-02-28 23:34:13] (step=0193700) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0991 +[2025-02-28 23:35:13] (step=0193800) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1041 +[2025-02-28 23:36:13] (step=0193900) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1006 +[2025-02-28 23:37:12] (step=0194000) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1014 +[2025-02-28 23:38:12] (step=0194100) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0971 +[2025-02-28 23:39:12] (step=0194200) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0987 +[2025-02-28 23:40:11] (step=0194300) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0990 +[2025-02-28 23:41:11] (step=0194400) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0994 +[2025-02-28 23:42:10] (step=0194500) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1060 +[2025-02-28 23:43:10] (step=0194600) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1011 +[2025-02-28 23:44:10] (step=0194700) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0960 +[2025-02-28 23:45:09] (step=0194800) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1043 +[2025-02-28 23:46:09] (step=0194900) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1006 +[2025-02-28 23:47:09] (step=0195000) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1023 +[2025-02-28 23:48:08] (step=0195100) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1037 +[2025-02-28 23:49:11] (step=0195200) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1005 +[2025-02-28 23:50:11] (step=0195300) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1014 +[2025-02-28 23:51:11] (step=0195400) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1042 +[2025-02-28 23:52:10] (step=0195500) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0984 +[2025-02-28 23:53:10] (step=0195600) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1013 +[2025-02-28 23:54:10] (step=0195700) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1020 +[2025-02-28 23:55:09] (step=0195800) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1022 +[2025-02-28 23:56:09] (step=0195900) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0991 +[2025-02-28 23:57:09] (step=0196000) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1046 +[2025-02-28 23:58:08] (step=0196100) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0960 +[2025-02-28 23:59:08] (step=0196200) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1002 +[2025-03-01 00:00:08] (step=0196300) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0994 +[2025-03-01 00:01:07] (step=0196400) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1005 +[2025-03-01 00:02:07] (step=0196500) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0998 +[2025-03-01 00:03:07] (step=0196600) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0987 +[2025-03-01 00:04:06] (step=0196700) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0981 +[2025-03-01 00:05:06] (step=0196800) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1011 +[2025-03-01 00:06:06] (step=0196900) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1013 +[2025-03-01 00:07:05] (step=0197000) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0996 +[2025-03-01 00:08:05] (step=0197100) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1062 +[2025-03-01 00:09:05] (step=0197200) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1042 +[2025-03-01 00:10:04] (step=0197300) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0989 +[2025-03-01 00:11:04] (step=0197400) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1039 +[2025-03-01 00:12:04] (step=0197500) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0989 +[2025-03-01 00:13:03] (step=0197600) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1001 +[2025-03-01 00:14:06] (step=0197700) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0992 +[2025-03-01 00:15:06] (step=0197800) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1012 +[2025-03-01 00:16:05] (step=0197900) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1020 +[2025-03-01 00:17:05] (step=0198000) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0954 +[2025-03-01 00:18:05] (step=0198100) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0976 +[2025-03-01 00:19:05] (step=0198200) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0969 +[2025-03-01 00:20:04] (step=0198300) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0979 +[2025-03-01 00:21:04] (step=0198400) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0969 +[2025-03-01 00:22:04] (step=0198500) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0995 +[2025-03-01 00:23:03] (step=0198600) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1007 +[2025-03-01 00:24:03] (step=0198700) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1008 +[2025-03-01 00:25:03] (step=0198800) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0940 +[2025-03-01 00:26:02] (step=0198900) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1013 +[2025-03-01 00:27:02] (step=0199000) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0936 +[2025-03-01 00:28:02] (step=0199100) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1004 +[2025-03-01 00:29:02] (step=0199200) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1006 +[2025-03-01 00:30:01] (step=0199300) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0983 +[2025-03-01 00:31:01] (step=0199400) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1004 +[2025-03-01 00:32:01] (step=0199500) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0944 +[2025-03-01 00:33:00] (step=0199600) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1003 +[2025-03-01 00:34:00] (step=0199700) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0947 +[2025-03-01 00:35:00] (step=0199800) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1020 +[2025-03-01 00:36:00] (step=0199900) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1011 +[2025-03-01 00:36:59] (step=0200000) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0974 +[2025-03-01 00:37:03] Saved checkpoint to ../logs/flow/flowsdvae_500kx512_lgn0p0/checkpoints/0200000.pt +[2025-03-01 00:42:29] (step=0200000), Fid=12.332113330929246, PSNR=26.964778727793693, LPIPS=0.2257547527551651, SSIM=0.7459940314292908 +[2025-03-01 00:43:29] (step=0200100) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 0.26, Grad Norm: 0.0967 +[2025-03-01 00:44:32] (step=0200200) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.1020 +[2025-03-01 00:45:32] (step=0200300) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1000 +[2025-03-01 00:46:32] (step=0200400) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1012 +[2025-03-01 00:47:31] (step=0200500) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0983 +[2025-03-01 00:48:31] (step=0200600) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0972 +[2025-03-01 00:49:31] (step=0200700) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0955 +[2025-03-01 00:50:30] (step=0200800) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0988 +[2025-03-01 00:51:30] (step=0200900) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0965 +[2025-03-01 00:52:30] (step=0201000) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0967 +[2025-03-01 00:53:30] (step=0201100) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0954 +[2025-03-01 00:54:29] (step=0201200) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0975 +[2025-03-01 00:55:29] (step=0201300) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0944 +[2025-03-01 00:56:29] (step=0201400) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1009 +[2025-03-01 00:57:28] (step=0201500) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0972 +[2025-03-01 00:58:28] (step=0201600) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0958 +[2025-03-01 00:59:28] (step=0201700) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0979 +[2025-03-01 01:00:28] (step=0201800) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0951 +[2025-03-01 01:01:27] (step=0201900) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0980 +[2025-03-01 01:02:27] (step=0202000) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0938 +[2025-03-01 01:03:27] (step=0202100) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0947 +[2025-03-01 01:04:26] (step=0202200) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0967 +[2025-03-01 01:05:26] (step=0202300) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0947 +[2025-03-01 01:06:26] (step=0202400) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0946 +[2025-03-01 01:07:26] (step=0202500) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0961 +[2025-03-01 01:08:25] (step=0202600) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1006 +[2025-03-01 01:09:28] (step=0202700) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0978 +[2025-03-01 01:10:28] (step=0202800) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0976 +[2025-03-01 01:11:27] (step=0202900) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0957 +[2025-03-01 01:12:27] (step=0203000) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0959 +[2025-03-01 01:13:27] (step=0203100) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0977 +[2025-03-01 01:14:27] (step=0203200) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0994 +[2025-03-01 01:15:26] (step=0203300) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0997 +[2025-03-01 01:16:26] (step=0203400) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0977 +[2025-03-01 01:17:26] (step=0203500) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0945 +[2025-03-01 01:18:25] (step=0203600) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0972 +[2025-03-01 01:19:25] (step=0203700) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0962 +[2025-03-01 01:20:25] (step=0203800) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0940 +[2025-03-01 01:21:25] (step=0203900) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0932 +[2025-03-01 01:22:24] (step=0204000) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0985 +[2025-03-01 01:23:24] (step=0204100) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0948 +[2025-03-01 01:24:24] (step=0204200) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0975 +[2025-03-01 01:25:23] (step=0204300) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0952 +[2025-03-01 01:26:23] (step=0204400) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0980 +[2025-03-01 01:27:23] (step=0204500) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0964 +[2025-03-01 01:28:22] (step=0204600) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0943 +[2025-03-01 01:29:22] (step=0204700) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0950 +[2025-03-01 01:30:22] (step=0204800) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0969 +[2025-03-01 01:31:21] (step=0204900) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0935 +[2025-03-01 01:32:21] (step=0205000) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0985 +[2025-03-01 01:33:21] (step=0205100) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0947 +[2025-03-01 01:34:24] (step=0205200) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0971 +[2025-03-01 01:35:23] (step=0205300) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0957 +[2025-03-01 01:36:23] (step=0205400) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0961 +[2025-03-01 01:37:23] (step=0205500) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0978 +[2025-03-01 01:38:22] (step=0205600) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0925 +[2025-03-01 01:39:22] (step=0205700) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0979 +[2025-03-01 01:40:22] (step=0205800) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0962 +[2025-03-01 01:41:21] (step=0205900) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.1021 +[2025-03-01 01:42:21] (step=0206000) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0969 +[2025-03-01 01:43:20] (step=0206100) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0958 +[2025-03-01 01:44:20] (step=0206200) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0944 +[2025-03-01 01:45:20] (step=0206300) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0938 +[2025-03-01 01:46:19] (step=0206400) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0995 +[2025-03-01 01:47:19] (step=0206500) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0919 +[2025-03-01 01:48:19] (step=0206600) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0974 +[2025-03-01 01:49:18] (step=0206700) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0959 +[2025-03-01 01:50:18] (step=0206800) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0937 +[2025-03-01 01:51:18] (step=0206900) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0974 +[2025-03-01 01:52:18] (step=0207000) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0993 +[2025-03-01 01:53:17] (step=0207100) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0962 +[2025-03-01 01:54:17] (step=0207200) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0975 +[2025-03-01 01:55:17] (step=0207300) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0923 +[2025-03-01 01:56:17] (step=0207400) Train Loss: 0.0456, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1022 +[2025-03-01 01:57:16] (step=0207500) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0939 +[2025-03-01 01:58:16] (step=0207600) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0959 +[2025-03-01 01:59:19] (step=0207700) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0946 +[2025-03-01 02:00:19] (step=0207800) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0983 +[2025-03-01 02:01:19] (step=0207900) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0939 +[2025-03-01 02:02:18] (step=0208000) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0997 +[2025-03-01 02:03:18] (step=0208100) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0980 +[2025-03-01 02:04:18] (step=0208200) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0961 +[2025-03-01 02:05:17] (step=0208300) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0931 +[2025-03-01 02:06:17] (step=0208400) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0930 +[2025-03-01 02:07:17] (step=0208500) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0969 +[2025-03-01 02:08:16] (step=0208600) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0958 +[2025-03-01 02:09:16] (step=0208700) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0979 +[2025-03-01 02:10:16] (step=0208800) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0928 +[2025-03-01 02:11:15] (step=0208900) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0920 +[2025-03-01 02:12:15] (step=0209000) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0953 +[2025-03-01 02:13:15] (step=0209100) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0960 +[2025-03-01 02:14:15] (step=0209200) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0967 +[2025-03-01 02:15:14] (step=0209300) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0997 +[2025-03-01 02:16:14] (step=0209400) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0979 +[2025-03-01 02:17:14] (step=0209500) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0962 +[2025-03-01 02:18:13] (step=0209600) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0953 +[2025-03-01 02:19:13] (step=0209700) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0932 +[2025-03-01 02:20:13] (step=0209800) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0927 +[2025-03-01 02:21:13] (step=0209900) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0954 +[2025-03-01 02:22:12] (step=0210000) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0918 +[2025-03-01 02:23:12] (step=0210100) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0976 +[2025-03-01 02:24:15] (step=0210200) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0986 +[2025-03-01 02:25:15] (step=0210300) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0932 +[2025-03-01 02:26:14] (step=0210400) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0953 +[2025-03-01 02:27:14] (step=0210500) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0985 +[2025-03-01 02:28:14] (step=0210600) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0956 +[2025-03-01 02:29:13] (step=0210700) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0936 +[2025-03-01 02:30:13] (step=0210800) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0948 +[2025-03-01 02:31:13] (step=0210900) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0981 +[2025-03-01 02:32:13] (step=0211000) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0965 +[2025-03-01 02:33:12] (step=0211100) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0921 +[2025-03-01 02:34:12] (step=0211200) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0963 +[2025-03-01 02:35:12] (step=0211300) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0948 +[2025-03-01 02:36:11] (step=0211400) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0920 +[2025-03-01 02:37:11] (step=0211500) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0996 +[2025-03-01 02:38:11] (step=0211600) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0967 +[2025-03-01 02:39:11] (step=0211700) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0997 +[2025-03-01 02:40:10] (step=0211800) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0943 +[2025-03-01 02:41:10] (step=0211900) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0918 +[2025-03-01 02:42:10] (step=0212000) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0956 +[2025-03-01 02:43:09] (step=0212100) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0946 +[2025-03-01 02:44:09] (step=0212200) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0935 +[2025-03-01 02:45:09] (step=0212300) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.1003 +[2025-03-01 02:46:09] (step=0212400) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0930 +[2025-03-01 02:47:08] (step=0212500) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0920 +[2025-03-01 02:48:08] (step=0212600) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0929 +[2025-03-01 02:49:11] (step=0212700) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0941 +[2025-03-01 02:50:11] (step=0212800) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0951 +[2025-03-01 02:51:10] (step=0212900) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0963 +[2025-03-01 02:52:10] (step=0213000) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0916 +[2025-03-01 02:53:10] (step=0213100) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0936 +[2025-03-01 02:54:10] (step=0213200) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0926 +[2025-03-01 02:55:09] (step=0213300) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0963 +[2025-03-01 02:56:09] (step=0213400) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0955 +[2025-03-01 02:57:09] (step=0213500) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0922 +[2025-03-01 02:58:09] (step=0213600) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0940 +[2025-03-01 02:59:08] (step=0213700) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0919 +[2025-03-01 03:00:08] (step=0213800) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0943 +[2025-03-01 03:01:08] (step=0213900) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0925 +[2025-03-01 03:02:08] (step=0214000) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0942 +[2025-03-01 03:03:07] (step=0214100) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0961 +[2025-03-01 03:04:07] (step=0214200) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0918 +[2025-03-01 03:05:07] (step=0214300) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0983 +[2025-03-01 03:06:07] (step=0214400) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0925 +[2025-03-01 03:07:06] (step=0214500) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0920 +[2025-03-01 03:08:06] (step=0214600) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0939 +[2025-03-01 03:09:06] (step=0214700) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0916 +[2025-03-01 03:10:06] (step=0214800) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0894 +[2025-03-01 03:11:05] (step=0214900) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0945 +[2025-03-01 03:12:05] (step=0215000) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0926 +[2025-03-01 03:13:05] (step=0215100) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0916 +[2025-03-01 03:14:08] (step=0215200) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0914 +[2025-03-01 03:15:08] (step=0215300) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0964 +[2025-03-01 03:16:07] (step=0215400) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0902 +[2025-03-01 03:17:07] (step=0215500) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0935 +[2025-03-01 03:18:07] (step=0215600) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0938 +[2025-03-01 03:19:07] (step=0215700) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0902 +[2025-03-01 03:20:06] (step=0215800) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0964 +[2025-03-01 03:21:06] (step=0215900) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0944 +[2025-03-01 03:22:06] (step=0216000) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0939 +[2025-03-01 03:23:05] (step=0216100) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0898 +[2025-03-01 03:24:05] (step=0216200) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0932 +[2025-03-01 03:25:05] (step=0216300) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0945 +[2025-03-01 03:26:05] (step=0216400) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0872 +[2025-03-01 03:27:04] (step=0216500) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0957 +[2025-03-01 03:28:04] (step=0216600) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0928 +[2025-03-01 03:29:04] (step=0216700) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0944 +[2025-03-01 03:30:04] (step=0216800) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0923 +[2025-03-01 03:31:03] (step=0216900) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0929 +[2025-03-01 03:32:03] (step=0217000) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0965 +[2025-03-01 03:33:03] (step=0217100) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0912 +[2025-03-01 03:34:02] (step=0217200) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0973 +[2025-03-01 03:35:02] (step=0217300) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0978 +[2025-03-01 03:36:02] (step=0217400) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0946 +[2025-03-01 03:37:02] (step=0217500) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0962 +[2025-03-01 03:38:01] (step=0217600) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0904 +[2025-03-01 03:39:04] (step=0217700) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0923 +[2025-03-01 03:40:04] (step=0217800) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0913 +[2025-03-01 03:41:04] (step=0217900) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0962 +[2025-03-01 03:42:04] (step=0218000) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0952 +[2025-03-01 03:43:03] (step=0218100) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0925 +[2025-03-01 03:44:03] (step=0218200) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0907 +[2025-03-01 03:45:03] (step=0218300) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0955 +[2025-03-01 03:46:03] (step=0218400) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0915 +[2025-03-01 03:47:02] (step=0218500) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0922 +[2025-03-01 03:48:02] (step=0218600) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0934 +[2025-03-01 03:49:02] (step=0218700) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0949 +[2025-03-01 03:50:01] (step=0218800) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0931 +[2025-03-01 03:51:01] (step=0218900) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0915 +[2025-03-01 03:52:01] (step=0219000) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0948 +[2025-03-01 03:53:01] (step=0219100) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0906 +[2025-03-01 03:54:00] (step=0219200) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0908 +[2025-03-01 03:55:00] (step=0219300) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0935 +[2025-03-01 03:56:00] (step=0219400) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0939 +[2025-03-01 03:57:00] (step=0219500) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0925 +[2025-03-01 03:57:59] (step=0219600) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0919 +[2025-03-01 03:58:59] (step=0219700) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0942 +[2025-03-01 03:59:59] (step=0219800) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0890 +[2025-03-01 04:00:58] (step=0219900) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0947 +[2025-03-01 04:01:58] (step=0220000) Train Loss: 0.0454, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0953 +[2025-03-01 04:02:58] (step=0220100) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0950 +[2025-03-01 04:04:01] (step=0220200) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0910 +[2025-03-01 04:05:00] (step=0220300) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0898 +[2025-03-01 04:06:00] (step=0220400) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0977 +[2025-03-01 04:07:00] (step=0220500) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0919 +[2025-03-01 04:08:00] (step=0220600) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0961 +[2025-03-01 04:08:59] (step=0220700) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0903 +[2025-03-01 04:09:59] (step=0220800) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0948 +[2025-03-01 04:10:59] (step=0220900) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0934 +[2025-03-01 04:11:59] (step=0221000) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0916 +[2025-03-01 04:12:58] (step=0221100) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0897 +[2025-03-01 04:13:58] (step=0221200) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0893 +[2025-03-01 04:14:58] (step=0221300) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0896 +[2025-03-01 04:15:57] (step=0221400) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0892 +[2025-03-01 04:16:57] (step=0221500) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0938 +[2025-03-01 04:17:57] (step=0221600) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0868 +[2025-03-01 04:18:56] (step=0221700) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0947 +[2025-03-01 04:19:56] (step=0221800) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0912 +[2025-03-01 04:20:56] (step=0221900) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0907 +[2025-03-01 04:21:56] (step=0222000) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0945 +[2025-03-01 04:22:55] (step=0222100) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0932 +[2025-03-01 04:23:55] (step=0222200) Train Loss: 0.0455, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0926 +[2025-03-01 04:24:55] (step=0222300) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0901 +[2025-03-01 04:25:54] (step=0222400) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0923 +[2025-03-01 04:26:54] (step=0222500) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0907 +[2025-03-01 04:27:54] (step=0222600) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0917 +[2025-03-01 04:28:57] (step=0222700) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0896 +[2025-03-01 04:29:56] (step=0222800) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0865 +[2025-03-01 04:30:56] (step=0222900) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0933 +[2025-03-01 04:31:56] (step=0223000) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0925 +[2025-03-01 04:32:55] (step=0223100) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0902 +[2025-03-01 04:33:55] (step=0223200) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0923 +[2025-03-01 04:34:55] (step=0223300) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0881 +[2025-03-01 04:35:55] (step=0223400) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0921 +[2025-03-01 04:36:54] (step=0223500) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0914 +[2025-03-01 04:37:54] (step=0223600) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0898 +[2025-03-01 04:38:54] (step=0223700) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0952 +[2025-03-01 04:39:54] (step=0223800) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0864 +[2025-03-01 04:40:53] (step=0223900) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0927 +[2025-03-01 04:41:53] (step=0224000) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0912 +[2025-03-01 04:42:53] (step=0224100) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0896 +[2025-03-01 04:43:53] (step=0224200) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0918 +[2025-03-01 04:44:52] (step=0224300) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0856 +[2025-03-01 04:45:52] (step=0224400) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0897 +[2025-03-01 04:46:52] (step=0224500) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0901 +[2025-03-01 04:47:52] (step=0224600) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0864 +[2025-03-01 04:48:51] (step=0224700) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0893 +[2025-03-01 04:49:51] (step=0224800) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0916 +[2025-03-01 04:50:51] (step=0224900) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0904 +[2025-03-01 04:51:50] (step=0225000) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0882 +[2025-03-01 04:52:50] (step=0225100) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0876 +[2025-03-01 04:53:53] (step=0225200) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0859 +[2025-03-01 04:54:53] (step=0225300) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0895 +[2025-03-01 04:55:52] (step=0225400) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0902 +[2025-03-01 04:56:52] (step=0225500) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0905 +[2025-03-01 04:57:52] (step=0225600) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0894 +[2025-03-01 04:58:51] (step=0225700) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0913 +[2025-03-01 04:59:51] (step=0225800) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0906 +[2025-03-01 05:00:51] (step=0225900) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0927 +[2025-03-01 05:01:50] (step=0226000) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0918 +[2025-03-01 05:02:50] (step=0226100) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0926 +[2025-03-01 05:03:50] (step=0226200) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0906 +[2025-03-01 05:04:49] (step=0226300) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0878 +[2025-03-01 05:05:49] (step=0226400) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0891 +[2025-03-01 05:06:49] (step=0226500) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0903 +[2025-03-01 05:07:48] (step=0226600) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0898 +[2025-03-01 05:08:48] (step=0226700) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0855 +[2025-03-01 05:09:48] (step=0226800) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0938 +[2025-03-01 05:10:47] (step=0226900) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0895 +[2025-03-01 05:11:47] (step=0227000) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0881 +[2025-03-01 05:12:47] (step=0227100) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0883 +[2025-03-01 05:13:46] (step=0227200) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0919 +[2025-03-01 05:14:46] (step=0227300) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0936 +[2025-03-01 05:15:46] (step=0227400) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0884 +[2025-03-01 05:16:45] (step=0227500) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0942 +[2025-03-01 05:17:45] (step=0227600) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0892 +[2025-03-01 05:18:48] (step=0227700) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0933 +[2025-03-01 05:19:48] (step=0227800) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0896 +[2025-03-01 05:20:48] (step=0227900) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0891 +[2025-03-01 05:21:47] (step=0228000) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0909 +[2025-03-01 05:22:47] (step=0228100) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0911 +[2025-03-01 05:23:47] (step=0228200) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0895 +[2025-03-01 05:24:46] (step=0228300) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0908 +[2025-03-01 05:25:46] (step=0228400) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0915 +[2025-03-01 05:26:46] (step=0228500) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0918 +[2025-03-01 05:27:45] (step=0228600) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0905 +[2025-03-01 05:28:45] (step=0228700) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0886 +[2025-03-01 05:29:44] (step=0228800) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0952 +[2025-03-01 05:30:44] (step=0228900) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0929 +[2025-03-01 05:31:44] (step=0229000) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0885 +[2025-03-01 05:32:43] (step=0229100) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0908 +[2025-03-01 05:33:43] (step=0229200) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0881 +[2025-03-01 05:34:43] (step=0229300) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0888 +[2025-03-01 05:35:43] (step=0229400) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0931 +[2025-03-01 05:36:42] (step=0229500) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0883 +[2025-03-01 05:37:42] (step=0229600) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0900 +[2025-03-01 05:38:41] (step=0229700) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0876 +[2025-03-01 05:39:41] (step=0229800) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0862 +[2025-03-01 05:40:41] (step=0229900) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0890 +[2025-03-01 05:41:40] (step=0230000) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0914 +[2025-03-01 05:42:40] (step=0230100) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0871 +[2025-03-01 05:43:43] (step=0230200) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0863 +[2025-03-01 05:44:43] (step=0230300) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0904 +[2025-03-01 05:45:43] (step=0230400) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0902 +[2025-03-01 05:46:42] (step=0230500) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0880 +[2025-03-01 05:47:43] (step=0230600) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.66, Grad Norm: 0.0868 +[2025-03-01 05:48:43] (step=0230700) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0890 +[2025-03-01 05:49:42] (step=0230800) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0929 +[2025-03-01 05:50:42] (step=0230900) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0896 +[2025-03-01 05:51:41] (step=0231000) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0905 +[2025-03-01 05:52:41] (step=0231100) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0897 +[2025-03-01 05:53:41] (step=0231200) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0878 +[2025-03-01 05:54:40] (step=0231300) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0884 +[2025-03-01 05:55:40] (step=0231400) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0879 +[2025-03-01 05:56:40] (step=0231500) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0952 +[2025-03-01 05:57:39] (step=0231600) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0886 +[2025-03-01 05:58:39] (step=0231700) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0920 +[2025-03-01 05:59:39] (step=0231800) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0897 +[2025-03-01 06:00:39] (step=0231900) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0916 +[2025-03-01 06:01:39] (step=0232000) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0914 +[2025-03-01 06:02:38] (step=0232100) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0852 +[2025-03-01 06:03:38] (step=0232200) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0889 +[2025-03-01 06:04:38] (step=0232300) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0891 +[2025-03-01 06:05:37] (step=0232400) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0873 +[2025-03-01 06:06:37] (step=0232500) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0884 +[2025-03-01 06:07:36] (step=0232600) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0893 +[2025-03-01 06:08:39] (step=0232700) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0850 +[2025-03-01 06:09:40] (step=0232800) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.66, Grad Norm: 0.0888 +[2025-03-01 06:10:40] (step=0232900) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0903 +[2025-03-01 06:11:39] (step=0233000) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0869 +[2025-03-01 06:12:39] (step=0233100) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0935 +[2025-03-01 06:13:39] (step=0233200) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0878 +[2025-03-01 06:14:38] (step=0233300) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0892 +[2025-03-01 06:15:38] (step=0233400) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0902 +[2025-03-01 06:16:37] (step=0233500) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0879 +[2025-03-01 06:17:37] (step=0233600) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0877 +[2025-03-01 06:18:37] (step=0233700) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0864 +[2025-03-01 06:19:36] (step=0233800) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0905 +[2025-03-01 06:20:36] (step=0233900) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0888 +[2025-03-01 06:21:36] (step=0234000) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0897 +[2025-03-01 06:22:35] (step=0234100) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0874 +[2025-03-01 06:23:35] (step=0234200) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0883 +[2025-03-01 06:24:35] (step=0234300) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0926 +[2025-03-01 06:25:34] (step=0234400) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0874 +[2025-03-01 06:26:34] (step=0234500) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0852 +[2025-03-01 06:27:34] (step=0234600) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0872 +[2025-03-01 06:28:33] (step=0234700) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0888 +[2025-03-01 06:29:33] (step=0234800) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0920 +[2025-03-01 06:30:33] (step=0234900) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0868 +[2025-03-01 06:31:32] (step=0235000) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0915 +[2025-03-01 06:32:32] (step=0235100) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0885 +[2025-03-01 06:33:35] (step=0235200) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0900 +[2025-03-01 06:34:35] (step=0235300) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0898 +[2025-03-01 06:35:34] (step=0235400) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0866 +[2025-03-01 06:36:34] (step=0235500) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0888 +[2025-03-01 06:37:33] (step=0235600) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0893 +[2025-03-01 06:38:33] (step=0235700) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0884 +[2025-03-01 06:39:33] (step=0235800) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0906 +[2025-03-01 06:40:32] (step=0235900) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0894 +[2025-03-01 06:41:32] (step=0236000) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0900 +[2025-03-01 06:42:31] (step=0236100) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0898 +[2025-03-01 06:43:31] (step=0236200) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0833 +[2025-03-01 06:44:30] (step=0236300) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0870 +[2025-03-01 06:45:30] (step=0236400) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0843 +[2025-03-01 06:46:30] (step=0236500) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0861 +[2025-03-01 06:47:29] (step=0236600) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0859 +[2025-03-01 06:48:29] (step=0236700) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0872 +[2025-03-01 06:49:28] (step=0236800) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0863 +[2025-03-01 06:50:28] (step=0236900) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0841 +[2025-03-01 06:51:28] (step=0237000) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0870 +[2025-03-01 06:52:27] (step=0237100) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0899 +[2025-03-01 06:53:27] (step=0237200) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0831 +[2025-03-01 06:54:26] (step=0237300) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0885 +[2025-03-01 06:55:26] (step=0237400) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0851 +[2025-03-01 06:56:26] (step=0237500) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0857 +[2025-03-01 06:57:25] (step=0237600) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0916 +[2025-03-01 06:58:28] (step=0237700) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0849 +[2025-03-01 06:59:28] (step=0237800) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0871 +[2025-03-01 07:00:28] (step=0237900) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0897 +[2025-03-01 07:01:27] (step=0238000) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0878 +[2025-03-01 07:02:27] (step=0238100) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0835 +[2025-03-01 07:03:26] (step=0238200) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0882 +[2025-03-01 07:04:26] (step=0238300) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0865 +[2025-03-01 07:05:26] (step=0238400) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0863 +[2025-03-01 07:06:25] (step=0238500) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0842 +[2025-03-01 07:07:25] (step=0238600) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0880 +[2025-03-01 07:08:25] (step=0238700) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0840 +[2025-03-01 07:09:24] (step=0238800) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0855 +[2025-03-01 07:10:24] (step=0238900) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0881 +[2025-03-01 07:11:23] (step=0239000) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0848 +[2025-03-01 07:12:23] (step=0239100) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0868 +[2025-03-01 07:13:23] (step=0239200) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0855 +[2025-03-01 07:14:22] (step=0239300) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0859 +[2025-03-01 07:15:22] (step=0239400) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0857 +[2025-03-01 07:16:21] (step=0239500) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0887 +[2025-03-01 07:17:21] (step=0239600) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0890 +[2025-03-01 07:18:21] (step=0239700) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0860 +[2025-03-01 07:19:20] (step=0239800) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0895 +[2025-03-01 07:20:20] (step=0239900) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0864 +[2025-03-01 07:21:20] (step=0240000) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0848 +[2025-03-01 07:22:19] (step=0240100) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0851 +[2025-03-01 07:23:22] (step=0240200) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0842 +[2025-03-01 07:24:22] (step=0240300) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0855 +[2025-03-01 07:25:21] (step=0240400) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0883 +[2025-03-01 07:26:21] (step=0240500) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0862 +[2025-03-01 07:27:21] (step=0240600) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0863 +[2025-03-01 07:28:20] (step=0240700) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0856 +[2025-03-01 07:29:20] (step=0240800) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0849 +[2025-03-01 07:30:20] (step=0240900) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0879 +[2025-03-01 07:31:19] (step=0241000) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0865 +[2025-03-01 07:32:19] (step=0241100) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0861 +[2025-03-01 07:33:19] (step=0241200) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0862 +[2025-03-01 07:34:18] (step=0241300) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0871 +[2025-03-01 07:35:18] (step=0241400) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0835 +[2025-03-01 07:36:18] (step=0241500) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0873 +[2025-03-01 07:37:17] (step=0241600) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0850 +[2025-03-01 07:38:17] (step=0241700) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0871 +[2025-03-01 07:39:17] (step=0241800) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0858 +[2025-03-01 07:40:16] (step=0241900) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0890 +[2025-03-01 07:41:16] (step=0242000) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0893 +[2025-03-01 07:42:16] (step=0242100) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0837 +[2025-03-01 07:43:15] (step=0242200) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0871 +[2025-03-01 07:44:15] (step=0242300) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0866 +[2025-03-01 07:45:15] (step=0242400) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0878 +[2025-03-01 07:46:14] (step=0242500) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0900 +[2025-03-01 07:47:14] (step=0242600) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0853 +[2025-03-01 07:48:17] (step=0242700) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0856 +[2025-03-01 07:49:17] (step=0242800) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0867 +[2025-03-01 07:50:16] (step=0242900) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0879 +[2025-03-01 07:51:16] (step=0243000) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0856 +[2025-03-01 07:52:16] (step=0243100) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0877 +[2025-03-01 07:53:15] (step=0243200) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0855 +[2025-03-01 07:54:15] (step=0243300) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0848 +[2025-03-01 07:55:14] (step=0243400) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0884 +[2025-03-01 07:56:14] (step=0243500) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0829 +[2025-03-01 07:57:13] (step=0243600) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0886 +[2025-03-01 07:58:13] (step=0243700) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0859 +[2025-03-01 07:59:13] (step=0243800) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0866 +[2025-03-01 08:00:12] (step=0243900) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0894 +[2025-03-01 08:01:12] (step=0244000) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0839 +[2025-03-01 08:02:11] (step=0244100) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0850 +[2025-03-01 08:03:11] (step=0244200) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0883 +[2025-03-01 08:04:11] (step=0244300) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0846 +[2025-03-01 08:05:10] (step=0244400) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0869 +[2025-03-01 08:06:10] (step=0244500) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0830 +[2025-03-01 08:07:09] (step=0244600) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0863 +[2025-03-01 08:08:09] (step=0244700) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0857 +[2025-03-01 08:09:08] (step=0244800) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0837 +[2025-03-01 08:10:08] (step=0244900) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0860 +[2025-03-01 08:11:08] (step=0245000) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0850 +[2025-03-01 08:12:07] (step=0245100) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0881 +[2025-03-01 08:13:10] (step=0245200) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0891 +[2025-03-01 08:14:10] (step=0245300) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0884 +[2025-03-01 08:15:10] (step=0245400) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0875 +[2025-03-01 08:16:09] (step=0245500) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0855 +[2025-03-01 08:17:09] (step=0245600) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0871 +[2025-03-01 08:18:08] (step=0245700) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0879 +[2025-03-01 08:19:08] (step=0245800) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0842 +[2025-03-01 08:20:07] (step=0245900) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0845 +[2025-03-01 08:21:07] (step=0246000) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0840 +[2025-03-01 08:22:07] (step=0246100) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0880 +[2025-03-01 08:23:06] (step=0246200) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0847 +[2025-03-01 08:24:06] (step=0246300) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0837 +[2025-03-01 08:25:05] (step=0246400) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0834 +[2025-03-01 08:26:05] (step=0246500) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0860 +[2025-03-01 08:27:05] (step=0246600) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0867 +[2025-03-01 08:28:04] (step=0246700) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0883 +[2025-03-01 08:29:04] (step=0246800) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0820 +[2025-03-01 08:30:03] (step=0246900) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0870 +[2025-03-01 08:31:03] (step=0247000) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0861 +[2025-03-01 08:32:03] (step=0247100) Train Loss: 0.0453, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0858 +[2025-03-01 08:33:02] (step=0247200) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0839 +[2025-03-01 08:34:02] (step=0247300) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0854 +[2025-03-01 08:35:01] (step=0247400) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0834 +[2025-03-01 08:36:01] (step=0247500) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0815 +[2025-03-01 08:37:01] (step=0247600) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0834 +[2025-03-01 08:38:03] (step=0247700) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0823 +[2025-03-01 08:39:03] (step=0247800) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0869 +[2025-03-01 08:40:03] (step=0247900) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0837 +[2025-03-01 08:41:02] (step=0248000) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0856 +[2025-03-01 08:42:02] (step=0248100) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0841 +[2025-03-01 08:43:01] (step=0248200) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0879 +[2025-03-01 08:44:01] (step=0248300) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0872 +[2025-03-01 08:45:00] (step=0248400) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0851 +[2025-03-01 08:46:00] (step=0248500) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0822 +[2025-03-01 08:46:59] (step=0248600) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0870 +[2025-03-01 08:47:59] (step=0248700) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0843 +[2025-03-01 08:48:59] (step=0248800) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0820 +[2025-03-01 08:49:58] (step=0248900) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0831 +[2025-03-01 08:50:58] (step=0249000) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0828 +[2025-03-01 08:51:57] (step=0249100) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0819 +[2025-03-01 08:52:57] (step=0249200) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0838 +[2025-03-01 08:53:56] (step=0249300) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0816 +[2025-03-01 08:54:56] (step=0249400) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0850 +[2025-03-01 08:55:55] (step=0249500) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0855 +[2025-03-01 08:56:55] (step=0249600) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0864 +[2025-03-01 08:57:55] (step=0249700) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0831 +[2025-03-01 08:58:54] (step=0249800) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0859 +[2025-03-01 08:59:54] (step=0249900) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0838 +[2025-03-01 09:00:53] (step=0250000) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0829 +[2025-03-01 09:00:57] Saved checkpoint to ../logs/flow/flowsdvae_500kx512_lgn0p0/checkpoints/0250000.pt +[2025-03-01 09:06:24] (step=0250000), Fid=12.368762294021963, PSNR=27.016703526735306, LPIPS=0.22542835772037506, SSIM=0.7476117014884949 +[2025-03-01 09:07:24] (step=0250100) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 0.26, Grad Norm: 0.0868 +[2025-03-01 09:08:25] (step=0250200) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.65, Grad Norm: 0.0850 +[2025-03-01 09:09:26] (step=0250300) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.62, Grad Norm: 0.0824 +[2025-03-01 09:10:26] (step=0250400) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0854 +[2025-03-01 09:11:26] (step=0250500) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0877 +[2025-03-01 09:12:26] (step=0250600) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0821 +[2025-03-01 09:13:25] (step=0250700) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0863 +[2025-03-01 09:14:25] (step=0250800) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0852 +[2025-03-01 09:15:25] (step=0250900) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0829 +[2025-03-01 09:16:24] (step=0251000) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0857 +[2025-03-01 09:17:24] (step=0251100) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0844 +[2025-03-01 09:18:24] (step=0251200) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0879 +[2025-03-01 09:19:24] (step=0251300) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0840 +[2025-03-01 09:20:23] (step=0251400) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0859 +[2025-03-01 09:21:23] (step=0251500) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0834 +[2025-03-01 09:22:23] (step=0251600) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0839 +[2025-03-01 09:23:23] (step=0251700) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0809 +[2025-03-01 09:24:22] (step=0251800) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0834 +[2025-03-01 09:25:22] (step=0251900) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0828 +[2025-03-01 09:26:22] (step=0252000) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0817 +[2025-03-01 09:27:21] (step=0252100) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0866 +[2025-03-01 09:28:21] (step=0252200) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0831 +[2025-03-01 09:29:21] (step=0252300) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0834 +[2025-03-01 09:30:21] (step=0252400) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0794 +[2025-03-01 09:31:20] (step=0252500) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0828 +[2025-03-01 09:32:20] (step=0252600) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0851 +[2025-03-01 09:33:20] (step=0252700) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0819 +[2025-03-01 09:34:23] (step=0252800) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.58, Grad Norm: 0.0816 +[2025-03-01 09:35:22] (step=0252900) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0838 +[2025-03-01 09:36:22] (step=0253000) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0831 +[2025-03-01 09:37:22] (step=0253100) Train Loss: 0.0457, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0791 +[2025-03-01 09:38:21] (step=0253200) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0856 +[2025-03-01 09:39:21] (step=0253300) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0794 +[2025-03-01 09:40:21] (step=0253400) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0848 +[2025-03-01 09:41:20] (step=0253500) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0832 +[2025-03-01 09:42:20] (step=0253600) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0835 +[2025-03-01 09:43:20] (step=0253700) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0859 +[2025-03-01 09:44:19] (step=0253800) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0878 +[2025-03-01 09:45:19] (step=0253900) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0849 +[2025-03-01 09:46:19] (step=0254000) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0863 +[2025-03-01 09:47:18] (step=0254100) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0839 +[2025-03-01 09:48:18] (step=0254200) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0865 +[2025-03-01 09:49:17] (step=0254300) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0892 +[2025-03-01 09:50:17] (step=0254400) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0837 +[2025-03-01 09:51:17] (step=0254500) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0849 +[2025-03-01 09:52:16] (step=0254600) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0833 +[2025-03-01 09:53:16] (step=0254700) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0855 +[2025-03-01 09:54:16] (step=0254800) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0836 +[2025-03-01 09:55:15] (step=0254900) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0853 +[2025-03-01 09:56:15] (step=0255000) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0835 +[2025-03-01 09:57:15] (step=0255100) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0861 +[2025-03-01 09:58:14] (step=0255200) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0848 +[2025-03-01 09:59:17] (step=0255300) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.58, Grad Norm: 0.0850 +[2025-03-01 10:00:17] (step=0255400) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0866 +[2025-03-01 10:01:17] (step=0255500) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0847 +[2025-03-01 10:02:17] (step=0255600) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0845 +[2025-03-01 10:03:16] (step=0255700) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0838 +[2025-03-01 10:04:16] (step=0255800) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0823 +[2025-03-01 10:05:16] (step=0255900) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0841 +[2025-03-01 10:06:15] (step=0256000) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0822 +[2025-03-01 10:07:15] (step=0256100) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0809 +[2025-03-01 10:08:14] (step=0256200) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0863 +[2025-03-01 10:09:14] (step=0256300) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0796 +[2025-03-01 10:10:14] (step=0256400) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0858 +[2025-03-01 10:11:13] (step=0256500) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0859 +[2025-03-01 10:12:13] (step=0256600) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0839 +[2025-03-01 10:13:13] (step=0256700) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0821 +[2025-03-01 10:14:12] (step=0256800) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0804 +[2025-03-01 10:15:12] (step=0256900) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0829 +[2025-03-01 10:16:12] (step=0257000) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0830 +[2025-03-01 10:17:11] (step=0257100) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0849 +[2025-03-01 10:18:11] (step=0257200) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0831 +[2025-03-01 10:19:11] (step=0257300) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0823 +[2025-03-01 10:20:10] (step=0257400) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0811 +[2025-03-01 10:21:10] (step=0257500) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0830 +[2025-03-01 10:22:10] (step=0257600) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0810 +[2025-03-01 10:23:09] (step=0257700) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0862 +[2025-03-01 10:24:12] (step=0257800) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0814 +[2025-03-01 10:25:12] (step=0257900) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0813 +[2025-03-01 10:26:12] (step=0258000) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0823 +[2025-03-01 10:27:11] (step=0258100) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0831 +[2025-03-01 10:28:11] (step=0258200) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0850 +[2025-03-01 10:29:10] (step=0258300) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0813 +[2025-03-01 10:30:10] (step=0258400) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0870 +[2025-03-01 10:31:10] (step=0258500) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0853 +[2025-03-01 10:32:09] (step=0258600) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0851 +[2025-03-01 10:33:09] (step=0258700) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0867 +[2025-03-01 10:34:09] (step=0258800) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0842 +[2025-03-01 10:35:08] (step=0258900) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0835 +[2025-03-01 10:36:08] (step=0259000) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0821 +[2025-03-01 10:37:07] (step=0259100) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0810 +[2025-03-01 10:38:07] (step=0259200) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0843 +[2025-03-01 10:39:07] (step=0259300) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0807 +[2025-03-01 10:40:06] (step=0259400) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0826 +[2025-03-01 10:41:06] (step=0259500) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0810 +[2025-03-01 10:42:06] (step=0259600) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0817 +[2025-03-01 10:43:05] (step=0259700) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0814 +[2025-03-01 10:44:05] (step=0259800) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0857 +[2025-03-01 10:45:04] (step=0259900) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0844 +[2025-03-01 10:46:04] (step=0260000) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0818 +[2025-03-01 10:47:04] (step=0260100) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0862 +[2025-03-01 10:48:03] (step=0260200) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0819 +[2025-03-01 10:49:06] (step=0260300) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0840 +[2025-03-01 10:50:06] (step=0260400) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0859 +[2025-03-01 10:51:06] (step=0260500) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0822 +[2025-03-01 10:52:06] (step=0260600) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0848 +[2025-03-01 10:53:05] (step=0260700) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0828 +[2025-03-01 10:54:05] (step=0260800) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0827 +[2025-03-01 10:55:05] (step=0260900) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0798 +[2025-03-01 10:56:04] (step=0261000) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0821 +[2025-03-01 10:57:04] (step=0261100) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0836 +[2025-03-01 10:58:03] (step=0261200) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0841 +[2025-03-01 10:59:03] (step=0261300) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0812 +[2025-03-01 11:00:02] (step=0261400) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0822 +[2025-03-01 11:01:02] (step=0261500) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0807 +[2025-03-01 11:02:02] (step=0261600) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0835 +[2025-03-01 11:03:01] (step=0261700) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0814 +[2025-03-01 11:04:01] (step=0261800) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0808 +[2025-03-01 11:05:00] (step=0261900) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0808 +[2025-03-01 11:06:00] (step=0262000) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0811 +[2025-03-01 11:07:00] (step=0262100) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0856 +[2025-03-01 11:07:59] (step=0262200) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0815 +[2025-03-01 11:08:59] (step=0262300) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0804 +[2025-03-01 11:09:58] (step=0262400) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0827 +[2025-03-01 11:10:58] (step=0262500) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0796 +[2025-03-01 11:11:58] (step=0262600) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0862 +[2025-03-01 11:12:57] (step=0262700) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0801 +[2025-03-01 11:14:00] (step=0262800) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0808 +[2025-03-01 11:15:00] (step=0262900) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0799 +[2025-03-01 11:16:00] (step=0263000) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0838 +[2025-03-01 11:16:59] (step=0263100) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0794 +[2025-03-01 11:17:59] (step=0263200) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0832 +[2025-03-01 11:18:59] (step=0263300) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0797 +[2025-03-01 11:19:58] (step=0263400) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0821 +[2025-03-01 11:20:58] (step=0263500) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0828 +[2025-03-01 11:21:57] (step=0263600) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0845 +[2025-03-01 11:22:57] (step=0263700) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0776 +[2025-03-01 11:23:56] (step=0263800) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0788 +[2025-03-01 11:24:56] (step=0263900) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0808 +[2025-03-01 11:25:56] (step=0264000) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0789 +[2025-03-01 11:26:55] (step=0264100) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0798 +[2025-03-01 11:27:55] (step=0264200) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0796 +[2025-03-01 11:28:54] (step=0264300) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0809 +[2025-03-01 11:29:54] (step=0264400) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0803 +[2025-03-01 11:30:54] (step=0264500) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0819 +[2025-03-01 11:31:53] (step=0264600) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0790 +[2025-03-01 11:32:53] (step=0264700) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0798 +[2025-03-01 11:33:52] (step=0264800) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0852 +[2025-03-01 11:34:52] (step=0264900) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0808 +[2025-03-01 11:35:52] (step=0265000) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0834 +[2025-03-01 11:36:51] (step=0265100) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0797 +[2025-03-01 11:37:51] (step=0265200) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0794 +[2025-03-01 11:38:54] (step=0265300) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0817 +[2025-03-01 11:39:53] (step=0265400) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0758 +[2025-03-01 11:40:53] (step=0265500) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0804 +[2025-03-01 11:41:53] (step=0265600) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0803 +[2025-03-01 11:42:52] (step=0265700) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0798 +[2025-03-01 11:43:52] (step=0265800) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0798 +[2025-03-01 11:44:52] (step=0265900) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0805 +[2025-03-01 11:45:52] (step=0266000) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0810 +[2025-03-01 11:46:51] (step=0266100) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0828 +[2025-03-01 11:47:51] (step=0266200) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0808 +[2025-03-01 11:48:51] (step=0266300) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0798 +[2025-03-01 11:49:50] (step=0266400) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0828 +[2025-03-01 11:50:50] (step=0266500) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0817 +[2025-03-01 11:51:49] (step=0266600) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0769 +[2025-03-01 11:52:49] (step=0266700) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0804 +[2025-03-01 11:53:49] (step=0266800) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0806 +[2025-03-01 11:54:48] (step=0266900) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0830 +[2025-03-01 11:55:48] (step=0267000) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0823 +[2025-03-01 11:56:48] (step=0267100) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0833 +[2025-03-01 11:57:47] (step=0267200) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0808 +[2025-03-01 11:58:47] (step=0267300) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0781 +[2025-03-01 11:59:47] (step=0267400) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0793 +[2025-03-01 12:00:46] (step=0267500) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0787 +[2025-03-01 12:01:46] (step=0267600) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0793 +[2025-03-01 12:02:46] (step=0267700) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0807 +[2025-03-01 12:03:49] (step=0267800) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0819 +[2025-03-01 12:04:48] (step=0267900) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0780 +[2025-03-01 12:05:48] (step=0268000) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0785 +[2025-03-01 12:06:48] (step=0268100) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0788 +[2025-03-01 12:07:47] (step=0268200) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0810 +[2025-03-01 12:08:47] (step=0268300) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0767 +[2025-03-01 12:09:46] (step=0268400) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0798 +[2025-03-01 12:10:46] (step=0268500) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0818 +[2025-03-01 12:11:46] (step=0268600) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0799 +[2025-03-01 12:12:45] (step=0268700) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0856 +[2025-03-01 12:13:45] (step=0268800) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0767 +[2025-03-01 12:14:44] (step=0268900) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0799 +[2025-03-01 12:15:44] (step=0269000) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0798 +[2025-03-01 12:16:44] (step=0269100) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0797 +[2025-03-01 12:17:43] (step=0269200) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0823 +[2025-03-01 12:18:43] (step=0269300) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0808 +[2025-03-01 12:19:42] (step=0269400) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0820 +[2025-03-01 12:20:42] (step=0269500) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0751 +[2025-03-01 12:21:42] (step=0269600) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0834 +[2025-03-01 12:22:41] (step=0269700) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0787 +[2025-03-01 12:23:41] (step=0269800) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0793 +[2025-03-01 12:24:40] (step=0269900) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0808 +[2025-03-01 12:25:40] (step=0270000) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0784 +[2025-03-01 12:26:40] (step=0270100) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0818 +[2025-03-01 12:27:39] (step=0270200) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0782 +[2025-03-01 12:28:42] (step=0270300) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0822 +[2025-03-01 12:29:42] (step=0270400) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0775 +[2025-03-01 12:30:41] (step=0270500) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0790 +[2025-03-01 12:31:41] (step=0270600) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0825 +[2025-03-01 12:32:40] (step=0270700) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0797 +[2025-03-01 12:33:40] (step=0270800) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0812 +[2025-03-01 12:34:40] (step=0270900) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0797 +[2025-03-01 12:35:39] (step=0271000) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0792 +[2025-03-01 12:36:39] (step=0271100) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0795 +[2025-03-01 12:37:38] (step=0271200) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0843 +[2025-03-01 12:38:38] (step=0271300) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0778 +[2025-03-01 12:39:38] (step=0271400) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0810 +[2025-03-01 12:40:37] (step=0271500) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0817 +[2025-03-01 12:41:37] (step=0271600) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0792 +[2025-03-01 12:42:36] (step=0271700) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0772 +[2025-03-01 12:43:36] (step=0271800) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0817 +[2025-03-01 12:44:36] (step=0271900) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0775 +[2025-03-01 12:45:35] (step=0272000) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0786 +[2025-03-01 12:46:35] (step=0272100) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0788 +[2025-03-01 12:47:34] (step=0272200) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0819 +[2025-03-01 12:48:34] (step=0272300) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0810 +[2025-03-01 12:49:34] (step=0272400) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0815 +[2025-03-01 12:50:33] (step=0272500) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0781 +[2025-03-01 12:51:33] (step=0272600) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0799 +[2025-03-01 12:52:32] (step=0272700) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0798 +[2025-03-01 12:53:35] (step=0272800) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0796 +[2025-03-01 12:54:35] (step=0272900) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0803 +[2025-03-01 12:55:35] (step=0273000) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0812 +[2025-03-01 12:56:34] (step=0273100) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0796 +[2025-03-01 12:57:34] (step=0273200) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0789 +[2025-03-01 12:58:34] (step=0273300) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0776 +[2025-03-01 12:59:34] (step=0273400) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0814 +[2025-03-01 13:00:33] (step=0273500) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0813 +[2025-03-01 13:01:33] (step=0273600) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0802 +[2025-03-01 13:02:32] (step=0273700) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0784 +[2025-03-01 13:03:32] (step=0273800) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0776 +[2025-03-01 13:04:32] (step=0273900) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0768 +[2025-03-01 13:05:31] (step=0274000) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0787 +[2025-03-01 13:06:31] (step=0274100) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0800 +[2025-03-01 13:07:30] (step=0274200) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0760 +[2025-03-01 13:08:30] (step=0274300) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0781 +[2025-03-01 13:09:30] (step=0274400) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0760 +[2025-03-01 13:10:29] (step=0274500) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0752 +[2025-03-01 13:11:29] (step=0274600) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0832 +[2025-03-01 13:12:29] (step=0274700) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0741 +[2025-03-01 13:13:28] (step=0274800) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0761 +[2025-03-01 13:14:28] (step=0274900) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0803 +[2025-03-01 13:15:27] (step=0275000) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0800 +[2025-03-01 13:16:27] (step=0275100) Train Loss: 0.0452, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0790 +[2025-03-01 13:17:27] (step=0275200) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0793 +[2025-03-01 13:18:29] (step=0275300) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0764 +[2025-03-01 13:19:29] (step=0275400) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0755 +[2025-03-01 13:20:29] (step=0275500) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0793 +[2025-03-01 13:21:29] (step=0275600) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0789 +[2025-03-01 13:22:28] (step=0275700) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0796 +[2025-03-01 13:23:28] (step=0275800) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0799 +[2025-03-01 13:24:27] (step=0275900) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0769 +[2025-03-01 13:25:27] (step=0276000) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0796 +[2025-03-01 13:26:27] (step=0276100) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0768 +[2025-03-01 13:27:26] (step=0276200) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0792 +[2025-03-01 13:28:26] (step=0276300) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0814 +[2025-03-01 13:29:25] (step=0276400) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0774 +[2025-03-01 13:30:25] (step=0276500) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0781 +[2025-03-01 13:31:25] (step=0276600) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0811 +[2025-03-01 13:32:24] (step=0276700) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0804 +[2025-03-01 13:33:24] (step=0276800) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0768 +[2025-03-01 13:34:24] (step=0276900) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0813 +[2025-03-01 13:35:23] (step=0277000) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0775 +[2025-03-01 13:36:23] (step=0277100) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0804 +[2025-03-01 13:37:22] (step=0277200) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0775 +[2025-03-01 13:38:22] (step=0277300) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0806 +[2025-03-01 13:39:22] (step=0277400) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0775 +[2025-03-01 13:40:21] (step=0277500) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0767 +[2025-03-01 13:41:21] (step=0277600) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0790 +[2025-03-01 13:42:21] (step=0277700) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0814 +[2025-03-01 13:43:23] (step=0277800) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0769 +[2025-03-01 13:44:23] (step=0277900) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0782 +[2025-03-01 13:45:23] (step=0278000) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0789 +[2025-03-01 13:46:22] (step=0278100) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0761 +[2025-03-01 13:47:22] (step=0278200) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0800 +[2025-03-01 13:48:21] (step=0278300) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0812 +[2025-03-01 13:49:21] (step=0278400) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0811 +[2025-03-01 13:50:21] (step=0278500) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0757 +[2025-03-01 13:51:20] (step=0278600) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0803 +[2025-03-01 13:52:20] (step=0278700) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0781 +[2025-03-01 13:53:19] (step=0278800) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0788 +[2025-03-01 13:54:19] (step=0278900) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0796 +[2025-03-01 13:55:19] (step=0279000) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0776 +[2025-03-01 13:56:18] (step=0279100) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0791 +[2025-03-01 13:57:18] (step=0279200) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0802 +[2025-03-01 13:58:17] (step=0279300) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0773 +[2025-03-01 13:59:17] (step=0279400) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0772 +[2025-03-01 14:00:17] (step=0279500) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0778 +[2025-03-01 14:01:16] (step=0279600) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0755 +[2025-03-01 14:02:16] (step=0279700) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0766 +[2025-03-01 14:03:15] (step=0279800) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0784 +[2025-03-01 14:04:15] (step=0279900) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0779 +[2025-03-01 14:05:15] (step=0280000) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0774 +[2025-03-01 14:06:14] (step=0280100) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0778 +[2025-03-01 14:07:14] (step=0280200) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0753 +[2025-03-01 14:08:17] (step=0280300) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0756 +[2025-03-01 14:09:16] (step=0280400) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0771 +[2025-03-01 14:10:16] (step=0280500) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0790 +[2025-03-01 14:11:16] (step=0280600) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0786 +[2025-03-01 14:12:15] (step=0280700) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0806 +[2025-03-01 14:13:15] (step=0280800) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0751 +[2025-03-01 14:14:15] (step=0280900) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0780 +[2025-03-01 14:15:14] (step=0281000) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0772 +[2025-03-01 14:16:14] (step=0281100) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0785 +[2025-03-01 14:17:13] (step=0281200) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0752 +[2025-03-01 14:18:13] (step=0281300) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0782 +[2025-03-01 14:19:12] (step=0281400) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0736 +[2025-03-01 14:20:12] (step=0281500) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0794 +[2025-03-01 14:21:12] (step=0281600) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0747 +[2025-03-01 14:22:11] (step=0281700) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0776 +[2025-03-01 14:23:11] (step=0281800) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0783 +[2025-03-01 14:24:10] (step=0281900) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0766 +[2025-03-01 14:25:10] (step=0282000) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0760 +[2025-03-01 14:26:09] (step=0282100) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0744 +[2025-03-01 14:27:09] (step=0282200) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0765 +[2025-03-01 14:28:09] (step=0282300) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0766 +[2025-03-01 14:29:08] (step=0282400) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0780 +[2025-03-01 14:30:08] (step=0282500) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0781 +[2025-03-01 14:31:07] (step=0282600) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0760 +[2025-03-01 14:32:07] (step=0282700) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0784 +[2025-03-01 14:33:10] (step=0282800) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0787 +[2025-03-01 14:34:10] (step=0282900) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0745 +[2025-03-01 14:35:09] (step=0283000) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0781 +[2025-03-01 14:36:09] (step=0283100) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0783 +[2025-03-01 14:37:09] (step=0283200) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0799 +[2025-03-01 14:38:08] (step=0283300) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0753 +[2025-03-01 14:39:08] (step=0283400) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0805 +[2025-03-01 14:40:07] (step=0283500) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0782 +[2025-03-01 14:41:07] (step=0283600) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0766 +[2025-03-01 14:42:06] (step=0283700) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0767 +[2025-03-01 14:43:06] (step=0283800) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0773 +[2025-03-01 14:44:05] (step=0283900) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0754 +[2025-03-01 14:45:05] (step=0284000) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0749 +[2025-03-01 14:46:05] (step=0284100) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0747 +[2025-03-01 14:47:04] (step=0284200) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0749 +[2025-03-01 14:48:04] (step=0284300) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0756 +[2025-03-01 14:49:03] (step=0284400) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0744 +[2025-03-01 14:50:03] (step=0284500) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0779 +[2025-03-01 14:51:02] (step=0284600) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0758 +[2025-03-01 14:52:02] (step=0284700) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0768 +[2025-03-01 14:53:01] (step=0284800) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0772 +[2025-03-01 14:54:01] (step=0284900) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0758 +[2025-03-01 14:55:01] (step=0285000) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0757 +[2025-03-01 14:56:00] (step=0285100) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0817 +[2025-03-01 14:57:00] (step=0285200) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0755 +[2025-03-01 14:58:03] (step=0285300) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.58, Grad Norm: 0.0820 +[2025-03-01 14:59:03] (step=0285400) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0763 +[2025-03-01 15:00:02] (step=0285500) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0795 +[2025-03-01 15:01:02] (step=0285600) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0743 +[2025-03-01 15:02:01] (step=0285700) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0801 +[2025-03-01 15:03:01] (step=0285800) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0799 +[2025-03-01 15:04:00] (step=0285900) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0756 +[2025-03-01 15:05:00] (step=0286000) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0742 +[2025-03-01 15:05:59] (step=0286100) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0790 +[2025-03-01 15:06:59] (step=0286200) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0768 +[2025-03-01 15:07:58] (step=0286300) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0759 +[2025-03-01 15:08:58] (step=0286400) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0785 +[2025-03-01 15:09:57] (step=0286500) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0764 +[2025-03-01 15:10:57] (step=0286600) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0773 +[2025-03-01 15:11:56] (step=0286700) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0759 +[2025-03-01 15:12:56] (step=0286800) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0758 +[2025-03-01 15:13:56] (step=0286900) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0776 +[2025-03-01 15:14:55] (step=0287000) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0794 +[2025-03-01 15:15:55] (step=0287100) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0796 +[2025-03-01 15:16:54] (step=0287200) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0780 +[2025-03-01 15:17:54] (step=0287300) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0743 +[2025-03-01 15:18:53] (step=0287400) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0768 +[2025-03-01 15:19:53] (step=0287500) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0754 +[2025-03-01 15:20:52] (step=0287600) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0744 +[2025-03-01 15:21:52] (step=0287700) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0744 +[2025-03-01 15:22:55] (step=0287800) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0799 +[2025-03-01 15:23:54] (step=0287900) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0786 +[2025-03-01 15:24:55] (step=0288000) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0760 +[2025-03-01 15:25:54] (step=0288100) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0758 +[2025-03-01 15:26:54] (step=0288200) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0801 +[2025-03-01 15:27:53] (step=0288300) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0769 +[2025-03-01 15:28:53] (step=0288400) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0779 +[2025-03-01 15:29:53] (step=0288500) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0783 +[2025-03-01 15:30:52] (step=0288600) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0744 +[2025-03-01 15:31:52] (step=0288700) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0774 +[2025-03-01 15:32:51] (step=0288800) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0774 +[2025-03-01 15:33:51] (step=0288900) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0751 +[2025-03-01 15:34:51] (step=0289000) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0750 +[2025-03-01 15:35:50] (step=0289100) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0768 +[2025-03-01 15:36:50] (step=0289200) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0751 +[2025-03-01 15:37:49] (step=0289300) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0772 +[2025-03-01 15:38:49] (step=0289400) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0742 +[2025-03-01 15:39:49] (step=0289500) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0775 +[2025-03-01 15:40:48] (step=0289600) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0752 +[2025-03-01 15:41:48] (step=0289700) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0804 +[2025-03-01 15:42:47] (step=0289800) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0770 +[2025-03-01 15:43:47] (step=0289900) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0737 +[2025-03-01 15:44:47] (step=0290000) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0743 +[2025-03-01 15:45:46] (step=0290100) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0732 +[2025-03-01 15:46:46] (step=0290200) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0760 +[2025-03-01 15:47:49] (step=0290300) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0763 +[2025-03-01 15:48:49] (step=0290400) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0757 +[2025-03-01 15:49:49] (step=0290500) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0714 +[2025-03-01 15:50:48] (step=0290600) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0763 +[2025-03-01 15:51:48] (step=0290700) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.66, Grad Norm: 0.0749 +[2025-03-01 15:52:48] (step=0290800) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0765 +[2025-03-01 15:53:47] (step=0290900) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0763 +[2025-03-01 15:54:47] (step=0291000) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0782 +[2025-03-01 15:55:47] (step=0291100) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0733 +[2025-03-01 15:56:47] (step=0291200) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0778 +[2025-03-01 15:57:46] (step=0291300) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0777 +[2025-03-01 15:58:46] (step=0291400) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0781 +[2025-03-01 15:59:45] (step=0291500) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0755 +[2025-03-01 16:00:45] (step=0291600) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0763 +[2025-03-01 16:01:44] (step=0291700) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0797 +[2025-03-01 16:02:44] (step=0291800) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0767 +[2025-03-01 16:03:43] (step=0291900) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0750 +[2025-03-01 16:04:43] (step=0292000) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0776 +[2025-03-01 16:05:42] (step=0292100) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0769 +[2025-03-01 16:06:42] (step=0292200) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0784 +[2025-03-01 16:07:41] (step=0292300) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0788 +[2025-03-01 16:08:41] (step=0292400) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0764 +[2025-03-01 16:09:41] (step=0292500) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0781 +[2025-03-01 16:10:40] (step=0292600) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0758 +[2025-03-01 16:11:40] (step=0292700) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0780 +[2025-03-01 16:12:43] (step=0292800) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0751 +[2025-03-01 16:13:42] (step=0292900) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0768 +[2025-03-01 16:14:42] (step=0293000) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0769 +[2025-03-01 16:15:41] (step=0293100) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0788 +[2025-03-01 16:16:41] (step=0293200) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0797 +[2025-03-01 16:17:41] (step=0293300) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0798 +[2025-03-01 16:18:40] (step=0293400) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0713 +[2025-03-01 16:19:40] (step=0293500) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0779 +[2025-03-01 16:20:39] (step=0293600) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0724 +[2025-03-01 16:21:39] (step=0293700) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0752 +[2025-03-01 16:22:38] (step=0293800) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0770 +[2025-03-01 16:23:38] (step=0293900) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0776 +[2025-03-01 16:24:37] (step=0294000) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0736 +[2025-03-01 16:25:37] (step=0294100) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0770 +[2025-03-01 16:26:37] (step=0294200) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0748 +[2025-03-01 16:27:36] (step=0294300) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0752 +[2025-03-01 16:28:36] (step=0294400) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0775 +[2025-03-01 16:29:36] (step=0294500) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0725 +[2025-03-01 16:30:35] (step=0294600) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0777 +[2025-03-01 16:31:35] (step=0294700) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0756 +[2025-03-01 16:32:34] (step=0294800) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0777 +[2025-03-01 16:33:34] (step=0294900) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0768 +[2025-03-01 16:34:34] (step=0295000) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0781 +[2025-03-01 16:35:33] (step=0295100) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0768 +[2025-03-01 16:36:33] (step=0295200) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0752 +[2025-03-01 16:37:36] (step=0295300) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0767 +[2025-03-01 16:38:35] (step=0295400) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0753 +[2025-03-01 16:39:35] (step=0295500) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0762 +[2025-03-01 16:40:35] (step=0295600) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0740 +[2025-03-01 16:41:34] (step=0295700) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0742 +[2025-03-01 16:42:34] (step=0295800) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0754 +[2025-03-01 16:43:33] (step=0295900) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0758 +[2025-03-01 16:44:33] (step=0296000) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0735 +[2025-03-01 16:45:32] (step=0296100) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0750 +[2025-03-01 16:46:32] (step=0296200) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0779 +[2025-03-01 16:47:31] (step=0296300) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0740 +[2025-03-01 16:48:31] (step=0296400) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0752 +[2025-03-01 16:49:30] (step=0296500) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0768 +[2025-03-01 16:50:30] (step=0296600) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0724 +[2025-03-01 16:51:30] (step=0296700) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0744 +[2025-03-01 16:52:29] (step=0296800) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0757 +[2025-03-01 16:53:29] (step=0296900) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0736 +[2025-03-01 16:54:28] (step=0297000) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0739 +[2025-03-01 16:55:28] (step=0297100) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0748 +[2025-03-01 16:56:27] (step=0297200) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0779 +[2025-03-01 16:57:27] (step=0297300) Train Loss: 0.0451, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0725 +[2025-03-01 16:58:26] (step=0297400) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0792 +[2025-03-01 16:59:26] (step=0297500) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0747 +[2025-03-01 17:00:26] (step=0297600) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0726 +[2025-03-01 17:01:25] (step=0297700) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0777 +[2025-03-01 17:02:28] (step=0297800) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0741 +[2025-03-01 17:03:28] (step=0297900) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0760 +[2025-03-01 17:04:27] (step=0298000) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0740 +[2025-03-01 17:05:27] (step=0298100) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0759 +[2025-03-01 17:06:26] (step=0298200) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0711 +[2025-03-01 17:07:26] (step=0298300) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0744 +[2025-03-01 17:08:25] (step=0298400) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0745 +[2025-03-01 17:09:25] (step=0298500) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0727 +[2025-03-01 17:10:24] (step=0298600) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0785 +[2025-03-01 17:11:24] (step=0298700) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0728 +[2025-03-01 17:12:24] (step=0298800) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0752 +[2025-03-01 17:13:23] (step=0298900) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0751 +[2025-03-01 17:14:23] (step=0299000) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0765 +[2025-03-01 17:15:22] (step=0299100) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0765 +[2025-03-01 17:16:22] (step=0299200) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0743 +[2025-03-01 17:17:21] (step=0299300) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0731 +[2025-03-01 17:18:21] (step=0299400) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0730 +[2025-03-01 17:19:20] (step=0299500) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0756 +[2025-03-01 17:20:20] (step=0299600) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0737 +[2025-03-01 17:21:19] (step=0299700) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0727 +[2025-03-01 17:22:19] (step=0299800) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0735 +[2025-03-01 17:23:18] (step=0299900) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0719 +[2025-03-01 17:24:18] (step=0300000) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0760 +[2025-03-01 17:24:21] Saved checkpoint to ../logs/flow/flowsdvae_500kx512_lgn0p0/checkpoints/0300000.pt +[2025-03-01 17:29:48] (step=0300000), Fid=12.176650524120078, PSNR=27.054235615444185, LPIPS=0.22435395419597626, SSIM=0.7486523985862732 +[2025-03-01 17:30:48] (step=0300100) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 0.26, Grad Norm: 0.0750 +[2025-03-01 17:31:48] (step=0300200) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0722 +[2025-03-01 17:32:51] (step=0300300) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0747 +[2025-03-01 17:33:51] (step=0300400) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0743 +[2025-03-01 17:34:50] (step=0300500) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0712 +[2025-03-01 17:35:50] (step=0300600) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0735 +[2025-03-01 17:36:50] (step=0300700) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0728 +[2025-03-01 17:37:49] (step=0300800) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0751 +[2025-03-01 17:38:49] (step=0300900) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0729 +[2025-03-01 17:39:49] (step=0301000) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0738 +[2025-03-01 17:40:48] (step=0301100) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0733 +[2025-03-01 17:41:48] (step=0301200) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0756 +[2025-03-01 17:42:48] (step=0301300) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0711 +[2025-03-01 17:43:48] (step=0301400) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0750 +[2025-03-01 17:44:48] (step=0301500) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0774 +[2025-03-01 17:45:47] (step=0301600) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0711 +[2025-03-01 17:46:47] (step=0301700) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0754 +[2025-03-01 17:47:47] (step=0301800) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0775 +[2025-03-01 17:48:46] (step=0301900) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0738 +[2025-03-01 17:49:46] (step=0302000) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0764 +[2025-03-01 17:50:45] (step=0302100) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0767 +[2025-03-01 17:51:45] (step=0302200) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0764 +[2025-03-01 17:52:44] (step=0302300) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0747 +[2025-03-01 17:53:44] (step=0302400) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0730 +[2025-03-01 17:54:44] (step=0302500) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0734 +[2025-03-01 17:55:43] (step=0302600) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0738 +[2025-03-01 17:56:43] (step=0302700) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0745 +[2025-03-01 17:57:45] (step=0302800) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0723 +[2025-03-01 17:58:45] (step=0302900) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0720 +[2025-03-01 17:59:45] (step=0303000) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0732 +[2025-03-01 18:00:45] (step=0303100) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0770 +[2025-03-01 18:01:44] (step=0303200) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0774 +[2025-03-01 18:02:44] (step=0303300) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0759 +[2025-03-01 18:03:44] (step=0303400) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0726 +[2025-03-01 18:04:43] (step=0303500) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0741 +[2025-03-01 18:05:43] (step=0303600) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0740 +[2025-03-01 18:06:42] (step=0303700) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0768 +[2025-03-01 18:07:42] (step=0303800) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0746 +[2025-03-01 18:08:41] (step=0303900) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0735 +[2025-03-01 18:09:41] (step=0304000) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0715 +[2025-03-01 18:10:41] (step=0304100) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0777 +[2025-03-01 18:11:40] (step=0304200) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0768 +[2025-03-01 18:12:40] (step=0304300) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0750 +[2025-03-01 18:13:39] (step=0304400) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0774 +[2025-03-01 18:14:39] (step=0304500) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0744 +[2025-03-01 18:15:38] (step=0304600) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0796 +[2025-03-01 18:16:38] (step=0304700) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0748 +[2025-03-01 18:17:37] (step=0304800) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0775 +[2025-03-01 18:18:37] (step=0304900) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0749 +[2025-03-01 18:19:36] (step=0305000) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0737 +[2025-03-01 18:20:36] (step=0305100) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0761 +[2025-03-01 18:21:36] (step=0305200) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0757 +[2025-03-01 18:22:38] (step=0305300) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0748 +[2025-03-01 18:23:38] (step=0305400) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0762 +[2025-03-01 18:24:38] (step=0305500) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0733 +[2025-03-01 18:25:38] (step=0305600) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0746 +[2025-03-01 18:26:37] (step=0305700) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0727 +[2025-03-01 18:27:37] (step=0305800) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0784 +[2025-03-01 18:28:36] (step=0305900) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0752 +[2025-03-01 18:29:36] (step=0306000) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0735 +[2025-03-01 18:30:35] (step=0306100) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0726 +[2025-03-01 18:31:35] (step=0306200) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0768 +[2025-03-01 18:32:35] (step=0306300) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0759 +[2025-03-01 18:33:34] (step=0306400) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0714 +[2025-03-01 18:34:34] (step=0306500) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0735 +[2025-03-01 18:35:33] (step=0306600) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0728 +[2025-03-01 18:36:33] (step=0306700) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0743 +[2025-03-01 18:37:32] (step=0306800) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0772 +[2025-03-01 18:38:32] (step=0306900) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0727 +[2025-03-01 18:39:32] (step=0307000) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0727 +[2025-03-01 18:40:31] (step=0307100) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0743 +[2025-03-01 18:41:31] (step=0307200) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0732 +[2025-03-01 18:42:30] (step=0307300) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0738 +[2025-03-01 18:43:30] (step=0307400) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0738 +[2025-03-01 18:44:29] (step=0307500) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0725 +[2025-03-01 18:45:29] (step=0307600) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0710 +[2025-03-01 18:46:28] (step=0307700) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0730 +[2025-03-01 18:47:31] (step=0307800) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0728 +[2025-03-01 18:48:31] (step=0307900) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0765 +[2025-03-01 18:49:31] (step=0308000) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0729 +[2025-03-01 18:50:30] (step=0308100) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0753 +[2025-03-01 18:51:30] (step=0308200) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0719 +[2025-03-01 18:52:30] (step=0308300) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0748 +[2025-03-01 18:53:30] (step=0308400) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0774 +[2025-03-01 18:54:29] (step=0308500) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0732 +[2025-03-01 18:55:29] (step=0308600) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0749 +[2025-03-01 18:56:29] (step=0308700) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0748 +[2025-03-01 18:57:28] (step=0308800) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0716 +[2025-03-01 18:58:28] (step=0308900) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0738 +[2025-03-01 18:59:28] (step=0309000) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0744 +[2025-03-01 19:00:27] (step=0309100) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0723 +[2025-03-01 19:01:27] (step=0309200) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0725 +[2025-03-01 19:02:26] (step=0309300) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0731 +[2025-03-01 19:03:26] (step=0309400) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0723 +[2025-03-01 19:04:25] (step=0309500) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0753 +[2025-03-01 19:05:25] (step=0309600) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0733 +[2025-03-01 19:06:24] (step=0309700) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0732 +[2025-03-01 19:07:24] (step=0309800) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0731 +[2025-03-01 19:08:23] (step=0309900) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0729 +[2025-03-01 19:09:23] (step=0310000) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0730 +[2025-03-01 19:10:23] (step=0310100) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0720 +[2025-03-01 19:11:22] (step=0310200) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0743 +[2025-03-01 19:12:25] (step=0310300) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0738 +[2025-03-01 19:13:25] (step=0310400) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0706 +[2025-03-01 19:14:24] (step=0310500) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0735 +[2025-03-01 19:15:24] (step=0310600) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0721 +[2025-03-01 19:16:23] (step=0310700) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0748 +[2025-03-01 19:17:23] (step=0310800) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0721 +[2025-03-01 19:18:23] (step=0310900) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0731 +[2025-03-01 19:19:22] (step=0311000) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0718 +[2025-03-01 19:20:22] (step=0311100) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0728 +[2025-03-01 19:21:21] (step=0311200) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0714 +[2025-03-01 19:22:21] (step=0311300) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0732 +[2025-03-01 19:23:20] (step=0311400) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0739 +[2025-03-01 19:24:20] (step=0311500) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0732 +[2025-03-01 19:25:20] (step=0311600) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0712 +[2025-03-01 19:26:19] (step=0311700) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0738 +[2025-03-01 19:27:19] (step=0311800) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0716 +[2025-03-01 19:28:18] (step=0311900) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0738 +[2025-03-01 19:29:18] (step=0312000) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0728 +[2025-03-01 19:30:18] (step=0312100) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0717 +[2025-03-01 19:31:17] (step=0312200) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0735 +[2025-03-01 19:32:17] (step=0312300) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0733 +[2025-03-01 19:33:16] (step=0312400) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0747 +[2025-03-01 19:34:16] (step=0312500) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0729 +[2025-03-01 19:35:15] (step=0312600) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0748 +[2025-03-01 19:36:15] (step=0312700) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0734 +[2025-03-01 19:37:18] (step=0312800) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0742 +[2025-03-01 19:38:18] (step=0312900) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0718 +[2025-03-01 19:39:17] (step=0313000) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0720 +[2025-03-01 19:40:17] (step=0313100) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0737 +[2025-03-01 19:41:17] (step=0313200) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0745 +[2025-03-01 19:42:16] (step=0313300) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0713 +[2025-03-01 19:43:16] (step=0313400) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0749 +[2025-03-01 19:44:15] (step=0313500) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0696 +[2025-03-01 19:45:15] (step=0313600) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0717 +[2025-03-01 19:46:14] (step=0313700) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0738 +[2025-03-01 19:47:14] (step=0313800) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0733 +[2025-03-01 19:48:13] (step=0313900) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0708 +[2025-03-01 19:49:13] (step=0314000) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0700 +[2025-03-01 19:50:12] (step=0314100) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0721 +[2025-03-01 19:51:12] (step=0314200) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0736 +[2025-03-01 19:52:11] (step=0314300) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0688 +[2025-03-01 19:53:11] (step=0314400) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0738 +[2025-03-01 19:54:10] (step=0314500) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0732 +[2025-03-01 19:55:10] (step=0314600) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0732 +[2025-03-01 19:56:09] (step=0314700) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0730 +[2025-03-01 19:57:09] (step=0314800) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0738 +[2025-03-01 19:58:08] (step=0314900) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0716 +[2025-03-01 19:59:08] (step=0315000) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0713 +[2025-03-01 20:00:08] (step=0315100) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0718 +[2025-03-01 20:01:07] (step=0315200) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0718 +[2025-03-01 20:02:10] (step=0315300) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0710 +[2025-03-01 20:03:10] (step=0315400) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0717 +[2025-03-01 20:04:09] (step=0315500) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0708 +[2025-03-01 20:05:09] (step=0315600) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0729 +[2025-03-01 20:06:09] (step=0315700) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0749 +[2025-03-01 20:07:08] (step=0315800) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0714 +[2025-03-01 20:08:08] (step=0315900) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0700 +[2025-03-01 20:09:07] (step=0316000) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0731 +[2025-03-01 20:10:07] (step=0316100) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0722 +[2025-03-01 20:11:06] (step=0316200) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0729 +[2025-03-01 20:12:06] (step=0316300) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0764 +[2025-03-01 20:13:05] (step=0316400) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0714 +[2025-03-01 20:14:05] (step=0316500) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0764 +[2025-03-01 20:15:04] (step=0316600) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0714 +[2025-03-01 20:16:04] (step=0316700) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0721 +[2025-03-01 20:17:04] (step=0316800) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0720 +[2025-03-01 20:18:03] (step=0316900) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0738 +[2025-03-01 20:19:03] (step=0317000) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0728 +[2025-03-01 20:20:03] (step=0317100) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0734 +[2025-03-01 20:21:02] (step=0317200) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0730 +[2025-03-01 20:22:02] (step=0317300) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0717 +[2025-03-01 20:23:02] (step=0317400) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0698 +[2025-03-01 20:24:01] (step=0317500) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0724 +[2025-03-01 20:25:01] (step=0317600) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0741 +[2025-03-01 20:26:01] (step=0317700) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0738 +[2025-03-01 20:27:04] (step=0317800) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0678 +[2025-03-01 20:28:03] (step=0317900) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0740 +[2025-03-01 20:29:03] (step=0318000) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0735 +[2025-03-01 20:30:03] (step=0318100) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0704 +[2025-03-01 20:31:02] (step=0318200) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0693 +[2025-03-01 20:32:02] (step=0318300) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0713 +[2025-03-01 20:33:01] (step=0318400) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0704 +[2025-03-01 20:34:01] (step=0318500) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0745 +[2025-03-01 20:35:01] (step=0318600) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0736 +[2025-03-01 20:36:00] (step=0318700) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0696 +[2025-03-01 20:37:00] (step=0318800) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0727 +[2025-03-01 20:37:59] (step=0318900) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0710 +[2025-03-01 20:38:59] (step=0319000) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0710 +[2025-03-01 20:39:59] (step=0319100) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0744 +[2025-03-01 20:40:58] (step=0319200) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0730 +[2025-03-01 20:41:58] (step=0319300) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0695 +[2025-03-01 20:42:57] (step=0319400) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0751 +[2025-03-01 20:43:57] (step=0319500) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0714 +[2025-03-01 20:44:56] (step=0319600) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0725 +[2025-03-01 20:45:56] (step=0319700) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0722 +[2025-03-01 20:46:56] (step=0319800) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0712 +[2025-03-01 20:47:55] (step=0319900) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0724 +[2025-03-01 20:48:55] (step=0320000) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0735 +[2025-03-01 20:49:54] (step=0320100) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0733 +[2025-03-01 20:50:54] (step=0320200) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0718 +[2025-03-01 20:51:57] (step=0320300) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0730 +[2025-03-01 20:52:57] (step=0320400) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0708 +[2025-03-01 20:53:56] (step=0320500) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0712 +[2025-03-01 20:54:56] (step=0320600) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0709 +[2025-03-01 20:55:56] (step=0320700) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0734 +[2025-03-01 20:56:55] (step=0320800) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0728 +[2025-03-01 20:57:55] (step=0320900) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0727 +[2025-03-01 20:58:54] (step=0321000) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0700 +[2025-03-01 20:59:54] (step=0321100) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0723 +[2025-03-01 21:00:53] (step=0321200) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0727 +[2025-03-01 21:01:53] (step=0321300) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0717 +[2025-03-01 21:02:53] (step=0321400) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0727 +[2025-03-01 21:03:52] (step=0321500) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0715 +[2025-03-01 21:04:52] (step=0321600) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0715 +[2025-03-01 21:05:51] (step=0321700) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0715 +[2025-03-01 21:06:51] (step=0321800) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0700 +[2025-03-01 21:07:51] (step=0321900) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0703 +[2025-03-01 21:08:50] (step=0322000) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0703 +[2025-03-01 21:09:50] (step=0322100) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0724 +[2025-03-01 21:10:49] (step=0322200) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0708 +[2025-03-01 21:11:49] (step=0322300) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0703 +[2025-03-01 21:12:49] (step=0322400) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0772 +[2025-03-01 21:13:48] (step=0322500) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0721 +[2025-03-01 21:14:48] (step=0322600) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0753 +[2025-03-01 21:15:47] (step=0322700) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0766 +[2025-03-01 21:16:50] (step=0322800) Train Loss: 0.0449, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0714 +[2025-03-01 21:17:50] (step=0322900) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0751 +[2025-03-01 21:18:50] (step=0323000) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0724 +[2025-03-01 21:19:49] (step=0323100) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0725 +[2025-03-01 21:20:49] (step=0323200) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0729 +[2025-03-01 21:21:48] (step=0323300) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0740 +[2025-03-01 21:22:48] (step=0323400) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0741 +[2025-03-01 21:23:48] (step=0323500) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0706 +[2025-03-01 21:24:47] (step=0323600) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0713 +[2025-03-01 21:25:47] (step=0323700) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0721 +[2025-03-01 21:26:46] (step=0323800) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0708 +[2025-03-01 21:27:46] (step=0323900) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0720 +[2025-03-01 21:28:46] (step=0324000) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0691 +[2025-03-01 21:29:45] (step=0324100) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0739 +[2025-03-01 21:30:45] (step=0324200) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0709 +[2025-03-01 21:31:44] (step=0324300) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0695 +[2025-03-01 21:32:44] (step=0324400) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0740 +[2025-03-01 21:33:44] (step=0324500) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0689 +[2025-03-01 21:34:43] (step=0324600) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0736 +[2025-03-01 21:35:43] (step=0324700) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0703 +[2025-03-01 21:36:42] (step=0324800) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0691 +[2025-03-01 21:37:42] (step=0324900) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0700 +[2025-03-01 21:38:42] (step=0325000) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0719 +[2025-03-01 21:39:41] (step=0325100) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0713 +[2025-03-01 21:40:41] (step=0325200) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0698 +[2025-03-01 21:41:44] (step=0325300) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0700 +[2025-03-01 21:42:44] (step=0325400) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0722 +[2025-03-01 21:43:43] (step=0325500) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0700 +[2025-03-01 21:44:43] (step=0325600) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0674 +[2025-03-01 21:45:43] (step=0325700) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0706 +[2025-03-01 21:46:42] (step=0325800) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0681 +[2025-03-01 21:47:42] (step=0325900) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0684 +[2025-03-01 21:48:41] (step=0326000) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0726 +[2025-03-01 21:49:41] (step=0326100) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0677 +[2025-03-01 21:50:41] (step=0326200) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0726 +[2025-03-01 21:51:40] (step=0326300) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0706 +[2025-03-01 21:52:40] (step=0326400) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0720 +[2025-03-01 21:53:39] (step=0326500) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0713 +[2025-03-01 21:54:39] (step=0326600) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0674 +[2025-03-01 21:55:38] (step=0326700) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0699 +[2025-03-01 21:56:38] (step=0326800) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0685 +[2025-03-01 21:57:38] (step=0326900) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0694 +[2025-03-01 21:58:37] (step=0327000) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0719 +[2025-03-01 21:59:37] (step=0327100) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0698 +[2025-03-01 22:00:36] (step=0327200) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0724 +[2025-03-01 22:01:36] (step=0327300) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0716 +[2025-03-01 22:02:36] (step=0327400) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0697 +[2025-03-01 22:03:35] (step=0327500) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0722 +[2025-03-01 22:04:35] (step=0327600) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0692 +[2025-03-01 22:05:34] (step=0327700) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0722 +[2025-03-01 22:06:37] (step=0327800) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0695 +[2025-03-01 22:07:37] (step=0327900) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0721 +[2025-03-01 22:08:37] (step=0328000) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0700 +[2025-03-01 22:09:36] (step=0328100) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0728 +[2025-03-01 22:10:36] (step=0328200) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0691 +[2025-03-01 22:11:35] (step=0328300) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0725 +[2025-03-01 22:12:35] (step=0328400) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0691 +[2025-03-01 22:13:35] (step=0328500) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0713 +[2025-03-01 22:14:34] (step=0328600) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0719 +[2025-03-01 22:15:34] (step=0328700) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0693 +[2025-03-01 22:16:33] (step=0328800) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0685 +[2025-03-01 22:17:33] (step=0328900) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0690 +[2025-03-01 22:18:33] (step=0329000) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0717 +[2025-03-01 22:19:32] (step=0329100) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0710 +[2025-03-01 22:20:32] (step=0329200) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0688 +[2025-03-01 22:21:31] (step=0329300) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0718 +[2025-03-01 22:22:31] (step=0329400) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0695 +[2025-03-01 22:23:30] (step=0329500) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0707 +[2025-03-01 22:24:30] (step=0329600) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0703 +[2025-03-01 22:25:30] (step=0329700) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0709 +[2025-03-01 22:26:29] (step=0329800) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0729 +[2025-03-01 22:27:29] (step=0329900) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0715 +[2025-03-01 22:28:28] (step=0330000) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0705 +[2025-03-01 22:29:28] (step=0330100) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0721 +[2025-03-01 22:30:28] (step=0330200) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0708 +[2025-03-01 22:31:30] (step=0330300) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0689 +[2025-03-01 22:32:30] (step=0330400) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0722 +[2025-03-01 22:33:30] (step=0330500) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0690 +[2025-03-01 22:34:29] (step=0330600) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0700 +[2025-03-01 22:35:29] (step=0330700) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0749 +[2025-03-01 22:36:29] (step=0330800) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0697 +[2025-03-01 22:37:28] (step=0330900) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0729 +[2025-03-01 22:38:28] (step=0331000) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0699 +[2025-03-01 22:39:27] (step=0331100) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0723 +[2025-03-01 22:40:27] (step=0331200) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0720 +[2025-03-01 22:41:27] (step=0331300) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0751 +[2025-03-01 22:42:26] (step=0331400) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0674 +[2025-03-01 22:43:26] (step=0331500) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0690 +[2025-03-01 22:44:25] (step=0331600) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0695 +[2025-03-01 22:45:25] (step=0331700) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0714 +[2025-03-01 22:46:24] (step=0331800) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0727 +[2025-03-01 22:47:24] (step=0331900) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0674 +[2025-03-01 22:48:24] (step=0332000) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0715 +[2025-03-01 22:49:23] (step=0332100) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0682 +[2025-03-01 22:50:23] (step=0332200) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0702 +[2025-03-01 22:51:22] (step=0332300) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0701 +[2025-03-01 22:52:22] (step=0332400) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0692 +[2025-03-01 22:53:22] (step=0332500) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0726 +[2025-03-01 22:54:21] (step=0332600) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0711 +[2025-03-01 22:55:21] (step=0332700) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0706 +[2025-03-01 22:56:24] (step=0332800) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0724 +[2025-03-01 22:57:23] (step=0332900) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0716 +[2025-03-01 22:58:23] (step=0333000) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0719 +[2025-03-01 22:59:22] (step=0333100) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0716 +[2025-03-01 23:00:22] (step=0333200) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0695 +[2025-03-01 23:01:21] (step=0333300) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0711 +[2025-03-01 23:02:21] (step=0333400) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0706 +[2025-03-01 23:03:21] (step=0333500) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0668 +[2025-03-01 23:04:20] (step=0333600) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0716 +[2025-03-01 23:05:20] (step=0333700) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0708 +[2025-03-01 23:06:19] (step=0333800) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0695 +[2025-03-01 23:07:19] (step=0333900) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0677 +[2025-03-01 23:08:18] (step=0334000) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0730 +[2025-03-01 23:09:18] (step=0334100) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0706 +[2025-03-01 23:10:17] (step=0334200) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0695 +[2025-03-01 23:11:17] (step=0334300) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0698 +[2025-03-01 23:12:17] (step=0334400) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0708 +[2025-03-01 23:13:16] (step=0334500) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0683 +[2025-03-01 23:14:16] (step=0334600) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0689 +[2025-03-01 23:15:15] (step=0334700) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0678 +[2025-03-01 23:16:15] (step=0334800) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0692 +[2025-03-01 23:17:14] (step=0334900) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0718 +[2025-03-01 23:18:14] (step=0335000) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0693 +[2025-03-01 23:19:13] (step=0335100) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0696 +[2025-03-01 23:20:13] (step=0335200) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0694 +[2025-03-01 23:21:16] (step=0335300) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0686 +[2025-03-01 23:22:16] (step=0335400) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0700 +[2025-03-01 23:23:15] (step=0335500) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0673 +[2025-03-01 23:24:15] (step=0335600) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0724 +[2025-03-01 23:25:14] (step=0335700) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0698 +[2025-03-01 23:26:14] (step=0335800) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0714 +[2025-03-01 23:27:13] (step=0335900) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0710 +[2025-03-01 23:28:13] (step=0336000) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0710 +[2025-03-01 23:29:13] (step=0336100) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0721 +[2025-03-01 23:30:12] (step=0336200) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0704 +[2025-03-01 23:31:12] (step=0336300) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0681 +[2025-03-01 23:32:11] (step=0336400) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0691 +[2025-03-01 23:33:11] (step=0336500) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0682 +[2025-03-01 23:34:10] (step=0336600) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0707 +[2025-03-01 23:35:10] (step=0336700) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0696 +[2025-03-01 23:36:09] (step=0336800) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0699 +[2025-03-01 23:37:09] (step=0336900) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0691 +[2025-03-01 23:38:08] (step=0337000) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0715 +[2025-03-01 23:39:08] (step=0337100) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0708 +[2025-03-01 23:40:07] (step=0337200) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0689 +[2025-03-01 23:41:07] (step=0337300) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0717 +[2025-03-01 23:42:06] (step=0337400) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0682 +[2025-03-01 23:43:06] (step=0337500) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0683 +[2025-03-01 23:44:05] (step=0337600) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0723 +[2025-03-01 23:45:05] (step=0337700) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0686 +[2025-03-01 23:46:08] (step=0337800) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0698 +[2025-03-01 23:47:08] (step=0337900) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0707 +[2025-03-01 23:48:07] (step=0338000) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0710 +[2025-03-01 23:49:07] (step=0338100) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0703 +[2025-03-01 23:50:06] (step=0338200) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0708 +[2025-03-01 23:51:06] (step=0338300) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0699 +[2025-03-01 23:52:05] (step=0338400) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0697 +[2025-03-01 23:53:05] (step=0338500) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0685 +[2025-03-01 23:54:04] (step=0338600) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0690 +[2025-03-01 23:55:04] (step=0338700) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0707 +[2025-03-01 23:56:03] (step=0338800) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0698 +[2025-03-01 23:57:03] (step=0338900) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0695 +[2025-03-01 23:58:02] (step=0339000) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0686 +[2025-03-01 23:59:02] (step=0339100) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0724 +[2025-03-02 00:00:01] (step=0339200) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0694 +[2025-03-02 00:01:01] (step=0339300) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0707 +[2025-03-02 00:02:00] (step=0339400) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0687 +[2025-03-02 00:03:00] (step=0339500) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0695 +[2025-03-02 00:03:59] (step=0339600) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0685 +[2025-03-02 00:04:59] (step=0339700) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0686 +[2025-03-02 00:05:59] (step=0339800) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0689 +[2025-03-02 00:06:58] (step=0339900) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0667 +[2025-03-02 00:07:58] (step=0340000) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0687 +[2025-03-02 00:08:57] (step=0340100) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0730 +[2025-03-02 00:09:57] (step=0340200) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0703 +[2025-03-02 00:10:59] (step=0340300) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0700 +[2025-03-02 00:11:59] (step=0340400) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0695 +[2025-03-02 00:12:59] (step=0340500) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0704 +[2025-03-02 00:13:59] (step=0340600) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0725 +[2025-03-02 00:14:58] (step=0340700) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0700 +[2025-03-02 00:15:58] (step=0340800) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0704 +[2025-03-02 00:16:57] (step=0340900) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0693 +[2025-03-02 00:17:57] (step=0341000) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0684 +[2025-03-02 00:18:56] (step=0341100) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0692 +[2025-03-02 00:19:56] (step=0341200) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0677 +[2025-03-02 00:20:55] (step=0341300) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0694 +[2025-03-02 00:21:55] (step=0341400) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0714 +[2025-03-02 00:22:54] (step=0341500) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0697 +[2025-03-02 00:23:54] (step=0341600) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0692 +[2025-03-02 00:24:53] (step=0341700) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0701 +[2025-03-02 00:25:53] (step=0341800) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0696 +[2025-03-02 00:26:52] (step=0341900) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0708 +[2025-03-02 00:27:52] (step=0342000) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0679 +[2025-03-02 00:28:52] (step=0342100) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0689 +[2025-03-02 00:29:51] (step=0342200) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0697 +[2025-03-02 00:30:51] (step=0342300) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0693 +[2025-03-02 00:31:50] (step=0342400) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0708 +[2025-03-02 00:32:50] (step=0342500) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0664 +[2025-03-02 00:33:49] (step=0342600) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0705 +[2025-03-02 00:34:49] (step=0342700) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0657 +[2025-03-02 00:35:52] (step=0342800) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0682 +[2025-03-02 00:36:51] (step=0342900) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0696 +[2025-03-02 00:37:51] (step=0343000) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0677 +[2025-03-02 00:38:51] (step=0343100) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0675 +[2025-03-02 00:39:50] (step=0343200) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0692 +[2025-03-02 00:40:50] (step=0343300) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0704 +[2025-03-02 00:41:49] (step=0343400) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0663 +[2025-03-02 00:42:49] (step=0343500) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0677 +[2025-03-02 00:43:49] (step=0343600) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0677 +[2025-03-02 00:44:48] (step=0343700) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0689 +[2025-03-02 00:45:48] (step=0343800) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0689 +[2025-03-02 00:46:48] (step=0343900) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0675 +[2025-03-02 00:47:47] (step=0344000) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0672 +[2025-03-02 00:48:47] (step=0344100) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0726 +[2025-03-02 00:49:47] (step=0344200) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0682 +[2025-03-02 00:50:46] (step=0344300) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0688 +[2025-03-02 00:51:46] (step=0344400) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0672 +[2025-03-02 00:52:46] (step=0344500) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0711 +[2025-03-02 00:53:45] (step=0344600) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0692 +[2025-03-02 00:54:45] (step=0344700) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0693 +[2025-03-02 00:55:45] (step=0344800) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0702 +[2025-03-02 00:56:44] (step=0344900) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0708 +[2025-03-02 00:57:44] (step=0345000) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0699 +[2025-03-02 00:58:44] (step=0345100) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0681 +[2025-03-02 00:59:43] (step=0345200) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0719 +[2025-03-02 01:00:46] (step=0345300) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0718 +[2025-03-02 01:01:47] (step=0345400) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.66, Grad Norm: 0.0719 +[2025-03-02 01:02:46] (step=0345500) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0678 +[2025-03-02 01:03:46] (step=0345600) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0695 +[2025-03-02 01:04:46] (step=0345700) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0675 +[2025-03-02 01:05:45] (step=0345800) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0685 +[2025-03-02 01:06:45] (step=0345900) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0682 +[2025-03-02 01:07:45] (step=0346000) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0681 +[2025-03-02 01:08:44] (step=0346100) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0710 +[2025-03-02 01:09:44] (step=0346200) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0697 +[2025-03-02 01:10:44] (step=0346300) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0686 +[2025-03-02 01:11:43] (step=0346400) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0666 +[2025-03-02 01:12:43] (step=0346500) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0673 +[2025-03-02 01:13:42] (step=0346600) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0685 +[2025-03-02 01:14:42] (step=0346700) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0691 +[2025-03-02 01:15:42] (step=0346800) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0686 +[2025-03-02 01:16:41] (step=0346900) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0684 +[2025-03-02 01:17:41] (step=0347000) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0706 +[2025-03-02 01:18:41] (step=0347100) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0694 +[2025-03-02 01:19:40] (step=0347200) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0706 +[2025-03-02 01:20:40] (step=0347300) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0712 +[2025-03-02 01:21:40] (step=0347400) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0702 +[2025-03-02 01:22:39] (step=0347500) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0671 +[2025-03-02 01:23:39] (step=0347600) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0683 +[2025-03-02 01:24:38] (step=0347700) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0717 +[2025-03-02 01:25:41] (step=0347800) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.58, Grad Norm: 0.0680 +[2025-03-02 01:26:42] (step=0347900) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.66, Grad Norm: 0.0705 +[2025-03-02 01:27:42] (step=0348000) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0686 +[2025-03-02 01:28:41] (step=0348100) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0684 +[2025-03-02 01:29:41] (step=0348200) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0672 +[2025-03-02 01:30:40] (step=0348300) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0703 +[2025-03-02 01:31:40] (step=0348400) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0680 +[2025-03-02 01:32:40] (step=0348500) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0662 +[2025-03-02 01:33:40] (step=0348600) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0683 +[2025-03-02 01:34:39] (step=0348700) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0708 +[2025-03-02 01:35:39] (step=0348800) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0703 +[2025-03-02 01:36:39] (step=0348900) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0711 +[2025-03-02 01:37:38] (step=0349000) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0705 +[2025-03-02 01:38:38] (step=0349100) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0681 +[2025-03-02 01:39:38] (step=0349200) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0726 +[2025-03-02 01:40:37] (step=0349300) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0714 +[2025-03-02 01:41:37] (step=0349400) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0685 +[2025-03-02 01:42:36] (step=0349500) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0678 +[2025-03-02 01:43:36] (step=0349600) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0692 +[2025-03-02 01:44:36] (step=0349700) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0687 +[2025-03-02 01:45:35] (step=0349800) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0681 +[2025-03-02 01:46:35] (step=0349900) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0689 +[2025-03-02 01:47:34] (step=0350000) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0700 +[2025-03-02 01:47:38] Saved checkpoint to ../logs/flow/flowsdvae_500kx512_lgn0p0/checkpoints/0350000.pt +[2025-03-02 01:53:02] (step=0350000), Fid=12.29196212904668, PSNR=27.088790105342866, LPIPS=0.22448259592056274, SSIM=0.7497131824493408 +[2025-03-02 01:54:02] (step=0350100) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 0.26, Grad Norm: 0.0701 +[2025-03-02 01:55:02] (step=0350200) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0686 +[2025-03-02 01:56:05] (step=0350300) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0664 +[2025-03-02 01:57:05] (step=0350400) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0683 +[2025-03-02 01:58:04] (step=0350500) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0669 +[2025-03-02 01:59:04] (step=0350600) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0677 +[2025-03-02 02:00:04] (step=0350700) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0666 +[2025-03-02 02:01:04] (step=0350800) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0681 +[2025-03-02 02:02:03] (step=0350900) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0682 +[2025-03-02 02:03:03] (step=0351000) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0683 +[2025-03-02 02:04:03] (step=0351100) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0683 +[2025-03-02 02:05:02] (step=0351200) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0672 +[2025-03-02 02:06:02] (step=0351300) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0687 +[2025-03-02 02:07:02] (step=0351400) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0704 +[2025-03-02 02:08:01] (step=0351500) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0670 +[2025-03-02 02:09:01] (step=0351600) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0680 +[2025-03-02 02:10:01] (step=0351700) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0680 +[2025-03-02 02:11:00] (step=0351800) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0693 +[2025-03-02 02:12:00] (step=0351900) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0663 +[2025-03-02 02:12:59] (step=0352000) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0696 +[2025-03-02 02:13:59] (step=0352100) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0658 +[2025-03-02 02:14:59] (step=0352200) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0688 +[2025-03-02 02:15:58] (step=0352300) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0683 +[2025-03-02 02:16:58] (step=0352400) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0677 +[2025-03-02 02:17:58] (step=0352500) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0690 +[2025-03-02 02:18:57] (step=0352600) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0701 +[2025-03-02 02:19:57] (step=0352700) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0701 +[2025-03-02 02:21:00] (step=0352800) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0668 +[2025-03-02 02:22:00] (step=0352900) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0706 +[2025-03-02 02:22:59] (step=0353000) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0680 +[2025-03-02 02:23:59] (step=0353100) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0663 +[2025-03-02 02:24:59] (step=0353200) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0672 +[2025-03-02 02:25:58] (step=0353300) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0681 +[2025-03-02 02:26:58] (step=0353400) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0676 +[2025-03-02 02:27:58] (step=0353500) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0668 +[2025-03-02 02:28:57] (step=0353600) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0712 +[2025-03-02 02:29:57] (step=0353700) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0657 +[2025-03-02 02:30:56] (step=0353800) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0698 +[2025-03-02 02:31:56] (step=0353900) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0710 +[2025-03-02 02:32:56] (step=0354000) Train Loss: 0.0450, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0655 +[2025-03-02 02:33:55] (step=0354100) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0668 +[2025-03-02 02:34:55] (step=0354200) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0683 +[2025-03-02 02:35:54] (step=0354300) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0682 +[2025-03-02 02:36:54] (step=0354400) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0659 +[2025-03-02 02:37:54] (step=0354500) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0717 +[2025-03-02 02:38:53] (step=0354600) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0674 +[2025-03-02 02:39:53] (step=0354700) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0674 +[2025-03-02 02:40:52] (step=0354800) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0728 +[2025-03-02 02:41:52] (step=0354900) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0717 +[2025-03-02 02:42:52] (step=0355000) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0677 +[2025-03-02 02:43:51] (step=0355100) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0711 +[2025-03-02 02:44:51] (step=0355200) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0684 +[2025-03-02 02:45:54] (step=0355300) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0670 +[2025-03-02 02:46:54] (step=0355400) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0700 +[2025-03-02 02:47:53] (step=0355500) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0690 +[2025-03-02 02:48:53] (step=0355600) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0702 +[2025-03-02 02:49:53] (step=0355700) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0674 +[2025-03-02 02:50:52] (step=0355800) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0666 +[2025-03-02 02:51:52] (step=0355900) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0691 +[2025-03-02 02:52:51] (step=0356000) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0665 +[2025-03-02 02:53:51] (step=0356100) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0684 +[2025-03-02 02:54:51] (step=0356200) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0655 +[2025-03-02 02:55:50] (step=0356300) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0671 +[2025-03-02 02:56:50] (step=0356400) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0698 +[2025-03-02 02:57:49] (step=0356500) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0663 +[2025-03-02 02:58:49] (step=0356600) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0665 +[2025-03-02 02:59:49] (step=0356700) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0663 +[2025-03-02 03:00:48] (step=0356800) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0659 +[2025-03-02 03:01:48] (step=0356900) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0664 +[2025-03-02 03:02:47] (step=0357000) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0673 +[2025-03-02 03:03:47] (step=0357100) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0664 +[2025-03-02 03:04:47] (step=0357200) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0699 +[2025-03-02 03:05:46] (step=0357300) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0669 +[2025-03-02 03:06:46] (step=0357400) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0679 +[2025-03-02 03:07:45] (step=0357500) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0653 +[2025-03-02 03:08:45] (step=0357600) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0655 +[2025-03-02 03:09:45] (step=0357700) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0682 +[2025-03-02 03:10:48] (step=0357800) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0676 +[2025-03-02 03:11:47] (step=0357900) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0688 +[2025-03-02 03:12:47] (step=0358000) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0677 +[2025-03-02 03:13:47] (step=0358100) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0665 +[2025-03-02 03:14:46] (step=0358200) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0705 +[2025-03-02 03:15:46] (step=0358300) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0665 +[2025-03-02 03:16:45] (step=0358400) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0660 +[2025-03-02 03:17:45] (step=0358500) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0674 +[2025-03-02 03:18:44] (step=0358600) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0653 +[2025-03-02 03:19:44] (step=0358700) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0686 +[2025-03-02 03:20:44] (step=0358800) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0710 +[2025-03-02 03:21:43] (step=0358900) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0659 +[2025-03-02 03:22:43] (step=0359000) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0680 +[2025-03-02 03:23:42] (step=0359100) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0683 +[2025-03-02 03:24:42] (step=0359200) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0641 +[2025-03-02 03:25:41] (step=0359300) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0678 +[2025-03-02 03:26:41] (step=0359400) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0667 +[2025-03-02 03:27:40] (step=0359500) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0673 +[2025-03-02 03:28:40] (step=0359600) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0648 +[2025-03-02 03:29:40] (step=0359700) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0700 +[2025-03-02 03:30:39] (step=0359800) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0676 +[2025-03-02 03:31:39] (step=0359900) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0662 +[2025-03-02 03:32:38] (step=0360000) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0674 +[2025-03-02 03:33:38] (step=0360100) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0695 +[2025-03-02 03:34:37] (step=0360200) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0665 +[2025-03-02 03:35:40] (step=0360300) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0677 +[2025-03-02 03:36:40] (step=0360400) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0687 +[2025-03-02 03:37:39] (step=0360500) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0669 +[2025-03-02 03:38:39] (step=0360600) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0662 +[2025-03-02 03:39:39] (step=0360700) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0678 +[2025-03-02 03:40:38] (step=0360800) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0691 +[2025-03-02 03:41:38] (step=0360900) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0670 +[2025-03-02 03:42:38] (step=0361000) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0662 +[2025-03-02 03:43:37] (step=0361100) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0664 +[2025-03-02 03:44:37] (step=0361200) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0698 +[2025-03-02 03:45:37] (step=0361300) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0672 +[2025-03-02 03:46:36] (step=0361400) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0688 +[2025-03-02 03:47:36] (step=0361500) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0668 +[2025-03-02 03:48:35] (step=0361600) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0696 +[2025-03-02 03:49:35] (step=0361700) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0659 +[2025-03-02 03:50:35] (step=0361800) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0669 +[2025-03-02 03:51:34] (step=0361900) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0677 +[2025-03-02 03:52:34] (step=0362000) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0677 +[2025-03-02 03:53:33] (step=0362100) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0656 +[2025-03-02 03:54:33] (step=0362200) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0671 +[2025-03-02 03:55:33] (step=0362300) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0690 +[2025-03-02 03:56:32] (step=0362400) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0708 +[2025-03-02 03:57:32] (step=0362500) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0649 +[2025-03-02 03:58:32] (step=0362600) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0688 +[2025-03-02 03:59:31] (step=0362700) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0668 +[2025-03-02 04:00:34] (step=0362800) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0663 +[2025-03-02 04:01:34] (step=0362900) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0658 +[2025-03-02 04:02:33] (step=0363000) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0714 +[2025-03-02 04:03:33] (step=0363100) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0639 +[2025-03-02 04:04:33] (step=0363200) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0702 +[2025-03-02 04:05:32] (step=0363300) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0682 +[2025-03-02 04:06:32] (step=0363400) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0710 +[2025-03-02 04:07:31] (step=0363500) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0670 +[2025-03-02 04:08:31] (step=0363600) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0672 +[2025-03-02 04:09:31] (step=0363700) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0717 +[2025-03-02 04:10:30] (step=0363800) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0673 +[2025-03-02 04:11:30] (step=0363900) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0694 +[2025-03-02 04:12:29] (step=0364000) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0673 +[2025-03-02 04:13:29] (step=0364100) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0680 +[2025-03-02 04:14:28] (step=0364200) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0676 +[2025-03-02 04:15:28] (step=0364300) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0668 +[2025-03-02 04:16:28] (step=0364400) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0648 +[2025-03-02 04:17:27] (step=0364500) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0654 +[2025-03-02 04:18:27] (step=0364600) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0647 +[2025-03-02 04:19:26] (step=0364700) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0660 +[2025-03-02 04:20:26] (step=0364800) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0679 +[2025-03-02 04:21:26] (step=0364900) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0647 +[2025-03-02 04:22:25] (step=0365000) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0662 +[2025-03-02 04:23:25] (step=0365100) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0647 +[2025-03-02 04:24:24] (step=0365200) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0670 +[2025-03-02 04:25:27] (step=0365300) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.60, Grad Norm: 0.0676 +[2025-03-02 04:26:27] (step=0365400) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0662 +[2025-03-02 04:27:26] (step=0365500) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0673 +[2025-03-02 04:28:26] (step=0365600) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0664 +[2025-03-02 04:29:25] (step=0365700) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0663 +[2025-03-02 04:30:25] (step=0365800) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0673 +[2025-03-02 04:31:25] (step=0365900) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0641 +[2025-03-02 04:32:24] (step=0366000) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0682 +[2025-03-02 04:33:24] (step=0366100) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0665 +[2025-03-02 04:34:23] (step=0366200) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0663 +[2025-03-02 04:35:23] (step=0366300) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0663 +[2025-03-02 04:36:23] (step=0366400) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0685 +[2025-03-02 04:37:22] (step=0366500) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0670 +[2025-03-02 04:38:22] (step=0366600) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0667 +[2025-03-02 04:39:21] (step=0366700) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0702 +[2025-03-02 04:40:21] (step=0366800) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0687 +[2025-03-02 04:41:21] (step=0366900) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0680 +[2025-03-02 04:42:20] (step=0367000) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0697 +[2025-03-02 04:43:20] (step=0367100) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0682 +[2025-03-02 04:44:20] (step=0367200) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0680 +[2025-03-02 04:45:19] (step=0367300) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0669 +[2025-03-02 04:46:19] (step=0367400) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0646 +[2025-03-02 04:47:18] (step=0367500) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0662 +[2025-03-02 04:48:18] (step=0367600) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0663 +[2025-03-02 04:49:18] (step=0367700) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0650 +[2025-03-02 04:50:20] (step=0367800) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.60, Grad Norm: 0.0666 +[2025-03-02 04:51:20] (step=0367900) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0705 +[2025-03-02 04:52:20] (step=0368000) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0681 +[2025-03-02 04:53:19] (step=0368100) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0612 +[2025-03-02 04:54:19] (step=0368200) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0664 +[2025-03-02 04:55:18] (step=0368300) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0682 +[2025-03-02 04:56:18] (step=0368400) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0653 +[2025-03-02 04:57:18] (step=0368500) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0646 +[2025-03-02 04:58:17] (step=0368600) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0647 +[2025-03-02 04:59:17] (step=0368700) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0671 +[2025-03-02 05:00:16] (step=0368800) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0642 +[2025-03-02 05:01:16] (step=0368900) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0655 +[2025-03-02 05:02:16] (step=0369000) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0668 +[2025-03-02 05:03:15] (step=0369100) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0691 +[2025-03-02 05:04:15] (step=0369200) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0657 +[2025-03-02 05:05:14] (step=0369300) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0665 +[2025-03-02 05:06:14] (step=0369400) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0671 +[2025-03-02 05:07:14] (step=0369500) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0652 +[2025-03-02 05:08:13] (step=0369600) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0638 +[2025-03-02 05:09:13] (step=0369700) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0645 +[2025-03-02 05:10:12] (step=0369800) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0696 +[2025-03-02 05:11:12] (step=0369900) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0654 +[2025-03-02 05:12:12] (step=0370000) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0666 +[2025-03-02 05:13:11] (step=0370100) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0656 +[2025-03-02 05:14:11] (step=0370200) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0650 +[2025-03-02 05:15:13] (step=0370300) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.60, Grad Norm: 0.0698 +[2025-03-02 05:16:13] (step=0370400) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0675 +[2025-03-02 05:17:13] (step=0370500) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0656 +[2025-03-02 05:18:12] (step=0370600) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0671 +[2025-03-02 05:19:12] (step=0370700) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0691 +[2025-03-02 05:20:12] (step=0370800) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0664 +[2025-03-02 05:21:11] (step=0370900) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0689 +[2025-03-02 05:22:11] (step=0371000) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0658 +[2025-03-02 05:23:10] (step=0371100) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0669 +[2025-03-02 05:24:10] (step=0371200) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0649 +[2025-03-02 05:25:10] (step=0371300) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0685 +[2025-03-02 05:26:09] (step=0371400) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0663 +[2025-03-02 05:27:09] (step=0371500) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0649 +[2025-03-02 05:28:08] (step=0371600) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0670 +[2025-03-02 05:29:08] (step=0371700) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0658 +[2025-03-02 05:30:07] (step=0371800) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0674 +[2025-03-02 05:31:07] (step=0371900) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0672 +[2025-03-02 05:32:07] (step=0372000) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0684 +[2025-03-02 05:33:06] (step=0372100) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0641 +[2025-03-02 05:34:06] (step=0372200) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0682 +[2025-03-02 05:35:05] (step=0372300) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0659 +[2025-03-02 05:36:05] (step=0372400) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0665 +[2025-03-02 05:37:05] (step=0372500) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0667 +[2025-03-02 05:38:04] (step=0372600) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0656 +[2025-03-02 05:39:04] (step=0372700) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0655 +[2025-03-02 05:40:07] (step=0372800) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0655 +[2025-03-02 05:41:06] (step=0372900) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0659 +[2025-03-02 05:42:06] (step=0373000) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0662 +[2025-03-02 05:43:06] (step=0373100) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0638 +[2025-03-02 05:44:05] (step=0373200) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0689 +[2025-03-02 05:45:05] (step=0373300) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0682 +[2025-03-02 05:46:04] (step=0373400) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0675 +[2025-03-02 05:47:04] (step=0373500) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0632 +[2025-03-02 05:48:04] (step=0373600) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0678 +[2025-03-02 05:49:03] (step=0373700) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0678 +[2025-03-02 05:50:03] (step=0373800) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0672 +[2025-03-02 05:51:02] (step=0373900) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0662 +[2025-03-02 05:52:02] (step=0374000) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0667 +[2025-03-02 05:53:01] (step=0374100) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0681 +[2025-03-02 05:54:01] (step=0374200) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0661 +[2025-03-02 05:55:01] (step=0374300) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0641 +[2025-03-02 05:56:00] (step=0374400) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0663 +[2025-03-02 05:57:00] (step=0374500) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0663 +[2025-03-02 05:57:59] (step=0374600) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0662 +[2025-03-02 05:58:59] (step=0374700) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0655 +[2025-03-02 05:59:58] (step=0374800) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0654 +[2025-03-02 06:00:58] (step=0374900) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0667 +[2025-03-02 06:01:58] (step=0375000) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0671 +[2025-03-02 06:02:57] (step=0375100) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0641 +[2025-03-02 06:03:57] (step=0375200) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0656 +[2025-03-02 06:04:57] (step=0375300) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.65, Grad Norm: 0.0699 +[2025-03-02 06:05:59] (step=0375400) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.61, Grad Norm: 0.0649 +[2025-03-02 06:06:59] (step=0375500) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0670 +[2025-03-02 06:07:59] (step=0375600) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0658 +[2025-03-02 06:08:58] (step=0375700) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0672 +[2025-03-02 06:09:58] (step=0375800) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0655 +[2025-03-02 06:10:57] (step=0375900) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0642 +[2025-03-02 06:11:57] (step=0376000) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0689 +[2025-03-02 06:12:56] (step=0376100) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0672 +[2025-03-02 06:13:56] (step=0376200) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0678 +[2025-03-02 06:14:55] (step=0376300) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0658 +[2025-03-02 06:15:55] (step=0376400) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0648 +[2025-03-02 06:16:55] (step=0376500) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0669 +[2025-03-02 06:17:54] (step=0376600) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0649 +[2025-03-02 06:18:54] (step=0376700) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0668 +[2025-03-02 06:19:53] (step=0376800) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0673 +[2025-03-02 06:20:53] (step=0376900) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0664 +[2025-03-02 06:21:52] (step=0377000) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0663 +[2025-03-02 06:22:52] (step=0377100) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0642 +[2025-03-02 06:23:52] (step=0377200) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0677 +[2025-03-02 06:24:51] (step=0377300) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0650 +[2025-03-02 06:25:51] (step=0377400) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0678 +[2025-03-02 06:26:50] (step=0377500) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0675 +[2025-03-02 06:27:50] (step=0377600) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0675 +[2025-03-02 06:28:49] (step=0377700) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0664 +[2025-03-02 06:29:49] (step=0377800) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0645 +[2025-03-02 06:30:52] (step=0377900) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.60, Grad Norm: 0.0681 +[2025-03-02 06:31:51] (step=0378000) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0640 +[2025-03-02 06:32:51] (step=0378100) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0685 +[2025-03-02 06:33:50] (step=0378200) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0669 +[2025-03-02 06:34:50] (step=0378300) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0633 +[2025-03-02 06:35:50] (step=0378400) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0672 +[2025-03-02 06:36:49] (step=0378500) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0656 +[2025-03-02 06:37:49] (step=0378600) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0646 +[2025-03-02 06:38:48] (step=0378700) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0676 +[2025-03-02 06:39:48] (step=0378800) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0627 +[2025-03-02 06:40:47] (step=0378900) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0642 +[2025-03-02 06:41:47] (step=0379000) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0664 +[2025-03-02 06:42:46] (step=0379100) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0667 +[2025-03-02 06:43:46] (step=0379200) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0662 +[2025-03-02 06:44:46] (step=0379300) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0641 +[2025-03-02 06:45:45] (step=0379400) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0646 +[2025-03-02 06:46:45] (step=0379500) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0641 +[2025-03-02 06:47:44] (step=0379600) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0665 +[2025-03-02 06:48:44] (step=0379700) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0627 +[2025-03-02 06:49:43] (step=0379800) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0664 +[2025-03-02 06:50:43] (step=0379900) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0637 +[2025-03-02 06:51:42] (step=0380000) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0677 +[2025-03-02 06:52:42] (step=0380100) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0645 +[2025-03-02 06:53:42] (step=0380200) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0687 +[2025-03-02 06:54:41] (step=0380300) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0646 +[2025-03-02 06:55:44] (step=0380400) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0653 +[2025-03-02 06:56:44] (step=0380500) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0625 +[2025-03-02 06:57:43] (step=0380600) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0661 +[2025-03-02 06:58:43] (step=0380700) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0678 +[2025-03-02 06:59:42] (step=0380800) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0649 +[2025-03-02 07:00:42] (step=0380900) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0634 +[2025-03-02 07:01:42] (step=0381000) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0689 +[2025-03-02 07:02:41] (step=0381100) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0645 +[2025-03-02 07:03:41] (step=0381200) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0640 +[2025-03-02 07:04:40] (step=0381300) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0650 +[2025-03-02 07:05:40] (step=0381400) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0635 +[2025-03-02 07:06:39] (step=0381500) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0663 +[2025-03-02 07:07:39] (step=0381600) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0646 +[2025-03-02 07:08:38] (step=0381700) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0638 +[2025-03-02 07:09:38] (step=0381800) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0638 +[2025-03-02 07:10:38] (step=0381900) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0675 +[2025-03-02 07:11:37] (step=0382000) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0645 +[2025-03-02 07:12:37] (step=0382100) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0650 +[2025-03-02 07:13:36] (step=0382200) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0657 +[2025-03-02 07:14:36] (step=0382300) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0638 +[2025-03-02 07:15:35] (step=0382400) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0657 +[2025-03-02 07:16:35] (step=0382500) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0641 +[2025-03-02 07:17:34] (step=0382600) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0640 +[2025-03-02 07:18:34] (step=0382700) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0662 +[2025-03-02 07:19:34] (step=0382800) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0645 +[2025-03-02 07:20:37] (step=0382900) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0625 +[2025-03-02 07:21:36] (step=0383000) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0679 +[2025-03-02 07:22:36] (step=0383100) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0636 +[2025-03-02 07:23:35] (step=0383200) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0649 +[2025-03-02 07:24:35] (step=0383300) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0643 +[2025-03-02 07:25:35] (step=0383400) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0636 +[2025-03-02 07:26:34] (step=0383500) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0629 +[2025-03-02 07:27:34] (step=0383600) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0632 +[2025-03-02 07:28:33] (step=0383700) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0645 +[2025-03-02 07:29:33] (step=0383800) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0654 +[2025-03-02 07:30:32] (step=0383900) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0658 +[2025-03-02 07:31:32] (step=0384000) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0657 +[2025-03-02 07:32:31] (step=0384100) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0646 +[2025-03-02 07:33:31] (step=0384200) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0661 +[2025-03-02 07:34:31] (step=0384300) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0653 +[2025-03-02 07:35:30] (step=0384400) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0637 +[2025-03-02 07:36:30] (step=0384500) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0650 +[2025-03-02 07:37:29] (step=0384600) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0643 +[2025-03-02 07:38:29] (step=0384700) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0646 +[2025-03-02 07:39:28] (step=0384800) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0640 +[2025-03-02 07:40:28] (step=0384900) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0625 +[2025-03-02 07:41:27] (step=0385000) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0659 +[2025-03-02 07:42:27] (step=0385100) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0644 +[2025-03-02 07:43:26] (step=0385200) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0635 +[2025-03-02 07:44:26] (step=0385300) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0634 +[2025-03-02 07:45:29] (step=0385400) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0644 +[2025-03-02 07:46:29] (step=0385500) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0645 +[2025-03-02 07:47:28] (step=0385600) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0638 +[2025-03-02 07:48:28] (step=0385700) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0667 +[2025-03-02 07:49:28] (step=0385800) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0655 +[2025-03-02 07:50:27] (step=0385900) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0647 +[2025-03-02 07:51:27] (step=0386000) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0670 +[2025-03-02 07:52:26] (step=0386100) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0627 +[2025-03-02 07:53:26] (step=0386200) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0656 +[2025-03-02 07:54:25] (step=0386300) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0647 +[2025-03-02 07:55:25] (step=0386400) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0636 +[2025-03-02 07:56:24] (step=0386500) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0636 +[2025-03-02 07:57:24] (step=0386600) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0635 +[2025-03-02 07:58:24] (step=0386700) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0651 +[2025-03-02 07:59:23] (step=0386800) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0621 +[2025-03-02 08:00:23] (step=0386900) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0663 +[2025-03-02 08:01:22] (step=0387000) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0639 +[2025-03-02 08:02:22] (step=0387100) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0639 +[2025-03-02 08:03:21] (step=0387200) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0647 +[2025-03-02 08:04:21] (step=0387300) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0664 +[2025-03-02 08:05:20] (step=0387400) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0621 +[2025-03-02 08:06:20] (step=0387500) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0641 +[2025-03-02 08:07:19] (step=0387600) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0654 +[2025-03-02 08:08:19] (step=0387700) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0627 +[2025-03-02 08:09:19] (step=0387800) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0641 +[2025-03-02 08:10:21] (step=0387900) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0637 +[2025-03-02 08:11:21] (step=0388000) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0636 +[2025-03-02 08:12:21] (step=0388100) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0638 +[2025-03-02 08:13:20] (step=0388200) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0637 +[2025-03-02 08:14:20] (step=0388300) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0638 +[2025-03-02 08:15:19] (step=0388400) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0654 +[2025-03-02 08:16:19] (step=0388500) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0613 +[2025-03-02 08:17:18] (step=0388600) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0649 +[2025-03-02 08:18:18] (step=0388700) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0635 +[2025-03-02 08:19:18] (step=0388800) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0671 +[2025-03-02 08:20:17] (step=0388900) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0676 +[2025-03-02 08:21:17] (step=0389000) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0627 +[2025-03-02 08:22:16] (step=0389100) Train Loss: 0.0448, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0649 +[2025-03-02 08:23:16] (step=0389200) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0640 +[2025-03-02 08:24:15] (step=0389300) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0619 +[2025-03-02 08:25:15] (step=0389400) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0674 +[2025-03-02 08:26:14] (step=0389500) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0617 +[2025-03-02 08:27:14] (step=0389600) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0639 +[2025-03-02 08:28:13] (step=0389700) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0640 +[2025-03-02 08:29:13] (step=0389800) Train Loss: 0.0435, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0655 +[2025-03-02 08:30:13] (step=0389900) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0653 +[2025-03-02 08:31:12] (step=0390000) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0620 +[2025-03-02 08:32:12] (step=0390100) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0646 +[2025-03-02 08:33:11] (step=0390200) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0643 +[2025-03-02 08:34:11] (step=0390300) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0650 +[2025-03-02 08:35:14] (step=0390400) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0625 +[2025-03-02 08:36:14] (step=0390500) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0653 +[2025-03-02 08:37:13] (step=0390600) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0628 +[2025-03-02 08:38:13] (step=0390700) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0631 +[2025-03-02 08:39:12] (step=0390800) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0657 +[2025-03-02 08:40:12] (step=0390900) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0648 +[2025-03-02 08:41:11] (step=0391000) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0644 +[2025-03-02 08:42:11] (step=0391100) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0653 +[2025-03-02 08:43:10] (step=0391200) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0657 +[2025-03-02 08:44:10] (step=0391300) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0637 +[2025-03-02 08:45:10] (step=0391400) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0634 +[2025-03-02 08:46:09] (step=0391500) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0646 +[2025-03-02 08:47:09] (step=0391600) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0673 +[2025-03-02 08:48:08] (step=0391700) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0641 +[2025-03-02 08:49:08] (step=0391800) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0647 +[2025-03-02 08:50:07] (step=0391900) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0651 +[2025-03-02 08:51:07] (step=0392000) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0638 +[2025-03-02 08:52:06] (step=0392100) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0659 +[2025-03-02 08:53:06] (step=0392200) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0648 +[2025-03-02 08:54:05] (step=0392300) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0632 +[2025-03-02 08:55:05] (step=0392400) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0643 +[2025-03-02 08:56:05] (step=0392500) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0616 +[2025-03-02 08:57:04] (step=0392600) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0662 +[2025-03-02 08:58:04] (step=0392700) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0638 +[2025-03-02 08:59:03] (step=0392800) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0610 +[2025-03-02 09:00:06] (step=0392900) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0631 +[2025-03-02 09:01:06] (step=0393000) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0636 +[2025-03-02 09:02:06] (step=0393100) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0649 +[2025-03-02 09:03:05] (step=0393200) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0597 +[2025-03-02 09:04:05] (step=0393300) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0662 +[2025-03-02 09:05:04] (step=0393400) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0615 +[2025-03-02 09:06:04] (step=0393500) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0628 +[2025-03-02 09:07:03] (step=0393600) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0633 +[2025-03-02 09:08:03] (step=0393700) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0623 +[2025-03-02 09:09:03] (step=0393800) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0628 +[2025-03-02 09:10:02] (step=0393900) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0635 +[2025-03-02 09:11:02] (step=0394000) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0645 +[2025-03-02 09:12:01] (step=0394100) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0642 +[2025-03-02 09:13:01] (step=0394200) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0650 +[2025-03-02 09:14:00] (step=0394300) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0628 +[2025-03-02 09:15:00] (step=0394400) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0618 +[2025-03-02 09:15:59] (step=0394500) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0639 +[2025-03-02 09:16:59] (step=0394600) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0638 +[2025-03-02 09:17:59] (step=0394700) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0662 +[2025-03-02 09:18:58] (step=0394800) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0618 +[2025-03-02 09:19:58] (step=0394900) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0632 +[2025-03-02 09:20:57] (step=0395000) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0661 +[2025-03-02 09:21:57] (step=0395100) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0609 +[2025-03-02 09:22:56] (step=0395200) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0660 +[2025-03-02 09:23:56] (step=0395300) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0642 +[2025-03-02 09:24:59] (step=0395400) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0663 +[2025-03-02 09:25:59] (step=0395500) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0666 +[2025-03-02 09:26:58] (step=0395600) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0661 +[2025-03-02 09:27:58] (step=0395700) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0655 +[2025-03-02 09:28:57] (step=0395800) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0634 +[2025-03-02 09:29:57] (step=0395900) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0695 +[2025-03-02 09:30:57] (step=0396000) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0635 +[2025-03-02 09:31:56] (step=0396100) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0623 +[2025-03-02 09:32:56] (step=0396200) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0664 +[2025-03-02 09:33:55] (step=0396300) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0624 +[2025-03-02 09:34:55] (step=0396400) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0638 +[2025-03-02 09:35:54] (step=0396500) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0655 +[2025-03-02 09:36:54] (step=0396600) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0669 +[2025-03-02 09:37:53] (step=0396700) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0615 +[2025-03-02 09:38:53] (step=0396800) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0638 +[2025-03-02 09:39:52] (step=0396900) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0647 +[2025-03-02 09:40:52] (step=0397000) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0631 +[2025-03-02 09:41:52] (step=0397100) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0660 +[2025-03-02 09:42:51] (step=0397200) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0629 +[2025-03-02 09:43:51] (step=0397300) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0592 +[2025-03-02 09:44:50] (step=0397400) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0654 +[2025-03-02 09:45:50] (step=0397500) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0659 +[2025-03-02 09:46:49] (step=0397600) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0630 +[2025-03-02 09:47:49] (step=0397700) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0620 +[2025-03-02 09:48:48] (step=0397800) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0637 +[2025-03-02 09:49:51] (step=0397900) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0627 +[2025-03-02 09:50:51] (step=0398000) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0632 +[2025-03-02 09:51:50] (step=0398100) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0635 +[2025-03-02 09:52:50] (step=0398200) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0635 +[2025-03-02 09:53:49] (step=0398300) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0658 +[2025-03-02 09:54:49] (step=0398400) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0629 +[2025-03-02 09:55:49] (step=0398500) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0610 +[2025-03-02 09:56:48] (step=0398600) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0648 +[2025-03-02 09:57:48] (step=0398700) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0638 +[2025-03-02 09:58:47] (step=0398800) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0616 +[2025-03-02 09:59:47] (step=0398900) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0619 +[2025-03-02 10:00:46] (step=0399000) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0667 +[2025-03-02 10:01:46] (step=0399100) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0631 +[2025-03-02 10:02:45] (step=0399200) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0635 +[2025-03-02 10:03:45] (step=0399300) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0626 +[2025-03-02 10:04:45] (step=0399400) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0651 +[2025-03-02 10:05:44] (step=0399500) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0613 +[2025-03-02 10:06:44] (step=0399600) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0614 +[2025-03-02 10:07:43] (step=0399700) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0611 +[2025-03-02 10:08:43] (step=0399800) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0641 +[2025-03-02 10:09:42] (step=0399900) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0644 +[2025-03-02 10:10:42] (step=0400000) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0624 +[2025-03-02 10:10:45] Saved checkpoint to ../logs/flow/flowsdvae_500kx512_lgn0p0/checkpoints/0400000.pt +[2025-03-02 10:16:09] (step=0400000), Fid=12.238605679240948, PSNR=27.11142971665859, LPIPS=0.22398853302001953, SSIM=0.7503665089607239 +[2025-03-02 10:17:09] (step=0400100) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 0.26, Grad Norm: 0.0624 +[2025-03-02 10:18:09] (step=0400200) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0636 +[2025-03-02 10:19:09] (step=0400300) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0632 +[2025-03-02 10:20:12] (step=0400400) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0615 +[2025-03-02 10:21:12] (step=0400500) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0641 +[2025-03-02 10:22:12] (step=0400600) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0618 +[2025-03-02 10:23:11] (step=0400700) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0602 +[2025-03-02 10:24:11] (step=0400800) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0648 +[2025-03-02 10:25:11] (step=0400900) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0618 +[2025-03-02 10:26:10] (step=0401000) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0616 +[2025-03-02 10:27:10] (step=0401100) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0636 +[2025-03-02 10:28:10] (step=0401200) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0640 +[2025-03-02 10:29:09] (step=0401300) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0612 +[2025-03-02 10:30:09] (step=0401400) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0627 +[2025-03-02 10:31:08] (step=0401500) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0640 +[2025-03-02 10:32:08] (step=0401600) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0618 +[2025-03-02 10:33:07] (step=0401700) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0664 +[2025-03-02 10:34:07] (step=0401800) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0629 +[2025-03-02 10:35:06] (step=0401900) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0610 +[2025-03-02 10:36:06] (step=0402000) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0637 +[2025-03-02 10:37:06] (step=0402100) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0648 +[2025-03-02 10:38:05] (step=0402200) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0648 +[2025-03-02 10:39:05] (step=0402300) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0614 +[2025-03-02 10:40:04] (step=0402400) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0616 +[2025-03-02 10:41:04] (step=0402500) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0628 +[2025-03-02 10:42:04] (step=0402600) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0642 +[2025-03-02 10:43:03] (step=0402700) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0608 +[2025-03-02 10:44:03] (step=0402800) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0640 +[2025-03-02 10:45:06] (step=0402900) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.58, Grad Norm: 0.0647 +[2025-03-02 10:46:06] (step=0403000) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.66, Grad Norm: 0.0638 +[2025-03-02 10:47:06] (step=0403100) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0638 +[2025-03-02 10:48:06] (step=0403200) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0636 +[2025-03-02 10:49:06] (step=0403300) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0595 +[2025-03-02 10:50:06] (step=0403400) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0659 +[2025-03-02 10:51:06] (step=0403500) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0626 +[2025-03-02 10:52:05] (step=0403600) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0636 +[2025-03-02 10:53:05] (step=0403700) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0633 +[2025-03-02 10:54:05] (step=0403800) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0626 +[2025-03-02 10:55:05] (step=0403900) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0638 +[2025-03-02 10:56:05] (step=0404000) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0636 +[2025-03-02 10:57:04] (step=0404100) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0650 +[2025-03-02 10:58:04] (step=0404200) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0634 +[2025-03-02 10:59:04] (step=0404300) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0642 +[2025-03-02 11:00:04] (step=0404400) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0637 +[2025-03-02 11:01:03] (step=0404500) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0656 +[2025-03-02 11:02:03] (step=0404600) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0655 +[2025-03-02 11:03:03] (step=0404700) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0660 +[2025-03-02 11:04:02] (step=0404800) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0646 +[2025-03-02 11:05:02] (step=0404900) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0649 +[2025-03-02 11:06:02] (step=0405000) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0651 +[2025-03-02 11:07:02] (step=0405100) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0680 +[2025-03-02 11:08:01] (step=0405200) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0652 +[2025-03-02 11:09:01] (step=0405300) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0665 +[2025-03-02 11:10:04] (step=0405400) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0676 +[2025-03-02 11:11:04] (step=0405500) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0645 +[2025-03-02 11:12:04] (step=0405600) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0639 +[2025-03-02 11:13:03] (step=0405700) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0651 +[2025-03-02 11:14:03] (step=0405800) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0666 +[2025-03-02 11:15:03] (step=0405900) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0619 +[2025-03-02 11:16:02] (step=0406000) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0642 +[2025-03-02 11:17:02] (step=0406100) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0607 +[2025-03-02 11:18:02] (step=0406200) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0627 +[2025-03-02 11:19:01] (step=0406300) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0626 +[2025-03-02 11:20:01] (step=0406400) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0626 +[2025-03-02 11:21:01] (step=0406500) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0632 +[2025-03-02 11:22:00] (step=0406600) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0628 +[2025-03-02 11:23:00] (step=0406700) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0610 +[2025-03-02 11:24:00] (step=0406800) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0617 +[2025-03-02 11:24:59] (step=0406900) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0640 +[2025-03-02 11:25:59] (step=0407000) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0617 +[2025-03-02 11:26:59] (step=0407100) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0620 +[2025-03-02 11:27:58] (step=0407200) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0638 +[2025-03-02 11:28:58] (step=0407300) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0629 +[2025-03-02 11:29:58] (step=0407400) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0611 +[2025-03-02 11:30:57] (step=0407500) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0632 +[2025-03-02 11:31:57] (step=0407600) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0617 +[2025-03-02 11:32:57] (step=0407700) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0630 +[2025-03-02 11:33:57] (step=0407800) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0630 +[2025-03-02 11:34:59] (step=0407900) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0626 +[2025-03-02 11:35:59] (step=0408000) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0615 +[2025-03-02 11:36:59] (step=0408100) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0633 +[2025-03-02 11:37:59] (step=0408200) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0609 +[2025-03-02 11:38:58] (step=0408300) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0638 +[2025-03-02 11:39:58] (step=0408400) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0638 +[2025-03-02 11:40:58] (step=0408500) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0629 +[2025-03-02 11:41:58] (step=0408600) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0624 +[2025-03-02 11:42:58] (step=0408700) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0622 +[2025-03-02 11:43:57] (step=0408800) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0656 +[2025-03-02 11:44:57] (step=0408900) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0628 +[2025-03-02 11:45:57] (step=0409000) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0614 +[2025-03-02 11:46:56] (step=0409100) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0620 +[2025-03-02 11:47:56] (step=0409200) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0608 +[2025-03-02 11:48:55] (step=0409300) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0614 +[2025-03-02 11:49:55] (step=0409400) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0614 +[2025-03-02 11:50:54] (step=0409500) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0647 +[2025-03-02 11:51:54] (step=0409600) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0656 +[2025-03-02 11:52:53] (step=0409700) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0632 +[2025-03-02 11:53:53] (step=0409800) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0616 +[2025-03-02 11:54:52] (step=0409900) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0622 +[2025-03-02 11:55:52] (step=0410000) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0634 +[2025-03-02 11:56:51] (step=0410100) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0635 +[2025-03-02 11:57:51] (step=0410200) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0617 +[2025-03-02 11:58:50] (step=0410300) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0628 +[2025-03-02 11:59:53] (step=0410400) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0608 +[2025-03-02 12:00:53] (step=0410500) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0630 +[2025-03-02 12:01:53] (step=0410600) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0628 +[2025-03-02 12:02:53] (step=0410700) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0626 +[2025-03-02 12:03:52] (step=0410800) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0636 +[2025-03-02 12:04:52] (step=0410900) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0619 +[2025-03-02 12:05:52] (step=0411000) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0645 +[2025-03-02 12:06:51] (step=0411100) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0621 +[2025-03-02 12:07:51] (step=0411200) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0662 +[2025-03-02 12:08:51] (step=0411300) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0643 +[2025-03-02 12:09:51] (step=0411400) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0619 +[2025-03-02 12:10:50] (step=0411500) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0633 +[2025-03-02 12:11:50] (step=0411600) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0647 +[2025-03-02 12:12:50] (step=0411700) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0621 +[2025-03-02 12:13:50] (step=0411800) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0642 +[2025-03-02 12:14:49] (step=0411900) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0627 +[2025-03-02 12:15:49] (step=0412000) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0629 +[2025-03-02 12:16:49] (step=0412100) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0642 +[2025-03-02 12:17:48] (step=0412200) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0608 +[2025-03-02 12:18:48] (step=0412300) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0620 +[2025-03-02 12:19:48] (step=0412400) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0625 +[2025-03-02 12:20:48] (step=0412500) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0626 +[2025-03-02 12:21:47] (step=0412600) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0617 +[2025-03-02 12:22:47] (step=0412700) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0635 +[2025-03-02 12:23:47] (step=0412800) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0625 +[2025-03-02 12:24:50] (step=0412900) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0627 +[2025-03-02 12:25:49] (step=0413000) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0591 +[2025-03-02 12:26:49] (step=0413100) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0630 +[2025-03-02 12:27:48] (step=0413200) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0595 +[2025-03-02 12:28:48] (step=0413300) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0612 +[2025-03-02 12:29:47] (step=0413400) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0623 +[2025-03-02 12:30:47] (step=0413500) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0612 +[2025-03-02 12:31:46] (step=0413600) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0647 +[2025-03-02 12:32:46] (step=0413700) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0642 +[2025-03-02 12:33:45] (step=0413800) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0631 +[2025-03-02 12:34:45] (step=0413900) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0617 +[2025-03-02 12:35:45] (step=0414000) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0618 +[2025-03-02 12:36:44] (step=0414100) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0634 +[2025-03-02 12:37:44] (step=0414200) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0650 +[2025-03-02 12:38:43] (step=0414300) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0624 +[2025-03-02 12:39:43] (step=0414400) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0613 +[2025-03-02 12:40:42] (step=0414500) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0631 +[2025-03-02 12:41:42] (step=0414600) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0624 +[2025-03-02 12:42:41] (step=0414700) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0617 +[2025-03-02 12:43:41] (step=0414800) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0611 +[2025-03-02 12:44:40] (step=0414900) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0648 +[2025-03-02 12:45:40] (step=0415000) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0603 +[2025-03-02 12:46:39] (step=0415100) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0632 +[2025-03-02 12:47:39] (step=0415200) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0616 +[2025-03-02 12:48:38] (step=0415300) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0624 +[2025-03-02 12:49:41] (step=0415400) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0643 +[2025-03-02 12:50:41] (step=0415500) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0622 +[2025-03-02 12:51:41] (step=0415600) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0622 +[2025-03-02 12:52:40] (step=0415700) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0627 +[2025-03-02 12:53:40] (step=0415800) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0621 +[2025-03-02 12:54:40] (step=0415900) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0655 +[2025-03-02 12:55:39] (step=0416000) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0610 +[2025-03-02 12:56:39] (step=0416100) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0616 +[2025-03-02 12:57:39] (step=0416200) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0643 +[2025-03-02 12:58:38] (step=0416300) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0601 +[2025-03-02 12:59:38] (step=0416400) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0612 +[2025-03-02 13:00:38] (step=0416500) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0594 +[2025-03-02 13:01:38] (step=0416600) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0613 +[2025-03-02 13:02:37] (step=0416700) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0624 +[2025-03-02 13:03:37] (step=0416800) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0635 +[2025-03-02 13:04:37] (step=0416900) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0607 +[2025-03-02 13:05:36] (step=0417000) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0645 +[2025-03-02 13:06:36] (step=0417100) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0609 +[2025-03-02 13:07:35] (step=0417200) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0609 +[2025-03-02 13:08:35] (step=0417300) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0606 +[2025-03-02 13:09:34] (step=0417400) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0635 +[2025-03-02 13:10:34] (step=0417500) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0625 +[2025-03-02 13:11:33] (step=0417600) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0656 +[2025-03-02 13:12:33] (step=0417700) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0632 +[2025-03-02 13:13:32] (step=0417800) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0629 +[2025-03-02 13:14:35] (step=0417900) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0631 +[2025-03-02 13:15:35] (step=0418000) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0635 +[2025-03-02 13:16:35] (step=0418100) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0626 +[2025-03-02 13:17:34] (step=0418200) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0631 +[2025-03-02 13:18:34] (step=0418300) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0649 +[2025-03-02 13:19:34] (step=0418400) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0590 +[2025-03-02 13:20:33] (step=0418500) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0630 +[2025-03-02 13:21:33] (step=0418600) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0626 +[2025-03-02 13:22:33] (step=0418700) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0598 +[2025-03-02 13:23:32] (step=0418800) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0632 +[2025-03-02 13:24:32] (step=0418900) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0600 +[2025-03-02 13:25:32] (step=0419000) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0618 +[2025-03-02 13:26:31] (step=0419100) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0614 +[2025-03-02 13:27:31] (step=0419200) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0610 +[2025-03-02 13:28:31] (step=0419300) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0602 +[2025-03-02 13:29:30] (step=0419400) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0629 +[2025-03-02 13:30:30] (step=0419500) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0611 +[2025-03-02 13:31:30] (step=0419600) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0621 +[2025-03-02 13:32:29] (step=0419700) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0588 +[2025-03-02 13:33:29] (step=0419800) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0641 +[2025-03-02 13:34:29] (step=0419900) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0637 +[2025-03-02 13:35:28] (step=0420000) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0628 +[2025-03-02 13:36:28] (step=0420100) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0628 +[2025-03-02 13:37:28] (step=0420200) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0623 +[2025-03-02 13:38:27] (step=0420300) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0597 +[2025-03-02 13:39:30] (step=0420400) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0615 +[2025-03-02 13:40:30] (step=0420500) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0623 +[2025-03-02 13:41:29] (step=0420600) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0617 +[2025-03-02 13:42:29] (step=0420700) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0606 +[2025-03-02 13:43:28] (step=0420800) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0606 +[2025-03-02 13:44:28] (step=0420900) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0599 +[2025-03-02 13:45:27] (step=0421000) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0625 +[2025-03-02 13:46:27] (step=0421100) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0618 +[2025-03-02 13:47:27] (step=0421200) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0621 +[2025-03-02 13:48:26] (step=0421300) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0623 +[2025-03-02 13:49:26] (step=0421400) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0624 +[2025-03-02 13:50:25] (step=0421500) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0591 +[2025-03-02 13:51:25] (step=0421600) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0623 +[2025-03-02 13:52:24] (step=0421700) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0620 +[2025-03-02 13:53:24] (step=0421800) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0614 +[2025-03-02 13:54:23] (step=0421900) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0642 +[2025-03-02 13:55:23] (step=0422000) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0637 +[2025-03-02 13:56:22] (step=0422100) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0620 +[2025-03-02 13:57:22] (step=0422200) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0616 +[2025-03-02 13:58:21] (step=0422300) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0622 +[2025-03-02 13:59:21] (step=0422400) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0623 +[2025-03-02 14:00:20] (step=0422500) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0602 +[2025-03-02 14:01:20] (step=0422600) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0644 +[2025-03-02 14:02:19] (step=0422700) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0598 +[2025-03-02 14:03:19] (step=0422800) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0624 +[2025-03-02 14:04:22] (step=0422900) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0610 +[2025-03-02 14:05:21] (step=0423000) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0602 +[2025-03-02 14:06:21] (step=0423100) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0618 +[2025-03-02 14:07:21] (step=0423200) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0605 +[2025-03-02 14:08:20] (step=0423300) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0633 +[2025-03-02 14:09:20] (step=0423400) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0628 +[2025-03-02 14:10:20] (step=0423500) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0607 +[2025-03-02 14:11:19] (step=0423600) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0661 +[2025-03-02 14:12:19] (step=0423700) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0593 +[2025-03-02 14:13:19] (step=0423800) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0638 +[2025-03-02 14:14:18] (step=0423900) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0587 +[2025-03-02 14:15:18] (step=0424000) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0624 +[2025-03-02 14:16:18] (step=0424100) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0624 +[2025-03-02 14:17:17] (step=0424200) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0639 +[2025-03-02 14:18:17] (step=0424300) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0602 +[2025-03-02 14:19:17] (step=0424400) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0620 +[2025-03-02 14:20:16] (step=0424500) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0624 +[2025-03-02 14:21:16] (step=0424600) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0624 +[2025-03-02 14:22:16] (step=0424700) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0611 +[2025-03-02 14:23:15] (step=0424800) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0624 +[2025-03-02 14:24:15] (step=0424900) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0639 +[2025-03-02 14:25:15] (step=0425000) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0645 +[2025-03-02 14:26:14] (step=0425100) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0620 +[2025-03-02 14:27:14] (step=0425200) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0616 +[2025-03-02 14:28:13] (step=0425300) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0631 +[2025-03-02 14:29:16] (step=0425400) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0617 +[2025-03-02 14:30:16] (step=0425500) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0612 +[2025-03-02 14:31:15] (step=0425600) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0611 +[2025-03-02 14:32:15] (step=0425700) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0594 +[2025-03-02 14:33:14] (step=0425800) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0623 +[2025-03-02 14:34:14] (step=0425900) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0629 +[2025-03-02 14:35:14] (step=0426000) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0604 +[2025-03-02 14:36:13] (step=0426100) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0614 +[2025-03-02 14:37:13] (step=0426200) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0635 +[2025-03-02 14:38:12] (step=0426300) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0591 +[2025-03-02 14:39:12] (step=0426400) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0611 +[2025-03-02 14:40:11] (step=0426500) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0642 +[2025-03-02 14:41:11] (step=0426600) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0603 +[2025-03-02 14:42:10] (step=0426700) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0621 +[2025-03-02 14:43:10] (step=0426800) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0610 +[2025-03-02 14:44:09] (step=0426900) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0609 +[2025-03-02 14:45:09] (step=0427000) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0629 +[2025-03-02 14:46:08] (step=0427100) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0610 +[2025-03-02 14:47:08] (step=0427200) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0619 +[2025-03-02 14:48:07] (step=0427300) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0603 +[2025-03-02 14:49:07] (step=0427400) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0613 +[2025-03-02 14:50:06] (step=0427500) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0637 +[2025-03-02 14:51:06] (step=0427600) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0611 +[2025-03-02 14:52:05] (step=0427700) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0595 +[2025-03-02 14:53:05] (step=0427800) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0635 +[2025-03-02 14:54:07] (step=0427900) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0606 +[2025-03-02 14:55:07] (step=0428000) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0619 +[2025-03-02 14:56:07] (step=0428100) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0646 +[2025-03-02 14:57:07] (step=0428200) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0635 +[2025-03-02 14:58:06] (step=0428300) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0607 +[2025-03-02 14:59:06] (step=0428400) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0597 +[2025-03-02 15:00:06] (step=0428500) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0614 +[2025-03-02 15:01:05] (step=0428600) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0605 +[2025-03-02 15:02:05] (step=0428700) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0623 +[2025-03-02 15:03:05] (step=0428800) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0639 +[2025-03-02 15:04:04] (step=0428900) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0636 +[2025-03-02 15:05:04] (step=0429000) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0630 +[2025-03-02 15:06:03] (step=0429100) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0633 +[2025-03-02 15:07:03] (step=0429200) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0623 +[2025-03-02 15:08:03] (step=0429300) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0601 +[2025-03-02 15:09:02] (step=0429400) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0626 +[2025-03-02 15:10:02] (step=0429500) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0627 +[2025-03-02 15:11:01] (step=0429600) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0644 +[2025-03-02 15:12:01] (step=0429700) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0622 +[2025-03-02 15:13:00] (step=0429800) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0628 +[2025-03-02 15:14:00] (step=0429900) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0604 +[2025-03-02 15:14:59] (step=0430000) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0606 +[2025-03-02 15:15:59] (step=0430100) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0610 +[2025-03-02 15:16:58] (step=0430200) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0624 +[2025-03-02 15:17:58] (step=0430300) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0629 +[2025-03-02 15:19:01] (step=0430400) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0614 +[2025-03-02 15:20:00] (step=0430500) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0597 +[2025-03-02 15:21:00] (step=0430600) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0600 +[2025-03-02 15:22:00] (step=0430700) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0603 +[2025-03-02 15:22:59] (step=0430800) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0590 +[2025-03-02 15:23:59] (step=0430900) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0604 +[2025-03-02 15:24:58] (step=0431000) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0585 +[2025-03-02 15:25:58] (step=0431100) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0610 +[2025-03-02 15:26:57] (step=0431200) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0624 +[2025-03-02 15:27:57] (step=0431300) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0612 +[2025-03-02 15:28:57] (step=0431400) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0606 +[2025-03-02 15:29:56] (step=0431500) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0617 +[2025-03-02 15:30:56] (step=0431600) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0584 +[2025-03-02 15:31:55] (step=0431700) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0627 +[2025-03-02 15:32:55] (step=0431800) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0594 +[2025-03-02 15:33:54] (step=0431900) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0588 +[2025-03-02 15:34:54] (step=0432000) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0618 +[2025-03-02 15:35:53] (step=0432100) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0621 +[2025-03-02 15:36:53] (step=0432200) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0635 +[2025-03-02 15:37:52] (step=0432300) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0629 +[2025-03-02 15:38:52] (step=0432400) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0619 +[2025-03-02 15:39:52] (step=0432500) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0628 +[2025-03-02 15:40:51] (step=0432600) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0606 +[2025-03-02 15:41:51] (step=0432700) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0659 +[2025-03-02 15:42:50] (step=0432800) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0616 +[2025-03-02 15:43:53] (step=0432900) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0634 +[2025-03-02 15:44:53] (step=0433000) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0598 +[2025-03-02 15:45:53] (step=0433100) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0604 +[2025-03-02 15:46:52] (step=0433200) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0612 +[2025-03-02 15:47:52] (step=0433300) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0616 +[2025-03-02 15:48:52] (step=0433400) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0618 +[2025-03-02 15:49:51] (step=0433500) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0620 +[2025-03-02 15:50:51] (step=0433600) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0612 +[2025-03-02 15:51:50] (step=0433700) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0616 +[2025-03-02 15:52:50] (step=0433800) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0608 +[2025-03-02 15:53:50] (step=0433900) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0621 +[2025-03-02 15:54:49] (step=0434000) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0615 +[2025-03-02 15:55:49] (step=0434100) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0620 +[2025-03-02 15:56:48] (step=0434200) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0616 +[2025-03-02 15:57:48] (step=0434300) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0601 +[2025-03-02 15:58:48] (step=0434400) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0643 +[2025-03-02 15:59:47] (step=0434500) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0599 +[2025-03-02 16:00:47] (step=0434600) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0635 +[2025-03-02 16:01:46] (step=0434700) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0639 +[2025-03-02 16:02:46] (step=0434800) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0597 +[2025-03-02 16:03:46] (step=0434900) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0613 +[2025-03-02 16:04:45] (step=0435000) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0610 +[2025-03-02 16:05:45] (step=0435100) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0629 +[2025-03-02 16:06:44] (step=0435200) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0604 +[2025-03-02 16:07:44] (step=0435300) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0595 +[2025-03-02 16:08:47] (step=0435400) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0600 +[2025-03-02 16:09:47] (step=0435500) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0618 +[2025-03-02 16:10:46] (step=0435600) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0603 +[2025-03-02 16:11:46] (step=0435700) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0621 +[2025-03-02 16:12:46] (step=0435800) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0629 +[2025-03-02 16:13:45] (step=0435900) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0599 +[2025-03-02 16:14:45] (step=0436000) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0602 +[2025-03-02 16:15:45] (step=0436100) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0617 +[2025-03-02 16:16:44] (step=0436200) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0609 +[2025-03-02 16:17:44] (step=0436300) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0599 +[2025-03-02 16:18:44] (step=0436400) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0611 +[2025-03-02 16:19:43] (step=0436500) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0620 +[2025-03-02 16:20:43] (step=0436600) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0600 +[2025-03-02 16:21:42] (step=0436700) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0614 +[2025-03-02 16:22:42] (step=0436800) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0611 +[2025-03-02 16:23:42] (step=0436900) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0619 +[2025-03-02 16:24:41] (step=0437000) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0618 +[2025-03-02 16:25:41] (step=0437100) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0606 +[2025-03-02 16:26:40] (step=0437200) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0595 +[2025-03-02 16:27:40] (step=0437300) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0658 +[2025-03-02 16:28:40] (step=0437400) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0590 +[2025-03-02 16:29:39] (step=0437500) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0616 +[2025-03-02 16:30:39] (step=0437600) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0624 +[2025-03-02 16:31:38] (step=0437700) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0637 +[2025-03-02 16:32:38] (step=0437800) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0619 +[2025-03-02 16:33:41] (step=0437900) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0636 +[2025-03-02 16:34:41] (step=0438000) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0632 +[2025-03-02 16:35:40] (step=0438100) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0594 +[2025-03-02 16:36:40] (step=0438200) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0618 +[2025-03-02 16:37:39] (step=0438300) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0615 +[2025-03-02 16:38:39] (step=0438400) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0598 +[2025-03-02 16:39:39] (step=0438500) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0609 +[2025-03-02 16:40:38] (step=0438600) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0610 +[2025-03-02 16:41:38] (step=0438700) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0608 +[2025-03-02 16:42:37] (step=0438800) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0609 +[2025-03-02 16:43:37] (step=0438900) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0605 +[2025-03-02 16:44:36] (step=0439000) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0600 +[2025-03-02 16:45:36] (step=0439100) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0602 +[2025-03-02 16:46:36] (step=0439200) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0601 +[2025-03-02 16:47:35] (step=0439300) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0607 +[2025-03-02 16:48:35] (step=0439400) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0615 +[2025-03-02 16:49:34] (step=0439500) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0619 +[2025-03-02 16:50:34] (step=0439600) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0617 +[2025-03-02 16:51:34] (step=0439700) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0629 +[2025-03-02 16:52:33] (step=0439800) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0603 +[2025-03-02 16:53:33] (step=0439900) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0626 +[2025-03-02 16:54:32] (step=0440000) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0607 +[2025-03-02 16:55:32] (step=0440100) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0608 +[2025-03-02 16:56:31] (step=0440200) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0603 +[2025-03-02 16:57:31] (step=0440300) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0606 +[2025-03-02 16:58:34] (step=0440400) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0599 +[2025-03-02 16:59:34] (step=0440500) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0606 +[2025-03-02 17:00:33] (step=0440600) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0598 +[2025-03-02 17:01:33] (step=0440700) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0612 +[2025-03-02 17:02:33] (step=0440800) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0612 +[2025-03-02 17:03:32] (step=0440900) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0601 +[2025-03-02 17:04:32] (step=0441000) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0619 +[2025-03-02 17:05:31] (step=0441100) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0580 +[2025-03-02 17:06:31] (step=0441200) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0625 +[2025-03-02 17:07:30] (step=0441300) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0623 +[2025-03-02 17:08:30] (step=0441400) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0594 +[2025-03-02 17:09:30] (step=0441500) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0615 +[2025-03-02 17:10:29] (step=0441600) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0620 +[2025-03-02 17:11:29] (step=0441700) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0600 +[2025-03-02 17:12:28] (step=0441800) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0576 +[2025-03-02 17:13:28] (step=0441900) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0597 +[2025-03-02 17:14:28] (step=0442000) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0603 +[2025-03-02 17:15:27] (step=0442100) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0593 +[2025-03-02 17:16:27] (step=0442200) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0606 +[2025-03-02 17:17:26] (step=0442300) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0608 +[2025-03-02 17:18:26] (step=0442400) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0625 +[2025-03-02 17:19:26] (step=0442500) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0596 +[2025-03-02 17:20:25] (step=0442600) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0616 +[2025-03-02 17:21:25] (step=0442700) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0605 +[2025-03-02 17:22:24] (step=0442800) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0604 +[2025-03-02 17:23:27] (step=0442900) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0606 +[2025-03-02 17:24:27] (step=0443000) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0623 +[2025-03-02 17:25:27] (step=0443100) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0597 +[2025-03-02 17:26:26] (step=0443200) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0592 +[2025-03-02 17:27:26] (step=0443300) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0613 +[2025-03-02 17:28:25] (step=0443400) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0605 +[2025-03-02 17:29:25] (step=0443500) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0591 +[2025-03-02 17:30:25] (step=0443600) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0592 +[2025-03-02 17:31:24] (step=0443700) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0633 +[2025-03-02 17:32:24] (step=0443800) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0582 +[2025-03-02 17:33:23] (step=0443900) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0626 +[2025-03-02 17:34:23] (step=0444000) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0598 +[2025-03-02 17:35:23] (step=0444100) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0616 +[2025-03-02 17:36:22] (step=0444200) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0587 +[2025-03-02 17:37:22] (step=0444300) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0622 +[2025-03-02 17:38:21] (step=0444400) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0584 +[2025-03-02 17:39:21] (step=0444500) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0610 +[2025-03-02 17:40:20] (step=0444600) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0618 +[2025-03-02 17:41:20] (step=0444700) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0613 +[2025-03-02 17:42:20] (step=0444800) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0605 +[2025-03-02 17:43:19] (step=0444900) Train Loss: 0.0435, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0572 +[2025-03-02 17:44:19] (step=0445000) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0596 +[2025-03-02 17:45:18] (step=0445100) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0592 +[2025-03-02 17:46:18] (step=0445200) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0622 +[2025-03-02 17:47:18] (step=0445300) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0588 +[2025-03-02 17:48:21] (step=0445400) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0612 +[2025-03-02 17:49:20] (step=0445500) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0619 +[2025-03-02 17:50:20] (step=0445600) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0618 +[2025-03-02 17:51:19] (step=0445700) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0607 +[2025-03-02 17:52:19] (step=0445800) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0621 +[2025-03-02 17:53:19] (step=0445900) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0611 +[2025-03-02 17:54:18] (step=0446000) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0614 +[2025-03-02 17:55:18] (step=0446100) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0621 +[2025-03-02 17:56:17] (step=0446200) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0612 +[2025-03-02 17:57:17] (step=0446300) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0619 +[2025-03-02 17:58:16] (step=0446400) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0618 +[2025-03-02 17:59:16] (step=0446500) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0599 +[2025-03-02 18:00:16] (step=0446600) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0633 +[2025-03-02 18:01:15] (step=0446700) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0594 +[2025-03-02 18:02:15] (step=0446800) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0595 +[2025-03-02 18:03:15] (step=0446900) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0610 +[2025-03-02 18:04:14] (step=0447000) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0607 +[2025-03-02 18:05:14] (step=0447100) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0599 +[2025-03-02 18:06:13] (step=0447200) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0589 +[2025-03-02 18:07:13] (step=0447300) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0625 +[2025-03-02 18:08:13] (step=0447400) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0593 +[2025-03-02 18:09:12] (step=0447500) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0602 +[2025-03-02 18:10:12] (step=0447600) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0606 +[2025-03-02 18:11:11] (step=0447700) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0607 +[2025-03-02 18:12:11] (step=0447800) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0582 +[2025-03-02 18:13:14] (step=0447900) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0582 +[2025-03-02 18:14:13] (step=0448000) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0602 +[2025-03-02 18:15:13] (step=0448100) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0596 +[2025-03-02 18:16:13] (step=0448200) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0604 +[2025-03-02 18:17:12] (step=0448300) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0620 +[2025-03-02 18:18:12] (step=0448400) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0596 +[2025-03-02 18:19:11] (step=0448500) Train Loss: 0.0446, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0619 +[2025-03-02 18:20:11] (step=0448600) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0615 +[2025-03-02 18:21:10] (step=0448700) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0576 +[2025-03-02 18:22:10] (step=0448800) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0605 +[2025-03-02 18:23:10] (step=0448900) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0609 +[2025-03-02 18:24:09] (step=0449000) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0617 +[2025-03-02 18:25:09] (step=0449100) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0607 +[2025-03-02 18:26:08] (step=0449200) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0616 +[2025-03-02 18:27:08] (step=0449300) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0578 +[2025-03-02 18:28:08] (step=0449400) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0609 +[2025-03-02 18:29:07] (step=0449500) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0602 +[2025-03-02 18:30:07] (step=0449600) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0614 +[2025-03-02 18:31:06] (step=0449700) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0597 +[2025-03-02 18:32:06] (step=0449800) Train Loss: 0.0435, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0607 +[2025-03-02 18:33:05] (step=0449900) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0596 +[2025-03-02 18:34:05] (step=0450000) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0623 +[2025-03-02 18:34:08] Saved checkpoint to ../logs/flow/flowsdvae_500kx512_lgn0p0/checkpoints/0450000.pt +[2025-03-02 18:39:33] (step=0450000), Fid=12.330832423249944, PSNR=27.134465019989015, LPIPS=0.22432295978069305, SSIM=0.751068115234375 +[2025-03-02 18:40:33] (step=0450100) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 0.26, Grad Norm: 0.0625 +[2025-03-02 18:41:33] (step=0450200) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0632 +[2025-03-02 18:42:33] (step=0450300) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0583 +[2025-03-02 18:43:36] (step=0450400) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0601 +[2025-03-02 18:44:35] (step=0450500) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0603 +[2025-03-02 18:45:35] (step=0450600) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0600 +[2025-03-02 18:46:35] (step=0450700) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0611 +[2025-03-02 18:47:35] (step=0450800) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0595 +[2025-03-02 18:48:34] (step=0450900) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0605 +[2025-03-02 18:49:34] (step=0451000) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0611 +[2025-03-02 18:50:33] (step=0451100) Train Loss: 0.0435, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0591 +[2025-03-02 18:51:33] (step=0451200) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0601 +[2025-03-02 18:52:33] (step=0451300) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0598 +[2025-03-02 18:53:32] (step=0451400) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0594 +[2025-03-02 18:54:32] (step=0451500) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0598 +[2025-03-02 18:55:32] (step=0451600) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0601 +[2025-03-02 18:56:31] (step=0451700) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0613 +[2025-03-02 18:57:31] (step=0451800) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0625 +[2025-03-02 18:58:30] (step=0451900) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0626 +[2025-03-02 18:59:30] (step=0452000) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0634 +[2025-03-02 19:00:30] (step=0452100) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0633 +[2025-03-02 19:01:29] (step=0452200) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0599 +[2025-03-02 19:02:29] (step=0452300) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0590 +[2025-03-02 19:03:28] (step=0452400) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0616 +[2025-03-02 19:04:28] (step=0452500) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0620 +[2025-03-02 19:05:28] (step=0452600) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0620 +[2025-03-02 19:06:27] (step=0452700) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0593 +[2025-03-02 19:07:27] (step=0452800) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0583 +[2025-03-02 19:08:29] (step=0452900) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.60, Grad Norm: 0.0612 +[2025-03-02 19:09:29] (step=0453000) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0605 +[2025-03-02 19:10:29] (step=0453100) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0575 +[2025-03-02 19:11:28] (step=0453200) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0594 +[2025-03-02 19:12:28] (step=0453300) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0616 +[2025-03-02 19:13:28] (step=0453400) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0606 +[2025-03-02 19:14:27] (step=0453500) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0598 +[2025-03-02 19:15:27] (step=0453600) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0589 +[2025-03-02 19:16:26] (step=0453700) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0610 +[2025-03-02 19:17:26] (step=0453800) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0598 +[2025-03-02 19:18:26] (step=0453900) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0581 +[2025-03-02 19:19:25] (step=0454000) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0613 +[2025-03-02 19:20:25] (step=0454100) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0580 +[2025-03-02 19:21:24] (step=0454200) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0609 +[2025-03-02 19:22:24] (step=0454300) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0588 +[2025-03-02 19:23:24] (step=0454400) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0570 +[2025-03-02 19:24:23] (step=0454500) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0600 +[2025-03-02 19:25:23] (step=0454600) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0570 +[2025-03-02 19:26:22] (step=0454700) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0621 +[2025-03-02 19:27:22] (step=0454800) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0575 +[2025-03-02 19:28:22] (step=0454900) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0608 +[2025-03-02 19:29:21] (step=0455000) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0580 +[2025-03-02 19:30:21] (step=0455100) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0631 +[2025-03-02 19:31:20] (step=0455200) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0615 +[2025-03-02 19:32:20] (step=0455300) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0612 +[2025-03-02 19:33:23] (step=0455400) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0601 +[2025-03-02 19:34:23] (step=0455500) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0601 +[2025-03-02 19:35:22] (step=0455600) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0591 +[2025-03-02 19:36:22] (step=0455700) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0604 +[2025-03-02 19:37:22] (step=0455800) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0607 +[2025-03-02 19:38:21] (step=0455900) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0644 +[2025-03-02 19:39:21] (step=0456000) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0592 +[2025-03-02 19:40:21] (step=0456100) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0609 +[2025-03-02 19:41:20] (step=0456200) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0613 +[2025-03-02 19:42:20] (step=0456300) Train Loss: 0.0435, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0578 +[2025-03-02 19:43:19] (step=0456400) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0610 +[2025-03-02 19:44:19] (step=0456500) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0571 +[2025-03-02 19:45:19] (step=0456600) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0607 +[2025-03-02 19:46:18] (step=0456700) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0579 +[2025-03-02 19:47:18] (step=0456800) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0579 +[2025-03-02 19:48:17] (step=0456900) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0599 +[2025-03-02 19:49:17] (step=0457000) Train Loss: 0.0434, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0587 +[2025-03-02 19:50:16] (step=0457100) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0587 +[2025-03-02 19:51:16] (step=0457200) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0599 +[2025-03-02 19:52:16] (step=0457300) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0573 +[2025-03-02 19:53:15] (step=0457400) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0610 +[2025-03-02 19:54:15] (step=0457500) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0624 +[2025-03-02 19:55:14] (step=0457600) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0589 +[2025-03-02 19:56:14] (step=0457700) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0633 +[2025-03-02 19:57:13] (step=0457800) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0592 +[2025-03-02 19:58:16] (step=0457900) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0572 +[2025-03-02 19:59:17] (step=0458000) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.66, Grad Norm: 0.0612 +[2025-03-02 20:00:16] (step=0458100) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0609 +[2025-03-02 20:01:16] (step=0458200) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0598 +[2025-03-02 20:02:16] (step=0458300) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0617 +[2025-03-02 20:03:15] (step=0458400) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0623 +[2025-03-02 20:04:15] (step=0458500) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0598 +[2025-03-02 20:05:15] (step=0458600) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0614 +[2025-03-02 20:06:14] (step=0458700) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0580 +[2025-03-02 20:07:14] (step=0458800) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0605 +[2025-03-02 20:08:13] (step=0458900) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0599 +[2025-03-02 20:09:13] (step=0459000) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0605 +[2025-03-02 20:10:12] (step=0459100) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0590 +[2025-03-02 20:11:12] (step=0459200) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0576 +[2025-03-02 20:12:12] (step=0459300) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0612 +[2025-03-02 20:13:11] (step=0459400) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0604 +[2025-03-02 20:14:11] (step=0459500) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0581 +[2025-03-02 20:15:11] (step=0459600) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0609 +[2025-03-02 20:16:10] (step=0459700) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0593 +[2025-03-02 20:17:10] (step=0459800) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0579 +[2025-03-02 20:18:09] (step=0459900) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0597 +[2025-03-02 20:19:09] (step=0460000) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0601 +[2025-03-02 20:20:09] (step=0460100) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0582 +[2025-03-02 20:21:08] (step=0460200) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0587 +[2025-03-02 20:22:08] (step=0460300) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0628 +[2025-03-02 20:23:11] (step=0460400) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0605 +[2025-03-02 20:24:11] (step=0460500) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0576 +[2025-03-02 20:25:11] (step=0460600) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0608 +[2025-03-02 20:26:10] (step=0460700) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0603 +[2025-03-02 20:27:10] (step=0460800) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0640 +[2025-03-02 20:28:10] (step=0460900) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0593 +[2025-03-02 20:29:09] (step=0461000) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0631 +[2025-03-02 20:30:09] (step=0461100) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0586 +[2025-03-02 20:31:09] (step=0461200) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0607 +[2025-03-02 20:32:09] (step=0461300) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0589 +[2025-03-02 20:33:08] (step=0461400) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0589 +[2025-03-02 20:34:08] (step=0461500) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0574 +[2025-03-02 20:35:08] (step=0461600) Train Loss: 0.0434, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0588 +[2025-03-02 20:36:07] (step=0461700) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0605 +[2025-03-02 20:37:07] (step=0461800) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0581 +[2025-03-02 20:38:06] (step=0461900) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0589 +[2025-03-02 20:39:06] (step=0462000) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0596 +[2025-03-02 20:40:05] (step=0462100) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0613 +[2025-03-02 20:41:05] (step=0462200) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0592 +[2025-03-02 20:42:05] (step=0462300) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0586 +[2025-03-02 20:43:04] (step=0462400) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0584 +[2025-03-02 20:44:04] (step=0462500) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0609 +[2025-03-02 20:45:03] (step=0462600) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0590 +[2025-03-02 20:46:03] (step=0462700) Train Loss: 0.0435, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0601 +[2025-03-02 20:47:02] (step=0462800) Train Loss: 0.0447, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0587 +[2025-03-02 20:48:05] (step=0462900) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0612 +[2025-03-02 20:49:05] (step=0463000) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0596 +[2025-03-02 20:50:05] (step=0463100) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0597 +[2025-03-02 20:51:04] (step=0463200) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0580 +[2025-03-02 20:52:04] (step=0463300) Train Loss: 0.0434, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0597 +[2025-03-02 20:53:03] (step=0463400) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0581 +[2025-03-02 20:54:03] (step=0463500) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0588 +[2025-03-02 20:55:02] (step=0463600) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0592 +[2025-03-02 20:56:02] (step=0463700) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0608 +[2025-03-02 20:57:02] (step=0463800) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0600 +[2025-03-02 20:58:01] (step=0463900) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0643 +[2025-03-02 20:59:01] (step=0464000) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0598 +[2025-03-02 21:00:00] (step=0464100) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0592 +[2025-03-02 21:01:00] (step=0464200) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0612 +[2025-03-02 21:01:59] (step=0464300) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0597 +[2025-03-02 21:02:59] (step=0464400) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0620 +[2025-03-02 21:03:59] (step=0464500) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0620 +[2025-03-02 21:04:58] (step=0464600) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0613 +[2025-03-02 21:05:58] (step=0464700) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0557 +[2025-03-02 21:06:57] (step=0464800) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0587 +[2025-03-02 21:07:57] (step=0464900) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0587 +[2025-03-02 21:08:56] (step=0465000) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0613 +[2025-03-02 21:09:56] (step=0465100) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0570 +[2025-03-02 21:10:55] (step=0465200) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0610 +[2025-03-02 21:11:55] (step=0465300) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0591 +[2025-03-02 21:12:58] (step=0465400) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0588 +[2025-03-02 21:13:58] (step=0465500) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0579 +[2025-03-02 21:14:57] (step=0465600) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0629 +[2025-03-02 21:15:57] (step=0465700) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0613 +[2025-03-02 21:16:57] (step=0465800) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0598 +[2025-03-02 21:17:56] (step=0465900) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0608 +[2025-03-02 21:18:56] (step=0466000) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0587 +[2025-03-02 21:19:56] (step=0466100) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0575 +[2025-03-02 21:20:55] (step=0466200) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0611 +[2025-03-02 21:21:55] (step=0466300) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0601 +[2025-03-02 21:22:54] (step=0466400) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0595 +[2025-03-02 21:23:54] (step=0466500) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0594 +[2025-03-02 21:24:53] (step=0466600) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0594 +[2025-03-02 21:25:53] (step=0466700) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0591 +[2025-03-02 21:26:53] (step=0466800) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0598 +[2025-03-02 21:27:52] (step=0466900) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0584 +[2025-03-02 21:28:52] (step=0467000) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0572 +[2025-03-02 21:29:51] (step=0467100) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0606 +[2025-03-02 21:30:51] (step=0467200) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0591 +[2025-03-02 21:31:50] (step=0467300) Train Loss: 0.0434, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0584 +[2025-03-02 21:32:50] (step=0467400) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0573 +[2025-03-02 21:33:49] (step=0467500) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0596 +[2025-03-02 21:34:49] (step=0467600) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0580 +[2025-03-02 21:35:49] (step=0467700) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0595 +[2025-03-02 21:36:48] (step=0467800) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0595 +[2025-03-02 21:37:51] (step=0467900) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0573 +[2025-03-02 21:38:51] (step=0468000) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0599 +[2025-03-02 21:39:50] (step=0468100) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0574 +[2025-03-02 21:40:50] (step=0468200) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0581 +[2025-03-02 21:41:50] (step=0468300) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0590 +[2025-03-02 21:42:49] (step=0468400) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0588 +[2025-03-02 21:43:49] (step=0468500) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0578 +[2025-03-02 21:44:48] (step=0468600) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0595 +[2025-03-02 21:45:48] (step=0468700) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0557 +[2025-03-02 21:46:48] (step=0468800) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0576 +[2025-03-02 21:47:47] (step=0468900) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0597 +[2025-03-02 21:48:47] (step=0469000) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0560 +[2025-03-02 21:49:46] (step=0469100) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0603 +[2025-03-02 21:50:46] (step=0469200) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0614 +[2025-03-02 21:51:45] (step=0469300) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0597 +[2025-03-02 21:52:45] (step=0469400) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0597 +[2025-03-02 21:53:44] (step=0469500) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0578 +[2025-03-02 21:54:44] (step=0469600) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0608 +[2025-03-02 21:55:44] (step=0469700) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0580 +[2025-03-02 21:56:43] (step=0469800) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0571 +[2025-03-02 21:57:43] (step=0469900) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0604 +[2025-03-02 21:58:42] (step=0470000) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0580 +[2025-03-02 21:59:42] (step=0470100) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0616 +[2025-03-02 22:00:41] (step=0470200) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0602 +[2025-03-02 22:01:41] (step=0470300) Train Loss: 0.0435, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0603 +[2025-03-02 22:02:44] (step=0470400) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0605 +[2025-03-02 22:03:44] (step=0470500) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0598 +[2025-03-02 22:04:43] (step=0470600) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0611 +[2025-03-02 22:05:43] (step=0470700) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0585 +[2025-03-02 22:06:43] (step=0470800) Train Loss: 0.0435, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0584 +[2025-03-02 22:07:42] (step=0470900) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0582 +[2025-03-02 22:08:42] (step=0471000) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0600 +[2025-03-02 22:09:42] (step=0471100) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0611 +[2025-03-02 22:10:41] (step=0471200) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0624 +[2025-03-02 22:11:41] (step=0471300) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0573 +[2025-03-02 22:12:41] (step=0471400) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0597 +[2025-03-02 22:13:40] (step=0471500) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0592 +[2025-03-02 22:14:40] (step=0471600) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0612 +[2025-03-02 22:15:39] (step=0471700) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0597 +[2025-03-02 22:16:39] (step=0471800) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0581 +[2025-03-02 22:17:39] (step=0471900) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0602 +[2025-03-02 22:18:38] (step=0472000) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0597 +[2025-03-02 22:19:38] (step=0472100) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0556 +[2025-03-02 22:20:37] (step=0472200) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0656 +[2025-03-02 22:21:37] (step=0472300) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0557 +[2025-03-02 22:22:37] (step=0472400) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0583 +[2025-03-02 22:23:36] (step=0472500) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0595 +[2025-03-02 22:24:36] (step=0472600) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0615 +[2025-03-02 22:25:35] (step=0472700) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0586 +[2025-03-02 22:26:35] (step=0472800) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0591 +[2025-03-02 22:27:38] (step=0472900) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0588 +[2025-03-02 22:28:38] (step=0473000) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0595 +[2025-03-02 22:29:37] (step=0473100) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0592 +[2025-03-02 22:30:37] (step=0473200) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0599 +[2025-03-02 22:31:37] (step=0473300) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0610 +[2025-03-02 22:32:37] (step=0473400) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0604 +[2025-03-02 22:33:36] (step=0473500) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0591 +[2025-03-02 22:34:36] (step=0473600) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0606 +[2025-03-02 22:35:35] (step=0473700) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0573 +[2025-03-02 22:36:35] (step=0473800) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0609 +[2025-03-02 22:37:35] (step=0473900) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0566 +[2025-03-02 22:38:34] (step=0474000) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0596 +[2025-03-02 22:39:34] (step=0474100) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0590 +[2025-03-02 22:40:33] (step=0474200) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0629 +[2025-03-02 22:41:33] (step=0474300) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0604 +[2025-03-02 22:42:32] (step=0474400) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0599 +[2025-03-02 22:43:32] (step=0474500) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0579 +[2025-03-02 22:44:32] (step=0474600) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0601 +[2025-03-02 22:45:31] (step=0474700) Train Loss: 0.0434, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0570 +[2025-03-02 22:46:31] (step=0474800) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0613 +[2025-03-02 22:47:30] (step=0474900) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0582 +[2025-03-02 22:48:30] (step=0475000) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0592 +[2025-03-02 22:49:30] (step=0475100) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0585 +[2025-03-02 22:50:29] (step=0475200) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0586 +[2025-03-02 22:51:29] (step=0475300) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0591 +[2025-03-02 22:52:31] (step=0475400) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0587 +[2025-03-02 22:53:31] (step=0475500) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0588 +[2025-03-02 22:54:31] (step=0475600) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0586 +[2025-03-02 22:55:31] (step=0475700) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0576 +[2025-03-02 22:56:30] (step=0475800) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0581 +[2025-03-02 22:57:30] (step=0475900) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0588 +[2025-03-02 22:58:30] (step=0476000) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0574 +[2025-03-02 22:59:29] (step=0476100) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0597 +[2025-03-02 23:00:29] (step=0476200) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0578 +[2025-03-02 23:01:28] (step=0476300) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0582 +[2025-03-02 23:02:28] (step=0476400) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0596 +[2025-03-02 23:03:28] (step=0476500) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0588 +[2025-03-02 23:04:27] (step=0476600) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0583 +[2025-03-02 23:05:27] (step=0476700) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0606 +[2025-03-02 23:06:26] (step=0476800) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0589 +[2025-03-02 23:07:26] (step=0476900) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0588 +[2025-03-02 23:08:26] (step=0477000) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0601 +[2025-03-02 23:09:25] (step=0477100) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0589 +[2025-03-02 23:10:25] (step=0477200) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0577 +[2025-03-02 23:11:24] (step=0477300) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0568 +[2025-03-02 23:12:24] (step=0477400) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0571 +[2025-03-02 23:13:23] (step=0477500) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0609 +[2025-03-02 23:14:23] (step=0477600) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0563 +[2025-03-02 23:15:23] (step=0477700) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0594 +[2025-03-02 23:16:22] (step=0477800) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0585 +[2025-03-02 23:17:25] (step=0477900) Train Loss: 0.0435, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0606 +[2025-03-02 23:18:25] (step=0478000) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0614 +[2025-03-02 23:19:25] (step=0478100) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0598 +[2025-03-02 23:20:24] (step=0478200) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0578 +[2025-03-02 23:21:24] (step=0478300) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0602 +[2025-03-02 23:22:23] (step=0478400) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0589 +[2025-03-02 23:23:23] (step=0478500) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0582 +[2025-03-02 23:24:22] (step=0478600) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0590 +[2025-03-02 23:25:22] (step=0478700) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0598 +[2025-03-02 23:26:22] (step=0478800) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0584 +[2025-03-02 23:27:21] (step=0478900) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0600 +[2025-03-02 23:28:21] (step=0479000) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0604 +[2025-03-02 23:29:20] (step=0479100) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0580 +[2025-03-02 23:30:20] (step=0479200) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0584 +[2025-03-02 23:31:19] (step=0479300) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0566 +[2025-03-02 23:32:19] (step=0479400) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0584 +[2025-03-02 23:33:19] (step=0479500) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0575 +[2025-03-02 23:34:18] (step=0479600) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0557 +[2025-03-02 23:35:18] (step=0479700) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0577 +[2025-03-02 23:36:17] (step=0479800) Train Loss: 0.0435, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0577 +[2025-03-02 23:37:17] (step=0479900) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0574 +[2025-03-02 23:38:16] (step=0480000) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0608 +[2025-03-02 23:39:16] (step=0480100) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0579 +[2025-03-02 23:40:16] (step=0480200) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0582 +[2025-03-02 23:41:15] (step=0480300) Train Loss: 0.0434, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0572 +[2025-03-02 23:42:18] (step=0480400) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0582 +[2025-03-02 23:43:18] (step=0480500) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0581 +[2025-03-02 23:44:17] (step=0480600) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0545 +[2025-03-02 23:45:17] (step=0480700) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0588 +[2025-03-02 23:46:17] (step=0480800) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0571 +[2025-03-02 23:47:16] (step=0480900) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0582 +[2025-03-02 23:48:16] (step=0481000) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0613 +[2025-03-02 23:49:15] (step=0481100) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0574 +[2025-03-02 23:50:15] (step=0481200) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0577 +[2025-03-02 23:51:14] (step=0481300) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0577 +[2025-03-02 23:52:14] (step=0481400) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0558 +[2025-03-02 23:53:13] (step=0481500) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0595 +[2025-03-02 23:54:13] (step=0481600) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0564 +[2025-03-02 23:55:13] (step=0481700) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0596 +[2025-03-02 23:56:12] (step=0481800) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0574 +[2025-03-02 23:57:12] (step=0481900) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0598 +[2025-03-02 23:58:11] (step=0482000) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0570 +[2025-03-02 23:59:11] (step=0482100) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0576 +[2025-03-03 00:00:10] (step=0482200) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0582 +[2025-03-03 00:01:10] (step=0482300) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0563 +[2025-03-03 00:02:09] (step=0482400) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0606 +[2025-03-03 00:03:09] (step=0482500) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0570 +[2025-03-03 00:04:09] (step=0482600) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0562 +[2025-03-03 00:05:08] (step=0482700) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0583 +[2025-03-03 00:06:08] (step=0482800) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0569 +[2025-03-03 00:07:10] (step=0482900) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.60, Grad Norm: 0.0596 +[2025-03-03 00:08:10] (step=0483000) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0586 +[2025-03-03 00:09:10] (step=0483100) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0583 +[2025-03-03 00:10:09] (step=0483200) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0606 +[2025-03-03 00:11:09] (step=0483300) Train Loss: 0.0444, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0573 +[2025-03-03 00:12:09] (step=0483400) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0570 +[2025-03-03 00:13:08] (step=0483500) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0595 +[2025-03-03 00:14:08] (step=0483600) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0582 +[2025-03-03 00:15:07] (step=0483700) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0579 +[2025-03-03 00:16:07] (step=0483800) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0554 +[2025-03-03 00:17:07] (step=0483900) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0583 +[2025-03-03 00:18:06] (step=0484000) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0575 +[2025-03-03 00:19:06] (step=0484100) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0569 +[2025-03-03 00:20:05] (step=0484200) Train Loss: 0.0435, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0586 +[2025-03-03 00:21:05] (step=0484300) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0574 +[2025-03-03 00:22:05] (step=0484400) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0559 +[2025-03-03 00:23:04] (step=0484500) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0575 +[2025-03-03 00:24:04] (step=0484600) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0552 +[2025-03-03 00:25:03] (step=0484700) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0585 +[2025-03-03 00:26:03] (step=0484800) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0550 +[2025-03-03 00:27:03] (step=0484900) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0602 +[2025-03-03 00:28:02] (step=0485000) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0571 +[2025-03-03 00:29:02] (step=0485100) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0587 +[2025-03-03 00:30:01] (step=0485200) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0536 +[2025-03-03 00:31:01] (step=0485300) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0605 +[2025-03-03 00:32:04] (step=0485400) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0577 +[2025-03-03 00:33:03] (step=0485500) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0610 +[2025-03-03 00:34:03] (step=0485600) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0583 +[2025-03-03 00:35:03] (step=0485700) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0577 +[2025-03-03 00:36:02] (step=0485800) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0601 +[2025-03-03 00:37:02] (step=0485900) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0576 +[2025-03-03 00:38:01] (step=0486000) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0580 +[2025-03-03 00:39:01] (step=0486100) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0562 +[2025-03-03 00:40:00] (step=0486200) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0550 +[2025-03-03 00:41:00] (step=0486300) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0589 +[2025-03-03 00:41:59] (step=0486400) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0571 +[2025-03-03 00:42:59] (step=0486500) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0566 +[2025-03-03 00:43:59] (step=0486600) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0568 +[2025-03-03 00:44:58] (step=0486700) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0567 +[2025-03-03 00:45:58] (step=0486800) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0575 +[2025-03-03 00:46:57] (step=0486900) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0566 +[2025-03-03 00:47:57] (step=0487000) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0597 +[2025-03-03 00:48:56] (step=0487100) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0585 +[2025-03-03 00:49:56] (step=0487200) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0590 +[2025-03-03 00:50:55] (step=0487300) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0580 +[2025-03-03 00:51:55] (step=0487400) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0582 +[2025-03-03 00:52:54] (step=0487500) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0629 +[2025-03-03 00:53:54] (step=0487600) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0587 +[2025-03-03 00:54:53] (step=0487700) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0593 +[2025-03-03 00:55:53] (step=0487800) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0581 +[2025-03-03 00:56:56] (step=0487900) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0573 +[2025-03-03 00:57:56] (step=0488000) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0573 +[2025-03-03 00:58:55] (step=0488100) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0592 +[2025-03-03 00:59:55] (step=0488200) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0575 +[2025-03-03 01:00:54] (step=0488300) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0578 +[2025-03-03 01:01:54] (step=0488400) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0571 +[2025-03-03 01:02:53] (step=0488500) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0612 +[2025-03-03 01:03:53] (step=0488600) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0580 +[2025-03-03 01:04:53] (step=0488700) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0556 +[2025-03-03 01:05:52] (step=0488800) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0592 +[2025-03-03 01:06:52] (step=0488900) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0577 +[2025-03-03 01:07:51] (step=0489000) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0581 +[2025-03-03 01:08:51] (step=0489100) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0571 +[2025-03-03 01:09:50] (step=0489200) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0601 +[2025-03-03 01:10:50] (step=0489300) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0564 +[2025-03-03 01:11:49] (step=0489400) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0578 +[2025-03-03 01:12:49] (step=0489500) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0580 +[2025-03-03 01:13:49] (step=0489600) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0582 +[2025-03-03 01:14:48] (step=0489700) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0586 +[2025-03-03 01:15:48] (step=0489800) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0584 +[2025-03-03 01:16:47] (step=0489900) Train Loss: 0.0433, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0559 +[2025-03-03 01:17:47] (step=0490000) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0614 +[2025-03-03 01:18:46] (step=0490100) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0583 +[2025-03-03 01:19:46] (step=0490200) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0587 +[2025-03-03 01:20:45] (step=0490300) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0572 +[2025-03-03 01:21:48] (step=0490400) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0529 +[2025-03-03 01:22:48] (step=0490500) Train Loss: 0.0435, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0575 +[2025-03-03 01:23:48] (step=0490600) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0576 +[2025-03-03 01:24:47] (step=0490700) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0559 +[2025-03-03 01:25:47] (step=0490800) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0565 +[2025-03-03 01:26:46] (step=0490900) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0572 +[2025-03-03 01:27:46] (step=0491000) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0598 +[2025-03-03 01:28:45] (step=0491100) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0559 +[2025-03-03 01:29:45] (step=0491200) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0561 +[2025-03-03 01:30:44] (step=0491300) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0576 +[2025-03-03 01:31:44] (step=0491400) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0563 +[2025-03-03 01:32:44] (step=0491500) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0556 +[2025-03-03 01:33:43] (step=0491600) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0579 +[2025-03-03 01:34:43] (step=0491700) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0589 +[2025-03-03 01:35:42] (step=0491800) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0564 +[2025-03-03 01:36:42] (step=0491900) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0586 +[2025-03-03 01:37:41] (step=0492000) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0571 +[2025-03-03 01:38:41] (step=0492100) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0605 +[2025-03-03 01:39:40] (step=0492200) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0569 +[2025-03-03 01:40:40] (step=0492300) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0575 +[2025-03-03 01:41:39] (step=0492400) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0582 +[2025-03-03 01:42:39] (step=0492500) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0599 +[2025-03-03 01:43:38] (step=0492600) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0568 +[2025-03-03 01:44:38] (step=0492700) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0596 +[2025-03-03 01:45:38] (step=0492800) Train Loss: 0.0435, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0610 +[2025-03-03 01:46:41] (step=0492900) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0590 +[2025-03-03 01:47:40] (step=0493000) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0612 +[2025-03-03 01:48:40] (step=0493100) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0578 +[2025-03-03 01:49:40] (step=0493200) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0584 +[2025-03-03 01:50:39] (step=0493300) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0591 +[2025-03-03 01:51:39] (step=0493400) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0613 +[2025-03-03 01:52:38] (step=0493500) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0557 +[2025-03-03 01:53:38] (step=0493600) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0596 +[2025-03-03 01:54:37] (step=0493700) Train Loss: 0.0435, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0577 +[2025-03-03 01:55:37] (step=0493800) Train Loss: 0.0445, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0592 +[2025-03-03 01:56:36] (step=0493900) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0584 +[2025-03-03 01:57:36] (step=0494000) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0582 +[2025-03-03 01:58:36] (step=0494100) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0566 +[2025-03-03 01:59:35] (step=0494200) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0601 +[2025-03-03 02:00:35] (step=0494300) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0574 +[2025-03-03 02:01:34] (step=0494400) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0578 +[2025-03-03 02:02:34] (step=0494500) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0576 +[2025-03-03 02:03:33] (step=0494600) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0598 +[2025-03-03 02:04:33] (step=0494700) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0579 +[2025-03-03 02:05:32] (step=0494800) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0588 +[2025-03-03 02:06:32] (step=0494900) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0572 +[2025-03-03 02:07:31] (step=0495000) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0585 +[2025-03-03 02:08:31] (step=0495100) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0582 +[2025-03-03 02:09:31] (step=0495200) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0596 +[2025-03-03 02:10:30] (step=0495300) Train Loss: 0.0435, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0577 +[2025-03-03 02:11:33] (step=0495400) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0600 +[2025-03-03 02:12:33] (step=0495500) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0595 +[2025-03-03 02:13:32] (step=0495600) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0585 +[2025-03-03 02:14:32] (step=0495700) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0596 +[2025-03-03 02:15:31] (step=0495800) Train Loss: 0.0435, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0562 +[2025-03-03 02:16:31] (step=0495900) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0579 +[2025-03-03 02:17:31] (step=0496000) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0566 +[2025-03-03 02:18:30] (step=0496100) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0604 +[2025-03-03 02:19:30] (step=0496200) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0611 +[2025-03-03 02:20:29] (step=0496300) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0562 +[2025-03-03 02:21:29] (step=0496400) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0583 +[2025-03-03 02:22:28] (step=0496500) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0580 +[2025-03-03 02:23:28] (step=0496600) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0576 +[2025-03-03 02:24:27] (step=0496700) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0574 +[2025-03-03 02:25:27] (step=0496800) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0581 +[2025-03-03 02:26:26] (step=0496900) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0606 +[2025-03-03 02:27:26] (step=0497000) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0585 +[2025-03-03 02:28:26] (step=0497100) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0571 +[2025-03-03 02:29:25] (step=0497200) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0578 +[2025-03-03 02:30:25] (step=0497300) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0575 +[2025-03-03 02:31:24] (step=0497400) Train Loss: 0.0436, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0580 +[2025-03-03 02:32:24] (step=0497500) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0594 +[2025-03-03 02:33:23] (step=0497600) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0583 +[2025-03-03 02:34:23] (step=0497700) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0607 +[2025-03-03 02:35:22] (step=0497800) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0587 +[2025-03-03 02:36:25] (step=0497900) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.59, Grad Norm: 0.0578 +[2025-03-03 02:37:25] (step=0498000) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.67, Grad Norm: 0.0571 +[2025-03-03 02:38:24] (step=0498100) Train Loss: 0.0443, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0621 +[2025-03-03 02:39:24] (step=0498200) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0564 +[2025-03-03 02:40:23] (step=0498300) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0555 +[2025-03-03 02:41:23] (step=0498400) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0579 +[2025-03-03 02:42:23] (step=0498500) Train Loss: 0.0440, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0559 +[2025-03-03 02:43:22] (step=0498600) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0574 +[2025-03-03 02:44:22] (step=0498700) Train Loss: 0.0442, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0575 +[2025-03-03 02:45:21] (step=0498800) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0557 +[2025-03-03 02:46:21] (step=0498900) Train Loss: 0.0435, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0581 +[2025-03-03 02:47:20] (step=0499000) Train Loss: 0.0435, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0582 +[2025-03-03 02:48:20] (step=0499100) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0562 +[2025-03-03 02:49:19] (step=0499200) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0589 +[2025-03-03 02:50:19] (step=0499300) Train Loss: 0.0438, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0579 +[2025-03-03 02:51:19] (step=0499400) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0575 +[2025-03-03 02:52:18] (step=0499500) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0554 +[2025-03-03 02:53:18] (step=0499600) Train Loss: 0.0441, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0567 +[2025-03-03 02:54:17] (step=0499700) Train Loss: 0.0435, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0582 +[2025-03-03 02:55:17] (step=0499800) Train Loss: 0.0439, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0611 +[2025-03-03 02:56:16] (step=0499900) Train Loss: 0.0434, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0565 +[2025-03-03 02:57:16] (step=0500000) Train Loss: 0.0437, Perceptual Loss: 0.0000, Cos Loss: 0.0000, Train Steps/Sec: 1.68, Grad Norm: 0.0574 +[2025-03-03 02:57:19] Saved checkpoint to ../logs/flow/flowsdvae_500kx512_lgn0p0/checkpoints/0500000.pt +[2025-03-03 03:02:42] (step=0500000), Fid=12.283589701087067, PSNR=27.15035362932682, LPIPS=0.2239067405462265, SSIM=0.7515549659729004 +[2025-03-03 03:02:43] Done!