diff --git a/.ipynb_checkpoints/config-checkpoint.yaml b/.ipynb_checkpoints/config-checkpoint.yaml new file mode 100644 index 0000000000000000000000000000000000000000..79aa97cc4800999b4e477e20f9d9e3b226f709af --- /dev/null +++ b/.ipynb_checkpoints/config-checkpoint.yaml @@ -0,0 +1,56 @@ +tracker_project_name: memo +output_dir: outputs +resume_from_checkpoint: null +model_name_or_path: memoavatar/memo +vae: stabilityai/sd-vae-ft-mse +gradient_checkpointing: true +gradient_accumulation_steps: 1 +train_batch_size: 2 +max_train_steps: 3500 +num_train_epochs: -1 +enable_xformers_memory_efficient_attention: true +checkpoints_total_limit: 3 +robust_training: true +learning_rate: 1e-5 +max_grad_norm: 1.0 +scale_lr: false +lr_scheduler: constant +lr_warmup_steps: 0 +seed: 42 +mixed_precision: bf16 +use_8bit_adam: false +allow_tf32: true +use_ema: false +adam_beta1: 0.9 +adam_beta2: 0.999 +adam_weight_decay: 0.01 +adam_epsilon: 1e-08 +dataloader_num_workers: 16 +prefetch_factor: 4 +checkpointing_steps: 5000 +data: + width: 512 + height: 512 + num_past_frames: 16 + dynamic_past_frames: false + n_sample_frames: 16 + audio_margin: 2 + metadata_paths: + - assets/embedding/metadata.jsonl +weighting_scheme: logit_normal +logit_mean: 0.0 +logit_std: 1.0 +mode_scale: 1.29 +noise_scheduler_kwargs: + num_train_timesteps: 1000 +train_reference_net: true +train_diffusion_net: true +train_image_proj: true +train_audio_proj: true +trainable_modules: + - to_q + - to_k + - to_v +uncond_img_ratio: 0.05 +uncond_audio_ratio: 0.05 +start_ratio: 0.05 \ No newline at end of file diff --git a/checkpoint-3500/audio_proj/config.json b/checkpoint-3500/audio_proj/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bf7703bd940f8da5794d46ea0bcd9a6d4ad381a4 --- /dev/null +++ b/checkpoint-3500/audio_proj/config.json @@ -0,0 +1,5 @@ +{ + "_class_name": "AudioProjModel", + "_diffusers_version": "0.31.0", + "_name_or_path": "memoavatar/memo" +} diff --git a/checkpoint-3500/audio_proj/diffusion_pytorch_model.safetensors b/checkpoint-3500/audio_proj/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6d668d104f4cbd7cbae2f67cc0bb6832e39b3903 --- /dev/null +++ b/checkpoint-3500/audio_proj/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc1c7d4583571f4648f5bf82b70246671d4576837154be38436327f3e8c0e8cc +size 72930976 diff --git a/checkpoint-3500/diffusion_net/config.json b/checkpoint-3500/diffusion_net/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2a8bbbd76d4f42260484e1188f782c049dca4e58 --- /dev/null +++ b/checkpoint-3500/diffusion_net/config.json @@ -0,0 +1,88 @@ +{ + "_center_input_sample": false, + "_class_name": "UNet3DConditionModel", + "_diffusers_version": "0.31.0", + "_name_or_path": "memoavatar/memo", + "_out_channels": 4, + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": null, + "attention_head_dim": 8, + "attention_type": "default", + "audio_attention_dim": 768, + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "center_input_sample": false, + "class_embed_type": null, + "class_embeddings_concat": false, + "conv_in_kernel": 3, + "cross_attention_dim": 768, + "down_block_types": [ + "CrossAttnDownBlock3D", + "CrossAttnDownBlock3D", + "CrossAttnDownBlock3D", + "DownBlock3D" + ], + "downsample_padding": 1, + "dropout": 0.0, + "dual_cross_attention": false, + "emo_drop_rate": 0.05, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_only_cross_attention": null, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock3DCrossAttn", + "motion_module_kwargs": { + "attention_block_types": [ + "Temporal_Self", + "Temporal_Self" + ], + "num_attention_heads": 8, + "num_transformer_block": 1, + "temporal_attention_dim_div": 1, + "temporal_position_encoding": true, + "temporal_position_encoding_max_len": 32 + }, + "motion_module_resolutions": [ + 1, + 2, + 4, + 8 + ], + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "out_channels": 4, + "projection_class_embeddings_input_dim": null, + "resnet_time_scale_shift": "default", + "reverse_transformer_layers_per_block": null, + "sample_size": 64, + "time_cond_proj_dim": null, + "time_embedding_act_fn": null, + "time_embedding_dim": null, + "time_embedding_type": "positional", + "timestep_post_act": null, + "transformer_layers_per_block": 1, + "unet_use_cross_frame_attention": false, + "unet_use_temporal_attention": false, + "up_block_types": [ + "UpBlock3D", + "CrossAttnUpBlock3D", + "CrossAttnUpBlock3D", + "CrossAttnUpBlock3D" + ], + "upcast_attention": false, + "use_inflated_groupnorm": true, + "use_linear_projection": false +} diff --git a/checkpoint-3500/diffusion_net/diffusion_pytorch_model.safetensors b/checkpoint-3500/diffusion_net/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..5c94d023fe6a3028be624fdc67a9b2b7678af675 --- /dev/null +++ b/checkpoint-3500/diffusion_net/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03162a8af72c47e34bff41edb6b1a5d42d6a6e3056f80d2ede70adfb92832572 +size 3356369240 diff --git a/checkpoint-3500/image_proj/config.json b/checkpoint-3500/image_proj/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c2c0acbea19270f45543f13d528b2e4830a28370 --- /dev/null +++ b/checkpoint-3500/image_proj/config.json @@ -0,0 +1,5 @@ +{ + "_class_name": "ImageProjModel", + "_diffusers_version": "0.31.0", + "_name_or_path": "memoavatar/memo" +} diff --git a/checkpoint-3500/image_proj/diffusion_pytorch_model.safetensors b/checkpoint-3500/image_proj/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..087c6a61477663dcf587d17ae8bf03d654ea7bb6 --- /dev/null +++ b/checkpoint-3500/image_proj/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9855dabf683d8c17b265567737bc90e5a0b032db7551b78f028cd9b03439abe5 +size 3155280 diff --git a/checkpoint-3500/optimizer.bin b/checkpoint-3500/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..b566502792f4e960a0720e9ff36ec8b466714f0e --- /dev/null +++ b/checkpoint-3500/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f2ff2008a029d4fb3bea5a39259d9cc3d1b304699aba98f39ddcff257f4a7d1 +size 3270385552 diff --git a/checkpoint-3500/random_states_0.pkl b/checkpoint-3500/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..ad32e0c670c82fc28f13bb5e32c904b4a3363b09 --- /dev/null +++ b/checkpoint-3500/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a9b3d3f1680675aba9b613e2d6261cba04f9f18471e2e84747bbd9e621bf725 +size 14408 diff --git a/checkpoint-3500/reference_net/config.json b/checkpoint-3500/reference_net/config.json new file mode 100644 index 0000000000000000000000000000000000000000..468b6a964243c2158d8899bd46df0df333b110fe --- /dev/null +++ b/checkpoint-3500/reference_net/config.json @@ -0,0 +1,66 @@ +{ + "_center_input_sample": false, + "_class_name": "UNet2DConditionModel", + "_diffusers_version": "0.31.0", + "_name_or_path": "memoavatar/memo", + "_out_channels": 4, + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": null, + "attention_head_dim": 8, + "attention_type": "default", + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "center_input_sample": false, + "class_embed_type": null, + "class_embeddings_concat": false, + "conv_in_kernel": 3, + "cross_attention_dim": 768, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "dropout": 0.0, + "dual_cross_attention": false, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_only_cross_attention": null, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "out_channels": 4, + "projection_class_embeddings_input_dim": null, + "resnet_time_scale_shift": "default", + "reverse_transformer_layers_per_block": null, + "sample_size": 64, + "time_cond_proj_dim": null, + "time_embedding_act_fn": null, + "time_embedding_dim": null, + "time_embedding_type": "positional", + "timestep_post_act": null, + "transformer_layers_per_block": 1, + "up_block_types": [ + "UpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D" + ], + "upcast_attention": false, + "use_linear_projection": false +} diff --git a/checkpoint-3500/reference_net/diffusion_pytorch_model.safetensors b/checkpoint-3500/reference_net/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..68202efe149f6eda5567ecb02df46bed5dca4b36 --- /dev/null +++ b/checkpoint-3500/reference_net/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0550a76a5df4c295610040f90075b3bbf64f7d6be58cfc93a9722be1377b2486 +size 1714214152 diff --git a/checkpoint-3500/scheduler.bin b/checkpoint-3500/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..f3290a51934a912d4984ad282affd1f94290c78f --- /dev/null +++ b/checkpoint-3500/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6802221f6347629ca3a6e377a3bbcf1d2a6c0b7ef7e83794854e08587237ffd4 +size 1000 diff --git a/checkpoint-5000/audio_proj/config.json b/checkpoint-5000/audio_proj/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bf7703bd940f8da5794d46ea0bcd9a6d4ad381a4 --- /dev/null +++ b/checkpoint-5000/audio_proj/config.json @@ -0,0 +1,5 @@ +{ + "_class_name": "AudioProjModel", + "_diffusers_version": "0.31.0", + "_name_or_path": "memoavatar/memo" +} diff --git a/checkpoint-5000/audio_proj/diffusion_pytorch_model.safetensors b/checkpoint-5000/audio_proj/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6d668d104f4cbd7cbae2f67cc0bb6832e39b3903 --- /dev/null +++ b/checkpoint-5000/audio_proj/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc1c7d4583571f4648f5bf82b70246671d4576837154be38436327f3e8c0e8cc +size 72930976 diff --git a/checkpoint-5000/diffusion_net/config.json b/checkpoint-5000/diffusion_net/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2a8bbbd76d4f42260484e1188f782c049dca4e58 --- /dev/null +++ b/checkpoint-5000/diffusion_net/config.json @@ -0,0 +1,88 @@ +{ + "_center_input_sample": false, + "_class_name": "UNet3DConditionModel", + "_diffusers_version": "0.31.0", + "_name_or_path": "memoavatar/memo", + "_out_channels": 4, + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": null, + "attention_head_dim": 8, + "attention_type": "default", + "audio_attention_dim": 768, + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "center_input_sample": false, + "class_embed_type": null, + "class_embeddings_concat": false, + "conv_in_kernel": 3, + "cross_attention_dim": 768, + "down_block_types": [ + "CrossAttnDownBlock3D", + "CrossAttnDownBlock3D", + "CrossAttnDownBlock3D", + "DownBlock3D" + ], + "downsample_padding": 1, + "dropout": 0.0, + "dual_cross_attention": false, + "emo_drop_rate": 0.05, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_only_cross_attention": null, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock3DCrossAttn", + "motion_module_kwargs": { + "attention_block_types": [ + "Temporal_Self", + "Temporal_Self" + ], + "num_attention_heads": 8, + "num_transformer_block": 1, + "temporal_attention_dim_div": 1, + "temporal_position_encoding": true, + "temporal_position_encoding_max_len": 32 + }, + "motion_module_resolutions": [ + 1, + 2, + 4, + 8 + ], + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "out_channels": 4, + "projection_class_embeddings_input_dim": null, + "resnet_time_scale_shift": "default", + "reverse_transformer_layers_per_block": null, + "sample_size": 64, + "time_cond_proj_dim": null, + "time_embedding_act_fn": null, + "time_embedding_dim": null, + "time_embedding_type": "positional", + "timestep_post_act": null, + "transformer_layers_per_block": 1, + "unet_use_cross_frame_attention": false, + "unet_use_temporal_attention": false, + "up_block_types": [ + "UpBlock3D", + "CrossAttnUpBlock3D", + "CrossAttnUpBlock3D", + "CrossAttnUpBlock3D" + ], + "upcast_attention": false, + "use_inflated_groupnorm": true, + "use_linear_projection": false +} diff --git a/checkpoint-5000/diffusion_net/diffusion_pytorch_model.safetensors b/checkpoint-5000/diffusion_net/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..a1feca0facd9e2a7a9dfc160c4952cfcd7475a6e --- /dev/null +++ b/checkpoint-5000/diffusion_net/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53f04a95f121794e54554f6b8746a239354167a03c70c2d3e6829cabd517754f +size 3356369240 diff --git a/checkpoint-5000/image_proj/config.json b/checkpoint-5000/image_proj/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c2c0acbea19270f45543f13d528b2e4830a28370 --- /dev/null +++ b/checkpoint-5000/image_proj/config.json @@ -0,0 +1,5 @@ +{ + "_class_name": "ImageProjModel", + "_diffusers_version": "0.31.0", + "_name_or_path": "memoavatar/memo" +} diff --git a/checkpoint-5000/image_proj/diffusion_pytorch_model.safetensors b/checkpoint-5000/image_proj/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..087c6a61477663dcf587d17ae8bf03d654ea7bb6 --- /dev/null +++ b/checkpoint-5000/image_proj/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9855dabf683d8c17b265567737bc90e5a0b032db7551b78f028cd9b03439abe5 +size 3155280 diff --git a/checkpoint-5000/optimizer.bin b/checkpoint-5000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..a6cc54fe6c63e329fdb347563286202ab31a805c --- /dev/null +++ b/checkpoint-5000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5932ca6ad987609976876f0e8473b54ee286a9e62778f4152c1de736a8b98c30 +size 3270385552 diff --git a/checkpoint-5000/random_states_0.pkl b/checkpoint-5000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..3e3b6c622c8138de7738f8ec8bc6a9969347efdd --- /dev/null +++ b/checkpoint-5000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0dc7aef135da1cc848c02bc449b185f15582060d87aa35e527e7d944cd090bd +size 14344 diff --git a/checkpoint-5000/reference_net/config.json b/checkpoint-5000/reference_net/config.json new file mode 100644 index 0000000000000000000000000000000000000000..468b6a964243c2158d8899bd46df0df333b110fe --- /dev/null +++ b/checkpoint-5000/reference_net/config.json @@ -0,0 +1,66 @@ +{ + "_center_input_sample": false, + "_class_name": "UNet2DConditionModel", + "_diffusers_version": "0.31.0", + "_name_or_path": "memoavatar/memo", + "_out_channels": 4, + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": null, + "attention_head_dim": 8, + "attention_type": "default", + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "center_input_sample": false, + "class_embed_type": null, + "class_embeddings_concat": false, + "conv_in_kernel": 3, + "cross_attention_dim": 768, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "dropout": 0.0, + "dual_cross_attention": false, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_only_cross_attention": null, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "out_channels": 4, + "projection_class_embeddings_input_dim": null, + "resnet_time_scale_shift": "default", + "reverse_transformer_layers_per_block": null, + "sample_size": 64, + "time_cond_proj_dim": null, + "time_embedding_act_fn": null, + "time_embedding_dim": null, + "time_embedding_type": "positional", + "timestep_post_act": null, + "transformer_layers_per_block": 1, + "up_block_types": [ + "UpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D" + ], + "upcast_attention": false, + "use_linear_projection": false +} diff --git a/checkpoint-5000/reference_net/diffusion_pytorch_model.safetensors b/checkpoint-5000/reference_net/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..68202efe149f6eda5567ecb02df46bed5dca4b36 --- /dev/null +++ b/checkpoint-5000/reference_net/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0550a76a5df4c295610040f90075b3bbf64f7d6be58cfc93a9722be1377b2486 +size 1714214152 diff --git a/checkpoint-5000/scheduler.bin b/checkpoint-5000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..976a27de201da5488bc7b42ce6d3ddff38320cae --- /dev/null +++ b/checkpoint-5000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:920333155b08e76154b89a85170c320833074db7b84649a9cfe79fd10b6bf2d9 +size 1000 diff --git a/checkpoint-7000/audio_proj/config.json b/checkpoint-7000/audio_proj/config.json new file mode 100644 index 0000000000000000000000000000000000000000..bf7703bd940f8da5794d46ea0bcd9a6d4ad381a4 --- /dev/null +++ b/checkpoint-7000/audio_proj/config.json @@ -0,0 +1,5 @@ +{ + "_class_name": "AudioProjModel", + "_diffusers_version": "0.31.0", + "_name_or_path": "memoavatar/memo" +} diff --git a/checkpoint-7000/audio_proj/diffusion_pytorch_model.safetensors b/checkpoint-7000/audio_proj/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..6d668d104f4cbd7cbae2f67cc0bb6832e39b3903 --- /dev/null +++ b/checkpoint-7000/audio_proj/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc1c7d4583571f4648f5bf82b70246671d4576837154be38436327f3e8c0e8cc +size 72930976 diff --git a/checkpoint-7000/diffusion_net/config.json b/checkpoint-7000/diffusion_net/config.json new file mode 100644 index 0000000000000000000000000000000000000000..2a8bbbd76d4f42260484e1188f782c049dca4e58 --- /dev/null +++ b/checkpoint-7000/diffusion_net/config.json @@ -0,0 +1,88 @@ +{ + "_center_input_sample": false, + "_class_name": "UNet3DConditionModel", + "_diffusers_version": "0.31.0", + "_name_or_path": "memoavatar/memo", + "_out_channels": 4, + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": null, + "attention_head_dim": 8, + "attention_type": "default", + "audio_attention_dim": 768, + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "center_input_sample": false, + "class_embed_type": null, + "class_embeddings_concat": false, + "conv_in_kernel": 3, + "cross_attention_dim": 768, + "down_block_types": [ + "CrossAttnDownBlock3D", + "CrossAttnDownBlock3D", + "CrossAttnDownBlock3D", + "DownBlock3D" + ], + "downsample_padding": 1, + "dropout": 0.0, + "dual_cross_attention": false, + "emo_drop_rate": 0.05, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_only_cross_attention": null, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock3DCrossAttn", + "motion_module_kwargs": { + "attention_block_types": [ + "Temporal_Self", + "Temporal_Self" + ], + "num_attention_heads": 8, + "num_transformer_block": 1, + "temporal_attention_dim_div": 1, + "temporal_position_encoding": true, + "temporal_position_encoding_max_len": 32 + }, + "motion_module_resolutions": [ + 1, + 2, + 4, + 8 + ], + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "out_channels": 4, + "projection_class_embeddings_input_dim": null, + "resnet_time_scale_shift": "default", + "reverse_transformer_layers_per_block": null, + "sample_size": 64, + "time_cond_proj_dim": null, + "time_embedding_act_fn": null, + "time_embedding_dim": null, + "time_embedding_type": "positional", + "timestep_post_act": null, + "transformer_layers_per_block": 1, + "unet_use_cross_frame_attention": false, + "unet_use_temporal_attention": false, + "up_block_types": [ + "UpBlock3D", + "CrossAttnUpBlock3D", + "CrossAttnUpBlock3D", + "CrossAttnUpBlock3D" + ], + "upcast_attention": false, + "use_inflated_groupnorm": true, + "use_linear_projection": false +} diff --git a/checkpoint-7000/diffusion_net/diffusion_pytorch_model.safetensors b/checkpoint-7000/diffusion_net/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..8209ee3e0f5cda2a82496b6f01aec3960c5072d9 --- /dev/null +++ b/checkpoint-7000/diffusion_net/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e24b052422aa8c6dc6b0ed81d03492b83928fc0c25d437cecfda6c65b52348c1 +size 3356369240 diff --git a/checkpoint-7000/image_proj/config.json b/checkpoint-7000/image_proj/config.json new file mode 100644 index 0000000000000000000000000000000000000000..c2c0acbea19270f45543f13d528b2e4830a28370 --- /dev/null +++ b/checkpoint-7000/image_proj/config.json @@ -0,0 +1,5 @@ +{ + "_class_name": "ImageProjModel", + "_diffusers_version": "0.31.0", + "_name_or_path": "memoavatar/memo" +} diff --git a/checkpoint-7000/image_proj/diffusion_pytorch_model.safetensors b/checkpoint-7000/image_proj/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..087c6a61477663dcf587d17ae8bf03d654ea7bb6 --- /dev/null +++ b/checkpoint-7000/image_proj/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9855dabf683d8c17b265567737bc90e5a0b032db7551b78f028cd9b03439abe5 +size 3155280 diff --git a/checkpoint-7000/optimizer.bin b/checkpoint-7000/optimizer.bin new file mode 100644 index 0000000000000000000000000000000000000000..d129b452237c7ed0c6e9b1e791ed9073d386b6ea --- /dev/null +++ b/checkpoint-7000/optimizer.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e6bee6eb8cfb1c8bd3314731385820e5ee5dbb0bd57dbb1a55c1ba676f34c2a +size 3270385552 diff --git a/checkpoint-7000/random_states_0.pkl b/checkpoint-7000/random_states_0.pkl new file mode 100644 index 0000000000000000000000000000000000000000..0492a6e7eaf07cb01234fc90d5fc0149a58c4260 --- /dev/null +++ b/checkpoint-7000/random_states_0.pkl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bc142465f2d168b5cbd99f93129ea9d61c76a52d868f8d39dbbaed3581a6afd +size 14344 diff --git a/checkpoint-7000/reference_net/config.json b/checkpoint-7000/reference_net/config.json new file mode 100644 index 0000000000000000000000000000000000000000..468b6a964243c2158d8899bd46df0df333b110fe --- /dev/null +++ b/checkpoint-7000/reference_net/config.json @@ -0,0 +1,66 @@ +{ + "_center_input_sample": false, + "_class_name": "UNet2DConditionModel", + "_diffusers_version": "0.31.0", + "_name_or_path": "memoavatar/memo", + "_out_channels": 4, + "act_fn": "silu", + "addition_embed_type": null, + "addition_embed_type_num_heads": 64, + "addition_time_embed_dim": null, + "attention_head_dim": 8, + "attention_type": "default", + "block_out_channels": [ + 320, + 640, + 1280, + 1280 + ], + "center_input_sample": false, + "class_embed_type": null, + "class_embeddings_concat": false, + "conv_in_kernel": 3, + "cross_attention_dim": 768, + "down_block_types": [ + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "CrossAttnDownBlock2D", + "DownBlock2D" + ], + "downsample_padding": 1, + "dropout": 0.0, + "dual_cross_attention": false, + "encoder_hid_dim": null, + "encoder_hid_dim_type": null, + "flip_sin_to_cos": true, + "freq_shift": 0, + "in_channels": 4, + "layers_per_block": 2, + "mid_block_only_cross_attention": null, + "mid_block_scale_factor": 1, + "mid_block_type": "UNetMidBlock2DCrossAttn", + "norm_eps": 1e-05, + "norm_num_groups": 32, + "num_attention_heads": null, + "num_class_embeds": null, + "only_cross_attention": false, + "out_channels": 4, + "projection_class_embeddings_input_dim": null, + "resnet_time_scale_shift": "default", + "reverse_transformer_layers_per_block": null, + "sample_size": 64, + "time_cond_proj_dim": null, + "time_embedding_act_fn": null, + "time_embedding_dim": null, + "time_embedding_type": "positional", + "timestep_post_act": null, + "transformer_layers_per_block": 1, + "up_block_types": [ + "UpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D", + "CrossAttnUpBlock2D" + ], + "upcast_attention": false, + "use_linear_projection": false +} diff --git a/checkpoint-7000/reference_net/diffusion_pytorch_model.safetensors b/checkpoint-7000/reference_net/diffusion_pytorch_model.safetensors new file mode 100644 index 0000000000000000000000000000000000000000..68202efe149f6eda5567ecb02df46bed5dca4b36 --- /dev/null +++ b/checkpoint-7000/reference_net/diffusion_pytorch_model.safetensors @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0550a76a5df4c295610040f90075b3bbf64f7d6be58cfc93a9722be1377b2486 +size 1714214152 diff --git a/checkpoint-7000/scheduler.bin b/checkpoint-7000/scheduler.bin new file mode 100644 index 0000000000000000000000000000000000000000..060d6467a94bb456ae140a069e7c9fc0d0d9eefe --- /dev/null +++ b/checkpoint-7000/scheduler.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4f80bd4cf789dadaabab339ee4bbcf7677008e876201ba9229aae4c3d8860b1 +size 1000 diff --git a/config.yaml b/config.yaml new file mode 100644 index 0000000000000000000000000000000000000000..ae8903e8f2b660e17edd731ea6970c7a6ef658d5 --- /dev/null +++ b/config.yaml @@ -0,0 +1,55 @@ +tracker_project_name: memo +output_dir: outputs/finetune +resume_from_checkpoint: null +model_name_or_path: memoavatar/memo +vae: stabilityai/sd-vae-ft-mse +gradient_checkpointing: true +gradient_accumulation_steps: 1 +train_batch_size: 1 +max_train_steps: 3500 +num_train_epochs: -1 +enable_xformers_memory_efficient_attention: true +checkpoints_total_limit: 3 +robust_training: true +learning_rate: 1.0e-05 +max_grad_norm: 1.0 +scale_lr: false +lr_scheduler: constant +lr_warmup_steps: 0 +seed: 42 +mixed_precision: bf16 +use_8bit_adam: false +allow_tf32: true +use_ema: false +adam_beta1: 0.9 +adam_beta2: 0.999 +adam_weight_decay: 0.01 +adam_epsilon: 1.0e-08 +dataloader_num_workers: 16 +prefetch_factor: 4 +checkpointing_steps: 5000 +data: + width: 512 + height: 512 + num_past_frames: 16 + dynamic_past_frames: false + n_sample_frames: 16 + audio_margin: 2 + metadata_paths: + - assets/embedding/metadata.jsonl +weighting_scheme: logit_normal +logit_mean: 0.0 +logit_std: 1.0 +mode_scale: 1.29 +noise_scheduler_kwargs: + num_train_timesteps: 1000 +train_reference_net: false +train_diffusion_net: true +train_image_proj: false +train_audio_proj: false +trainable_modules: +- motion_modules +- audio_modules +uncond_img_ratio: 0.05 +uncond_audio_ratio: 0.05 +start_ratio: 0.05 diff --git a/logs/memo/1741022678.2856228/events.out.tfevents.1741022678.3c52c6a06e3b b/logs/memo/1741022678.2856228/events.out.tfevents.1741022678.3c52c6a06e3b new file mode 100644 index 0000000000000000000000000000000000000000..24881d5ec65890ac9cca6df0f9725e11a5d8fe20 --- /dev/null +++ b/logs/memo/1741022678.2856228/events.out.tfevents.1741022678.3c52c6a06e3b @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82468bdd6d38c969094750adaf19ce3778a9c50fd26b45c2e643f9852bcd80fd +size 2329 diff --git a/logs/memo/1741022678.2878249/hparams.yml b/logs/memo/1741022678.2878249/hparams.yml new file mode 100644 index 0000000000000000000000000000000000000000..c05b5d01f644eace9cb291f5531dd5ae3e3e32e1 --- /dev/null +++ b/logs/memo/1741022678.2878249/hparams.yml @@ -0,0 +1,55 @@ +adam_beta1: 0.9 +adam_beta2: 0.999 +adam_epsilon: 1.0e-08 +adam_weight_decay: 0.01 +allow_tf32: true +checkpointing_steps: 5000 +checkpoints_total_limit: 20 +data: + audio_margin: 2 + dynamic_past_frames: false + height: 512 + metadata_paths: + - data/embedding/metadata.jsonl + n_sample_frames: 16 + num_past_frames: 16 + width: 512 +dataloader_num_workers: 16 +enable_xformers_memory_efficient_attention: true +gradient_accumulation_steps: 1 +gradient_checkpointing: true +learning_rate: 1.0e-05 +logit_mean: 0.0 +logit_std: 1.0 +lr_scheduler: constant +lr_warmup_steps: 0 +max_grad_norm: 1.0 +max_train_steps: 3500 +mixed_precision: bf16 +mode_scale: 1.29 +model_name_or_path: memoavatar/memo +noise_scheduler_kwargs: + num_train_timesteps: 1000 +num_train_epochs: 350 +output_dir: outputs/finetune +prefetch_factor: 4 +resume_from_checkpoint: null +robust_training: true +scale_lr: false +seed: 42 +start_ratio: 0.05 +tracker_project_name: memo +train_audio_proj: false +train_batch_size: 1 +train_diffusion_net: true +train_image_proj: false +train_reference_net: false +trainable_modules: +- motion_modules +- audio_modules +uncond_audio_ratio: 0.05 +uncond_img_ratio: 0.05 +use_8bit_adam: false +use_ema: false +vae: stabilityai/sd-vae-ft-mse +weighting_scheme: logit_normal diff --git a/logs/memo/1741046967.6854546/events.out.tfevents.1741046967.369f90aa7051 b/logs/memo/1741046967.6854546/events.out.tfevents.1741046967.369f90aa7051 new file mode 100644 index 0000000000000000000000000000000000000000..6c70bd85bea3ebb2108a865aa488158967084479 --- /dev/null +++ b/logs/memo/1741046967.6854546/events.out.tfevents.1741046967.369f90aa7051 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:516216cf24c6ea13cf020b0b334970a9d7dcaef079db3a8fd0d3cdbc21aa1b58 +size 2329 diff --git a/logs/memo/1741046967.688156/.ipynb_checkpoints/hparams-checkpoint.yml b/logs/memo/1741046967.688156/.ipynb_checkpoints/hparams-checkpoint.yml new file mode 100644 index 0000000000000000000000000000000000000000..e88e51d9c6a89ea42615575c9021b23aebc20a69 --- /dev/null +++ b/logs/memo/1741046967.688156/.ipynb_checkpoints/hparams-checkpoint.yml @@ -0,0 +1,55 @@ +adam_beta1: 0.9 +adam_beta2: 0.999 +adam_epsilon: 1.0e-08 +adam_weight_decay: 0.01 +allow_tf32: true +checkpointing_steps: 5000 +checkpoints_total_limit: 20 +data: + audio_margin: 2 + dynamic_past_frames: false + height: 512 + metadata_paths: + - data/embedding/metadata.jsonl + n_sample_frames: 16 + num_past_frames: 16 + width: 512 +dataloader_num_workers: 16 +enable_xformers_memory_efficient_attention: true +gradient_accumulation_steps: 1 +gradient_checkpointing: true +learning_rate: 1.0e-05 +logit_mean: 0.0 +logit_std: 1.0 +lr_scheduler: constant +lr_warmup_steps: 0 +max_grad_norm: 1.0 +max_train_steps: 3500 +mixed_precision: bf16 +mode_scale: 1.29 +model_name_or_path: memoavatar/memo +noise_scheduler_kwargs: + num_train_timesteps: 1000 +num_train_epochs: 700 +output_dir: outputs/finetune +prefetch_factor: 4 +resume_from_checkpoint: null +robust_training: true +scale_lr: false +seed: 42 +start_ratio: 0.05 +tracker_project_name: memo +train_audio_proj: false +train_batch_size: 2 +train_diffusion_net: true +train_image_proj: false +train_reference_net: false +trainable_modules: +- motion_modules +- audio_modules +uncond_audio_ratio: 0.05 +uncond_img_ratio: 0.05 +use_8bit_adam: true +use_ema: false +vae: stabilityai/sd-vae-ft-mse +weighting_scheme: logit_normal diff --git a/logs/memo/1741046967.688156/hparams.yml b/logs/memo/1741046967.688156/hparams.yml new file mode 100644 index 0000000000000000000000000000000000000000..e88e51d9c6a89ea42615575c9021b23aebc20a69 --- /dev/null +++ b/logs/memo/1741046967.688156/hparams.yml @@ -0,0 +1,55 @@ +adam_beta1: 0.9 +adam_beta2: 0.999 +adam_epsilon: 1.0e-08 +adam_weight_decay: 0.01 +allow_tf32: true +checkpointing_steps: 5000 +checkpoints_total_limit: 20 +data: + audio_margin: 2 + dynamic_past_frames: false + height: 512 + metadata_paths: + - data/embedding/metadata.jsonl + n_sample_frames: 16 + num_past_frames: 16 + width: 512 +dataloader_num_workers: 16 +enable_xformers_memory_efficient_attention: true +gradient_accumulation_steps: 1 +gradient_checkpointing: true +learning_rate: 1.0e-05 +logit_mean: 0.0 +logit_std: 1.0 +lr_scheduler: constant +lr_warmup_steps: 0 +max_grad_norm: 1.0 +max_train_steps: 3500 +mixed_precision: bf16 +mode_scale: 1.29 +model_name_or_path: memoavatar/memo +noise_scheduler_kwargs: + num_train_timesteps: 1000 +num_train_epochs: 700 +output_dir: outputs/finetune +prefetch_factor: 4 +resume_from_checkpoint: null +robust_training: true +scale_lr: false +seed: 42 +start_ratio: 0.05 +tracker_project_name: memo +train_audio_proj: false +train_batch_size: 2 +train_diffusion_net: true +train_image_proj: false +train_reference_net: false +trainable_modules: +- motion_modules +- audio_modules +uncond_audio_ratio: 0.05 +uncond_img_ratio: 0.05 +use_8bit_adam: true +use_ema: false +vae: stabilityai/sd-vae-ft-mse +weighting_scheme: logit_normal diff --git a/logs/memo/1741060237.980531/events.out.tfevents.1741060237.369f90aa7051 b/logs/memo/1741060237.980531/events.out.tfevents.1741060237.369f90aa7051 new file mode 100644 index 0000000000000000000000000000000000000000..c01b078b89aa10c87df1f8030446c353683b834e --- /dev/null +++ b/logs/memo/1741060237.980531/events.out.tfevents.1741060237.369f90aa7051 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:657998ec24fdf97d92613eada6193a47b49c50fb100f3b8f5ec4e25dd8d11249 +size 2329 diff --git a/logs/memo/1741060237.983221/hparams.yml b/logs/memo/1741060237.983221/hparams.yml new file mode 100644 index 0000000000000000000000000000000000000000..e88e51d9c6a89ea42615575c9021b23aebc20a69 --- /dev/null +++ b/logs/memo/1741060237.983221/hparams.yml @@ -0,0 +1,55 @@ +adam_beta1: 0.9 +adam_beta2: 0.999 +adam_epsilon: 1.0e-08 +adam_weight_decay: 0.01 +allow_tf32: true +checkpointing_steps: 5000 +checkpoints_total_limit: 20 +data: + audio_margin: 2 + dynamic_past_frames: false + height: 512 + metadata_paths: + - data/embedding/metadata.jsonl + n_sample_frames: 16 + num_past_frames: 16 + width: 512 +dataloader_num_workers: 16 +enable_xformers_memory_efficient_attention: true +gradient_accumulation_steps: 1 +gradient_checkpointing: true +learning_rate: 1.0e-05 +logit_mean: 0.0 +logit_std: 1.0 +lr_scheduler: constant +lr_warmup_steps: 0 +max_grad_norm: 1.0 +max_train_steps: 3500 +mixed_precision: bf16 +mode_scale: 1.29 +model_name_or_path: memoavatar/memo +noise_scheduler_kwargs: + num_train_timesteps: 1000 +num_train_epochs: 700 +output_dir: outputs/finetune +prefetch_factor: 4 +resume_from_checkpoint: null +robust_training: true +scale_lr: false +seed: 42 +start_ratio: 0.05 +tracker_project_name: memo +train_audio_proj: false +train_batch_size: 2 +train_diffusion_net: true +train_image_proj: false +train_reference_net: false +trainable_modules: +- motion_modules +- audio_modules +uncond_audio_ratio: 0.05 +uncond_img_ratio: 0.05 +use_8bit_adam: true +use_ema: false +vae: stabilityai/sd-vae-ft-mse +weighting_scheme: logit_normal diff --git a/logs/memo/1741060310.7917793/events.out.tfevents.1741060310.369f90aa7051 b/logs/memo/1741060310.7917793/events.out.tfevents.1741060310.369f90aa7051 new file mode 100644 index 0000000000000000000000000000000000000000..b04eb668d23c135293f347a034a69d6f8cf3c068 --- /dev/null +++ b/logs/memo/1741060310.7917793/events.out.tfevents.1741060310.369f90aa7051 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7ab603a92f4ae6f27f318a54ebff660a0c9e707799e389f65f2440b9eb176a2 +size 2329 diff --git a/logs/memo/1741060310.7946274/hparams.yml b/logs/memo/1741060310.7946274/hparams.yml new file mode 100644 index 0000000000000000000000000000000000000000..90d06df871df18abd2fe1b1cf45d2e86bc27d2b9 --- /dev/null +++ b/logs/memo/1741060310.7946274/hparams.yml @@ -0,0 +1,55 @@ +adam_beta1: 0.9 +adam_beta2: 0.999 +adam_epsilon: 1.0e-08 +adam_weight_decay: 0.01 +allow_tf32: true +checkpointing_steps: 5000 +checkpoints_total_limit: 20 +data: + audio_margin: 2 + dynamic_past_frames: false + height: 512 + metadata_paths: + - data/embedding/metadata.jsonl + n_sample_frames: 16 + num_past_frames: 16 + width: 512 +dataloader_num_workers: 16 +enable_xformers_memory_efficient_attention: true +gradient_accumulation_steps: 1 +gradient_checkpointing: true +learning_rate: 1.0e-05 +logit_mean: 0.0 +logit_std: 1.0 +lr_scheduler: constant +lr_warmup_steps: 0 +max_grad_norm: 1.0 +max_train_steps: 3500 +mixed_precision: bf16 +mode_scale: 1.29 +model_name_or_path: memoavatar/memo +noise_scheduler_kwargs: + num_train_timesteps: 1000 +num_train_epochs: 875 +output_dir: outputs/finetune +prefetch_factor: 4 +resume_from_checkpoint: null +robust_training: true +scale_lr: false +seed: 42 +start_ratio: 0.05 +tracker_project_name: memo +train_audio_proj: false +train_batch_size: 3 +train_diffusion_net: true +train_image_proj: false +train_reference_net: false +trainable_modules: +- motion_modules +- audio_modules +uncond_audio_ratio: 0.05 +uncond_img_ratio: 0.05 +use_8bit_adam: true +use_ema: false +vae: stabilityai/sd-vae-ft-mse +weighting_scheme: logit_normal diff --git a/logs/memo/1741060338.6906004/events.out.tfevents.1741060338.369f90aa7051 b/logs/memo/1741060338.6906004/events.out.tfevents.1741060338.369f90aa7051 new file mode 100644 index 0000000000000000000000000000000000000000..54ed1da3ec88ffd7f78e24bc014758f54cd0682e --- /dev/null +++ b/logs/memo/1741060338.6906004/events.out.tfevents.1741060338.369f90aa7051 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5e705e83cd16356a16b87991f60c4e05562b9765a3ef319ff245e211feaf078 +size 2329 diff --git a/logs/memo/1741060338.6932552/hparams.yml b/logs/memo/1741060338.6932552/hparams.yml new file mode 100644 index 0000000000000000000000000000000000000000..4b349508ba235d2e1d7eba7e7d57b97a33107a82 --- /dev/null +++ b/logs/memo/1741060338.6932552/hparams.yml @@ -0,0 +1,55 @@ +adam_beta1: 0.9 +adam_beta2: 0.999 +adam_epsilon: 1.0e-08 +adam_weight_decay: 0.01 +allow_tf32: true +checkpointing_steps: 5000 +checkpoints_total_limit: 20 +data: + audio_margin: 2 + dynamic_past_frames: false + height: 512 + metadata_paths: + - data/embedding/metadata.jsonl + n_sample_frames: 16 + num_past_frames: 16 + width: 512 +dataloader_num_workers: 16 +enable_xformers_memory_efficient_attention: true +gradient_accumulation_steps: 1 +gradient_checkpointing: true +learning_rate: 1.0e-05 +logit_mean: 0.0 +logit_std: 1.0 +lr_scheduler: constant +lr_warmup_steps: 0 +max_grad_norm: 1.0 +max_train_steps: 3500 +mixed_precision: bf16 +mode_scale: 1.29 +model_name_or_path: memoavatar/memo +noise_scheduler_kwargs: + num_train_timesteps: 1000 +num_train_epochs: 350 +output_dir: outputs/finetune +prefetch_factor: 4 +resume_from_checkpoint: null +robust_training: true +scale_lr: false +seed: 42 +start_ratio: 0.05 +tracker_project_name: memo +train_audio_proj: false +train_batch_size: 1 +train_diffusion_net: true +train_image_proj: false +train_reference_net: false +trainable_modules: +- motion_modules +- audio_modules +uncond_audio_ratio: 0.05 +uncond_img_ratio: 0.05 +use_8bit_adam: true +use_ema: false +vae: stabilityai/sd-vae-ft-mse +weighting_scheme: logit_normal diff --git a/logs/memo/1741145698.900579/events.out.tfevents.1741145698.16e2a27e51cb b/logs/memo/1741145698.900579/events.out.tfevents.1741145698.16e2a27e51cb new file mode 100644 index 0000000000000000000000000000000000000000..de213e0869748bdb66e526d357bc673a35195d97 --- /dev/null +++ b/logs/memo/1741145698.900579/events.out.tfevents.1741145698.16e2a27e51cb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ce7a3b494bd3470fb3b8c6543ac40d7612c5c71a2c1290c5b5fd711fd79ec93 +size 2329 diff --git a/logs/memo/1741145698.903226/hparams.yml b/logs/memo/1741145698.903226/hparams.yml new file mode 100644 index 0000000000000000000000000000000000000000..4b349508ba235d2e1d7eba7e7d57b97a33107a82 --- /dev/null +++ b/logs/memo/1741145698.903226/hparams.yml @@ -0,0 +1,55 @@ +adam_beta1: 0.9 +adam_beta2: 0.999 +adam_epsilon: 1.0e-08 +adam_weight_decay: 0.01 +allow_tf32: true +checkpointing_steps: 5000 +checkpoints_total_limit: 20 +data: + audio_margin: 2 + dynamic_past_frames: false + height: 512 + metadata_paths: + - data/embedding/metadata.jsonl + n_sample_frames: 16 + num_past_frames: 16 + width: 512 +dataloader_num_workers: 16 +enable_xformers_memory_efficient_attention: true +gradient_accumulation_steps: 1 +gradient_checkpointing: true +learning_rate: 1.0e-05 +logit_mean: 0.0 +logit_std: 1.0 +lr_scheduler: constant +lr_warmup_steps: 0 +max_grad_norm: 1.0 +max_train_steps: 3500 +mixed_precision: bf16 +mode_scale: 1.29 +model_name_or_path: memoavatar/memo +noise_scheduler_kwargs: + num_train_timesteps: 1000 +num_train_epochs: 350 +output_dir: outputs/finetune +prefetch_factor: 4 +resume_from_checkpoint: null +robust_training: true +scale_lr: false +seed: 42 +start_ratio: 0.05 +tracker_project_name: memo +train_audio_proj: false +train_batch_size: 1 +train_diffusion_net: true +train_image_proj: false +train_reference_net: false +trainable_modules: +- motion_modules +- audio_modules +uncond_audio_ratio: 0.05 +uncond_img_ratio: 0.05 +use_8bit_adam: true +use_ema: false +vae: stabilityai/sd-vae-ft-mse +weighting_scheme: logit_normal diff --git a/logs/memo/1741199250.1532586/events.out.tfevents.1741199250.a4f5499e5c53.9131.2 b/logs/memo/1741199250.1532586/events.out.tfevents.1741199250.a4f5499e5c53.9131.2 new file mode 100644 index 0000000000000000000000000000000000000000..21f6b1b057c50bce3db2651f8dd5a1f23f68c6d4 --- /dev/null +++ b/logs/memo/1741199250.1532586/events.out.tfevents.1741199250.a4f5499e5c53.9131.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eacae07a4bb38bc80c79d8ed96e7116a18701eaef7df4baba0e16aa57ab95743 +size 516 diff --git a/logs/memo/1741199250.154769/hparams.yml b/logs/memo/1741199250.154769/hparams.yml new file mode 100644 index 0000000000000000000000000000000000000000..5bbb2dfe843252444202a8e4a2c31c2e0ca588fa --- /dev/null +++ b/logs/memo/1741199250.154769/hparams.yml @@ -0,0 +1,4 @@ +learning_rate: 1.0e-05 +max_train_steps: 10 +num_train_epochs: 1 +train_batch_size: 1 diff --git a/logs/memo/1741199250.155282/events.out.tfevents.1741199250.a4f5499e5c53.9131.3 b/logs/memo/1741199250.155282/events.out.tfevents.1741199250.a4f5499e5c53.9131.3 new file mode 100644 index 0000000000000000000000000000000000000000..6737ae8c60ce5c8b8bec0f9ac8cc7c84411d40d9 --- /dev/null +++ b/logs/memo/1741199250.155282/events.out.tfevents.1741199250.a4f5499e5c53.9131.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e9349ffa47cb939f8ba5874fd51009c8006ec0a4b9a9ebd7c3123b4d3b61495 +size 516 diff --git a/logs/memo/1741199250.1561742/hparams.yml b/logs/memo/1741199250.1561742/hparams.yml new file mode 100644 index 0000000000000000000000000000000000000000..5bbb2dfe843252444202a8e4a2c31c2e0ca588fa --- /dev/null +++ b/logs/memo/1741199250.1561742/hparams.yml @@ -0,0 +1,4 @@ +learning_rate: 1.0e-05 +max_train_steps: 10 +num_train_epochs: 1 +train_batch_size: 1 diff --git a/logs/memo/1741199336.9286091/events.out.tfevents.1741199336.a4f5499e5c53.10747.2 b/logs/memo/1741199336.9286091/events.out.tfevents.1741199336.a4f5499e5c53.10747.2 new file mode 100644 index 0000000000000000000000000000000000000000..378effd49496ed02e748b12b56071b723f8af8da --- /dev/null +++ b/logs/memo/1741199336.9286091/events.out.tfevents.1741199336.a4f5499e5c53.10747.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07b62497d23ff43a5e4402b7a3ea5914328d6d4c42d72894e00726eb28d15676 +size 516 diff --git a/logs/memo/1741199336.9300776/hparams.yml b/logs/memo/1741199336.9300776/hparams.yml new file mode 100644 index 0000000000000000000000000000000000000000..65f98afc264a21ce3a52d37c96668bd62c05bed4 --- /dev/null +++ b/logs/memo/1741199336.9300776/hparams.yml @@ -0,0 +1,4 @@ +learning_rate: 1.0e-05 +max_train_steps: 3500 +num_train_epochs: 700 +train_batch_size: 2 diff --git a/logs/memo/1741199336.9306138/events.out.tfevents.1741199336.a4f5499e5c53.10747.3 b/logs/memo/1741199336.9306138/events.out.tfevents.1741199336.a4f5499e5c53.10747.3 new file mode 100644 index 0000000000000000000000000000000000000000..d3d300062a584812611e4a8dfce792ec464ce71f --- /dev/null +++ b/logs/memo/1741199336.9306138/events.out.tfevents.1741199336.a4f5499e5c53.10747.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2ce8bfea557aea1b703f7322e2dea3fd0cc8b4fb5400c7a46ed8e8bd69ae11a +size 516 diff --git a/logs/memo/1741199336.9314003/hparams.yml b/logs/memo/1741199336.9314003/hparams.yml new file mode 100644 index 0000000000000000000000000000000000000000..65f98afc264a21ce3a52d37c96668bd62c05bed4 --- /dev/null +++ b/logs/memo/1741199336.9314003/hparams.yml @@ -0,0 +1,4 @@ +learning_rate: 1.0e-05 +max_train_steps: 3500 +num_train_epochs: 700 +train_batch_size: 2 diff --git a/logs/memo/1741219597.3638191/events.out.tfevents.1741219597.a4f5499e5c53.205096.2 b/logs/memo/1741219597.3638191/events.out.tfevents.1741219597.a4f5499e5c53.205096.2 new file mode 100644 index 0000000000000000000000000000000000000000..d62e4b4530a3b18fdc3603777ef29b2e35225e1a --- /dev/null +++ b/logs/memo/1741219597.3638191/events.out.tfevents.1741219597.a4f5499e5c53.205096.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b768e39ef2b009c22438103469b11393a7f66ca413404bd0a3faf6ec1489cdc +size 516 diff --git a/logs/memo/1741219597.3651204/hparams.yml b/logs/memo/1741219597.3651204/hparams.yml new file mode 100644 index 0000000000000000000000000000000000000000..65f98afc264a21ce3a52d37c96668bd62c05bed4 --- /dev/null +++ b/logs/memo/1741219597.3651204/hparams.yml @@ -0,0 +1,4 @@ +learning_rate: 1.0e-05 +max_train_steps: 3500 +num_train_epochs: 700 +train_batch_size: 2 diff --git a/logs/memo/1741219597.3656578/events.out.tfevents.1741219597.a4f5499e5c53.205096.3 b/logs/memo/1741219597.3656578/events.out.tfevents.1741219597.a4f5499e5c53.205096.3 new file mode 100644 index 0000000000000000000000000000000000000000..6f9012fff20d3cd22c2698e73988dd2983fa08d7 --- /dev/null +++ b/logs/memo/1741219597.3656578/events.out.tfevents.1741219597.a4f5499e5c53.205096.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05d67c2e18dc198b808523a8bd77d9028bd86739ff976a6debc1cc43aa5fee7a +size 516 diff --git a/logs/memo/1741219597.367057/hparams.yml b/logs/memo/1741219597.367057/hparams.yml new file mode 100644 index 0000000000000000000000000000000000000000..65f98afc264a21ce3a52d37c96668bd62c05bed4 --- /dev/null +++ b/logs/memo/1741219597.367057/hparams.yml @@ -0,0 +1,4 @@ +learning_rate: 1.0e-05 +max_train_steps: 3500 +num_train_epochs: 700 +train_batch_size: 2 diff --git a/logs/memo/1741219809.924625/events.out.tfevents.1741219809.a4f5499e5c53.207262.2 b/logs/memo/1741219809.924625/events.out.tfevents.1741219809.a4f5499e5c53.207262.2 new file mode 100644 index 0000000000000000000000000000000000000000..42106dd3106765051dfc0fc53925840048b59760 --- /dev/null +++ b/logs/memo/1741219809.924625/events.out.tfevents.1741219809.a4f5499e5c53.207262.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc0079d2839a1233538a54a049224492a1ac9589b22e1ea5307299ca559c0ada +size 516 diff --git a/logs/memo/1741219809.9256084/hparams.yml b/logs/memo/1741219809.9256084/hparams.yml new file mode 100644 index 0000000000000000000000000000000000000000..65f98afc264a21ce3a52d37c96668bd62c05bed4 --- /dev/null +++ b/logs/memo/1741219809.9256084/hparams.yml @@ -0,0 +1,4 @@ +learning_rate: 1.0e-05 +max_train_steps: 3500 +num_train_epochs: 700 +train_batch_size: 2 diff --git a/logs/memo/1741219809.926121/events.out.tfevents.1741219809.a4f5499e5c53.207262.3 b/logs/memo/1741219809.926121/events.out.tfevents.1741219809.a4f5499e5c53.207262.3 new file mode 100644 index 0000000000000000000000000000000000000000..10c211394a788b2041a73e837853add346ecb6c5 --- /dev/null +++ b/logs/memo/1741219809.926121/events.out.tfevents.1741219809.a4f5499e5c53.207262.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7f2beed5aa152576583981b9b12c4e583fed66ef5162683fbc536b054144ba5 +size 516 diff --git a/logs/memo/1741219809.927274/hparams.yml b/logs/memo/1741219809.927274/hparams.yml new file mode 100644 index 0000000000000000000000000000000000000000..65f98afc264a21ce3a52d37c96668bd62c05bed4 --- /dev/null +++ b/logs/memo/1741219809.927274/hparams.yml @@ -0,0 +1,4 @@ +learning_rate: 1.0e-05 +max_train_steps: 3500 +num_train_epochs: 700 +train_batch_size: 2 diff --git a/logs/memo/1741220040.6413944/events.out.tfevents.1741220040.a4f5499e5c53.212374.2 b/logs/memo/1741220040.6413944/events.out.tfevents.1741220040.a4f5499e5c53.212374.2 new file mode 100644 index 0000000000000000000000000000000000000000..05a868c14a5ebcb86294abd86828cc9cc139fd9d --- /dev/null +++ b/logs/memo/1741220040.6413944/events.out.tfevents.1741220040.a4f5499e5c53.212374.2 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:881dd83989710a0ca14d8592a222a7c7663abf01feee2c6bfc4d7d28305d6d20 +size 516 diff --git a/logs/memo/1741220040.6428657/hparams.yml b/logs/memo/1741220040.6428657/hparams.yml new file mode 100644 index 0000000000000000000000000000000000000000..e5642c52005416cd4d690ee5d78758e5addf49c6 --- /dev/null +++ b/logs/memo/1741220040.6428657/hparams.yml @@ -0,0 +1,4 @@ +learning_rate: 1.0e-05 +max_train_steps: 3500 +num_train_epochs: 350 +train_batch_size: 1 diff --git a/logs/memo/1741220040.6434078/events.out.tfevents.1741220040.a4f5499e5c53.212374.3 b/logs/memo/1741220040.6434078/events.out.tfevents.1741220040.a4f5499e5c53.212374.3 new file mode 100644 index 0000000000000000000000000000000000000000..4385a673e5c3e5eeba62495ffbed04409f9a3592 --- /dev/null +++ b/logs/memo/1741220040.6434078/events.out.tfevents.1741220040.a4f5499e5c53.212374.3 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21ba2203003af45b2bcf9badf9f88c75b508c2cf5d7044ab2b6a730df4632ad7 +size 516 diff --git a/logs/memo/1741220040.644948/hparams.yml b/logs/memo/1741220040.644948/hparams.yml new file mode 100644 index 0000000000000000000000000000000000000000..e5642c52005416cd4d690ee5d78758e5addf49c6 --- /dev/null +++ b/logs/memo/1741220040.644948/hparams.yml @@ -0,0 +1,4 @@ +learning_rate: 1.0e-05 +max_train_steps: 3500 +num_train_epochs: 350 +train_batch_size: 1 diff --git a/logs/memo/events.out.tfevents.1741022678.3c52c6a06e3b b/logs/memo/events.out.tfevents.1741022678.3c52c6a06e3b new file mode 100644 index 0000000000000000000000000000000000000000..189f5306bcaf71913a339bbaa93fd5c4181111df --- /dev/null +++ b/logs/memo/events.out.tfevents.1741022678.3c52c6a06e3b @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:634edd0d46439b57037d51e95825d2a55a2bc65e9fad28a7442e85edf3358b78 +size 186798 diff --git a/logs/memo/events.out.tfevents.1741046967.369f90aa7051 b/logs/memo/events.out.tfevents.1741046967.369f90aa7051 new file mode 100644 index 0000000000000000000000000000000000000000..6d3201777b05029b638cf8d1779ea03ace59c314 --- /dev/null +++ b/logs/memo/events.out.tfevents.1741046967.369f90aa7051 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b0e22e72970d95bf8215c0e219e80f630c559f1a6b62cd00dedb7e7b5dbba0f +size 202185 diff --git a/logs/memo/events.out.tfevents.1741060237.369f90aa7051 b/logs/memo/events.out.tfevents.1741060237.369f90aa7051 new file mode 100644 index 0000000000000000000000000000000000000000..6bb256ce3b926b32c645510cae20394ed34f27cf --- /dev/null +++ b/logs/memo/events.out.tfevents.1741060237.369f90aa7051 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01ba23232218d9820f3f39bcf4fdf99cedbe43d42d1c61a8be2ea8ebe741d7b5 +size 978 diff --git a/logs/memo/events.out.tfevents.1741060310.369f90aa7051 b/logs/memo/events.out.tfevents.1741060310.369f90aa7051 new file mode 100644 index 0000000000000000000000000000000000000000..4ab84e1dfacb3ba652652c30ea86ed9135ae7b58 --- /dev/null +++ b/logs/memo/events.out.tfevents.1741060310.369f90aa7051 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c70732385fae2a61402fac2559b405fb8154cfa2050a8258b66cae0f43a4b622 +size 81 diff --git a/logs/memo/events.out.tfevents.1741060338.369f90aa7051 b/logs/memo/events.out.tfevents.1741060338.369f90aa7051 new file mode 100644 index 0000000000000000000000000000000000000000..7da36910b92efb943ae2fa61bd6d22af89b80207 --- /dev/null +++ b/logs/memo/events.out.tfevents.1741060338.369f90aa7051 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4af4645f861db61c065c21d2f09683764ebafe22c4eeb3a9d6e8bbe4c77ec04e +size 9069 diff --git a/logs/memo/events.out.tfevents.1741145698.16e2a27e51cb b/logs/memo/events.out.tfevents.1741145698.16e2a27e51cb new file mode 100644 index 0000000000000000000000000000000000000000..d4bc3691dbfa12ac64df56e4972f375fcad82635 --- /dev/null +++ b/logs/memo/events.out.tfevents.1741145698.16e2a27e51cb @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7454da4500601bf693706b2b8713eeca1d97972a376bd5a8d8b45ee8c5eefc7 +size 186798 diff --git a/logs/memo/events.out.tfevents.1741199140.a4f5499e5c53.8865.0 b/logs/memo/events.out.tfevents.1741199140.a4f5499e5c53.8865.0 new file mode 100644 index 0000000000000000000000000000000000000000..c4923f5bf81e4766703eeea6720157c94a1804d2 --- /dev/null +++ b/logs/memo/events.out.tfevents.1741199140.a4f5499e5c53.8865.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f04fd080b4974d869ab788807cb5490ea96f0f161444011c6215ca1c48427a0 +size 88 diff --git a/logs/memo/events.out.tfevents.1741199250.a4f5499e5c53.9131.0 b/logs/memo/events.out.tfevents.1741199250.a4f5499e5c53.9131.0 new file mode 100644 index 0000000000000000000000000000000000000000..b3a3d6948d32ef286338afec8333900789e30078 --- /dev/null +++ b/logs/memo/events.out.tfevents.1741199250.a4f5499e5c53.9131.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0590b60b8082995dbd83b38d089301684a81178e14368467f915c9e3cf94cb13 +size 609 diff --git a/logs/memo/events.out.tfevents.1741199250.a4f5499e5c53.9131.1 b/logs/memo/events.out.tfevents.1741199250.a4f5499e5c53.9131.1 new file mode 100644 index 0000000000000000000000000000000000000000..de7690b0ff120e85b32ce818b5b3d0691ac4ed44 --- /dev/null +++ b/logs/memo/events.out.tfevents.1741199250.a4f5499e5c53.9131.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:436e1e603c528a6eed230673fa4738516d1de093f3c64f4b17b9d1f11aeb18be +size 609 diff --git a/logs/memo/events.out.tfevents.1741199336.a4f5499e5c53.10747.0 b/logs/memo/events.out.tfevents.1741199336.a4f5499e5c53.10747.0 new file mode 100644 index 0000000000000000000000000000000000000000..d216f768d64b8846ee1e7d81cedd26cb3d722747 --- /dev/null +++ b/logs/memo/events.out.tfevents.1741199336.a4f5499e5c53.10747.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55b5458412fcc4a2e426cbea50b5e38f1ac3e5c20d6527be252935f6806a4580 +size 202233 diff --git a/logs/memo/events.out.tfevents.1741199336.a4f5499e5c53.10747.1 b/logs/memo/events.out.tfevents.1741199336.a4f5499e5c53.10747.1 new file mode 100644 index 0000000000000000000000000000000000000000..b1eeefb2c5540633e33358fde35afafdcb205a09 --- /dev/null +++ b/logs/memo/events.out.tfevents.1741199336.a4f5499e5c53.10747.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:843bf195a113a8665705228a54e9ce65ea3d980bc9fece2674c1a4fe2e5ef533 +size 202233 diff --git a/logs/memo/events.out.tfevents.1741219597.a4f5499e5c53.205096.0 b/logs/memo/events.out.tfevents.1741219597.a4f5499e5c53.205096.0 new file mode 100644 index 0000000000000000000000000000000000000000..00d91b0fe1eedd828d8f6a541f4887baf8ca5da6 --- /dev/null +++ b/logs/memo/events.out.tfevents.1741219597.a4f5499e5c53.205096.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8fec8a10443f203fe8ec7f5d6c712bb716273e5cae76fe7b490a1ef64bcff3e +size 743 diff --git a/logs/memo/events.out.tfevents.1741219597.a4f5499e5c53.205096.1 b/logs/memo/events.out.tfevents.1741219597.a4f5499e5c53.205096.1 new file mode 100644 index 0000000000000000000000000000000000000000..f76a8e0344ccddc85b80d525dd335e7b3fd8b1b0 --- /dev/null +++ b/logs/memo/events.out.tfevents.1741219597.a4f5499e5c53.205096.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:951be82426b4ed9196b274e6f3f00380ec764112e032ceb34433e9debe743121 +size 743 diff --git a/logs/memo/events.out.tfevents.1741219809.a4f5499e5c53.207262.0 b/logs/memo/events.out.tfevents.1741219809.a4f5499e5c53.207262.0 new file mode 100644 index 0000000000000000000000000000000000000000..4d27312d708b0d102ca05b7eb9a8e9592e3d29cc --- /dev/null +++ b/logs/memo/events.out.tfevents.1741219809.a4f5499e5c53.207262.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c70c7ab7aeb7d7d26bac7bcaccf53225f7a623447ae0d08e324d6e7e03e68ccd +size 3808 diff --git a/logs/memo/events.out.tfevents.1741219809.a4f5499e5c53.207262.1 b/logs/memo/events.out.tfevents.1741219809.a4f5499e5c53.207262.1 new file mode 100644 index 0000000000000000000000000000000000000000..d469f2ac5ae4ca8824384862c583000fc4dcce3e --- /dev/null +++ b/logs/memo/events.out.tfevents.1741219809.a4f5499e5c53.207262.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fbc5589891a2b524e38b05f470e2925b8164571272a528a35909d917b2865f2 +size 3808 diff --git a/logs/memo/events.out.tfevents.1741220040.a4f5499e5c53.212374.0 b/logs/memo/events.out.tfevents.1741220040.a4f5499e5c53.212374.0 new file mode 100644 index 0000000000000000000000000000000000000000..943befe5c404ecf3b2589e449756ed5ca384e989 --- /dev/null +++ b/logs/memo/events.out.tfevents.1741220040.a4f5499e5c53.212374.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:655e13c50919a76151720019eb41fb55f799dd9d9fa39ab6e95659280cd85d49 +size 186846 diff --git a/logs/memo/events.out.tfevents.1741220040.a4f5499e5c53.212374.1 b/logs/memo/events.out.tfevents.1741220040.a4f5499e5c53.212374.1 new file mode 100644 index 0000000000000000000000000000000000000000..a7ac2348fdedd016c460fc1401dc0248e5b9608f --- /dev/null +++ b/logs/memo/events.out.tfevents.1741220040.a4f5499e5c53.212374.1 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c692e88835998bf12f4a2414545970cb72548061e9d89202c1cf3831982925e +size 186846