diff --git a/exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/mxfp4_e2m1_cs/checkpoint.pt b/exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/mxfp4_e2m1_cs/checkpoint.pt new file mode 100644 index 0000000000000000000000000000000000000000..b41404445070c99cc0f667e7eca2a98ded55a471 --- /dev/null +++ b/exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/mxfp4_e2m1_cs/checkpoint.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02ac9c7fbb85c3cb5c319220b4824a5aa2722ae71c4b0c0a9f7e3e6b58345a7d +size 10798884178 diff --git a/exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/mxfp4_e2m1_cs/checkpoint_.pt b/exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/mxfp4_e2m1_cs/checkpoint_.pt new file mode 100644 index 0000000000000000000000000000000000000000..b41404445070c99cc0f667e7eca2a98ded55a471 --- /dev/null +++ b/exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/mxfp4_e2m1_cs/checkpoint_.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02ac9c7fbb85c3cb5c319220b4824a5aa2722ae71c4b0c0a9f7e3e6b58345a7d +size 10798884178 diff --git a/exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/mxfp4_e2m1_cs/config.yaml b/exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/mxfp4_e2m1_cs/config.yaml new file mode 100644 index 0000000000000000000000000000000000000000..2f02444eb3435942880024349954163166145fcb --- /dev/null +++ b/exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/mxfp4_e2m1_cs/config.yaml @@ -0,0 +1,271 @@ +run_dir: exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/mxfp4_e2m1_cs +seed: 0 +allow_tf32: true +timeout: null +resolution: 256 +amp: bf16 +cfg_scale: 1.0 +evaluate_split: test +eval_dir_name: null +num_save_images: 64 +save_all_images: false +save_image_format: jpg +save_images_at_all_procs: false +save_latent_samples: false +latent_samples_dir: null +evaluate_dataset: sample_class +sample_class: + name: SampleClass + batch_size: 128 + n_worker: 8 + drop_last: false + seed: 0 + shuffle: false + num_classes: 1000 + num_samples: 50000 +autoencoder: + num_settings: 1 + name: dc-ae-f32c32-in-1.0-256px + scaling_factor: 0.3285 + latent_channels: null +autoencoder_dtype: fp32 +eval_autoencoder_setting_list: null +model: fp8coat_dit +dit: + name: DiT + in_channels: 32 + input_size: 8 + cfg_channels: null + pretrained_path: null + pretrained_source: dc-ae + train_scheduler: SiTSampler + eval_scheduler: ODE_heun2 + num_inference_steps: 30 + flow_shift: 3.0 + reverse_time: false + use_cads: false + cads_noise_scale: 0.1 + cads_mixing_factor: 1.0 + cads_tau_min: 0.2 + cads_tau_max: 0.9 + use_guidance_interval: false + guidance_t_min: 0.2 + guidance_t_max: 0.8 + count_nfe: false + patch_size: 1 + hidden_size: 1152 + depth: 28 + num_heads: 16 + mlp_ratio: 4.0 + post_norm: false + class_dropout_prob: 0.1 + num_classes: 1000 + learn_sigma: false + unconditional: false + use_checkpoint: true + adaptive_channel: false + adaptive_channel_share_weights: true + only_load_backbone: false + freeze_backbone: false +uvit: + name: UViT + in_channels: 4 + input_size: 32 + cfg_channels: null + pretrained_path: null + pretrained_source: dc-ae + train_scheduler: DPM_Solver + eval_scheduler: DPM_Solver + num_inference_steps: 30 + flow_shift: 3.0 + reverse_time: false + use_cads: false + cads_noise_scale: 0.1 + cads_mixing_factor: 1.0 + cads_tau_min: 0.2 + cads_tau_max: 0.9 + use_guidance_interval: false + guidance_t_min: 0.2 + guidance_t_max: 0.8 + count_nfe: false + patch_size: 2 + hidden_size: 1152 + depth: 28 + num_heads: 16 + mlp_ratio: 4.0 + mlp_time_embed: false + qkv_bias: false + act_layer: gelu + use_checkpoint: true + class_dropout_prob: 0.1 + num_classes: 1000 + attn_mode: null +sana_cls: + name: SanaCls + in_channels: 4 + input_size: 32 + cfg_channels: null + pretrained_path: null + pretrained_source: dc-ae + train_scheduler: SanaScheduler + eval_scheduler: SanaScheduler + num_inference_steps: 250 + flow_shift: 3.0 + reverse_time: false + use_cads: false + cads_noise_scale: 0.1 + cads_mixing_factor: 1.0 + cads_tau_min: 0.2 + cads_tau_max: 0.9 + use_guidance_interval: false + guidance_t_min: 0.2 + guidance_t_max: 0.8 + count_nfe: false + patch_size: 2 + hidden_size: 1152 + depth: 28 + num_heads: 16 + mlp_ratio: 4.0 + post_norm: false + class_dropout_prob: 0.1 + num_classes: 1000 + unconditional: false + use_checkpoint: true + only_load_backbone: false + freeze_backbone: false + learn_sigma: false +usana_cls: + name: USanaCls + in_channels: 4 + input_size: 32 + cfg_channels: null + pretrained_path: null + pretrained_source: dc-ae + train_scheduler: DPM_Solver + eval_scheduler: DPM_Solver + num_inference_steps: 30 + flow_shift: 3.0 + reverse_time: false + use_cads: false + cads_noise_scale: 0.1 + cads_mixing_factor: 1.0 + cads_tau_min: 0.2 + cads_tau_max: 0.9 + use_guidance_interval: false + guidance_t_min: 0.2 + guidance_t_max: 0.8 + count_nfe: false + patch_size: 2 + hidden_size: 1152 + depth: 28 + num_heads: 16 + mlp_ratio: 4.0 + mlp_time_embed: false + qkv_bias: false + act_layer: gelu + use_checkpoint: true + class_dropout_prob: 0.1 + num_classes: 1000 + num_training_steps: 1000 +fp8: + name: FP8DiT +fp8coat: + name: FP8COATDiT + qchoice: linear + symm: true + row_blocksize: -1 + col_blocksize: -1 + linear_row_blocksize: 1 + linear_col_blocksize: 32 + min_blockunit_row: -1 + min_blockunit_col: -1 + fabit: MXE2M1 + fwbit: MXE2M1 + babit: MXE2M1 + bwbit: MXE2M1 + bobit: MXE2M1 + epsilon: 1.0e-08 +compute_fid: true +fid: + save_path: null + ref_path: assets/data/fid/imagenet_train_256.npz + precision_recall_ref_path: assets/data/precision_recall/VIRTUAL_imagenet256.npy +compute_inception_score: true +inception_score: {} +compute_cmmd: true +cmmd: + save_path: null + ref_path: assets/data/cmmd/VIRTUAL_imagenet256.npy +verbose: false +train_dataset: latent_imagenet +latent_imagenet: + name: LatentImageNet + batch_size: 128 + n_worker: 8 + drop_last: true + seed: 0 + shuffle: true + data_dir: assets/data/latent/dc_ae_f32c32_in_1.0_256px/imagenet_256 +latent_mjhq: + name: LatentMJHQ + batch_size: 32 + n_worker: 8 + drop_last: true + seed: 0 + shuffle: true + data_dir: assets/data/latent/dc_ae_f32c32/mjhq_1024 +latent_ffhq: + name: LatentFFHQ + batch_size: 32 + n_worker: 8 + drop_last: true + seed: 0 + shuffle: true + data_dir: assets/data/latent/dc_ae_f32c32/ffhq_1024 +latent_mapillary_vistas: + name: LatentMapillaryVistas + batch_size: 32 + n_worker: 8 + drop_last: true + seed: 0 + shuffle: true + data_dir: assets/data/latent/dc_ae_f32c32/mapillary_vistas_2048 +latent_multiple_channel_imagenet: + name: LatentMultipleChannelImageNet + batch_size: 32 + n_worker: 8 + drop_last: true + seed: 0 + shuffle: true + dataset_sample_ratio: null + num_channels_list: null + data_dirs: + - assets/data/latent/dc_ae_f32c32/imagenet_512 +resume: true +resume_path: null +resume_schedule: true +num_epochs: null +max_steps: 500000 +clip_grad: null +num_store_images: 64 +save_checkpoint_steps: 1000 +eval_steps: 5000 +save_eval_checkpoint_steps: 100000 +optimizer: + name: adamw + lr: 0.0001 + warmup_lr: 0.0 + weight_decay: 0.0 + no_wd_keys: [] + betas: + - 0.9 + - 0.999 +lr_scheduler: + name: constant + warmup_steps: 1000 +log: true +wandb_entity: han2024 +wandb_project: dc_ae_diffusion +ema_decay: 0.9999 +ema_warmup_steps: 2000 +eval_ema: true diff --git a/exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/mxfp4_e2m1_cs/eval_results.csv b/exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/mxfp4_e2m1_cs/eval_results.csv new file mode 100644 index 0000000000000000000000000000000000000000..c6451d3f75aca9a0749ae49d4a342cab171024f3 --- /dev/null +++ b/exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/mxfp4_e2m1_cs/eval_results.csv @@ -0,0 +1,69 @@ +,fid,precision,recall,inception_score_mean,inception_score_std,cmmd +step_100000_autoencoder_setting_0_cfg_1.0,27.46606584701101,0.61735999584198,0.5893999934196472,46.54857947447967,1.3332273204939689,0.685572624206543 +step_10000_autoencoder_setting_0_cfg_1.0,77.05727446679134,0.3295599818229675,0.4676999747753143,15.565048888106762,0.268597983349972,1.496434211730957 +step_105000_autoencoder_setting_0_cfg_1.0,27.715464220831564,0.6100999712944031,0.5995999574661255,45.302445631410805,1.2576683673143063,0.690460205078125 +step_110000_autoencoder_setting_0_cfg_1.0,27.141188774822467,0.6067799925804138,0.6047999858856201,45.71671888649294,1.074692222450376,0.6685256958007812 +step_115000_autoencoder_setting_0_cfg_1.0,29.350415158731263,0.5864599943161011,0.5963999629020691,43.579235183056014,1.2193228974808052,0.7292032241821289 +step_120000_autoencoder_setting_0_cfg_1.0,27.38260828210184,0.6115800142288208,0.598800003528595,47.638758831764754,1.2527766028282552,0.7010698318481445 +step_125000_autoencoder_setting_0_cfg_1.0,83.55567058324493,0.2736199796199798,0.4508000016212463,18.344966937487577,0.389236454215938,1.780986785888672 +step_130000_autoencoder_setting_0_cfg_1.0,114.60912176227862,0.1869200021028518,0.2345999926328659,13.028534859800804,0.23888282689829,2.300500869750977 +step_135000_autoencoder_setting_0_cfg_1.0,97.17474583044005,0.2395999878644943,0.3242000043392181,16.750898003550397,0.2424382515054995,1.890420913696289 +step_140000_autoencoder_setting_0_cfg_1.0,62.01676963957283,0.3773399889469147,0.5047999620437622,24.835525419780133,0.5307866202988152,1.2725591659545898 +step_145000_autoencoder_setting_0_cfg_1.0,44.22959053359051,0.4382599890232086,0.5212999582290649,35.67310203500692,0.5913120500560604,1.043081283569336 +step_150000_autoencoder_setting_0_cfg_1.0,32.55213508177684,0.537559986114502,0.5720999836921692,40.40690785039882,1.132214501737283,0.7479190826416016 +step_15000_autoencoder_setting_0_cfg_1.0,64.88207396149625,0.3858200013637543,0.5281000137329102,18.014370533263538,0.3676093952837374,1.2459754943847656 +step_155000_autoencoder_setting_0_cfg_1.0,40.266173895939176,0.5103999972343445,0.585599958896637,28.388441572318595,0.4970437606726969,0.7547140121459961 +step_160000_autoencoder_setting_0_cfg_1.0,36.156868500368944,0.5500999689102173,0.5920000076293945,33.231766280420786,0.6152553127261183,0.6874799728393555 +step_165000_autoencoder_setting_0_cfg_1.0,38.89370050754872,0.5418199896812439,0.5845000147819519,30.68981609633452,0.4129188269920643,0.6977319717407227 +step_170000_autoencoder_setting_0_cfg_1.0,30.694090357101345,0.5943799614906311,0.5412999987602234,39.55446709901744,0.745065321938258,0.5748271942138672 +step_175000_autoencoder_setting_0_cfg_1.0,37.083586034121424,0.5604400038719177,0.4668999910354614,34.84011334894741,0.8153509818257131,0.64849853515625 +step_180000_autoencoder_setting_0_cfg_1.0,27.748739835219794,0.6278799772262573,0.5295000076293945,45.49423802870099,1.0167031906161783,0.5700588226318359 +step_185000_autoencoder_setting_0_cfg_1.0,25.23685241176776,0.6418399810791016,0.5458999872207642,49.39908635955667,0.8054656414757482,0.5505084991455078 +step_190000_autoencoder_setting_0_cfg_1.0,23.13110201175607,0.6460599899291992,0.5361999869346619,55.5172910005238,1.4440970382251597,0.540614128112793 +step_195000_autoencoder_setting_0_cfg_1.0,23.538359742343346,0.6541399955749512,0.5478999614715576,56.7474705741029,1.2274480853058574,0.598907470703125 +step_200000_autoencoder_setting_0_cfg_1.0,23.92483618921034,0.6505599617958069,0.561199963092804,54.45099339865616,1.093298317638356,0.5929470062255859 +step_20000_autoencoder_setting_0_cfg_1.0,58.60705841394633,0.4182599782943725,0.5557000041007996,19.6572384893356,0.3906942602501593,1.1314153671264648 +step_205000_autoencoder_setting_0_cfg_1.0,26.66331853579948,0.6324999928474426,0.5630999803543091,48.94374481668279,0.7540630131991589,0.6198883056640625 +step_210000_autoencoder_setting_0_cfg_1.0,27.182584950619287,0.6284199953079224,0.5674999952316284,47.74365201665509,0.8291473491519269,0.6200075149536133 +step_215000_autoencoder_setting_0_cfg_1.0,27.06325435066248,0.6215599775314331,0.5681999921798706,47.31741172494515,1.0237269085835967,0.6133317947387695 +step_220000_autoencoder_setting_0_cfg_1.0,27.20068400837704,0.6174600124359131,0.5679000020027161,46.26930037428583,0.9438617752214088,0.5998611450195312 +step_225000_autoencoder_setting_0_cfg_1.0,30.37256821875951,0.5977399945259094,0.5534999966621399,41.23860861317935,0.7901778911911452,0.6161928176879883 +step_230000_autoencoder_setting_0_cfg_1.0,34.054256909763865,0.5787599682807922,0.5667999982833862,37.56948925905199,0.855416136230482,0.6885528564453125 +step_235000_autoencoder_setting_0_cfg_1.0,37.78871189972301,0.5626999735832214,0.5475000143051147,36.7783688249036,0.8235595865583547,0.7672309875488281 +step_240000_autoencoder_setting_0_cfg_1.0,34.93812927402263,0.5778799653053284,0.5565999746322632,39.86825228223786,0.7340756105042252,0.7361173629760742 +step_245000_autoencoder_setting_0_cfg_1.0,36.087229732776905,0.5704999566078186,0.5575000047683716,38.57220970973545,0.914182454177906,0.7581710815429688 +step_250000_autoencoder_setting_0_cfg_1.0,45.18380360504688,0.5283399820327759,0.5587999820709229,31.677529143387662,0.8310292837008046,0.9241104125976562 +step_25000_autoencoder_setting_0_cfg_1.0,54.78462564683889,0.4369199872016907,0.560699999332428,20.89925753264752,0.4969876692833168,1.0616779327392578 +step_255000_autoencoder_setting_0_cfg_1.0,45.76596311543864,0.5237799882888794,0.5626999735832214,31.552457359973697,0.7716041779496106,0.9648799896240234 +step_260000_autoencoder_setting_0_cfg_1.0,47.279312671421735,0.5155199766159058,0.5676000118255615,30.325805138480234,0.6582780217704692,0.9881258010864258 +step_265000_autoencoder_setting_0_cfg_1.0,44.83983435376615,0.5292800068855286,0.5715999603271484,31.390541326123003,0.8134063420420725,0.9305477142333984 +step_270000_autoencoder_setting_0_cfg_1.0,38.73975484264247,0.5501999855041504,0.5708000063896179,35.52544017242904,0.8652260562194196,0.8199214935302734 +step_275000_autoencoder_setting_0_cfg_1.0,38.77210438903603,0.5509999990463257,0.5715999603271484,35.44527252818729,1.0544389007409831,0.7992982864379883 +step_280000_autoencoder_setting_0_cfg_1.0,33.48746168703428,0.5824999809265137,0.5663999915122986,40.810818631937806,1.2478690465740545,0.7320642471313477 +step_285000_autoencoder_setting_0_cfg_1.0,36.32169918558572,0.5613799691200256,0.5709999799728394,38.53071838412784,0.913512937325494,0.8158683776855469 +step_290000_autoencoder_setting_0_cfg_1.0,46.39197448834176,0.5216599702835083,0.5680999755859375,29.67758757261446,0.6341125924727178,0.912189483642578 +step_295000_autoencoder_setting_0_cfg_1.0,45.04938679619204,0.5299599766731262,0.5613999962806702,30.68297905279561,0.6612615131016247,0.9065866470336914 +step_300000_autoencoder_setting_0_cfg_1.0,52.62663548825503,0.5005399584770203,0.5475999712944031,27.40174913093044,0.5743170027896177,1.0752677917480469 +step_30000_autoencoder_setting_0_cfg_1.0,51.11758756774248,0.4611199796199798,0.5708000063896179,22.615113190655308,0.5158982480242132,1.0036230087280271 +step_305000_autoencoder_setting_0_cfg_1.0,45.67455880145883,0.5220999717712402,0.5546999573707581,30.240217515698056,0.5965084969428479,0.9334087371826172 +step_310000_autoencoder_setting_0_cfg_1.0,40.7856380902565,0.531059980392456,0.5634999871253967,33.664514027515104,0.7228171352764384,0.8565187454223633 +step_315000_autoencoder_setting_0_cfg_1.0,36.91062019126514,0.5459200143814087,0.5716999769210815,35.633312098853764,0.7608190318318035,0.7877349853515625 +step_320000_autoencoder_setting_0_cfg_1.0,37.70445902023067,0.544439971446991,0.5766000151634216,35.30922628868343,0.6470175937942215,0.8041858673095703 +step_325000_autoencoder_setting_0_cfg_1.0,40.59112778457501,0.526479959487915,0.5719000101089478,32.94323669682364,0.7779966445993756,0.8525848388671875 +step_330000_autoencoder_setting_0_cfg_1.0,41.36808095788467,0.5224800109863281,0.57669997215271,31.92972678430424,0.8519911306550041,0.8611679077148438 +step_335000_autoencoder_setting_0_cfg_1.0,40.70737066945162,0.5106399655342102,0.5771999955177307,31.90316849544508,0.8207527243075626,0.8548498153686523 +step_340000_autoencoder_setting_0_cfg_1.0,55.28661371068199,0.4687599837779999,0.5615999698638916,24.1637554510839,0.5237266040978577,1.0663270950317383 +step_35000_autoencoder_setting_0_cfg_1.0,47.86400868705658,0.4843999743461609,0.5753999948501587,24.44938966535462,0.4740879065412466,0.9522438049316406 +step_40000_autoencoder_setting_0_cfg_1.0,44.9806935532348,0.5034399628639221,0.5691999793052673,26.29743248955851,0.5344097675106841,0.9119510650634766 +step_45000_autoencoder_setting_0_cfg_1.0,42.565378047629565,0.5239599943161011,0.5755000114440918,28.31337645810432,0.7533079439820995,0.8807182312011719 +step_50000_autoencoder_setting_0_cfg_1.0,40.306019801100376,0.5388399958610535,0.5862999558448792,30.31891718660548,0.8627970481147651,0.8524656295776367 +step_5000_autoencoder_setting_0_cfg_1.0,94.56607537638756,0.2631199955940246,0.3899999856948852,12.82565688732519,0.2361612010165683,1.894235610961914 +step_55000_autoencoder_setting_0_cfg_1.0,37.902322258016966,0.5573999881744385,0.5845000147819519,32.649221478044026,0.935466874893832,0.8213520050048828 +step_60000_autoencoder_setting_0_cfg_1.0,35.683201608006414,0.5734800100326538,0.5792999863624573,35.13069249041864,1.0521529429123773,0.7933378219604492 +step_65000_autoencoder_setting_0_cfg_1.0,33.64241122812501,0.5882200002670288,0.5812000036239624,37.57651136185181,1.069450384565616,0.7615089416503906 +step_70000_autoencoder_setting_0_cfg_1.0,32.061544728339015,0.5981799960136414,0.5773999691009521,39.65159192976438,1.0475217356430864,0.7382631301879883 +step_75000_autoencoder_setting_0_cfg_1.0,30.8947741839886,0.6048799753189087,0.5803999900817871,41.48548670094574,1.1469000012472177,0.7206201553344727 +step_80000_autoencoder_setting_0_cfg_1.0,29.825967575364075,0.6105200052261353,0.5796999931335449,42.90583151384847,0.9982311615890564,0.7059574127197266 +step_85000_autoencoder_setting_0_cfg_1.0,28.89284787860163,0.616159975528717,0.5788999795913696,44.170102925623326,1.238303746466466,0.6911754608154297 +step_90000_autoencoder_setting_0_cfg_1.0,28.134619316356066,0.6207000017166138,0.5791999697685242,45.48569601232439,1.263262369188022,0.6834268569946289 +step_95000_autoencoder_setting_0_cfg_1.0,27.76390992589802,0.6223999857902527,0.5803999900817871,46.33348094756814,1.1956481347018857,0.6825923919677734 diff --git a/exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/mxfp4_e2m1_cs/log.txt b/exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/mxfp4_e2m1_cs/log.txt new file mode 100644 index 0000000000000000000000000000000000000000..1bef265c798992d80580c0856e79b3fca2f0c784 --- /dev/null +++ b/exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/mxfp4_e2m1_cs/log.txt @@ -0,0 +1,3740 @@ +run_dir: exp_hcai/latent_diffusion/imagenet_256/dc_ae_f32c32_in_1.0_256px/dit_xl_1/SiTSampler_ODE_heun2_30/mxfp4_e2m1_cscan not find a checkpoint, will train from scratch + Train Epoch #1: 0%| | 0/1251 [00:00