wwppdemo / training_log.json
KimJY's picture
Upload 3 files
6bccabd verified
raw
history blame contribute delete
460 Bytes
{
"base_model_name": "maywell_Synatra-10.7B-v0.4",
"base_model_class": "LlamaForCausalLM",
"base_loaded_in_4bit": true,
"base_loaded_in_8bit": false,
"projections": "q, v",
"loss": 1.5643,
"learning_rate": 8.935678962196381e-10,
"epoch": 2.99,
"current_steps": 7627,
"train_runtime": 47144.0886,
"train_samples_per_second": 2.6,
"train_steps_per_second": 0.01,
"total_flos": 1.991968191814828e+18,
"train_loss": 1.6426315012717896
}