optimass commited on
Commit
e325feb
·
verified ·
1 Parent(s): 0488c63

Add checkpoint

Browse files
.DS_Store ADDED
Binary file (6.15 kB). View file
 
checkpoints/.DS_Store ADDED
Binary file (6.15 kB). View file
 
checkpoints/adapter_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25f2958901b6bc000cdb9c068f22a22e8b66fd5ba8892eb04216cb95cfcb5a49
3
+ size 390897466
checkpoints/adapter_100.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:79a893207acafb3fdd8c4d596c9d467ec54d98540e6e782907a1cc3ab9056c88
3
+ size 390899394
checkpoints/adapter_150.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:e40a0db738400da4c4c45973e4377cda971636d3efc7eeb8f33c464461173de4
3
+ size 390899394
checkpoints/adapter_200.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed94936f01ef38d6cab5244ef6a740545be04d8cc8b2bd2d2a7f55c5bba3da69
3
+ size 390899394
checkpoints/adapter_250.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:71c421e784271fb97884553f9322e14aa22795155ebb26015c64489d7a03f3f1
3
+ size 390899394
checkpoints/adapter_50.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:00af12026e03b98e88b75c678070b1907c9ebd3eb21d9cd0d607fab765d39dd8
3
+ size 390898430
checkpoints/adapter_config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"r": 16, "lora_alpha": 32, "target_modules": ["q_proj", "v_proj", "o_proj", "gate_proj", "down_proj", "up_proj"], "peft_type": "LORA"}
checkpoints/adapter_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b07f94053888f401e731f3aac684fc01a8c2f2e4b8bd878be1b043b66228f1aa
3
+ size 390928074
checkpoints/config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 128000, "eos_token_id": [128001, 128008, 128009], "head_dim": 128, "hidden_act": "silu", "hidden_size": 8192, "initializer_range": 0.02, "intermediate_size": 28672, "max_position_embeddings": 131072, "mlp_bias": false, "model_type": "llama", "num_attention_heads": 64, "num_hidden_layers": 80, "num_key_value_heads": 8, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": {"factor": 8.0, "high_freq_factor": 4.0, "low_freq_factor": 1.0, "original_max_position_embeddings": 8192, "rope_type": "llama3"}, "rope_theta": 500000.0, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "transformers_version": "4.47.0.dev0", "use_cache": true, "vocab_size": 128256}