optimass commited on
Commit
41daab6
·
verified ·
1 Parent(s): d244be6

Add checkpoint

Browse files
.DS_Store ADDED
Binary file (6.15 kB). View file
 
checkpoints/.DS_Store ADDED
Binary file (6.15 kB). View file
 
checkpoints/adapter_0.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:02a8e220cbd35058bbe7d8e4be0bc52675dba967a834400454ded709c1604e8e
3
+ size 390897466
checkpoints/adapter_100.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b408a270269e0a9b997e36f3c8f16c32d8826fd4a3613c73d4d1e7f3109f17a3
3
+ size 390899394
checkpoints/adapter_150.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:09331973effa78d5ef5aeeb91c43ff72881031a1f44c8f0a82c2d72f9e2ce495
3
+ size 390899394
checkpoints/adapter_200.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f40e04992c3cf601dec7cab216b87918cba68f099320bd45b914c94784b1ad44
3
+ size 390899394
checkpoints/adapter_250.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:54c7dd36c26425b5b7941ea2899cb7cdcef8c1ff3713a93dd480b30cf7f48553
3
+ size 390899394
checkpoints/adapter_50.pt ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0e44ec24eda06f3b2d329906df387ff9ce2b5bb3e1cd4edf80b48dc879f76405
3
+ size 390898430
checkpoints/adapter_config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"r": 16, "lora_alpha": 32, "target_modules": ["q_proj", "v_proj", "o_proj", "gate_proj", "down_proj", "up_proj"], "peft_type": "LORA"}
checkpoints/adapter_model.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cc10c303acbfb128715096f9573051062bcc21d43123145c04d7c5c99db16d53
3
+ size 390928074
checkpoints/config.json ADDED
@@ -0,0 +1 @@
 
 
1
+ {"architectures": ["LlamaForCausalLM"], "attention_bias": false, "attention_dropout": 0.0, "bos_token_id": 128000, "eos_token_id": [128001, 128008, 128009], "head_dim": 128, "hidden_act": "silu", "hidden_size": 8192, "initializer_range": 0.02, "intermediate_size": 28672, "max_position_embeddings": 131072, "mlp_bias": false, "model_type": "llama", "num_attention_heads": 64, "num_hidden_layers": 80, "num_key_value_heads": 8, "pretraining_tp": 1, "rms_norm_eps": 1e-05, "rope_scaling": {"factor": 8.0, "high_freq_factor": 4.0, "low_freq_factor": 1.0, "original_max_position_embeddings": 8192, "rope_type": "llama3"}, "rope_theta": 500000.0, "tie_word_embeddings": false, "torch_dtype": "bfloat16", "transformers_version": "4.47.0.dev0", "use_cache": true, "vocab_size": 128256}