mtasic85 commited on
Commit
63b45b9
·
1 Parent(s): 9f5b8d0

pretrain-core-0

Browse files
Files changed (1) hide show
  1. scripts/pretrain_core_model_0.yaml +1 -1
scripts/pretrain_core_model_0.yaml CHANGED
@@ -20,7 +20,7 @@ model_config:
20
  mlp_class_name: "LLaMAMLP"
21
  intermediate_size: 2048 # n_embd * 4
22
  norm_eps: 1e-5
23
- rope_base: 10000
24
  head_size: 128 # n_embd / n_head
25
 
26
  # Directory in which to save checkpoints and logs. If running in a Lightning Studio Job, look for it in
 
20
  mlp_class_name: "LLaMAMLP"
21
  intermediate_size: 2048 # n_embd * 4
22
  norm_eps: 1e-5
23
+ rope_base: 4300 # https://arxiv.org/pdf/2405.14591
24
  head_size: 128 # n_embd / n_head
25
 
26
  # Directory in which to save checkpoints and logs. If running in a Lightning Studio Job, look for it in