WSX commited on
Commit
28f17b3
·
verified ·
1 Parent(s): b4502f7

Training in progress, step 10

Browse files
Files changed (3) hide show
  1. config.json +3 -3
  2. model.safetensors +1 -1
  3. training_args.bin +2 -2
config.json CHANGED
@@ -1,5 +1,5 @@
1
  {
2
- "_name_or_path": "/opt/tiger/sLLM_sft_llama/output/FC_toolace_500_r1_presft_1.5B/checkpoint-132",
3
  "architectures": [
4
  "Qwen2ForCausalLM"
5
  ],
@@ -19,11 +19,11 @@
19
  "rms_norm_eps": 1e-06,
20
  "rope_scaling": null,
21
  "rope_theta": 1000000.0,
22
- "sliding_window": null,
23
  "tie_word_embeddings": true,
24
  "torch_dtype": "bfloat16",
25
  "transformers_version": "4.50.0.dev0",
26
- "use_cache": true,
27
  "use_sliding_window": false,
28
  "vocab_size": 151936
29
  }
 
1
  {
2
+ "_name_or_path": "Qwen/Qwen2.5-1.5B-Instruct",
3
  "architectures": [
4
  "Qwen2ForCausalLM"
5
  ],
 
19
  "rms_norm_eps": 1e-06,
20
  "rope_scaling": null,
21
  "rope_theta": 1000000.0,
22
+ "sliding_window": 32768,
23
  "tie_word_embeddings": true,
24
  "torch_dtype": "bfloat16",
25
  "transformers_version": "4.50.0.dev0",
26
+ "use_cache": false,
27
  "use_sliding_window": false,
28
  "vocab_size": 151936
29
  }
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5f3f7272c4f62f903b3c37acaecf9e9ad3aa6c60889af6714715005289206ead
3
  size 3087467144
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:931c3db5ee21a47882036f969294e36507b5f3ab3c257c0c4f3a51d9206ca2fd
3
  size 3087467144
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:82fa3cfe463ed10fa91da65c1aa74b5d4f72df7f463db4a129f35d14641a067c
3
- size 7672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:8710efd089dcd2bd97fcccbea40ac8c0c35b5cd1c88abbbcfc4a06a0879c261f
3
+ size 7736