SihyunPark commited on
Commit
a21eaa9
·
verified ·
1 Parent(s): d9bff4a

Upload folder using huggingface_hub

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
config.json CHANGED
@@ -1,12 +1,17 @@
1
  {
2
- "_name_or_path": "wisenut-nlp-team/wisenut-llama-3.1-8B-0.8-Instruct",
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
6
  "attention_bias": false,
7
  "attention_dropout": 0.0,
8
  "bos_token_id": 128000,
9
- "eos_token_id": 128001,
 
 
 
 
 
10
  "hidden_act": "silu",
11
  "hidden_size": 4096,
12
  "initializer_range": 0.02,
@@ -29,7 +34,7 @@
29
  "rope_theta": 500000.0,
30
  "tie_word_embeddings": false,
31
  "torch_dtype": "bfloat16",
32
- "transformers_version": "4.44.1",
33
  "use_cache": false,
34
  "vocab_size": 128256
35
  }
 
1
  {
2
+ "_name_or_path": "",
3
  "architectures": [
4
  "LlamaForCausalLM"
5
  ],
6
  "attention_bias": false,
7
  "attention_dropout": 0.0,
8
  "bos_token_id": 128000,
9
+ "eos_token_id": [
10
+ 128001,
11
+ 128008,
12
+ 128009
13
+ ],
14
+ "head_dim": 128,
15
  "hidden_act": "silu",
16
  "hidden_size": 4096,
17
  "initializer_range": 0.02,
 
34
  "rope_theta": 500000.0,
35
  "tie_word_embeddings": false,
36
  "torch_dtype": "bfloat16",
37
+ "transformers_version": "4.46.1",
38
  "use_cache": false,
39
  "vocab_size": 128256
40
  }
generation_config.json CHANGED
@@ -1,6 +1,12 @@
1
  {
2
- "_from_model_config": true,
3
  "bos_token_id": 128000,
4
- "eos_token_id": 128001,
5
- "transformers_version": "4.44.1"
 
 
 
 
 
 
 
6
  }
 
1
  {
 
2
  "bos_token_id": 128000,
3
+ "do_sample": true,
4
+ "eos_token_id": [
5
+ 128001,
6
+ 128008,
7
+ 128009
8
+ ],
9
+ "temperature": 0.6,
10
+ "top_p": 0.9,
11
+ "transformers_version": "4.46.1"
12
  }
model-00001-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8f4e509f033bf075608afb95f0f9151fe588d63fc4475ccb93e9646891c5f309
3
  size 4976698672
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:07a83b6b0d94816db2324287ed369234c678c5fa702ec0858f4f57a406db2e5c
3
  size 4976698672
model-00002-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:8ea8ba7a85ab333ef13fe8df5f6bc5df8e9d3a32018f17f443039e4162063c12
3
  size 4999802720
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2a94561cbc4f23eb62674b886dd2c73cbe62ad52332a6d78d6503d8629503575
3
  size 4999802720
model-00003-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ff44caafe528f5092192b02b121e04d690008b65a6a625c9263f682f3436b3b5
3
  size 4915916176
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ed00238eae1ef58c668228dae5db8e575046efee1cf4dbbc7c4ca977d8d2a820
3
  size 4915916176
model-00004-of-00004.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:68dfaed99a9ba51c91d51aab516ddeee1c5ca45a44445604188c8607dbec1d59
3
  size 1168138808
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7f8ce5f205b970997e08d3b2596bb29cd0dda975a4125914915c60448c95601d
3
  size 1168138808
special_tokens_map.json CHANGED
@@ -1,4 +1,20 @@
1
  {
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
2
  "bos_token": {
3
  "content": "<|begin_of_text|>",
4
  "lstrip": false,
 
1
  {
2
+ "additional_special_tokens": [
3
+ {
4
+ "content": "<|eot_id|>",
5
+ "lstrip": false,
6
+ "normalized": false,
7
+ "rstrip": false,
8
+ "single_word": false
9
+ },
10
+ {
11
+ "content": "<|eom_id|>",
12
+ "lstrip": false,
13
+ "normalized": false,
14
+ "rstrip": false,
15
+ "single_word": false
16
+ }
17
+ ],
18
  "bos_token": {
19
  "content": "<|begin_of_text|>",
20
  "lstrip": false,
tokenizer.json CHANGED
The diff for this file is too large to render. See raw diff
 
tokenizer_config.json CHANGED
@@ -2049,6 +2049,10 @@
2049
  "special": true
2050
  }
2051
  },
 
 
 
 
2052
  "bos_token": "<|begin_of_text|>",
2053
  "chat_template": "{% set loop_messages = messages %}{% for message in loop_messages %}{% set content = '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n'+ message['content'] | trim + '<|eot_id|>' %}{% if loop.index0 == 0 %}{% set content = bos_token + content %}{% endif %}{{ content }}{% endfor %}{{ '<|start_header_id|>assistant<|end_header_id|>\n\n' }}",
2054
  "clean_up_tokenization_spaces": true,
 
2049
  "special": true
2050
  }
2051
  },
2052
+ "additional_special_tokens": [
2053
+ "<|eot_id|>",
2054
+ "<|eom_id|>"
2055
+ ],
2056
  "bos_token": "<|begin_of_text|>",
2057
  "chat_template": "{% set loop_messages = messages %}{% for message in loop_messages %}{% set content = '<|start_header_id|>' + message['role'] + '<|end_header_id|>\n\n'+ message['content'] | trim + '<|eot_id|>' %}{% if loop.index0 == 0 %}{% set content = bos_token + content %}{% endif %}{{ content }}{% endfor %}{{ '<|start_header_id|>assistant<|end_header_id|>\n\n' }}",
2058
  "clean_up_tokenization_spaces": true,
train_results.json ADDED
@@ -0,0 +1,8 @@
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "epoch": 0.9171974522292994,
3
+ "total_flos": 1.4450769654710272e+17,
4
+ "train_loss": 0.8373564614189996,
5
+ "train_runtime": 1015.8196,
6
+ "train_samples_per_second": 4.922,
7
+ "train_steps_per_second": 0.009
8
+ }
trainer_log.jsonl ADDED
@@ -0,0 +1 @@
 
 
1
+ {"current_steps": 9, "total_steps": 9, "epoch": 0.9171974522292994, "percentage": 100.0, "elapsed_time": "0:16:55", "remaining_time": "0:00:00"}
trainer_state.json ADDED
@@ -0,0 +1,42 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "best_metric": null,
3
+ "best_model_checkpoint": null,
4
+ "epoch": 0.9171974522292994,
5
+ "eval_steps": 500,
6
+ "global_step": 9,
7
+ "is_hyper_param_search": false,
8
+ "is_local_process_zero": true,
9
+ "is_world_process_zero": true,
10
+ "log_history": [
11
+ {
12
+ "epoch": 0.9171974522292994,
13
+ "step": 9,
14
+ "total_flos": 1.4450769654710272e+17,
15
+ "train_loss": 0.8373564614189996,
16
+ "train_runtime": 1015.8196,
17
+ "train_samples_per_second": 4.922,
18
+ "train_steps_per_second": 0.009
19
+ }
20
+ ],
21
+ "logging_steps": 50,
22
+ "max_steps": 9,
23
+ "num_input_tokens_seen": 0,
24
+ "num_train_epochs": 1,
25
+ "save_steps": 500,
26
+ "stateful_callbacks": {
27
+ "TrainerControl": {
28
+ "args": {
29
+ "should_epoch_stop": false,
30
+ "should_evaluate": false,
31
+ "should_log": false,
32
+ "should_save": true,
33
+ "should_training_stop": true
34
+ },
35
+ "attributes": {}
36
+ }
37
+ },
38
+ "total_flos": 1.4450769654710272e+17,
39
+ "train_batch_size": 8,
40
+ "trial_name": null,
41
+ "trial_params": null
42
+ }
training_args.bin ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ab11a0cd03349979f1b78bc9d8fee772181424455035a997df669482c4927edc
3
+ size 5368