yihanwang617 commited on
Commit
bc70ba6
·
verified ·
1 Parent(s): c644a73

Training in progress, step 100

Browse files
adapter_config.json ADDED
@@ -0,0 +1,34 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "alpha_pattern": {},
3
+ "auto_mapping": null,
4
+ "base_model_name_or_path": "meta-llama/Llama-2-7b-hf",
5
+ "bias": "none",
6
+ "fan_in_fan_out": false,
7
+ "inference_mode": true,
8
+ "init_lora_weights": true,
9
+ "layer_replication": null,
10
+ "layers_pattern": null,
11
+ "layers_to_transform": null,
12
+ "loftq_config": {},
13
+ "lora_alpha": 16,
14
+ "lora_dropout": 0.05,
15
+ "megatron_config": null,
16
+ "megatron_core": "megatron.core",
17
+ "modules_to_save": null,
18
+ "peft_type": "LORA",
19
+ "r": 16,
20
+ "rank_pattern": {},
21
+ "revision": null,
22
+ "target_modules": [
23
+ "down_proj",
24
+ "gate_proj",
25
+ "q_proj",
26
+ "o_proj",
27
+ "k_proj",
28
+ "v_proj",
29
+ "up_proj"
30
+ ],
31
+ "task_type": "CAUSAL_LM",
32
+ "use_dora": false,
33
+ "use_rslora": false
34
+ }
adapter_model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5480e99448d62d3aef9421c59de2d4d3f99636cf4cc6b72bbca7a59cab9dc34b
3
  size 604336032
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:f7ba3c5e08ce28df3c22b3052a6fcfef58080400248c79e61855235985a5f0ab
3
  size 604336032
runs/Sep13_22-50-43_nova.cs.ucla.edu/events.out.tfevents.1726293206.nova.cs.ucla.edu.4131116.0 ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:74ea999b117d76d4aefa815348f2f093fa82f8adc430329ff58590764e9431a6
3
+ size 9282
tokenizer.json CHANGED
@@ -1,6 +1,11 @@
1
  {
2
  "version": "1.0",
3
- "truncation": null,
 
 
 
 
 
4
  "padding": null,
5
  "added_tokens": [
6
  {
 
1
  {
2
  "version": "1.0",
3
+ "truncation": {
4
+ "direction": "Right",
5
+ "max_length": 4096,
6
+ "strategy": "LongestFirst",
7
+ "stride": 0
8
+ },
9
  "padding": null,
10
  "added_tokens": [
11
  {
tokenizer_config.json CHANGED
@@ -44,11 +44,11 @@
44
  }
45
  },
46
  "bos_token": "<s>",
 
47
  "clean_up_tokenization_spaces": false,
48
  "eos_token": "</s>",
49
- "chat_template": "{% for message in messages %}\n{% if message['role'] == 'user' %}\n{{ '<|user|>\n' + message['content'] + eos_token }}\n{% elif message['role'] == 'system' %}\n{{ '<|system|>\n' + message['content'] + eos_token }}\n{% elif message['role'] == 'assistant' %}\n{{ '<|assistant|>\n' + message['content'] + eos_token }}\n{% endif %}\n{% if loop.last and add_generation_prompt %}\n{{ '<|assistant|>' }}\n{% endif %}\n{% endfor %}",
50
  "legacy": false,
51
- "model_max_length": 1000000000000000019884624838656,
52
  "pad_token": "[PAD]",
53
  "padding_side": "right",
54
  "sp_model_kwargs": {},
 
44
  }
45
  },
46
  "bos_token": "<s>",
47
+ "chat_template": "{% for message in messages %}\n{% if message['role'] == 'user' %}\n{{ '<|user|>\n' + message['content'] + eos_token }}\n{% elif message['role'] == 'system' %}\n{{ '<|system|>\n' + message['content'] + eos_token }}\n{% elif message['role'] == 'assistant' %}\n{{ '<|assistant|>\n' + message['content'] + eos_token }}\n{% endif %}\n{% if loop.last and add_generation_prompt %}\n{{ '<|assistant|>' }}\n{% endif %}\n{% endfor %}",
48
  "clean_up_tokenization_spaces": false,
49
  "eos_token": "</s>",
 
50
  "legacy": false,
51
+ "model_max_length": 2048,
52
  "pad_token": "[PAD]",
53
  "padding_side": "right",
54
  "sp_model_kwargs": {},
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:5555f9c2068c149dfe2b8c77b1be13bc97b3f0d9cdb50a8ee993d4e9d1ddfef7
3
  size 6264
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:014bd8984dfb9a98eb33f1f35833635f9bf883602306424c8f027b580992a080
3
  size 6264