minpeter commited on
Commit
6d91d45
·
verified ·
1 Parent(s): c03e3f8

Training in progress, step 79

Browse files
Files changed (3) hide show
  1. config.json +2 -2
  2. model.safetensors +2 -2
  3. training_args.bin +1 -1
config.json CHANGED
@@ -6,7 +6,7 @@
6
  "attention_dropout": 0.0,
7
  "bos_token_id": 1,
8
  "eos_token_id": 32001,
9
- "head_dim": 32,
10
  "hidden_act": "silu",
11
  "hidden_size": 256,
12
  "initializer_range": 0.02,
@@ -14,7 +14,7 @@
14
  "max_position_embeddings": 8192,
15
  "mlp_bias": false,
16
  "model_type": "llama",
17
- "num_attention_heads": 8,
18
  "num_hidden_layers": 12,
19
  "num_key_value_heads": 2,
20
  "pad_token_id": 32003,
 
6
  "attention_dropout": 0.0,
7
  "bos_token_id": 1,
8
  "eos_token_id": 32001,
9
+ "head_dim": 64,
10
  "hidden_act": "silu",
11
  "hidden_size": 256,
12
  "initializer_range": 0.02,
 
14
  "max_position_embeddings": 8192,
15
  "mlp_bias": false,
16
  "model_type": "llama",
17
+ "num_attention_heads": 4,
18
  "num_hidden_layers": 12,
19
  "num_key_value_heads": 2,
20
  "pad_token_id": 32003,
model.safetensors CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:ff1d14cd1d5f44e9b8dfe13e9d202139047e63db16a82a2fb9b48be1b8ea1af0
3
- size 39224640
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0ee1c8d83e940e24cfa7591f45f58216088eb308d1e2e847923734ea2eff34aa
3
+ size 40011096
training_args.bin CHANGED
@@ -1,3 +1,3 @@
1
  version https://git-lfs.github.com/spec/v1
2
- oid sha256:459adac6056a53d252a2866812c7720bb793bdfbda1dedc840d1c974a68aa043
3
  size 5777
 
1
  version https://git-lfs.github.com/spec/v1
2
+ oid sha256:afdf64f4d775a1ccf498b20cd081ad67c4be050cb9d17c39bf8ce8997b041645
3
  size 5777