wejoncy commited on
Commit
fed455b
·
1 Parent(s): a887be4

update config

Browse files
Files changed (1) hide show
  1. config.json +19 -18
config.json CHANGED
@@ -22,7 +22,21 @@
22
  "num_hidden_layers": 126,
23
  "num_key_value_heads": 8,
24
  "pretraining_tp": 1,
25
- "quant_config": {
 
 
 
 
 
 
 
 
 
 
 
 
 
 
26
  "model.layers.0.mlp.down_proj": {
27
  "bias": null,
28
  "enable_norm": true,
@@ -21190,20 +21204,7 @@
21190
  -1,
21191
  8
21192
  ]
21193
- }
21194
- },
21195
- "rms_norm_eps": 1e-05,
21196
- "rope_scaling": {
21197
- "factor": 8.0,
21198
- "high_freq_factor": 4.0,
21199
- "low_freq_factor": 1.0,
21200
- "original_max_position_embeddings": 8192,
21201
- "rope_type": "llama3"
21202
- },
21203
- "rope_theta": 500000.0,
21204
- "tie_word_embeddings": false,
21205
- "torch_dtype": "bfloat16",
21206
- "transformers_version": "4.45.1",
21207
- "use_cache": true,
21208
- "vocab_size": 128256
21209
- }
 
22
  "num_hidden_layers": 126,
23
  "num_key_value_heads": 8,
24
  "pretraining_tp": 1,
25
+ "rms_norm_eps": 1e-05,
26
+ "rope_scaling": {
27
+ "factor": 8.0,
28
+ "high_freq_factor": 4.0,
29
+ "low_freq_factor": 1.0,
30
+ "original_max_position_embeddings": 8192,
31
+ "rope_type": "llama3"
32
+ },
33
+ "rope_theta": 500000.0,
34
+ "tie_word_embeddings": false,
35
+ "torch_dtype": "bfloat16",
36
+ "transformers_version": "4.45.1",
37
+ "use_cache": true,
38
+ "vocab_size": 128256,
39
+ "quantization_config": {
40
  "model.layers.0.mlp.down_proj": {
41
  "bias": null,
42
  "enable_norm": true,
 
21204
  -1,
21205
  8
21206
  ]
21207
+ },
21208
+ "quant_method": "vptq"
21209
+ }
21210
+ }