zx-modelcloud commited on
Commit
a44aa3f
·
verified ·
1 Parent(s): 8e69f4c

Upload 10 files

Browse files
.gitattributes CHANGED
@@ -33,3 +33,4 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
 
 
33
  *.zip filter=lfs diff=lfs merge=lfs -text
34
  *.zst filter=lfs diff=lfs merge=lfs -text
35
  *tfevents* filter=lfs diff=lfs merge=lfs -text
36
+ tokenizer.json filter=lfs diff=lfs merge=lfs -text
added_tokens.json ADDED
@@ -0,0 +1,5 @@
 
 
 
 
 
 
1
+ {
2
+ "<|endoftext|>": 151643,
3
+ "<|im_end|>": 151645,
4
+ "<|im_start|>": 151644
5
+ }
config.json ADDED
@@ -0,0 +1,66 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "_attn_implementation_autoset": true,
3
+ "_name_or_path": "/root/.cache/huggingface/hub/models--Qwen--Qwen1.5-1.8B-Chat/snapshots/e482ee3f73c375a627a16fdf66fd0c8279743ca6",
4
+ "architectures": [
5
+ "Qwen2ForCausalLM"
6
+ ],
7
+ "attention_dropout": 0.0,
8
+ "bos_token_id": 151643,
9
+ "eos_token_id": 151645,
10
+ "hidden_act": "silu",
11
+ "hidden_size": 2048,
12
+ "initializer_range": 0.02,
13
+ "intermediate_size": 5504,
14
+ "max_position_embeddings": 32768,
15
+ "max_window_layers": 21,
16
+ "model_type": "qwen2",
17
+ "num_attention_heads": 16,
18
+ "num_hidden_layers": 24,
19
+ "num_key_value_heads": 16,
20
+ "quantization_config": {
21
+ "bits": 4,
22
+ "checkpoint_format": "gptq",
23
+ "desc_act": true,
24
+ "dynamic": {
25
+ "-:model\\.layers\\.([2-9]\\d*|[1-9]\\d+)\\..*": {},
26
+ ".*\\.1\\..*": {
27
+ "bits": 8,
28
+ "desc_act": false,
29
+ "group_size": 32
30
+ },
31
+ "lm_head": {
32
+ "bits": 8,
33
+ "desc_act": false,
34
+ "group_size": 32,
35
+ "mse": 2.4,
36
+ "sym": true
37
+ }
38
+ },
39
+ "group_size": 128,
40
+ "lm_head": true,
41
+ "meta": {
42
+ "damp_auto_increment": 0.0025,
43
+ "damp_percent": 0.01,
44
+ "mse": 0.0,
45
+ "quantizer": [
46
+ "gptqmodel:1.8.0-dev"
47
+ ],
48
+ "static_groups": false,
49
+ "true_sequential": true,
50
+ "uri": "https://github.com/modelcloud/gptqmodel"
51
+ },
52
+ "pack_dtype": "int32",
53
+ "quant_method": "gptq",
54
+ "sym": true
55
+ },
56
+ "rms_norm_eps": 1e-06,
57
+ "rope_scaling": null,
58
+ "rope_theta": 1000000.0,
59
+ "sliding_window": null,
60
+ "tie_word_embeddings": false,
61
+ "torch_dtype": "bfloat16",
62
+ "transformers_version": "4.48.2",
63
+ "use_cache": true,
64
+ "use_sliding_window": false,
65
+ "vocab_size": 151936
66
+ }
merges.txt ADDED
The diff for this file is too large to render. See raw diff
 
model.safetensors ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:26554734410865a68f3771a55ca6b89c2c4321cacc79125336b3392638aa1835
3
+ size 3271099656
quant_log.csv ADDED
@@ -0,0 +1,16 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ layer,module,loss,damp,time
2
+ 0,self_attn.k_proj,0.38340,0.01000,0.985
3
+ 0,self_attn.v_proj,0.00899,0.01000,0.332
4
+ 0,self_attn.q_proj,0.52614,0.01000,0.327
5
+ 0,self_attn.o_proj,0.00033,0.01000,0.326
6
+ 0,mlp.up_proj,1.90171,0.01000,0.348
7
+ 0,mlp.gate_proj,1.81718,0.01000,0.366
8
+ 0,mlp.down_proj,0.04200,0.01000,0.950
9
+ 1,self_attn.k_proj,0.00821,0.01000,0.338
10
+ 1,self_attn.v_proj,0.00108,0.01000,0.329
11
+ 1,self_attn.q_proj,0.00811,0.01000,0.329
12
+ 1,self_attn.o_proj,0.00003,0.01000,0.347
13
+ 1,mlp.up_proj,0.00614,0.01000,0.370
14
+ 1,mlp.gate_proj,0.00698,0.01000,0.383
15
+ 1,mlp.down_proj,0.00040,0.01000,0.944
16
+ 24,lm_head,23.30706,0.01000,4.334
quantize_config.json ADDED
@@ -0,0 +1,36 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "bits": 4,
3
+ "dynamic": {
4
+ "-:model\\.layers\\.([2-9]\\d*|[1-9]\\d+)\\..*": {},
5
+ ".*\\.1\\..*": {
6
+ "bits": 8,
7
+ "desc_act": false,
8
+ "group_size": 32
9
+ },
10
+ "lm_head": {
11
+ "bits": 8,
12
+ "group_size": 32,
13
+ "sym": true,
14
+ "desc_act": false,
15
+ "mse": 2.4
16
+ }
17
+ },
18
+ "group_size": 128,
19
+ "desc_act": true,
20
+ "sym": true,
21
+ "lm_head": true,
22
+ "quant_method": "gptq",
23
+ "checkpoint_format": "gptq",
24
+ "pack_dtype": "int32",
25
+ "meta": {
26
+ "quantizer": [
27
+ "gptqmodel:1.8.0-dev"
28
+ ],
29
+ "uri": "https://github.com/modelcloud/gptqmodel",
30
+ "damp_percent": 0.01,
31
+ "damp_auto_increment": 0.0025,
32
+ "static_groups": false,
33
+ "true_sequential": true,
34
+ "mse": 0.0
35
+ }
36
+ }
special_tokens_map.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "additional_special_tokens": [
3
+ "<|im_start|>",
4
+ "<|im_end|>"
5
+ ],
6
+ "eos_token": {
7
+ "content": "<|im_end|>",
8
+ "lstrip": false,
9
+ "normalized": false,
10
+ "rstrip": false,
11
+ "single_word": false
12
+ },
13
+ "pad_token": "<unk>"
14
+ }
tokenizer.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bcfe42da0a4497e8b2b172c1f9f4ec423a46dc12907f4349c55025f670422ba9
3
+ size 11418266
tokenizer_config.json ADDED
@@ -0,0 +1,45 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "add_prefix_space": false,
3
+ "added_tokens_decoder": {
4
+ "151643": {
5
+ "content": "<|endoftext|>",
6
+ "lstrip": false,
7
+ "normalized": false,
8
+ "rstrip": false,
9
+ "single_word": false,
10
+ "special": true
11
+ },
12
+ "151644": {
13
+ "content": "<|im_start|>",
14
+ "lstrip": false,
15
+ "normalized": false,
16
+ "rstrip": false,
17
+ "single_word": false,
18
+ "special": true
19
+ },
20
+ "151645": {
21
+ "content": "<|im_end|>",
22
+ "lstrip": false,
23
+ "normalized": false,
24
+ "rstrip": false,
25
+ "single_word": false,
26
+ "special": true
27
+ }
28
+ },
29
+ "additional_special_tokens": [
30
+ "<|im_start|>",
31
+ "<|im_end|>"
32
+ ],
33
+ "bos_token": null,
34
+ "chat_template": "{% for message in messages %}{% if loop.first and messages[0]['role'] != 'system' %}{{ '<|im_start|>system\nYou are a helpful assistant.<|im_end|>\n' }}{% endif %}{{'<|im_start|>' + message['role'] + '\n' + message['content'] + '<|im_end|>' + '\n'}}{% endfor %}{% if add_generation_prompt %}{{ '<|im_start|>assistant\n' }}{% endif %}",
35
+ "clean_up_tokenization_spaces": false,
36
+ "eos_token": "<|im_end|>",
37
+ "errors": "replace",
38
+ "extra_special_tokens": {},
39
+ "model_max_length": 32768,
40
+ "pad_token": "<unk>",
41
+ "split_special_tokens": false,
42
+ "tokenizer_class": "Qwen2TokenizerFast",
43
+ "unk_token": null,
44
+ "_commit_hash": null
45
+ }
vocab.json ADDED
The diff for this file is too large to render. See raw diff