satreysa commited on
Commit
bc2d4b5
·
verified ·
1 Parent(s): d03d57f

Update genai_config.json

Browse files
Files changed (1) hide show
  1. genai_config.json +51 -51
genai_config.json CHANGED
@@ -1,52 +1,52 @@
1
- {
2
- "model": {
3
- "bos_token_id": 1,
4
- "context_length": 8192,
5
- "decoder": {
6
- "session_options": {
7
- "log_id": "onnxruntime-genai",
8
- "custom_ops_library": "//path//to//onnx_custom_ops.dll",
9
- "external_data_file": "chatglm3_v4_npu_jit.pb.bin",
10
- "custom_allocator": "shared_d3d_xrt",
11
- "provider_options": []
12
- },
13
- "filename": "chatglm3_v4_npu_jit.onnx",
14
- "head_size": 128,
15
- "hidden_size": 4096,
16
- "inputs": {
17
- "input_ids": "input_ids",
18
- "attention_mask": "attention_mask",
19
- "past_key_names": "past_key_values.%d.key",
20
- "past_value_names": "past_key_values.%d.value"
21
- },
22
- "outputs": {
23
- "logits": "logits",
24
- "present_key_names": "present.%d.key",
25
- "present_value_names": "present.%d.value"
26
- },
27
- "num_attention_heads": 32,
28
- "num_hidden_layers": 28,
29
- "num_key_value_heads": 2
30
- },
31
- "eos_token_id": 2,
32
- "pad_token_id": 0,
33
- "type": "chatglm",
34
- "vocab_size": 65024
35
- },
36
- "search": {
37
- "diversity_penalty": 0.0,
38
- "do_sample": false,
39
- "early_stopping": true,
40
- "length_penalty": 1.0,
41
- "max_length": 8192,
42
- "min_length": 0,
43
- "no_repeat_ngram_size": 0,
44
- "num_beams": 1,
45
- "num_return_sequences": 1,
46
- "past_present_share_buffer": true,
47
- "repetition_penalty": 1.0,
48
- "temperature": 1.0,
49
- "top_k": 1,
50
- "top_p": 1.0
51
- }
52
  }
 
1
+ {
2
+ "model": {
3
+ "bos_token_id": 1,
4
+ "context_length": 8192,
5
+ "decoder": {
6
+ "session_options": {
7
+ "log_id": "onnxruntime-genai",
8
+ "custom_ops_library": "onnx_custom_ops.dll",
9
+ "external_data_file": "chatglm3_v4_npu_jit.pb.bin",
10
+ "custom_allocator": "shared_d3d_xrt",
11
+ "provider_options": []
12
+ },
13
+ "filename": "chatglm3_v4_npu_jit.onnx",
14
+ "head_size": 128,
15
+ "hidden_size": 4096,
16
+ "inputs": {
17
+ "input_ids": "input_ids",
18
+ "attention_mask": "attention_mask",
19
+ "past_key_names": "past_key_values.%d.key",
20
+ "past_value_names": "past_key_values.%d.value"
21
+ },
22
+ "outputs": {
23
+ "logits": "logits",
24
+ "present_key_names": "present.%d.key",
25
+ "present_value_names": "present.%d.value"
26
+ },
27
+ "num_attention_heads": 32,
28
+ "num_hidden_layers": 28,
29
+ "num_key_value_heads": 2
30
+ },
31
+ "eos_token_id": 2,
32
+ "pad_token_id": 0,
33
+ "type": "chatglm",
34
+ "vocab_size": 65024
35
+ },
36
+ "search": {
37
+ "diversity_penalty": 0.0,
38
+ "do_sample": false,
39
+ "early_stopping": true,
40
+ "length_penalty": 1.0,
41
+ "max_length": 8192,
42
+ "min_length": 0,
43
+ "no_repeat_ngram_size": 0,
44
+ "num_beams": 1,
45
+ "num_return_sequences": 1,
46
+ "past_present_share_buffer": true,
47
+ "repetition_penalty": 1.0,
48
+ "temperature": 1.0,
49
+ "top_k": 1,
50
+ "top_p": 1.0
51
+ }
52
  }