Transformers
Inference Endpoints
qqc1989 commited on
Commit
738a450
·
verified ·
1 Parent(s): 8b50404

Upload 2 files

Browse files
Files changed (3) hide show
  1. .gitattributes +1 -0
  2. main_prefill_postprocess +3 -0
  3. post_config.json +14 -0
.gitattributes CHANGED
@@ -63,3 +63,4 @@ deepseek-r1-7b-ax650/qwen2_p128_l25_together.axmodel filter=lfs diff=lfs merge=l
63
  deepseek-r1-7b-ax650/qwen2_p128_l26_together.axmodel filter=lfs diff=lfs merge=lfs -text
64
  deepseek-r1-7b-ax650/qwen2_p128_l27_together.axmodel filter=lfs diff=lfs merge=lfs -text
65
  deepseek-r1-7b-ax650/qwen2_post.axmodel filter=lfs diff=lfs merge=lfs -text
 
 
63
  deepseek-r1-7b-ax650/qwen2_p128_l26_together.axmodel filter=lfs diff=lfs merge=lfs -text
64
  deepseek-r1-7b-ax650/qwen2_p128_l27_together.axmodel filter=lfs diff=lfs merge=lfs -text
65
  deepseek-r1-7b-ax650/qwen2_post.axmodel filter=lfs diff=lfs merge=lfs -text
66
+ main_prefill_postprocess filter=lfs diff=lfs merge=lfs -text
main_prefill_postprocess ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:7661c63bcc2d2f6ca557ec81cad9371b1a196b0f9f171b6b91069e87a9ae9619
3
+ size 3055912
post_config.json ADDED
@@ -0,0 +1,14 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "enable_temperature" : true,
3
+ "temperature" : 0.9,
4
+
5
+ "enable_repetition_penalty" : false,
6
+ "repetition_penalty" : 1.2,
7
+ "penalty_window" : 20,
8
+
9
+ "enable_top_p_sampling" : false,
10
+ "top_p" : 0.8,
11
+
12
+ "enable_top_k_sampling" : true,
13
+ "top_k" : 10
14
+ }