Sakalti commited on
Commit
58f08c5
·
verified ·
1 Parent(s): b9a7371

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +12 -10
app.py CHANGED
@@ -1,11 +1,11 @@
1
  import gradio as gr
2
  from huggingface_hub import InferenceClient
 
3
 
4
  """
5
- For more information on `huggingface_hub` Inference API support, please check the docs: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
6
  """
7
- client = InferenceClient("Sakalti/qwen2.5")
8
-
9
 
10
  def respond(
11
  message,
@@ -26,34 +26,36 @@ def respond(
26
  messages.append({"role": "user", "content": message})
27
 
28
  # ストリーミングを無効にして、単一の応答を取得
 
29
  response = client.chat_completion(
30
  messages,
31
  max_tokens=max_tokens,
32
  temperature=temperature,
33
  top_p=top_p,
34
  )
 
35
 
36
- return response.choices[0].message.content
37
 
38
  """
39
- For information on how to customize the ChatInterface, peruse the gradio docs: https://www.gradio.app/docs/chatinterface
40
  """
41
  demo = gr.ChatInterface(
42
  respond,
43
  additional_inputs=[
44
- gr.Textbox(value="ユーザーの質問や依頼にのみ答えてください。ポジティブに答えてください", label="System message"),
45
- gr.Slider(minimum=1, maximum=2048, value=512, step=1, label="Max new tokens"),
46
- gr.Slider(minimum=0.1, maximum=4.0, value=0.7, step=0.1, label="Temperature"),
47
  gr.Slider(
48
  minimum=0.1,
49
  maximum=1.0,
50
  value=0.95,
51
  step=0.05,
52
- label="Top-p (nucleus sampling)",
53
  ),
54
  ],
 
55
  )
56
 
57
-
58
  if __name__ == "__main__":
59
  demo.launch()
 
1
  import gradio as gr
2
  from huggingface_hub import InferenceClient
3
+ import time
4
 
5
  """
6
+ `huggingface_hub` の推論 API サポートについての詳細は、ドキュメントを確認してください: https://huggingface.co/docs/huggingface_hub/v0.22.2/en/guides/inference
7
  """
8
+ client = InferenceClient("Qwen/Qwen2.5-3b-Instruct")
 
9
 
10
  def respond(
11
  message,
 
26
  messages.append({"role": "user", "content": message})
27
 
28
  # ストリーミングを無効にして、単一の応答を取得
29
+ start_time = time.time() # 予測時間計測開始
30
  response = client.chat_completion(
31
  messages,
32
  max_tokens=max_tokens,
33
  temperature=temperature,
34
  top_p=top_p,
35
  )
36
+ elapsed_time = time.time() - start_time # 予測時間計測終了
37
 
38
+ return response.choices[0].message.content, f"予測時間: {elapsed_time:.2f}秒"
39
 
40
  """
41
+ ChatInterfaceのカスタマイズ方法については、gradioのドキュメントを確認してください: https://www.gradio.app/docs/chatinterface
42
  """
43
  demo = gr.ChatInterface(
44
  respond,
45
  additional_inputs=[
46
+ gr.Textbox(value="ユーザーの質問や依頼にのみ答えてください。ポジティブに答えてください", label="システムメッセージ"),
47
+ gr.Slider(minimum=1, maximum=2048, value=512, step=1, label="最大新規トークン"),
48
+ gr.Slider(minimum=0.1, maximum=4.0, value=0.7, step=0.1, label="温度"),
49
  gr.Slider(
50
  minimum=0.1,
51
  maximum=1.0,
52
  value=0.95,
53
  step=0.05,
54
+ label="Top-p (核サンプリング)",
55
  ),
56
  ],
57
+ theme=gr.themes.BaseTheme(primary_color="#212121") # 背景色を設定
58
  )
59
 
 
60
  if __name__ == "__main__":
61
  demo.launch()