MadsGalsgaard commited on
Commit
fa89eeb
·
verified ·
1 Parent(s): 9ca7283

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +65 -17
app.py CHANGED
@@ -7,7 +7,62 @@ For more information on `huggingface_hub` Inference API support, please check th
7
  """
8
  client = InferenceClient("meta-llama/Meta-Llama-3-8B",token=os.getenv('HF_API_TOKEN'))
9
 
10
- ## None type
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
11
  def respond(
12
  message: str,
13
  history: list[tuple[str, str]], # This will not be used
@@ -16,32 +71,26 @@ def respond(
16
  temperature: float,
17
  top_p: float,
18
  ):
19
- messages = [{"role": "system", "content": system_message}]
20
-
21
- # Append only the latest user message
22
- messages.append({"role": "user", "content": message})
23
 
24
  response = ""
25
 
26
  try:
27
- # Generate response from the model
28
- for message in client.chat_completion(
29
- messages,
30
- max_tokens=max_tokens,
31
- stream=True,
32
  temperature=temperature,
33
  top_p=top_p,
34
  ):
35
- if message.choices[0].delta.content is not None:
36
- token = message.choices[0].delta.content
37
- response += token
38
  yield response
39
  except Exception as e:
40
  yield f"An error occurred: {e}"
41
 
42
- """
43
- For information on how to customize the ChatInterface, peruse the gradio docs: https://www.gradio.app/docs/chatinterface
44
- """
45
  demo = gr.ChatInterface(
46
  respond,
47
  additional_inputs=[
@@ -61,7 +110,6 @@ demo = gr.ChatInterface(
61
  if __name__ == "__main__":
62
  demo.launch()
63
 
64
-
65
  # import os
66
  # import gradio as gr
67
  # from huggingface_hub import InferenceClient
 
7
  """
8
  client = InferenceClient("meta-llama/Meta-Llama-3-8B",token=os.getenv('HF_API_TOKEN'))
9
 
10
+ # ## None type
11
+ # def respond(
12
+ # message: str,
13
+ # history: list[tuple[str, str]], # This will not be used
14
+ # system_message: str,
15
+ # max_tokens: int,
16
+ # temperature: float,
17
+ # top_p: float,
18
+ # ):
19
+ # messages = [{"role": "system", "content": system_message}]
20
+
21
+ # # Append only the latest user message
22
+ # messages.append({"role": "user", "content": message})
23
+
24
+ # response = ""
25
+
26
+ # try:
27
+ # # Generate response from the model
28
+ # for message in client.chat_completion(
29
+ # messages,
30
+ # max_tokens=max_tokens,
31
+ # stream=True,
32
+ # temperature=temperature,
33
+ # top_p=top_p,
34
+ # ):
35
+ # if message.choices[0].delta.content is not None:
36
+ # token = message.choices[0].delta.content
37
+ # response += token
38
+ # yield response
39
+ # except Exception as e:
40
+ # yield f"An error occurred: {e}"
41
+
42
+ # """
43
+ # For information on how to customize the ChatInterface, peruse the gradio docs: https://www.gradio.app/docs/chatinterface
44
+ # """
45
+ # demo = gr.ChatInterface(
46
+ # respond,
47
+ # additional_inputs=[
48
+ # gr.Textbox(value="You are a friendly Chatbot.", label="System message"),
49
+ # gr.Slider(minimum=1, maximum=2048, value=512, step=1, label="Max new tokens"),
50
+ # gr.Slider(minimum=0.1, maximum=4.0, value=0.7, step=0.1, label="Temperature"),
51
+ # gr.Slider(
52
+ # minimum=0.1,
53
+ # maximum=1.0,
54
+ # value=0.95,
55
+ # step=0.05,
56
+ # label="Top-p (nucleus sampling)",
57
+ # ),
58
+ # ],
59
+ # )
60
+
61
+ # if __name__ == "__main__":
62
+ # demo.launch()
63
+
64
+
65
+ ####19
66
  def respond(
67
  message: str,
68
  history: list[tuple[str, str]], # This will not be used
 
71
  temperature: float,
72
  top_p: float,
73
  ):
74
+ # Combine the system message and user input into a single prompt
75
+ prompt = f"{system_message}\n{message}"
 
 
76
 
77
  response = ""
78
 
79
  try:
80
+ # Generate response from the model using text generation method
81
+ for message in client.text_generation(
82
+ prompt=prompt,
83
+ max_new_tokens=max_tokens,
 
84
  temperature=temperature,
85
  top_p=top_p,
86
  ):
87
+ if message.token is not None:
88
+ response += message.token
 
89
  yield response
90
  except Exception as e:
91
  yield f"An error occurred: {e}"
92
 
93
+ # Define the Gradio interface
 
 
94
  demo = gr.ChatInterface(
95
  respond,
96
  additional_inputs=[
 
110
  if __name__ == "__main__":
111
  demo.launch()
112
 
 
113
  # import os
114
  # import gradio as gr
115
  # from huggingface_hub import InferenceClient