Spaces:

richardskimco
/

google-gemma

Sleeping

App Files Files

richardkimsm89 commited on Dec 28, 2024

Commit

12fb4a0

verified ·

1 Parent(s): 8dbe12b

Update app.py

Browse files

Files changed (1) hide show

app.py +55 -1

app.py CHANGED Viewed

@@ -3,6 +3,61 @@
 import gradio as gr
 from huggingface_hub import InferenceClient
 model = "google/gemma-2-27b-it"
 #model = "google/gemma-2-9b-it"
 #model = "google/gemma-2-2b-it"
@@ -58,7 +113,6 @@ app = gr.ChatInterface(
 if __name__ == "__main__":
     app.launch()
-"""
 # Pipeline
 import gradio as gr

 import gradio as gr
 from huggingface_hub import InferenceClient
+model = "google/gemma-2-27b-it"
+client = InferenceClient(model)
+def fn_text(
+    prompt,
+    history,
+    #system_prompt,
+    max_tokens,
+    temperature,
+    top_p,
+):
+    messages = [{"role": "user", "content": prompt}]
+    history.append(messages[0])
+    stream = client.chat.completions.create(
+        model = model,
+        messages = history,
+        max_tokens = max_tokens,
+        temperature = temperature,
+        top_p = top_p,
+        stream = True
+    )
+    chunks = []
+    for chunk in stream:
+        chunks.append(chunk.choices[0].delta.content or "")
+        yield "".join(chunks)
+app_text = gr.ChatInterface(
+    fn = fn_text,
+    type = "messages",
+    additional_inputs = [
+        #gr.Textbox(value="You are a helpful assistant.", label="System Prompt"),
+        gr.Slider(minimum=1, maximum=2048, value=512, step=1, label="Max Tokens"),
+        gr.Slider(minimum=0.1, maximum=4.0, value=0.7, step=0.1, label="Temperature"),
+        gr.Slider(minimum=0.1, maximum=1.0, value=0.95, step=0.05, label="Top-P"),
+    ],
+    title = "Google Gemma",
+    description = model,
+)
+app = gr.TabbedInterface(
+    [app_text],
+    ["Text"]
+).launch()
+#if __name__ == "__main__":
+#    app.launch()
+"""
+# Inference
+import gradio as gr
+from huggingface_hub import InferenceClient
 model = "google/gemma-2-27b-it"
 #model = "google/gemma-2-9b-it"
 #model = "google/gemma-2-2b-it"
 if __name__ == "__main__":
     app.launch()
 # Pipeline
 import gradio as gr