Spaces:

richardskimco
/

google-gemma

Sleeping

richardkimsm89 commited on Dec 18, 2024

Commit

4c8c277

verified ·

1 Parent(s): 18160e9

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -15,7 +15,7 @@ app = gr.load(
     ]
 ).launch()
 """
 # Pipeline
 import gradio as gr
@@ -39,4 +39,25 @@ app = gr.Interface(
     examples = [
         ["Hello, World."]
     ]
-).launch()

     ]
 ).launch()
 """
+"""
 # Pipeline
 import gradio as gr
     examples = [
         ["Hello, World."]
     ]
+).launch()
+"""
+from huggingface_hub import InferenceClient
+#client = InferenceClient(api_key="YOUR_HF_TOKEN")
+messages = [
+	{ "role": "user", "content": "Tell me a story" }
+]
+stream = client.chat.completions.create(
+    model="google/gemma-2-2b-it",
+	messages=messages,
+	temperature=0.5,
+	max_tokens=2048,
+	top_p=0.7,
+	stream=True
+)
+for chunk in stream:
+    print(chunk.choices[0].delta.content)