Llama-3.3-70B-Instruct-abliterated

Running

DJStomp commited on Jan 13

Commit

8393716

verified ·

1 Parent(s): 2a8ab0b

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -10,7 +10,6 @@ if not hf_token:
 # Initialize InferenceClient
 client = InferenceClient(model="huihui-ai/Llama-3.3-70B-Instruct-abliterated", token=hf_token)
 def respond(
     message,
     history: list[tuple[str, str]],
@@ -33,9 +32,10 @@ def respond(
     response = ""
     try:
         for message in client.chat_completion(
             model="huihui-ai/Llama-3.3-70B-Instruct-abliterated",
-            inputs=messages,
             parameters={
                 "max_tokens": max_tokens,
                 "temperature": temperature,
@@ -47,10 +47,8 @@ def respond(
             response += token
             yield response
     except Exception as e:
-        yield f"Error: {str(e)}"
-# Gradio Chat Interface
 demo = gr.ChatInterface(
     respond,
     additional_inputs=[

 # Initialize InferenceClient
 client = InferenceClient(model="huihui-ai/Llama-3.3-70B-Instruct-abliterated", token=hf_token)
 def respond(
     message,
     history: list[tuple[str, str]],
     response = ""
     try:
+        # Use 'messages' instead of 'inputs'
         for message in client.chat_completion(
             model="huihui-ai/Llama-3.3-70B-Instruct-abliterated",
+            messages=messages,  # Correct argument
             parameters={
                 "max_tokens": max_tokens,
                 "temperature": temperature,
             response += token
             yield response
     except Exception as e:
+        yield f"Error: {str(e)}"
 demo = gr.ChatInterface(
     respond,
     additional_inputs=[