Spaces:

artificialguybr
/

LLAMA-2-70B-FREE-DEMO

Paused

App Files Files Community

artificialguybr commited on Mar 9, 2024

Commit

b6ff2ee

verified ·

1 Parent(s): a414401

Update app.py

Browse files

Files changed (1) hide show

app.py +3 -8

app.py CHANGED Viewed

@@ -16,12 +16,6 @@ headers = {
 # Base system message
 BASE_SYSTEM_MESSAGE = "I carefully provide accurate, factual, thoughtful, nuanced answers and am brilliant at reasoning."
-def clear_chat():
-    """Clears the chat history and message state."""
-    print("Clearing chat...")
-    chat_history_state.value = []
-    chatbot.textbox.value = ""
 def call_nvidia_api(history, system_message, max_tokens, temperature, top_p):
     """Calls the NVIDIA API to generate a response."""
     messages = [{"role": "system", "content": system_message}]
@@ -34,7 +28,7 @@ def call_nvidia_api(history, system_message, max_tokens, temperature, top_p):
         "max_tokens": max_tokens,
         "stream": False
     }
-    print(f"Payload enviado: {payload}")
     session = requests.Session()
     response = session.post(INVOKE_URL, headers=headers, json=payload)
     while response.status_code == 202:
@@ -43,7 +37,7 @@ def call_nvidia_api(history, system_message, max_tokens, temperature, top_p):
         response = session.get(fetch_url, headers=headers)
         response.raise_for_status()
     response_body = response.json()
-    print(f"Payload recebido: {response_body}")
     if response_body.get("choices"):
         assistant_message = response_body["choices"][0]["message"]["content"]
         return assistant_message
@@ -70,6 +64,7 @@ system_msg = gr.Textbox(BASE_SYSTEM_MESSAGE, label="System Message", placeholder
 max_tokens = gr.Slider(20, 1024, label="Max Tokens", step=20, value=1024)
 temperature = gr.Slider(0.0, 1.0, label="Temperature", step=0.1, value=0.2)
 top_p = gr.Slider(0.0, 1.0, label="Top P", step=0.05, value=0.7)
 with gr.Blocks() as demo:
     chat_history_state = gr.State([])
     chatbot = gr.ChatInterface(

 # Base system message
 BASE_SYSTEM_MESSAGE = "I carefully provide accurate, factual, thoughtful, nuanced answers and am brilliant at reasoning."
 def call_nvidia_api(history, system_message, max_tokens, temperature, top_p):
     """Calls the NVIDIA API to generate a response."""
     messages = [{"role": "system", "content": system_message}]
         "max_tokens": max_tokens,
         "stream": False
     }
+    print(f"Payload enviado: {json.dumps(payload, indent=2)}")
     session = requests.Session()
     response = session.post(INVOKE_URL, headers=headers, json=payload)
     while response.status_code == 202:
         response = session.get(fetch_url, headers=headers)
         response.raise_for_status()
     response_body = response.json()
+    print(f"Payload recebido: {json.dumps(response_body, indent=2)}")
     if response_body.get("choices"):
         assistant_message = response_body["choices"][0]["message"]["content"]
         return assistant_message
 max_tokens = gr.Slider(20, 1024, label="Max Tokens", step=20, value=1024)
 temperature = gr.Slider(0.0, 1.0, label="Temperature", step=0.1, value=0.2)
 top_p = gr.Slider(0.0, 1.0, label="Top P", step=0.05, value=0.7)
 with gr.Blocks() as demo:
     chat_history_state = gr.State([])
     chatbot = gr.ChatInterface(