Sentinel-AI-Beta-Test

Sleeping

Shreyas094 commited on Sep 1, 2024

Commit

996270e

verified ·

1 Parent(s): 5ed09d4

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -541,7 +541,7 @@ def get_response_from_llama(query, model, selected_docs, file_type, num_calls=1,
             # Generate content with streaming enabled
             for response in client.chat_completion(
                 messages=messages,  # Pass messages in the required format
-                max_tokens=2048,  # Reduced to ensure we stay within token limits
                 temperature=temperature,
                 stream=True,
                 top_p=0.9,

             # Generate content with streaming enabled
             for response in client.chat_completion(
                 messages=messages,  # Pass messages in the required format
+                max_tokens=3000,  # Reduced to ensure we stay within token limits
                 temperature=temperature,
                 stream=True,
                 top_p=0.9,