import gradio as gr import requests import subprocess import time # Start the Ollama server and wait for it to output the URL subprocess.Popen(['bash', 'run_ollama.sh']) time.sleep(10) # Adjust sleep time based on how long it takes Ollama to start # Read the URL from the file with open('ollama_url.txt', 'r') as file: OLLAMA_URL = file.read().strip() console_output = [] def call_ollama_api(prompt): response = requests.post( f'{OLLAMA_URL}/generate', json={"prompt": prompt} ) if response.status_code == 200: result = response.json() output = result.get('text', '') console_output.append(f"Prompt: {prompt}\nResponse: {output}") return output else: error_message = f"Error: {response.status_code} - {response.text}" console_output.append(error_message) return error_message def chat(prompt): output = call_ollama_api(prompt) return output def show_console_output(): return "\n\n".join(console_output) iface = gr.Interface( fn=chat, inputs="text", outputs="text", title="Ollama Chat", description="Chat with Ollama API and see the responses." ) console_iface = gr.Interface( fn=show_console_output, inputs=None, outputs="text", title="Console Output", description="See the console outputs here." ) gr.TabbedInterface([iface, console_iface], ["Chat", "Console"]).launch()