Spaces:

MrSimple07
/

RuSimulBench_arena

Sleeping

RuSimulBench_arena / app.py

Update app.py

d9f7b70 verified 6 months ago

1.59 kB

	import gradio as gr
	import pandas as pd


	#Models:
	# IlyaGusev/saiga_llama3_8b
	# Vikhrmodels/Vikhr-Nemo-12B-Instruct-R-21-09-24
	# TinyLlama
	# Google-gemma-2-27b-it
	# mistralai/Mistral-Nemo-Instruct-2407
	# Vikhrmodels/Vikhr-Qwen-2.5-0.5b-Instruct


	benchmark_data = {
	'Model': [
	'TheBloke/llama3-13b', # LLaMA3
	'Vikhrmodels/Vikhr-Nemo-12B', # Vikhr
	'TinyLLaMA/TinyLlama-1.1B', # TinyLLaMA
	'mistralai/Mistral-7B-instruct', # Mistral
	'Qwen/Qwen-7B' # Qwen
	],
	'Creativity Score': [
	37.75, # LLaMA3
	46.00, # Vikhr
	6.50, # TinyLLaMA
	23.75, # Mistral
	8.25 # Qwen
	],
	'Diversity Score': [
	49.50, # LLaMA3
	52.00, # Vikhr
	14.50, # TinyLLaMA
	38.50, # Mistral
	15.55 # Qwen
	],
	'Relevance Score': [
	79.25, # LLaMA3
	87.50, # Vikhr
	18.50, # TinyLLaMA
	76.75, # Mistral
	34.25 # Qwen
	],
	'Average Score': [
	55.50, # LLaMA3
	61.83, # Vikhr
	13.17, # TinyLLaMA
	46.33, # Mistral
	19.35 # Qwen
	]
	}
	def display_results():
	df = pd.DataFrame(benchmark_data)
	return df

	# Create the interface
	with gr.Blocks() as demo:
	gr.Markdown("# Model Benchmark Results")

	# Display results in a DataFrame
	output = gr.Dataframe(
	headers=["Model", "Creativity Score", "Coherence Score", "Diversity Score"],
	interactive=True
	)

	if __name__ == "__main__":
	demo.launch()