Spaces:
Sleeping
Sleeping
import gradio as gr | |
import pandas as pd | |
#Models: | |
# IlyaGusev/saiga_llama3_8b | |
# Vikhrmodels/Vikhr-Nemo-12B-Instruct-R-21-09-24 | |
# TinyLlama | |
# Google-gemma-2-27b-it | |
# mistralai/Mistral-Nemo-Instruct-2407 | |
# Vikhrmodels/Vikhr-Qwen-2.5-0.5b-Instruct | |
benchmark_data = { | |
'Model': [ | |
'TheBloke/llama3-13b', # LLaMA3 | |
'Vikhrmodels/Vikhr-Nemo-12B', # Vikhr | |
'TinyLLaMA/TinyLlama-1.1B', # TinyLLaMA | |
'mistralai/Mistral-7B-instruct', # Mistral | |
'Qwen/Qwen-7B' # Qwen | |
], | |
'Creativity Score': [ | |
37.75, # LLaMA3 | |
46.00, # Vikhr | |
6.50, # TinyLLaMA | |
23.75, # Mistral | |
8.25 # Qwen | |
], | |
'Diversity Score': [ | |
49.50, # LLaMA3 | |
52.00, # Vikhr | |
14.50, # TinyLLaMA | |
38.50, # Mistral | |
15.55 # Qwen | |
], | |
'Relevance Score': [ | |
79.25, # LLaMA3 | |
87.50, # Vikhr | |
18.50, # TinyLLaMA | |
76.75, # Mistral | |
34.25 # Qwen | |
], | |
'Average Score': [ | |
55.50, # LLaMA3 | |
61.83, # Vikhr | |
13.17, # TinyLLaMA | |
46.33, # Mistral | |
19.35 # Qwen | |
] | |
} | |
def display_results(): | |
df = pd.DataFrame(benchmark_data) | |
return df | |
# Create the interface | |
with gr.Blocks() as demo: | |
gr.Markdown("# Model Benchmark Results") | |
# Display results in a DataFrame | |
output = gr.Dataframe( | |
headers=["Model", "Creativity Score", "Coherence Score", "Diversity Score"], | |
interactive=True | |
) | |
if __name__ == "__main__": | |
demo.launch() |