File size: 1,796 Bytes
6b85865
22725f7
 
ffdb8d3
3a8762c
6b85865
df074bd
 
 
3a8762c
903d653
 
 
 
df074bd
 
 
 
 
6b85865
df074bd
 
 
ffdb8d3
df074bd
903d653
 
 
 
 
 
df074bd
 
903d653
22725f7
cee6ea9
 
 
22725f7
 
 
 
 
 
 
 
cee6ea9
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
import gradio as gr
import pandas as pd
import numpy as np
import json
import requests

# URLs for the two JSON files
FILE_URL_1 = "https://raw.githubusercontent.com/EleutherAI/lm-evaluation-harness/master/results/llama/llama-30B/llama-30B_mmlu_5-shot.json"
FILE_URL_2 = "https://raw.githubusercontent.com/EleutherAI/lm-evaluation-harness/master/results/llama/llama-13B/llama-13B_mmlu_5-shot.json"

# Derive column names from the URLs
column_name_1 = FILE_URL_1.split('/')[-1].split('_')[0]  # 'llama-30B'
column_name_2 = FILE_URL_2.split('/')[-1].split('_')[0]  # 'llama-13B'

# Load data from both URLs
response1 = requests.get(FILE_URL_1)
data1 = response1.json()
response2 = requests.get(FILE_URL_2)
data2 = response2.json()

# Convert data from both URLs into DataFrames
data1_df = pd.DataFrame(data1['results']).T
data2_df = pd.DataFrame(data2['results']).T

# Rename 'acc' column to respective file names
data1_df = data1_df.rename(columns={'acc': column_name_1})
data2_df = data2_df.rename(columns={'acc': column_name_2})

# Remove 'hendrycksTest-' from the index of both dataframes
data1_df.index = data1_df.index.str.replace('hendrycksTest-', '')
data2_df.index = data2_df.index.str.replace('hendrycksTest-', '')

# Merge the dataframes on index (Here index is the sub-test names)
data = pd.merge(data1_df[column_name_1], data2_df[column_name_2], left_index=True, right_index=True)

# Transpose the dataframe to swap rows and columns
data = data.transpose()

def show_leaderboard():
    # Convert dataframe to html so that it can be displayed properly in Gradio
    return data.to_html()

iface = gr.Interface(fn=show_leaderboard, inputs=[], outputs="html")

# Run the interface. 
# Note: you don't need to use .launch() in Hugging Face Spaces, this is for local testing.
iface.launch()