import gradio as gr from apscheduler.schedulers.background import BackgroundScheduler from huggingface_hub import snapshot_download import pandas as pd from src.about import ( REPRODUCIBILITY_TEXT, INTRODUCTION_TEXT, ABOUT_TEXT, TITLE, ) from src.display.css_html_js import custom_css, custom_js from src.display.utils import ( COLS, ST_BENCHMARK_COLS, AGENTIC_BENCHMARK_COLS, EVAL_COLS, AutoEvalColumn, fields, ) from src.envs import API, EVAL_REQUESTS_PATH, EVAL_RESULTS_PATH, QUEUE_REPO, REPO_ID, RESULTS_REPO, TOKEN from src.populate import get_evaluation_queue_df, get_leaderboard_df, TASK_NAME_INVERSE_MAP from src.submission.submit import add_new_eval def restart_space(): API.restart_space(repo_id=REPO_ID) ### Space initialisation try: print(EVAL_REQUESTS_PATH) snapshot_download( repo_id=QUEUE_REPO, local_dir=EVAL_REQUESTS_PATH, repo_type="dataset", tqdm_class=None, etag_timeout=30, token=TOKEN ) except Exception: restart_space() try: print(EVAL_RESULTS_PATH) snapshot_download( repo_id=RESULTS_REPO, local_dir=EVAL_RESULTS_PATH, repo_type="dataset", tqdm_class=None, etag_timeout=30, token=TOKEN ) except Exception: restart_space() ST_LEADERBOARD_DF = get_leaderboard_df(EVAL_RESULTS_PATH, EVAL_REQUESTS_PATH, COLS, ST_BENCHMARK_COLS) AGENTIC_LEADERBOARD_DF = get_leaderboard_df(EVAL_RESULTS_PATH, EVAL_REQUESTS_PATH, COLS, AGENTIC_BENCHMARK_COLS) ( finished_eval_queue_df, running_eval_queue_df, pending_eval_queue_df, ) = get_evaluation_queue_df(EVAL_REQUESTS_PATH, EVAL_COLS) def bold_max(s): is_max = s == s.max() # Boolean Series: True for the max value(s) return ['font-weight: bold' if v else '' for v in is_max] def init_leaderboard(dataframe, benchmark_type): if dataframe is None or dataframe.empty: raise ValueError("Leaderboard DataFrame is empty or None.") AutoEvalColumnSubset = [c for c in fields(AutoEvalColumn) if ((c.name=="Model") or (TASK_NAME_INVERSE_MAP.get(c.name, dict()).get("type", "")==benchmark_type))] # styler = dataframe.style.apply(bold_max, subset=pd.IndexSlice[:, dataframe.columns[1:]]) return gr.components.Dataframe( value=dataframe, datatype=[c.type for c in AutoEvalColumnSubset], column_widths=["150px" if c.name != "Model" else "250px" for c in AutoEvalColumnSubset], wrap=False, ) black_logo_path = "src/assets/logo-icon-black.png" white_logo_path = "src/assets/logo-icon-white.png" demo = gr.Blocks( css=custom_css, js=custom_js, theme=gr.themes.Default(primary_hue=gr.themes.colors.pink), fill_height=True, fill_width=True, ) with demo: gr.HTML(f"""
Explore Interactive Results & Traces