|
|
""" |
|
|
MUSEval Leaderboard - Local Demo |
|
|
Imports from app.py to ensure identical functionality, loads a local demo leaderboard |
|
|
""" |
|
|
|
|
|
import gradio as gr |
|
|
import pandas as pd |
|
|
import json |
|
|
import os |
|
|
from datetime import datetime |
|
|
from typing import Dict, List, Any |
|
|
import numpy as np |
|
|
|
|
|
|
|
|
from src.load_results import ( |
|
|
load_results_with_metadata, |
|
|
create_overall_table, |
|
|
get_filter_options, |
|
|
get_model_metadata, |
|
|
create_model_metadata_display, |
|
|
get_overall_summary |
|
|
) |
|
|
|
|
|
|
|
|
from app import create_leaderboard_interface |
|
|
|
|
|
|
|
|
demo = create_leaderboard_interface() |
|
|
|
|
|
|
|
|
if __name__ == "__main__": |
|
|
print("π¨ MUSEval Leaderboard Local Demo") |
|
|
print("=" * 50) |
|
|
|
|
|
try: |
|
|
print("π Loading data...") |
|
|
results = load_results_with_metadata() |
|
|
print(f"β
Loaded {len(results)} results") |
|
|
|
|
|
print("ποΈ Creating interface...") |
|
|
print("π Starting local leaderboard...") |
|
|
print("π Access at: http://localhost:7860") |
|
|
print("π Press Ctrl+C to stop") |
|
|
|
|
|
demo.launch( |
|
|
server_name="0.0.0.0", |
|
|
server_port=7860, |
|
|
share=False, |
|
|
show_error=True, |
|
|
quiet=False |
|
|
) |
|
|
|
|
|
except Exception as e: |
|
|
print(f"β Error: {e}") |
|
|
import traceback |
|
|
traceback.print_exc() |
|
|
|