Spaces:
Running
Running
| from dataclasses import dataclass, make_dataclass | |
| import pandas as pd | |
| def fields(raw_class): | |
| return [v for k, v in raw_class.__dict__.items() if k[:2] != "__" and k[-2:] != "__"] | |
| # These classes are for user facing column names, | |
| # to avoid having to change them all around the code | |
| # when a modif is needed | |
| class ColumnContent: | |
| name: str | |
| type: str | |
| displayed_by_default: bool | |
| hidden: bool = False | |
| never_hidden: bool = False | |
| ## Leaderboard columns | |
| auto_eval_column_dict = [] | |
| # 'Model', 'NCR', 'HTU', 'TCU', 'NED', 'PVI', 'KQA', 'TII', 'MTA', 'BRI', 'Overall', 'Agentic Framework'] | |
| # Init | |
| auto_eval_column_dict.append( | |
| ["model", ColumnContent, ColumnContent("Model", "markdown", True, never_hidden=True)] | |
| ) | |
| # Agentic Framework | |
| auto_eval_column_dict.append( | |
| ["agentic_framework", ColumnContent, ColumnContent("Agentic Framework", "markdown", True, never_hidden=True)] | |
| ) | |
| # NCR | |
| auto_eval_column_dict.append( | |
| ["ncr", ColumnContent, ColumnContent("NCR", "markdown", True)] | |
| ) | |
| # HTU | |
| auto_eval_column_dict.append( | |
| ["htu", ColumnContent, ColumnContent("HTU", "markdown", True)] | |
| ) | |
| # TCU | |
| auto_eval_column_dict.append( | |
| ["tcu", ColumnContent, ColumnContent("TCU", "markdown", True)] | |
| ) | |
| # NED | |
| auto_eval_column_dict.append( | |
| ["ned", ColumnContent, ColumnContent("NED", "markdown", True)] | |
| ) | |
| # PVI | |
| auto_eval_column_dict.append( | |
| ["pvi", ColumnContent, ColumnContent("PVI", "markdown", True)] | |
| ) | |
| # KQA | |
| auto_eval_column_dict.append( | |
| ["kqa", ColumnContent, ColumnContent("KQA", "markdown", True)] | |
| ) | |
| # TII | |
| auto_eval_column_dict.append( | |
| ["tii", ColumnContent, ColumnContent("TII", "markdown", True)] | |
| ) | |
| # MTA | |
| auto_eval_column_dict.append( | |
| ["mta", ColumnContent, ColumnContent("MTA", "markdown", True)] | |
| ) | |
| # BRI | |
| auto_eval_column_dict.append( | |
| ["bri", ColumnContent, ColumnContent("BRI", "markdown", True)] | |
| ) | |
| # Overall | |
| auto_eval_column_dict.append( | |
| ["overall", ColumnContent, ColumnContent("Overall ⬆️", "markdown", True, never_hidden=True)] | |
| ) | |
| # Create AutoEvalColumn class | |
| AutoEvalColumn = make_dataclass("AutoEvalColumn", auto_eval_column_dict) | |
| # Column selection | |
| COLS = [c.name for c in fields(AutoEvalColumn) if not c.hidden] | |
| TYPES = [c.type for c in fields(AutoEvalColumn) if not c.hidden] | |
| COLS_LITE = [c.name for c in fields(AutoEvalColumn) if c.displayed_by_default and not c.hidden] | |
| TYPES_LITE = [c.type for c in fields(AutoEvalColumn) if c.displayed_by_default and not c.hidden] | |
| # BENCHMARK_COLS = [t.value.col_name for t in Tasks] | |
| NUMERIC_INTERVALS = { | |
| "?": pd.Interval(-1, 0, closed="right"), | |
| "~1.5": pd.Interval(0, 2, closed="right"), | |
| "~3": pd.Interval(2, 4, closed="right"), | |
| "~7": pd.Interval(4, 9, closed="right"), | |
| "~13": pd.Interval(9, 20, closed="right"), | |
| "~35": pd.Interval(20, 45, closed="right"), | |
| "~60": pd.Interval(45, 70, closed="right"), | |
| "70+": pd.Interval(70, 10000, closed="right"), | |
| } | |