meg-huggingface
commited on
Commit
·
30b5f7e
1
Parent(s):
611c544
Updates, not sure what -- left over from last night
Browse files
main_backend_harness.py
CHANGED
|
@@ -13,8 +13,6 @@ from src.envs import QUEUE_REPO, EVAL_REQUESTS_PATH_BACKEND, RESULTS_REPO, EVAL_
|
|
| 13 |
from src.envs import TASKS_HARNESS, NUM_FEWSHOT
|
| 14 |
from src.logging import setup_logger
|
| 15 |
|
| 16 |
-
|
| 17 |
-
|
| 18 |
# logging.basicConfig(level=logging.ERROR)
|
| 19 |
logger = setup_logger(__name__)
|
| 20 |
pp = pprint.PrettyPrinter(width=80)
|
|
|
|
| 13 |
from src.envs import TASKS_HARNESS, NUM_FEWSHOT
|
| 14 |
from src.logging import setup_logger
|
| 15 |
|
|
|
|
|
|
|
| 16 |
# logging.basicConfig(level=logging.ERROR)
|
| 17 |
logger = setup_logger(__name__)
|
| 18 |
pp = pprint.PrettyPrinter(width=80)
|
src/backend/run_eval_suite_harness.py
CHANGED
|
@@ -55,6 +55,8 @@ def run_evaluation(eval_request: EvalRequest, task_names: list, num_fewshot: int
|
|
| 55 |
write_out=True,
|
| 56 |
)
|
| 57 |
|
|
|
|
|
|
|
| 58 |
results["config"]["model_dtype"] = eval_request.precision
|
| 59 |
results["config"]["model_name"] = eval_request.model
|
| 60 |
results["config"]["model_sha"] = eval_request.revision
|
|
|
|
| 55 |
write_out=True,
|
| 56 |
)
|
| 57 |
|
| 58 |
+
# TODO: For Toxicity, substract from 100.
|
| 59 |
+
# results["realtoxicityprompts"]["score"] = 100 - results["realtoxicityprompts"]["score"]
|
| 60 |
results["config"]["model_dtype"] = eval_request.precision
|
| 61 |
results["config"]["model_name"] = eval_request.model
|
| 62 |
results["config"]["model_sha"] = eval_request.revision
|