future-xy
commited on
Commit
•
a317a5f
1
Parent(s):
b9f0099
add display info
Browse files- src/display/utils.py +5 -1
src/display/utils.py
CHANGED
@@ -46,7 +46,7 @@ class Tasks(Enum):
|
|
46 |
|
47 |
# # XXX include me back at some point
|
48 |
selfcheck = Task("selfcheckgpt", "max-selfcheckgpt", "SelfCheckGPT")
|
49 |
-
mmlu = Task("mmlu", "acc", "MMLU/Acc")
|
50 |
|
51 |
|
52 |
# These classes are for user facing column names,
|
@@ -73,6 +73,10 @@ auto_eval_column_dict.append(["model", ColumnContent, ColumnContent("Model", "ma
|
|
73 |
# Inference framework
|
74 |
auto_eval_column_dict.append(["inference_framework", ColumnContent, ColumnContent("Inference framework", "str", True)])
|
75 |
|
|
|
|
|
|
|
|
|
76 |
for task in Tasks:
|
77 |
auto_eval_column_dict.append([task.name, ColumnContent, ColumnContent(task.value.col_name, "number", True)])
|
78 |
|
|
|
46 |
|
47 |
# # XXX include me back at some point
|
48 |
selfcheck = Task("selfcheckgpt", "max-selfcheckgpt", "SelfCheckGPT")
|
49 |
+
mmlu = Task("mmlu", "acc", "MMLU/Acc (5-shot)")
|
50 |
|
51 |
|
52 |
# These classes are for user facing column names,
|
|
|
73 |
# Inference framework
|
74 |
auto_eval_column_dict.append(["inference_framework", ColumnContent, ColumnContent("Inference framework", "str", True)])
|
75 |
|
76 |
+
# System performance metrics
|
77 |
+
auto_eval_column_dict.append(["prefilling_time", ColumnContent, ColumnContent("Prefilling time (s)", "number", True)])
|
78 |
+
auto_eval_column_dict.append(["token_per_second", ColumnContent, ColumnContent("Tokens/s", "number", True)])
|
79 |
+
|
80 |
for task in Tasks:
|
81 |
auto_eval_column_dict.append([task.name, ColumnContent, ColumnContent(task.value.col_name, "number", True)])
|
82 |
|