Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
pminervini
commited on
Commit
•
5a94e04
1
Parent(s):
b3ee622
update
Browse files- cli/analysis-cli.py +4 -1
- cli/submit-cli.py +1 -1
cli/analysis-cli.py
CHANGED
@@ -54,11 +54,14 @@ for path in result_path_lst:
|
|
54 |
|
55 |
if ',' in metric_name and '_stderr' not in metric_name \
|
56 |
and 'f1' not in metric_name \
|
57 |
-
and 'selfcheckgpt' not in dataset_name \
|
58 |
and model_name_to_model_map[model_name]["likes"] > 256:
|
59 |
|
60 |
to_add = True
|
61 |
|
|
|
|
|
|
|
|
|
62 |
if 'nq_open' in dataset_name or 'triviaqa' in dataset_name:
|
63 |
to_add = False
|
64 |
# pass
|
|
|
54 |
|
55 |
if ',' in metric_name and '_stderr' not in metric_name \
|
56 |
and 'f1' not in metric_name \
|
|
|
57 |
and model_name_to_model_map[model_name]["likes"] > 256:
|
58 |
|
59 |
to_add = True
|
60 |
|
61 |
+
if 'selfcheck' in dataset_name:
|
62 |
+
if 'max' not in metric_name:
|
63 |
+
to_add = False
|
64 |
+
|
65 |
if 'nq_open' in dataset_name or 'triviaqa' in dataset_name:
|
66 |
to_add = False
|
67 |
# pass
|
cli/submit-cli.py
CHANGED
@@ -141,7 +141,7 @@ def main():
|
|
141 |
|
142 |
requested_model_names = {e.model for e in eval_requests}
|
143 |
|
144 |
-
breakpoint()
|
145 |
|
146 |
for i in range(min(200, len(filtered_model_lst))):
|
147 |
model = filtered_model_lst[i]
|
|
|
141 |
|
142 |
requested_model_names = {e.model for e in eval_requests}
|
143 |
|
144 |
+
# breakpoint()
|
145 |
|
146 |
for i in range(min(200, len(filtered_model_lst))):
|
147 |
model = filtered_model_lst[i]
|