Spaces:
Running
Running
lixuejing
commited on
Commit
·
70172bf
1
Parent(s):
ff262aa
update
Browse files
src/leaderboard/read_evals.py
CHANGED
|
@@ -92,12 +92,13 @@ class EvalResult:
|
|
| 92 |
for k, v in data["results"].items():
|
| 93 |
print("k,v,benchmark,metic",k,v, task.benchmark,task.metric)
|
| 94 |
if task.benchmark == k:
|
| 95 |
-
print(v.get(task.metric, None))
|
| 96 |
print("accs", accs)
|
| 97 |
if accs.size == 0 or any([acc is None for acc in accs]):
|
| 98 |
continue
|
| 99 |
|
| 100 |
mean_acc = np.mean(accs) if len(accs) > 0 else 0
|
|
|
|
| 101 |
results[task.metric] = mean_acc
|
| 102 |
|
| 103 |
return self(
|
|
@@ -183,14 +184,14 @@ class EvalResult:
|
|
| 183 |
data_dict[task.value.col_name] = "%.2f" % self.results.get(task.value.benchmark, 0)
|
| 184 |
|
| 185 |
for task in Quotas:
|
| 186 |
-
#data_dict[task.value.col_name] = self.results.get(task.value.
|
| 187 |
if task.value.col_name != "CLCC-H":
|
| 188 |
-
data_dict[task.value.col_name] = self.results.get(task.value.
|
| 189 |
else:
|
| 190 |
if self.results.get(task.value.metric, 0) == 0:
|
| 191 |
data_dict[task.value.col_name] = "-"
|
| 192 |
else:
|
| 193 |
-
data_dict[task.value.col_name] = "%.2f" % self.results.get(task.value.
|
| 194 |
|
| 195 |
return data_dict
|
| 196 |
|
|
|
|
| 92 |
for k, v in data["results"].items():
|
| 93 |
print("k,v,benchmark,metic",k,v, task.benchmark,task.metric)
|
| 94 |
if task.benchmark == k:
|
| 95 |
+
print("task.benchmark == k get metic",v.get(task.metric, None))
|
| 96 |
print("accs", accs)
|
| 97 |
if accs.size == 0 or any([acc is None for acc in accs]):
|
| 98 |
continue
|
| 99 |
|
| 100 |
mean_acc = np.mean(accs) if len(accs) > 0 else 0
|
| 101 |
+
print("mean_acc", task.metric, mean_acc)
|
| 102 |
results[task.metric] = mean_acc
|
| 103 |
|
| 104 |
return self(
|
|
|
|
| 184 |
data_dict[task.value.col_name] = "%.2f" % self.results.get(task.value.benchmark, 0)
|
| 185 |
|
| 186 |
for task in Quotas:
|
| 187 |
+
#data_dict[task.value.col_name] = self.results.get(task.value.metric, 0)
|
| 188 |
if task.value.col_name != "CLCC-H":
|
| 189 |
+
data_dict[task.value.col_name] = self.results.get(task.value.metric, 0)
|
| 190 |
else:
|
| 191 |
if self.results.get(task.value.metric, 0) == 0:
|
| 192 |
data_dict[task.value.col_name] = "-"
|
| 193 |
else:
|
| 194 |
+
data_dict[task.value.col_name] = "%.2f" % self.results.get(task.value.metric, 0)
|
| 195 |
|
| 196 |
return data_dict
|
| 197 |
|