Spaces:
Runtime error
Runtime error
Commit
·
84b824e
1
Parent(s):
7253275
new charts
Browse files- evals/.zeno_cache_country-area/reports.pickle +1 -1
- evals/.zeno_cache_crossword/reports.pickle +1 -1
- evals/.zeno_cache_med-mcqa/PREDISTILLsubject.pickle +3 -0
- evals/.zeno_cache_med-mcqa/folders.pickle +2 -2
- evals/.zeno_cache_med-mcqa/reports.pickle +2 -2
- evals/.zeno_cache_med-mcqa/slices.pickle +3 -0
- evals/evals.yaml +1 -0
- evals/medmcqa/med_fns.py +14 -0
- zeno-evals-hub/main.py +0 -1
evals/.zeno_cache_country-area/reports.pickle
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 3880
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:ebe923fd1e82b53bd95580dff84cfae8e0c37824c57186e218e921a01c397b1c
|
| 3 |
size 3880
|
evals/.zeno_cache_crossword/reports.pickle
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 6586
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:4335d3a1a4a7ce47c4c9ee39811c090bdeb3a2d565085b411b1e9a471052d705
|
| 3 |
size 6586
|
evals/.zeno_cache_med-mcqa/PREDISTILLsubject.pickle
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:47ada9af3bfaaa3ea9c77bed6774b474d5cf505676302d443c20ace3db98f7a5
|
| 3 |
+
size 11589
|
evals/.zeno_cache_med-mcqa/folders.pickle
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:c21f58777ece01ce867731803c284f07d64ef69d67712eeca9bf9bda7ac4f38b
|
| 3 |
+
size 29
|
evals/.zeno_cache_med-mcqa/reports.pickle
CHANGED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
-
size
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:0150a18fcad53c825bfed305a0a05c6ddc9cc8bd5f8cd70e630ed4d273d51aa4
|
| 3 |
+
size 3033
|
evals/.zeno_cache_med-mcqa/slices.pickle
ADDED
|
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f4b521b1fc398b7bf3b6be870e597b077110fc2fb2ef61b52b4a204e3b5a45f0
|
| 3 |
+
size 2295
|
evals/evals.yaml
CHANGED
|
@@ -13,6 +13,7 @@
|
|
| 13 |
- med-mcqa:
|
| 14 |
results-file: ./medmcqa/med-3.5-turbo.jsonl
|
| 15 |
second-results-file: ./medmcqa/med-4.jsonl
|
|
|
|
| 16 |
link: https://github.com/openai/evals/commit/19b2cf9ff96b08af68f5c3b4d2c90184844a4fe6
|
| 17 |
description: Multiple choice questions from different medical areas.
|
| 18 |
- aba-mrpc:
|
|
|
|
| 13 |
- med-mcqa:
|
| 14 |
results-file: ./medmcqa/med-3.5-turbo.jsonl
|
| 15 |
second-results-file: ./medmcqa/med-4.jsonl
|
| 16 |
+
functions-file: ./medmcqa/med_fns.py
|
| 17 |
link: https://github.com/openai/evals/commit/19b2cf9ff96b08af68f5c3b4d2c90184844a4fe6
|
| 18 |
description: Multiple choice questions from different medical areas.
|
| 19 |
- aba-mrpc:
|
evals/medmcqa/med_fns.py
ADDED
|
@@ -0,0 +1,14 @@
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 1 |
+
import re
|
| 2 |
+
|
| 3 |
+
from zeno import DistillReturn, distill
|
| 4 |
+
|
| 5 |
+
finder = "Subject:(.*)"
|
| 6 |
+
|
| 7 |
+
|
| 8 |
+
@distill
|
| 9 |
+
def subject(df, ops):
|
| 10 |
+
ret_subjs = []
|
| 11 |
+
for entry in df[ops.data_column]:
|
| 12 |
+
ret_subjs.append(re.search(finder, entry[1]["content"]).group(1))
|
| 13 |
+
|
| 14 |
+
return DistillReturn(distill_output=ret_subjs)
|
zeno-evals-hub/main.py
CHANGED
|
@@ -88,7 +88,6 @@ def command_line():
|
|
| 88 |
config.editable = False
|
| 89 |
|
| 90 |
zeno_obj = zeno(config)
|
| 91 |
-
print(config.metadata["expected"])
|
| 92 |
if zeno_obj is None:
|
| 93 |
sys.exit(1)
|
| 94 |
server = get_server(zeno_obj)
|
|
|
|
| 88 |
config.editable = False
|
| 89 |
|
| 90 |
zeno_obj = zeno(config)
|
|
|
|
| 91 |
if zeno_obj is None:
|
| 92 |
sys.exit(1)
|
| 93 |
server = get_server(zeno_obj)
|