Spaces:
Runtime error
Runtime error
kmfoda
commited on
Commit
•
e6199cd
0
Parent(s):
Initial Upload
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- .gitattributes +2 -0
- _results/hellaswag.json +3 -0
- _results/zero-shot/hellaswag_results.json +3 -0
- _results/zero-shot/hendrycksTest-abstract_algebra_results.json +3 -0
- _results/zero-shot/hendrycksTest-anatomy_results.json +3 -0
- _results/zero-shot/hendrycksTest-astronomy_results.json +3 -0
- _results/zero-shot/hendrycksTest-business_ethics_results.json +3 -0
- _results/zero-shot/hendrycksTest-clinical_knowledge_results.json +3 -0
- _results/zero-shot/hendrycksTest-college_biology_results.json +3 -0
- _results/zero-shot/hendrycksTest-college_chemistry_results.json +3 -0
- _results/zero-shot/hendrycksTest-college_computer_science_results.json +3 -0
- _results/zero-shot/hendrycksTest-college_mathematics_results.json +3 -0
- _results/zero-shot/hendrycksTest-college_medicine_results.json +3 -0
- _results/zero-shot/hendrycksTest-college_physics_results.json +3 -0
- _results/zero-shot/hendrycksTest-computer_security_results.json +3 -0
- _results/zero-shot/hendrycksTest-conceptual_physics_results.json +3 -0
- _results/zero-shot/hendrycksTest-econometrics_results.json +3 -0
- _results/zero-shot/hendrycksTest-electrical_engineering_results.json +3 -0
- _results/zero-shot/hendrycksTest-elementary_mathematics_results.json +3 -0
- _results/zero-shot/hendrycksTest-formal_logic_results.json +3 -0
- _results/zero-shot/hendrycksTest-global_facts_results.json +3 -0
- _results/zero-shot/hendrycksTest-high_school_biology_results.json +3 -0
- _results/zero-shot/hendrycksTest-high_school_chemistry_results.json +3 -0
- _results/zero-shot/hendrycksTest-high_school_computer_science_results.json +3 -0
- _results/zero-shot/hendrycksTest-high_school_european_history_results.json +3 -0
- _results/zero-shot/hendrycksTest-high_school_geography_results.json +3 -0
- _results/zero-shot/hendrycksTest-high_school_government_and_politics_results.json +3 -0
- _results/zero-shot/hendrycksTest-high_school_macroeconomics_results.json +3 -0
- _results/zero-shot/hendrycksTest-high_school_mathematics_results.json +3 -0
- _results/zero-shot/hendrycksTest-high_school_microeconomics_results.json +3 -0
- _results/zero-shot/hendrycksTest-high_school_physics_results.json +3 -0
- _results/zero-shot/hendrycksTest-high_school_psychology_results.json +3 -0
- _results/zero-shot/hendrycksTest-high_school_statistics_results.json +3 -0
- _results/zero-shot/hendrycksTest-high_school_us_history_results.json +3 -0
- _results/zero-shot/hendrycksTest-high_school_world_history_results.json +3 -0
- _results/zero-shot/hendrycksTest-human_aging_results.json +3 -0
- _results/zero-shot/hendrycksTest-human_sexuality_results.json +3 -0
- _results/zero-shot/hendrycksTest-international_law_results.json +3 -0
- _results/zero-shot/hendrycksTest-jurisprudence_results.json +3 -0
- _results/zero-shot/hendrycksTest-logical_fallacies_results.json +3 -0
- _results/zero-shot/hendrycksTest-machine_learning_results.json +3 -0
- _results/zero-shot/hendrycksTest-management_results.json +3 -0
- _results/zero-shot/hendrycksTest-marketing_results.json +3 -0
- _results/zero-shot/hendrycksTest-medical_genetics_results.json +3 -0
- _results/zero-shot/hendrycksTest-miscellaneous_results.json +3 -0
- _results/zero-shot/hendrycksTest-moral_disputes_results.json +3 -0
- _results/zero-shot/hendrycksTest-moral_scenarios_results.json +3 -0
- _results/zero-shot/hendrycksTest-nutrition_results.json +3 -0
- _results/zero-shot/hendrycksTest-philosophy_results.json +3 -0
- _results/zero-shot/hendrycksTest-prehistory_results.json +3 -0
.gitattributes
ADDED
@@ -0,0 +1,2 @@
|
|
|
|
|
|
|
1 |
+
*.json filter=lfs diff=lfs merge=lfs -text
|
2 |
+
*.py filter=lfs diff=lfs merge=lfs -text
|
_results/hellaswag.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eb5bfbbbd793bb3700fdd232df51df2bed54e600cff359d66e1ad715c4059dba
|
3 |
+
size 8273334
|
_results/zero-shot/hellaswag_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c473faa1c445e96bfde24cc0f95bcb6b065673ca15a9e2047844e26c24ddc5ee
|
3 |
+
size 17889988
|
_results/zero-shot/hendrycksTest-abstract_algebra_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:98acded413c08949406ad0a3ae51557e358e76c1fd025af5b860e0fced332716
|
3 |
+
size 69709
|
_results/zero-shot/hendrycksTest-anatomy_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4b82c943f9760a478fed6e9b5281ad31df9e1bfb64f436c59478fd0b0976d06a
|
3 |
+
size 124285
|
_results/zero-shot/hendrycksTest-astronomy_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9871011e8711ff1271527b55394ccbabd30a5106fbb059ee9c83826e7d5b8cf2
|
3 |
+
size 168185
|
_results/zero-shot/hendrycksTest-business_ethics_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c5373e79ebdad893d1c9333cfcaa0751cdac6cbdb423fec4b75e862fb8f05d80
|
3 |
+
size 114742
|
_results/zero-shot/hendrycksTest-clinical_knowledge_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:5590a21bff7d84df84020d526659cec4167ed88e7852cea7d89fb95f7e299158
|
3 |
+
size 240896
|
_results/zero-shot/hendrycksTest-college_biology_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f6e4e8d90471389e85e91511c9dd3fef144723c265cb6d5f219a9688872d69bb
|
3 |
+
size 158943
|
_results/zero-shot/hendrycksTest-college_chemistry_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:dcee98a3f0c48382c2010bb6b23addeee619be474f7fc5322a4dd817bb4349e9
|
3 |
+
size 84762
|
_results/zero-shot/hendrycksTest-college_computer_science_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:655bf4968460b42b0250257cc24343bf1e8afb39b690819dff280915f2cb1354
|
3 |
+
size 123186
|
_results/zero-shot/hendrycksTest-college_mathematics_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:ddb10d0404001fa7edc730192689c0a0c43e074b3f3da7027ba55f1620012e4c
|
3 |
+
size 84530
|
_results/zero-shot/hendrycksTest-college_medicine_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:44cb2aa886452b62be4d0139965412e4348f8b89d397b400a816952a8bfb6ee4
|
3 |
+
size 241110
|
_results/zero-shot/hendrycksTest-college_physics_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:99709d05fcc8daa1143eeabb71083c8ce30b941590a6f439d5311ad21d164960
|
3 |
+
size 100570
|
_results/zero-shot/hendrycksTest-computer_security_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:66a348ab3a7b486690305e518f2077c516f2291da364bbd209b8a7889fb53d64
|
3 |
+
size 96212
|
_results/zero-shot/hendrycksTest-conceptual_physics_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7765b03f169ed88c57b9afc798c67ded790c89255685b89597d613eb8f326152
|
3 |
+
size 171073
|
_results/zero-shot/hendrycksTest-econometrics_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e9944ba50bb59361f9a477d87d25d63a23cfa14abe3c0f02c9add4a7d3825f48
|
3 |
+
size 147528
|
_results/zero-shot/hendrycksTest-electrical_engineering_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:fe6650e62d6e26c953d5e3cc2bd4a8e5686abb6734414faf92c562224fb72789
|
3 |
+
size 105839
|
_results/zero-shot/hendrycksTest-elementary_mathematics_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:380aa49b9e75129ff9b7e9e8a7c4f6a62fe49b4257ba4661db0b70c2289a019d
|
3 |
+
size 274513
|
_results/zero-shot/hendrycksTest-formal_logic_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:34584ee156a47809fb48406adb14b0d3f439c0a27f82eadaa9016235a3483f35
|
3 |
+
size 162876
|
_results/zero-shot/hendrycksTest-global_facts_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4ce9696511d5caf333348669dda7f61f6f758b9332308d49d893ba5248f834f9
|
3 |
+
size 72336
|
_results/zero-shot/hendrycksTest-high_school_biology_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:f8d3dda7ae20c1c3fdcf0e47105f75d74273116d34cca803be5a5ade43949b19
|
3 |
+
size 369482
|
_results/zero-shot/hendrycksTest-high_school_chemistry_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:52f243ed1bd3b7207efd3811ed4b08c3a3294cab654394e3df325cd901714fb1
|
3 |
+
size 204979
|
_results/zero-shot/hendrycksTest-high_school_computer_science_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:3b1137235b952d67a6dc259231c41ad6551f8e0389b22a293ee9db24c94d0cdd
|
3 |
+
size 137165
|
_results/zero-shot/hendrycksTest-high_school_european_history_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:86b050f876c76d78cbca1b2c9dd4775adead9432f703f3041d0792fb7d09e82a
|
3 |
+
size 629881
|
_results/zero-shot/hendrycksTest-high_school_geography_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1d9d8f47a9aabf2c9ee9212e660f56909f94a2a299fbdd12933cac666a8fbefa
|
3 |
+
size 163896
|
_results/zero-shot/hendrycksTest-high_school_government_and_politics_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:61c7bda180499352381ccd48c85dce6f051124a2784209b17b042197312e2696
|
3 |
+
size 234288
|
_results/zero-shot/hendrycksTest-high_school_macroeconomics_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9534222b3a74d63e4de67e0a76a009897c8de4cfc9a1e83210e9b9ef84f99178
|
3 |
+
size 433359
|
_results/zero-shot/hendrycksTest-high_school_mathematics_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:a7fbfa0fc18c42ba43d761b8dbf87d53a438a9b4d4a0ea59f4c295924a6acc6d
|
3 |
+
size 203612
|
_results/zero-shot/hendrycksTest-high_school_microeconomics_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:819d7cfa653982d386f603922bddfb73958d942c17156dbd5fe149aff39f5ccb
|
3 |
+
size 273665
|
_results/zero-shot/hendrycksTest-high_school_physics_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:8b8f052f34e0032fad387e588180a5bef57f671ba749f947d347116e358a1f2d
|
3 |
+
size 192460
|
_results/zero-shot/hendrycksTest-high_school_psychology_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:00a62dbf77aefd2412ba0397895bca9a6aca3cf8c7e3675d670e25c27ce6ead5
|
3 |
+
size 556908
|
_results/zero-shot/hendrycksTest-high_school_statistics_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e5c8024f2690315351ae4a5ad4ee1c96fca15f7457253b8983b97b0fe25c6b03
|
3 |
+
size 336971
|
_results/zero-shot/hendrycksTest-high_school_us_history_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e636e9b44272e8b4f0b4e7aa6f459ae9d5c484d228006eb521cc739dce6d07c5
|
3 |
+
size 701743
|
_results/zero-shot/hendrycksTest-high_school_world_history_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e683851839408a56477d17b1c33196284039a154f117fc3aae74af824985231e
|
3 |
+
size 890481
|
_results/zero-shot/hendrycksTest-human_aging_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:e06c4ab3a3cb2abf96b5e85a8e50588e6751778fb016b442449388f026ff6340
|
3 |
+
size 183283
|
_results/zero-shot/hendrycksTest-human_sexuality_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:02288d8bd3f50e71eb6cf1e0f9fe0b2b3c70d0667a85bffd7dd1fb7f300f72df
|
3 |
+
size 118875
|
_results/zero-shot/hendrycksTest-international_law_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:1cef928a14964215c1020d2f7c535d6034ae42a2280286a39a707e8eaa11a0b7
|
3 |
+
size 187345
|
_results/zero-shot/hendrycksTest-jurisprudence_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7543a007643582d91243cc984cd5caf2abaac31823592011df31901adf518eab
|
3 |
+
size 119374
|
_results/zero-shot/hendrycksTest-logical_fallacies_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:d6fe83292819eebfda3e72297bddc5a6e2f2388ac0a85141989aa780dbc91862
|
3 |
+
size 178321
|
_results/zero-shot/hendrycksTest-machine_learning_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c290f7e099185477b3ffe7d24e89a431b5b8eac1577ba94aeb98b01a4b15edfc
|
3 |
+
size 112250
|
_results/zero-shot/hendrycksTest-management_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:0a4fe6ac71f0e80cee0fe778263b28ae2a6704891ed1c6cb1d267ac0d7072597
|
3 |
+
size 85855
|
_results/zero-shot/hendrycksTest-marketing_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:9cf8bd38144b0d86359c8d6370d3b0097d961e41ad0b9abd597f63c47b986a1e
|
3 |
+
size 224231
|
_results/zero-shot/hendrycksTest-medical_genetics_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:4e7563e2c79dd68d017bf012d47912db27c1c0c052d4859beaafc461bb9f6bbb
|
3 |
+
size 82048
|
_results/zero-shot/hendrycksTest-miscellaneous_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7dd91682d51c87b8442517dde66ffabe60d9a902b424dc5fa5418bf558030209
|
3 |
+
size 580654
|
_results/zero-shot/hendrycksTest-moral_disputes_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:c593327785f85859f438f9ba95b22cad8a749696de0814a48e33b91a72554e40
|
3 |
+
size 382625
|
_results/zero-shot/hendrycksTest-moral_scenarios_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:7230d4d58548b0b4ea02840154667c598b5a36b087cf8b0245925c2a2ff714b4
|
3 |
+
size 1097787
|
_results/zero-shot/hendrycksTest-nutrition_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:6c9ddeaafecb01d2b3a6a98ee73265b759dfcb4ee7050a379315d2b51b5aa88f
|
3 |
+
size 335204
|
_results/zero-shot/hendrycksTest-philosophy_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:96c0937b73d8a810b6c3055296337f0ca5e37b2013d4674d15ca48ce33f53b93
|
3 |
+
size 302736
|
_results/zero-shot/hendrycksTest-prehistory_results.json
ADDED
@@ -0,0 +1,3 @@
|
|
|
|
|
|
|
|
|
1 |
+
version https://git-lfs.github.com/spec/v1
|
2 |
+
oid sha256:eea9a4922a1d8a5367a25edbd7edfd626e919e0c2b1ff4b193a07761cd8e69da
|
3 |
+
size 327560
|