Spaces:
Sleeping
Sleeping
Upload folder using huggingface_hub
Browse files
results/cultural_reasoning/zero_shot/sg_eval_v2_mcq.csv
CHANGED
|
@@ -17,6 +17,7 @@ cross_openhermes_llama3_8b_2048_inst,0.7781818181818182
|
|
| 17 |
gemma-2-2b-it,0.7163636363636363
|
| 18 |
cross_openhermes_llama3_8b_12288_inst,0.7890909090909091
|
| 19 |
Qwen2_5_0_5B_Instruct,0.5727272727272728
|
|
|
|
| 20 |
cross_openhermes_llama3_8b_8192_inst,0.78
|
| 21 |
cross_openhermes_llama3_70b_4096_inst,0.8381818181818181
|
| 22 |
cross_openhermes_llama3_8b_4096_2_inst,0.7654545454545455
|
|
|
|
| 17 |
gemma-2-2b-it,0.7163636363636363
|
| 18 |
cross_openhermes_llama3_8b_12288_inst,0.7890909090909091
|
| 19 |
Qwen2_5_0_5B_Instruct,0.5727272727272728
|
| 20 |
+
GPT4o_0513,0.8709090909090909
|
| 21 |
cross_openhermes_llama3_8b_8192_inst,0.78
|
| 22 |
cross_openhermes_llama3_70b_4096_inst,0.8381818181818181
|
| 23 |
cross_openhermes_llama3_8b_4096_2_inst,0.7654545454545455
|
results/cultural_reasoning/zero_shot/sg_eval_v2_open.csv
CHANGED
|
@@ -17,6 +17,7 @@ cross_openhermes_llama3_8b_2048_inst,52.24
|
|
| 17 |
gemma-2-2b-it,52.08
|
| 18 |
cross_openhermes_llama3_8b_12288_inst,52.480000000000004
|
| 19 |
Qwen2_5_0_5B_Instruct,35.28
|
|
|
|
| 20 |
cross_openhermes_llama3_8b_8192_inst,53.0
|
| 21 |
cross_openhermes_llama3_70b_4096_inst,53.2
|
| 22 |
cross_openhermes_llama3_8b_4096_2_inst,52.28
|
|
|
|
| 17 |
gemma-2-2b-it,52.08
|
| 18 |
cross_openhermes_llama3_8b_12288_inst,52.480000000000004
|
| 19 |
Qwen2_5_0_5B_Instruct,35.28
|
| 20 |
+
GPT4o_0513,57.28
|
| 21 |
cross_openhermes_llama3_8b_8192_inst,53.0
|
| 22 |
cross_openhermes_llama3_70b_4096_inst,53.2
|
| 23 |
cross_openhermes_llama3_8b_4096_2_inst,52.28
|
results/general_reasoning/zero_shot/zbench.csv
CHANGED
|
@@ -23,6 +23,7 @@ gemma-2-2b-it,0.24242424242424243
|
|
| 23 |
llama3-8b-cpt-sea-lionv2-instruct,0.30303030303030304
|
| 24 |
cross_openhermes_llama3_8b_12288_inst,0.42424242424242425
|
| 25 |
Qwen2_5_0_5B_Instruct,0.36363636363636365
|
|
|
|
| 26 |
cross_openhermes_llama3_8b_8192_inst,0.45454545454545453
|
| 27 |
cross_openhermes_llama3_70b_4096_inst,0.42424242424242425
|
| 28 |
cross_openhermes_llama3_8b_4096_2_inst,0.45454545454545453
|
|
|
|
| 23 |
llama3-8b-cpt-sea-lionv2-instruct,0.30303030303030304
|
| 24 |
cross_openhermes_llama3_8b_12288_inst,0.42424242424242425
|
| 25 |
Qwen2_5_0_5B_Instruct,0.36363636363636365
|
| 26 |
+
GPT4o_0513,0.696969696969697
|
| 27 |
cross_openhermes_llama3_8b_8192_inst,0.45454545454545453
|
| 28 |
cross_openhermes_llama3_70b_4096_inst,0.42424242424242425
|
| 29 |
cross_openhermes_llama3_8b_4096_2_inst,0.45454545454545453
|