zhuohan-7 commited on
Commit
98c8a71
·
verified ·
1 Parent(s): 01ee931

Upload folder using huggingface_hub

Browse files
results/cultural_reasoning/zero_shot/sg_eval_v2_mcq.csv CHANGED
@@ -17,6 +17,7 @@ cross_openhermes_llama3_8b_2048_inst,0.7781818181818182
17
  gemma-2-2b-it,0.7163636363636363
18
  cross_openhermes_llama3_8b_12288_inst,0.7890909090909091
19
  Qwen2_5_0_5B_Instruct,0.5727272727272728
 
20
  cross_openhermes_llama3_8b_8192_inst,0.78
21
  cross_openhermes_llama3_70b_4096_inst,0.8381818181818181
22
  cross_openhermes_llama3_8b_4096_2_inst,0.7654545454545455
 
17
  gemma-2-2b-it,0.7163636363636363
18
  cross_openhermes_llama3_8b_12288_inst,0.7890909090909091
19
  Qwen2_5_0_5B_Instruct,0.5727272727272728
20
+ GPT4o_0513,0.8709090909090909
21
  cross_openhermes_llama3_8b_8192_inst,0.78
22
  cross_openhermes_llama3_70b_4096_inst,0.8381818181818181
23
  cross_openhermes_llama3_8b_4096_2_inst,0.7654545454545455
results/cultural_reasoning/zero_shot/sg_eval_v2_open.csv CHANGED
@@ -17,6 +17,7 @@ cross_openhermes_llama3_8b_2048_inst,52.24
17
  gemma-2-2b-it,52.08
18
  cross_openhermes_llama3_8b_12288_inst,52.480000000000004
19
  Qwen2_5_0_5B_Instruct,35.28
 
20
  cross_openhermes_llama3_8b_8192_inst,53.0
21
  cross_openhermes_llama3_70b_4096_inst,53.2
22
  cross_openhermes_llama3_8b_4096_2_inst,52.28
 
17
  gemma-2-2b-it,52.08
18
  cross_openhermes_llama3_8b_12288_inst,52.480000000000004
19
  Qwen2_5_0_5B_Instruct,35.28
20
+ GPT4o_0513,57.28
21
  cross_openhermes_llama3_8b_8192_inst,53.0
22
  cross_openhermes_llama3_70b_4096_inst,53.2
23
  cross_openhermes_llama3_8b_4096_2_inst,52.28
results/general_reasoning/zero_shot/zbench.csv CHANGED
@@ -23,6 +23,7 @@ gemma-2-2b-it,0.24242424242424243
23
  llama3-8b-cpt-sea-lionv2-instruct,0.30303030303030304
24
  cross_openhermes_llama3_8b_12288_inst,0.42424242424242425
25
  Qwen2_5_0_5B_Instruct,0.36363636363636365
 
26
  cross_openhermes_llama3_8b_8192_inst,0.45454545454545453
27
  cross_openhermes_llama3_70b_4096_inst,0.42424242424242425
28
  cross_openhermes_llama3_8b_4096_2_inst,0.45454545454545453
 
23
  llama3-8b-cpt-sea-lionv2-instruct,0.30303030303030304
24
  cross_openhermes_llama3_8b_12288_inst,0.42424242424242425
25
  Qwen2_5_0_5B_Instruct,0.36363636363636365
26
+ GPT4o_0513,0.696969696969697
27
  cross_openhermes_llama3_8b_8192_inst,0.45454545454545453
28
  cross_openhermes_llama3_70b_4096_inst,0.42424242424242425
29
  cross_openhermes_llama3_8b_4096_2_inst,0.45454545454545453