weichiang commited on
Commit
cfcc840
β€’
1 Parent(s): d949fbc
Files changed (1) hide show
  1. leaderboard_table_20231206.csv +6 -6
leaderboard_table_20231206.csv CHANGED
@@ -22,22 +22,22 @@ Calude-2.1,8.18,1118,-,Proprietary,https://www.anthropic.com/index/claude-2-1
22
  GPT-3.5-turbo-0613,8.39,1112,-,Proprietary,https://platform.openai.com/docs/models/gpt-3-5
23
  Claude-instant-1,7.85,1109,0.734,Proprietary,https://www.anthropic.com/index/introducing-claude
24
  GPT-3.5-turbo-0314,7.94,1105,0.700,Proprietary,https://platform.openai.com/docs/models/gpt-3-5
25
- Tulu-2-dpo-70b,7.89,1105,-,AI2 ImpACT Low-risk,https://huggingface.co/allenai/tulu-2-dpo-70b
26
- Yi-34b-chat,-,1102,0.735,Yi License,https://huggingface.co/01-ai/Yi-34B-Chat
27
  WizardLM-70b-v1.0,7.71,1097,0.637,Llama 2 Community,https://huggingface.co/WizardLM/WizardLM-70B-V1.0
28
  Vicuna-33B,7.12,1093,0.592,Non-commercial,https://huggingface.co/lmsys/vicuna-33b-v1.3
29
- starling-lm-7b-alpha,8.09,1083,0.639,CC-BY-NC-4.0,https://huggingface.co/berkeley-nest/Starling-LM-7B-alpha
30
  pplx-70b-online,-,1080,-,Proprietary,https://blog.perplexity.ai/blog/introducing-pplx-online-llms
31
  OpenChat-3.5,7.81,1077,0.643,Apache-2.0,https://huggingface.co/openchat/openchat_3.5
32
- openhermes-2.5-mistral-7b,-,1075,-,Apache-2.0,https://huggingface.co/teknium/OpenHermes-2.5-Mistral-7B
33
  GPT-3.5-Turbo-1106,8.32,1074,-,Proprietary,https://platform.openai.com/docs/models/gpt-3-5
34
  Llama-2-70b-chat,6.86,1069,0.630,Llama 2 Community,https://huggingface.co/meta-llama/Llama-2-70b-chat-hf
35
  WizardLM-13b-v1.2,7.20,1053,0.527,Llama 2 Community,https://huggingface.co/WizardLM/WizardLM-13B-V1.2
36
- zephyr-7b-beta,7.34,1045,0.614,MIT,https://huggingface.co/HuggingFaceH4/zephyr-7b-beta
37
  MPT-30B-chat,6.39,1039,0.504,CC-BY-NC-SA-4.0,https://huggingface.co/mosaicml/mpt-30b-chat
38
  Vicuna-13B,6.57,1039,0.558,Llama 2 Community,https://huggingface.co/lmsys/vicuna-13b-v1.5
39
  QWen-Chat-14B,6.96,1039,0.665,Qianwen LICENSE,https://huggingface.co/Qwen/Qwen-14B-Chat
40
- zephyr-7b-alpha,6.88,1034,-,MIT,https://huggingface.co/HuggingFaceH4/zephyr-7b-alpha
41
  CodeLlama-34B-instruct,-,1032,0.537,Llama 2 Community,https://huggingface.co/codellama/CodeLlama-34b-Instruct-hf
42
  falcon-180b-chat,-,1031,0.680,Falcon-180B TII License,https://huggingface.co/tiiuae/falcon-180B-chat
43
  Guanaco-33B,6.53,1029,0.576,Non-commercial,https://huggingface.co/timdettmers/guanaco-33b-merged
 
22
  GPT-3.5-turbo-0613,8.39,1112,-,Proprietary,https://platform.openai.com/docs/models/gpt-3-5
23
  Claude-instant-1,7.85,1109,0.734,Proprietary,https://www.anthropic.com/index/introducing-claude
24
  GPT-3.5-turbo-0314,7.94,1105,0.700,Proprietary,https://platform.openai.com/docs/models/gpt-3-5
25
+ Tulu-2-DPO-70B,7.89,1105,-,AI2 ImpACT Low-risk,https://huggingface.co/allenai/tulu-2-dpo-70b
26
+ Yi-34B-chat,-,1102,0.735,Yi License,https://huggingface.co/01-ai/Yi-34B-Chat
27
  WizardLM-70b-v1.0,7.71,1097,0.637,Llama 2 Community,https://huggingface.co/WizardLM/WizardLM-70B-V1.0
28
  Vicuna-33B,7.12,1093,0.592,Non-commercial,https://huggingface.co/lmsys/vicuna-33b-v1.3
29
+ Starling-lm-7b-alpha,8.09,1083,0.639,CC-BY-NC-4.0,https://huggingface.co/berkeley-nest/Starling-LM-7B-alpha
30
  pplx-70b-online,-,1080,-,Proprietary,https://blog.perplexity.ai/blog/introducing-pplx-online-llms
31
  OpenChat-3.5,7.81,1077,0.643,Apache-2.0,https://huggingface.co/openchat/openchat_3.5
32
+ OpenHermes-2.5-Mistral-7b,-,1075,-,Apache-2.0,https://huggingface.co/teknium/OpenHermes-2.5-Mistral-7B
33
  GPT-3.5-Turbo-1106,8.32,1074,-,Proprietary,https://platform.openai.com/docs/models/gpt-3-5
34
  Llama-2-70b-chat,6.86,1069,0.630,Llama 2 Community,https://huggingface.co/meta-llama/Llama-2-70b-chat-hf
35
  WizardLM-13b-v1.2,7.20,1053,0.527,Llama 2 Community,https://huggingface.co/WizardLM/WizardLM-13B-V1.2
36
+ Zephyr-7b-beta,7.34,1045,0.614,MIT,https://huggingface.co/HuggingFaceH4/zephyr-7b-beta
37
  MPT-30B-chat,6.39,1039,0.504,CC-BY-NC-SA-4.0,https://huggingface.co/mosaicml/mpt-30b-chat
38
  Vicuna-13B,6.57,1039,0.558,Llama 2 Community,https://huggingface.co/lmsys/vicuna-13b-v1.5
39
  QWen-Chat-14B,6.96,1039,0.665,Qianwen LICENSE,https://huggingface.co/Qwen/Qwen-14B-Chat
40
+ Zephyr-7b-alpha,6.88,1034,-,MIT,https://huggingface.co/HuggingFaceH4/zephyr-7b-alpha
41
  CodeLlama-34B-instruct,-,1032,0.537,Llama 2 Community,https://huggingface.co/codellama/CodeLlama-34b-Instruct-hf
42
  falcon-180b-chat,-,1031,0.680,Falcon-180B TII License,https://huggingface.co/tiiuae/falcon-180B-chat
43
  Guanaco-33B,6.53,1029,0.576,Non-commercial,https://huggingface.co/timdettmers/guanaco-33b-merged