azureml-assets/assets/evaluation_results
..
amazonpolarityclassification_cohere-embed-v3-english_classification
amazonpolarityclassification_cohere-embed-v3-multilingual_classification
amazonpolarityclassification_text-embedding-3-large_classification
amazonpolarityclassification_text-embedding-3-small_classification
amazonpolarityclassification_text-embedding-ada-002_classification
arguana_cohere-embed-v3-english_retrieval
arguana_cohere-embed-v3-multilingual_retrieval
arguana_text-embedding-3-large_retrieval
arguana_text-embedding-3-small_retrieval
arguana_text-embedding-ada-002_retrieval
arxivclusteringp2p.v2_cohere-embed-v3-english_clustering
arxivclusteringp2p.v2_cohere-embed-v3-multilingual_clustering
arxivclusteringp2p.v2_text-embedding-3-large_clustering
arxivclusteringp2p.v2_text-embedding-3-small_clustering
arxivclusteringp2p.v2_text-embedding-ada-002_clustering
arxivclusterings2s_cohere-embed-v3-english_clustering
arxivclusterings2s_cohere-embed-v3-multilingual_clustering
arxivclusterings2s_text-embedding-3-large_clustering
arxivclusterings2s_text-embedding-3-small_clustering
arxivclusterings2s_text-embedding-ada-002_clustering
banking77classification_cohere-embed-v3-english_classification
banking77classification_cohere-embed-v3-multilingual_classification
banking77classification_text-embedding-3-large_classification
banking77classification_text-embedding-3-small_classification
banking77classification_text-embedding-ada-002_classification
boolq__gpt-4-0125-preview__question_answering
boolq__meta-llama-3_1-8b-instruct__question_answering
boolq__meta-llama-3_1-70b-instruct__question_answering
boolq_cohere_command_r_plus_question_answering
boolq_cohere_command_r_question_answering
boolq_databricks-dbrx-base_question_answering
boolq_databricks-dbrx-instruct_question_answering
boolq_gpt-4-turbo-2024-04-09_chat_completion
boolq_gpt-4o_question_answering
boolq_gpt_4_32k_0314_question_answering
boolq_gpt_4_32k_0613_question_answering
boolq_gpt_4_0314_question_answering
boolq_gpt_4_0613_question_answering
boolq_gpt_35_turbo_0301_question_answering
boolq_gpt_35_turbo_0613_question_answering
boolq_llama_2_7b_chat_question_answering
boolq_llama_2_7b_question_answering
boolq_llama_2_13b_chat_question_answering
boolq_llama_2_13b_question_answering
boolq_llama_2_70b_chat_question_answering
boolq_llama_2_70b_question_answering
boolq_meta-llama-3-8b-instruct_question_answering
boolq_meta-llama-3-8b_question_answering
boolq_meta-llama-3-70b-instruct_question_answering
boolq_meta-llama-3-70b_question_answering
boolq_meta-llama-3_1-405b-instruct_question_answering
boolq_microsoft_phi_2_question_answering
boolq_mistral-community-mixtral-8x22b-v0-1_question_answering
boolq_mistral_7b_instruct_v01_question_answering
boolq_mistral_7b_v01_question_answering
boolq_mistral_large_question_answering
boolq_mistralai-mistral-7b-instruct-v0-2_question_answering
boolq_mistralai-mixtral-8x7b-instruct-v01_question_answering
boolq_mistralai-mixtral-8x7b-v01_question_answering
boolq_mistralai-mixtral-8x22b-instruct-v0-1_question_answering
boolq_mistralai-mixtral-8x22b-v0-1_question_answering
boolq_phi-3-medium-4k-instruct_question_answering
boolq_phi-3-medium-128k-instruct_question_answering
boolq_phi-3-mini-4k-instruct_chat_completion
boolq_phi-3-mini-128k-instruct_chat_completion
boolq_phi-3-small-8k-instruct_question_answering
boolq_phi-3-small-128k-instruct_question_answering
bucc_cohere-embed-v3-english_bitext_mining
bucc_cohere-embed-v3-multilingual_bitext_mining
bucc_text-embedding-3-large_bitext_mining
bucc_text-embedding-3-small_bitext_mining
bucc_text-embedding-ada-002_bitext_mining
emotionclassification_cohere-embed-v3-english_classification
emotionclassification_cohere-embed-v3-multilingual_classification
emotionclassification_text-embedding-3-large_classification
emotionclassification_text-embedding-3-small_classification
emotionclassification_text-embedding-ada-002_classification
gsm8k__gpt-4-0125-preview__question_answering
gsm8k__meta-llama-3_1-8b-instruct__question_answering
gsm8k__meta-llama-3_1-70b-instruct__question_answering
gsm8k_cohere_command_r_plus_question_answering
gsm8k_cohere_command_r_question_answering
gsm8k_databricks-dbrx-base_question_answering
gsm8k_databricks-dbrx-instruct_question_answering
gsm8k_gpt-4-turbo-2024-04-09_chat_completion
gsm8k_gpt-4o_question_answering
gsm8k_gpt_4_32k_0314_question_answering
gsm8k_gpt_4_32k_0613_question_answering
gsm8k_gpt_4_0314_question_answering
gsm8k_gpt_4_0613_question_answering
gsm8k_gpt_35_turbo_0301_question_answering
gsm8k_gpt_35_turbo_0613_question_answering
gsm8k_llama_2_7b_chat_question_answering
gsm8k_llama_2_7b_question_answering
gsm8k_llama_2_13b_chat_question_answering
gsm8k_llama_2_13b_question_answering
gsm8k_llama_2_70b_chat_question_answering
gsm8k_llama_2_70b_question_answering
gsm8k_meta-llama-3-8b-instruct_question_answering
gsm8k_meta-llama-3-8b_question_answering
gsm8k_meta-llama-3-70b-instruct_question_answering
gsm8k_meta-llama-3-70b_question_answering
gsm8k_meta-llama-3_1-405b-instruct_question_answering
gsm8k_microsoft_phi_2_question_answering
gsm8k_mistral-community-mixtral-8x22b-v0-1_question_answering
gsm8k_mistral_7b_instruct_v01_question_answering
gsm8k_mistral_7b_v01_question_answering
gsm8k_mistral_large_question_answering
gsm8k_mistralai-mistral-7b-instruct-v0-2_question_answering
gsm8k_mistralai-mixtral-8x7b-instruct-v01_question_answering
gsm8k_mistralai-mixtral-8x7b-v01_question_answering
gsm8k_mistralai-mixtral-8x22b-instruct-v0-1_question_answering
gsm8k_mistralai-mixtral-8x22b-v0-1_question_answering
gsm8k_phi-3-medium-4k-instruct_question_answering
gsm8k_phi-3-medium-128k-instruct_question_answering
gsm8k_phi-3-mini-4k-instruct_chat_completion
gsm8k_phi-3-mini-128k-instruct_chat_completion
gsm8k_phi-3-small-8k-instruct_question_answering
gsm8k_phi-3-small-128k-instruct_question_answering
hellaswag__gpt-4-0125-preview__question_answering
hellaswag__meta-llama-3_1-8b-instruct__question_answering
hellaswag__meta-llama-3_1-70b-instruct__question_answering
hellaswag_cohere_command_r_plus_question_answering
hellaswag_cohere_command_r_question_answering
hellaswag_databricks-dbrx-base_question_answering
hellaswag_databricks-dbrx-instruct_question_answering
hellaswag_gpt-4-turbo-2024-04-09_chat_completion
hellaswag_gpt-4o_question_answering
hellaswag_gpt_4_32k_0314_question_answering
hellaswag_gpt_4_32k_0613_question_answering
hellaswag_gpt_4_0314_question_answering
hellaswag_gpt_4_0613_question_answering
hellaswag_gpt_35_turbo_0301_question_answering
hellaswag_gpt_35_turbo_0613_question_answering
hellaswag_llama_2_7b_chat_question_answering
hellaswag_llama_2_7b_question_answering
hellaswag_llama_2_13b_chat_question_answering
hellaswag_llama_2_13b_question_answering
hellaswag_llama_2_70b_chat_question_answering
hellaswag_llama_2_70b_question_answering
hellaswag_meta-llama-3-8b-instruct_question_answering
hellaswag_meta-llama-3-8b_question_answering
hellaswag_meta-llama-3-70b-instruct_question_answering
hellaswag_meta-llama-3-70b_question_answering
hellaswag_meta-llama-3_1-405b-instruct_question_answering
hellaswag_microsoft_phi_2_question_answering
hellaswag_mistral-community-mixtral-8x22b-v0-1_question_answering
hellaswag_mistral_7b_instruct_v01_question_answering
hellaswag_mistral_7b_v01_question_answering
hellaswag_mistral_large_question_answering
hellaswag_mistralai-mistral-7b-instruct-v0-2_question_answering
hellaswag_mistralai-mixtral-8x7b-instruct-v01_question_answering
hellaswag_mistralai-mixtral-8x7b-v01_question_answering
hellaswag_mistralai-mixtral-8x22b-instruct-v0-1_question_answering
hellaswag_mistralai-mixtral-8x22b-v0-1_question_answering
hellaswag_phi-3-medium-4k-instruct_question_answering
hellaswag_phi-3-medium-128k-instruct_question_answering
hellaswag_phi-3-mini-4k-instruct_chat_completion
hellaswag_phi-3-mini-128k-instruct_chat_completion
hellaswag_phi-3-small-8k-instruct_question_answering
hellaswag_phi-3-small-128k-instruct_question_answering
human_eval__gpt-4-0125-preview__text_generation
human_eval__meta-llama-3_1-8b-instruct__text_generation
human_eval__meta-llama-3_1-70b-instruct__text_generation
human_eval_codellama_7b_hf_text_generation
human_eval_codellama_7b_instruct_hf_text_generation
human_eval_codellama_7b_python_hf_text_generation
human_eval_codellama_13b_hf_text_generation
human_eval_codellama_13b_instruct_hf_text_generation
human_eval_codellama_13b_python_hf_text_generation
human_eval_codellama_34b_hf_text_generation
human_eval_codellama_34b_instruct_hf_text_generation
human_eval_codellama_34b_python_hf_text_generation
human_eval_cohere_command_r_plus_text_generation
human_eval_cohere_command_r_text_generation
human_eval_databricks-dbrx-base_text_generation
human_eval_databricks-dbrx-instruct_text_generation
human_eval_gpt-4-turbo-2024-04-09_chat_completion
human_eval_gpt-4o_text_generation
human_eval_gpt_4_32k_0314_text_generation
human_eval_gpt_4_32k_0613_text_generation
human_eval_gpt_4_0314_text_generation
human_eval_gpt_4_0613_text_generation
human_eval_gpt_35_turbo_0301_text_generation
human_eval_gpt_35_turbo_0613_text_generation
human_eval_llama_2_7b_text_generation
human_eval_llama_2_13b_text_generation
human_eval_llama_2_70b_text_generation
human_eval_meta-llama-3-8b-instruct_text_generation
human_eval_meta-llama-3-8b_text_generation
human_eval_meta-llama-3-70b-instruct_text_generation
human_eval_meta-llama-3-70b_text_generation
human_eval_meta-llama-3_1-405b-instruct_text_generation
human_eval_microsoft_phi_2_text_generation
human_eval_mistral_7b_v01_text_generation
human_eval_mistral_large_text_generation
human_eval_mistralai-mistral-7b-instruct-v0-2_text_generation
human_eval_mistralai-mixtral-8x7b-instruct-v01_text_generation
human_eval_mistralai-mixtral-8x7b-v01_text_generation
human_eval_mistralai-mixtral-8x22b-instruct-v0-1_text_generation
human_eval_mistralai-mixtral-8x22b-v0-1_text_generation
human_eval_phi-3-medium-4k-instruct_text_generation
human_eval_phi-3-medium-128k-instruct_text_generation
human_eval_phi-3-mini-4k-instruct_chat_completion
human_eval_phi-3-mini-128k-instruct_chat_completion
human_eval_phi-3-small-8k-instruct_text_generation
human_eval_phi-3-small-128k-instruct_text_generation
lccsentimentclassification_cohere-embed-v3-english_classification
lccsentimentclassification_cohere-embed-v3-multilingual_classification
lccsentimentclassification_text-embedding-3-large_classification
lccsentimentclassification_text-embedding-3-small_classification
lccsentimentclassification_text-embedding-ada-002_classification
legalbenchpc_cohere-embed-v3-english_pair_classification
legalbenchpc_cohere-embed-v3-multilingual_pair_classification
legalbenchpc_text-embedding-3-large_pair_classification
legalbenchpc_text-embedding-3-small_pair_classification
legalbenchpc_text-embedding-ada-002_pair_classification
mmlu_humanities__gpt-4-0125-preview__question_answering
mmlu_humanities__meta-llama-3_1-8b-instruct__question_answering
mmlu_humanities__meta-llama-3_1-70b-instruct__question_answering
mmlu_humanities_cohere_command_r_plus_question_answering
mmlu_humanities_cohere_command_r_question_answering
mmlu_humanities_databricks-dbrx-base_question_answering
mmlu_humanities_databricks-dbrx-instruct_question_answering
mmlu_humanities_gpt-4-turbo-2024-04-09_chat_completion
mmlu_humanities_gpt-4o_question_answering
mmlu_humanities_gpt_4_32k_0314_question_answering
mmlu_humanities_gpt_4_32k_0613_question_answering
mmlu_humanities_gpt_4_0314_question_answering
mmlu_humanities_gpt_4_0613_question_answering
mmlu_humanities_gpt_35_turbo_0301_question_answering
mmlu_humanities_gpt_35_turbo_0613_question_answering
mmlu_humanities_llama_2_7b_chat_question_answering
mmlu_humanities_llama_2_7b_question_answering
mmlu_humanities_llama_2_13b_chat_question_answering
mmlu_humanities_llama_2_13b_question_answering
mmlu_humanities_llama_2_70b_chat_question_answering
mmlu_humanities_llama_2_70b_question_answering
mmlu_humanities_meta-llama-3-8b-instruct_question_answering
mmlu_humanities_meta-llama-3-8b_question_answering
mmlu_humanities_meta-llama-3-70b-instruct_question_answering
mmlu_humanities_meta-llama-3-70b_question_answering
mmlu_humanities_meta-llama-3_1-405b-instruct_question_answering
mmlu_humanities_microsoft_phi_2_question_answering
mmlu_humanities_mistral-community-mixtral-8x22b-v0-1_question_answering
mmlu_humanities_mistral_7b_instruct_v01_question_answering
mmlu_humanities_mistral_7b_v01_question_answering
mmlu_humanities_mistral_large_question_answering
mmlu_humanities_mistralai-mistral-7b-instruct-v0-2_question_answering
mmlu_humanities_mistralai-mixtral-8x7b-instruct-v01_question_answering
mmlu_humanities_mistralai-mixtral-8x7b-v01_question_answering
mmlu_humanities_mistralai-mixtral-8x22b-instruct-v0-1_question_answering
mmlu_humanities_mistralai-mixtral-8x22b-v0-1_question_answering
mmlu_humanities_phi-3-medium-4k-instruct_question_answering
mmlu_humanities_phi-3-medium-128k-instruct_question_answering
mmlu_humanities_phi-3-mini-4k-instruct_chat_completion
mmlu_humanities_phi-3-mini-128k-instruct_chat_completion
mmlu_humanities_phi-3-small-8k-instruct_question_answering
mmlu_humanities_phi-3-small-128k-instruct_question_answering
mmlu_other__gpt-4-0125-preview__question_answering
mmlu_other__meta-llama-3_1-8b-instruct__question_answering
mmlu_other__meta-llama-3_1-70b-instruct__question_answering
mmlu_other_cohere_command_r_plus_question_answering
mmlu_other_cohere_command_r_question_answering
mmlu_other_databricks-dbrx-base_question_answering
mmlu_other_databricks-dbrx-instruct_question_answering
mmlu_other_gpt-4-turbo-2024-04-09_chat_completion
mmlu_other_gpt-4o_question_answering
mmlu_other_gpt_4_32k_0314_question_answering
mmlu_other_gpt_4_32k_0613_question_answering
mmlu_other_gpt_4_0314_question_answering
mmlu_other_gpt_4_0613_question_answering
mmlu_other_gpt_35_turbo_0301_question_answering
mmlu_other_gpt_35_turbo_0613_question_answering
mmlu_other_llama_2_7b_chat_question_answering
mmlu_other_llama_2_7b_question_answering
mmlu_other_llama_2_13b_chat_question_answering
mmlu_other_llama_2_13b_question_answering
mmlu_other_llama_2_70b_chat_question_answering
mmlu_other_llama_2_70b_question_answering
mmlu_other_meta-llama-3-8b-instruct_question_answering
mmlu_other_meta-llama-3-8b_question_answering
mmlu_other_meta-llama-3-70b-instruct_question_answering
mmlu_other_meta-llama-3-70b_question_answering
mmlu_other_meta-llama-3_1-405b-instruct_question_answering
mmlu_other_microsoft_phi_2_question_answering
mmlu_other_mistral-community-mixtral-8x22b-v0-1_question_answering
mmlu_other_mistral_7b_instruct_v01_question_answering
mmlu_other_mistral_7b_v01_question_answering
mmlu_other_mistral_large_question_answering
mmlu_other_mistralai-mistral-7b-instruct-v0-2_question_answering
mmlu_other_mistralai-mixtral-8x7b-instruct-v01_question_answering
mmlu_other_mistralai-mixtral-8x7b-v01_question_answering
mmlu_other_mistralai-mixtral-8x22b-instruct-v0-1_question_answering
mmlu_other_mistralai-mixtral-8x22b-v0-1_question_answering
mmlu_other_phi-3-medium-4k-instruct_question_answering
mmlu_other_phi-3-medium-128k-instruct_question_answering
mmlu_other_phi-3-mini-4k-instruct_chat_completion
mmlu_other_phi-3-mini-128k-instruct_chat_completion
mmlu_other_phi-3-small-8k-instruct_question_answering
mmlu_other_phi-3-small-128k-instruct_question_answering
mmlu_social_sciences__gpt-4-0125-preview__question_answering
mmlu_social_sciences__meta-llama-3_1-8b-instruct__question_answering
mmlu_social_sciences__meta-llama-3_1-70b-instruct__question_answering
mmlu_social_sciences_cohere_command_r_plus_question_answering
mmlu_social_sciences_cohere_command_r_question_answering
mmlu_social_sciences_databricks-dbrx-base_question_answering
mmlu_social_sciences_databricks-dbrx-instruct_question_answering
mmlu_social_sciences_gpt-4-turbo-2024-04-09_chat_completion
mmlu_social_sciences_gpt-4o_question_answering
mmlu_social_sciences_gpt_4_32k_0314_question_answering
mmlu_social_sciences_gpt_4_32k_0613_question_answering
mmlu_social_sciences_gpt_4_0314_question_answering
mmlu_social_sciences_gpt_4_0613_question_answering
mmlu_social_sciences_gpt_35_turbo_0301_question_answering
mmlu_social_sciences_gpt_35_turbo_0613_question_answering
mmlu_social_sciences_llama_2_7b_chat_question_answering
mmlu_social_sciences_llama_2_7b_question_answering
mmlu_social_sciences_llama_2_13b_chat_question_answering
mmlu_social_sciences_llama_2_13b_question_answering
mmlu_social_sciences_llama_2_70b_chat_question_answering
mmlu_social_sciences_llama_2_70b_question_answering
mmlu_social_sciences_meta-llama-3-8b-instruct_question_answering
mmlu_social_sciences_meta-llama-3-8b_question_answering
mmlu_social_sciences_meta-llama-3-70b-instruct_question_answering
mmlu_social_sciences_meta-llama-3-70b_question_answering
mmlu_social_sciences_meta-llama-3_1-405b-instruct_question_answering
mmlu_social_sciences_microsoft_phi_2_question_answering
mmlu_social_sciences_mistral-community-mixtral-8x22b-v0-1_question_answering
mmlu_social_sciences_mistral_7b_instruct_v01_question_answering
mmlu_social_sciences_mistral_7b_v01_question_answering
mmlu_social_sciences_mistral_large_question_answering
mmlu_social_sciences_mistralai-mistral-7b-instruct-v0-2_question_answering
mmlu_social_sciences_mistralai-mixtral-8x7b-instruct-v01_question_answering
mmlu_social_sciences_mistralai-mixtral-8x7b-v01_question_answering
mmlu_social_sciences_mistralai-mixtral-8x22b-instruct-v0-1_question_answering
mmlu_social_sciences_mistralai-mixtral-8x22b-v0-1_question_answering
mmlu_social_sciences_phi-3-medium-4k-instruct_question_answering
mmlu_social_sciences_phi-3-medium-128k-instruct_question_answering
mmlu_social_sciences_phi-3-mini-4k-instruct_chat_completion
mmlu_social_sciences_phi-3-mini-128k-instruct_chat_completion
mmlu_social_sciences_phi-3-small-8k-instruct_question_answering
mmlu_social_sciences_phi-3-small-128k-instruct_question_answering
mmlu_stem__gpt-4-0125-preview__question_answering
mmlu_stem__meta-llama-3_1-8b-instruct__question_answering
mmlu_stem__meta-llama-3_1-70b-instruct__question_answering
mmlu_stem_cohere_command_r_plus_question_answering
mmlu_stem_cohere_command_r_question_answering
mmlu_stem_databricks-dbrx-base_question_answering
mmlu_stem_databricks-dbrx-instruct_question_answering
mmlu_stem_gpt-4-turbo-2024-04-09_chat_completion
mmlu_stem_gpt-4o_question_answering
mmlu_stem_gpt_4_32k_0314_question_answering
mmlu_stem_gpt_4_32k_0613_question_answering
mmlu_stem_gpt_4_0314_question_answering
mmlu_stem_gpt_4_0613_question_answering
mmlu_stem_gpt_35_turbo_0301_question_answering
mmlu_stem_gpt_35_turbo_0613_question_answering
mmlu_stem_llama_2_7b_chat_question_answering
mmlu_stem_llama_2_7b_question_answering
mmlu_stem_llama_2_13b_chat_question_answering
mmlu_stem_llama_2_13b_question_answering
mmlu_stem_llama_2_70b_chat_question_answering
mmlu_stem_llama_2_70b_question_answering
mmlu_stem_meta-llama-3-8b-instruct_question_answering
mmlu_stem_meta-llama-3-8b_question_answering
mmlu_stem_meta-llama-3-70b-instruct_question_answering
mmlu_stem_meta-llama-3-70b_question_answering
mmlu_stem_meta-llama-3_1-405b-instruct_question_answering
mmlu_stem_microsoft_phi_2_question_answering
mmlu_stem_mistral-community-mixtral-8x22b-v0-1_question_answering
mmlu_stem_mistral_7b_instruct_v01_question_answering
mmlu_stem_mistral_7b_v01_question_answering
mmlu_stem_mistral_large_question_answering
mmlu_stem_mistralai-mistral-7b-instruct-v0-2_question_answering
mmlu_stem_mistralai-mixtral-8x7b-instruct-v01_question_answering
mmlu_stem_mistralai-mixtral-8x7b-v01_question_answering
mmlu_stem_mistralai-mixtral-8x22b-instruct-v0-1_question_answering
mmlu_stem_mistralai-mixtral-8x22b-v0-1_question_answering
mmlu_stem_phi-3-medium-4k-instruct_question_answering
mmlu_stem_phi-3-medium-128k-instruct_question_answering
mmlu_stem_phi-3-mini-4k-instruct_chat_completion
mmlu_stem_phi-3-mini-128k-instruct_chat_completion
mmlu_stem_phi-3-small-8k-instruct_question_answering
mmlu_stem_phi-3-small-128k-instruct_question_answering
mscoco__stabilityai-stable-diffusion-2-1__image_generation
openbookqa__gpt-4-0125-preview__question_answering
openbookqa__meta-llama-3_1-8b-instruct__question_answering
openbookqa__meta-llama-3_1-70b-instruct__question_answering
openbookqa_cohere_command_r_plus_question_answering
openbookqa_cohere_command_r_question_answering
openbookqa_databricks-dbrx-base_question_answering
openbookqa_databricks-dbrx-instruct_question_answering
openbookqa_gpt-4-turbo-2024-04-09_chat_completion
openbookqa_gpt-4o_question_answering
openbookqa_gpt_4_32k_0314_question_answering
openbookqa_gpt_4_32k_0613_question_answering
openbookqa_gpt_4_0314_question_answering
openbookqa_gpt_4_0613_question_answering
openbookqa_gpt_35_turbo_0301_question_answering
openbookqa_gpt_35_turbo_0613_question_answering
openbookqa_llama_2_7b_chat_question_answering
openbookqa_llama_2_7b_question_answering
openbookqa_llama_2_13b_chat_question_answering
openbookqa_llama_2_13b_question_answering
openbookqa_llama_2_70b_chat_question_answering
openbookqa_llama_2_70b_question_answering
openbookqa_meta-llama-3-8b-instruct_question_answering
openbookqa_meta-llama-3-8b_question_answering
openbookqa_meta-llama-3-70b-instruct_question_answering
openbookqa_meta-llama-3-70b_question_answering
openbookqa_meta-llama-3_1-405b-instruct_question_answering
openbookqa_microsoft_phi_2_question_answering
openbookqa_mistral-community-mixtral-8x22b-v0-1_question_answering
openbookqa_mistral_7b_instruct_v01_question_answering
openbookqa_mistral_7b_v01_question_answering
openbookqa_mistral_large_question_answering
openbookqa_mistralai-mistral-7b-instruct-v0-2_question_answering
openbookqa_mistralai-mixtral-8x7b-instruct-v01_question_answering
openbookqa_mistralai-mixtral-8x7b-v01_question_answering
openbookqa_mistralai-mixtral-8x22b-instruct-v0-1_question_answering
openbookqa_mistralai-mixtral-8x22b-v0-1_question_answering
openbookqa_phi-3-medium-4k-instruct_question_answering
openbookqa_phi-3-medium-128k-instruct_question_answering
openbookqa_phi-3-mini-4k-instruct_chat_completion
openbookqa_phi-3-mini-128k-instruct_chat_completion
openbookqa_phi-3-small-8k-instruct_question_answering
openbookqa_phi-3-small-128k-instruct_question_answering
piqa__gpt-4-0125-preview__question_answering
piqa__meta-llama-3_1-8b-instruct__question_answering
piqa__meta-llama-3_1-70b-instruct__question_answering
piqa_cohere_command_r_plus_question_answering
piqa_cohere_command_r_question_answering
piqa_databricks-dbrx-base_question_answering
piqa_databricks-dbrx-instruct_question_answering
piqa_gpt-4-turbo-2024-04-09_chat_completion
piqa_gpt-4o_question_answering
piqa_gpt_4_32k_0314_question_answering
piqa_gpt_4_32k_0613_question_answering
piqa_gpt_4_0314_question_answering
piqa_gpt_4_0613_question_answering
piqa_gpt_35_turbo_0301_question_answering
piqa_gpt_35_turbo_0613_question_answering
piqa_llama_2_7b_chat_question_answering
piqa_llama_2_7b_question_answering
piqa_llama_2_13b_chat_question_answering
piqa_llama_2_13b_question_answering
piqa_llama_2_70b_chat_question_answering
piqa_llama_2_70b_question_answering
piqa_meta-llama-3-8b-instruct_question_answering
piqa_meta-llama-3-8b_question_answering
piqa_meta-llama-3-70b-instruct_question_answering
piqa_meta-llama-3-70b_question_answering
piqa_meta-llama-3_1-405b-instruct_question_answering
piqa_microsoft_phi_2_question_answering
piqa_mistral-community-mixtral-8x22b-v0-1_question_answering
piqa_mistral_7b_instruct_v01_question_answering
piqa_mistral_7b_v01_question_answering
piqa_mistral_large_question_answering
piqa_mistralai-mistral-7b-instruct-v0-2_question_answering
piqa_mistralai-mixtral-8x7b-instruct-v01_question_answering
piqa_mistralai-mixtral-8x7b-v01_question_answering
piqa_mistralai-mixtral-8x22b-instruct-v0-1_question_answering
piqa_mistralai-mixtral-8x22b-v0-1_question_answering
piqa_phi-3-medium-4k-instruct_question_answering
piqa_phi-3-medium-128k-instruct_question_answering
piqa_phi-3-mini-4k-instruct_chat_completion
piqa_phi-3-mini-128k-instruct_chat_completion
piqa_phi-3-small-8k-instruct_question_answering
piqa_phi-3-small-128k-instruct_question_answering
scidocsrr_cohere-embed-v3-english_reranking
scidocsrr_cohere-embed-v3-multilingual_reranking
scidocsrr_text-embedding-3-large_reranking
scidocsrr_text-embedding-3-small_reranking
scidocsrr_text-embedding-ada-002_reranking
scifact-pl_cohere-embed-v3-english_retrieval
scifact-pl_cohere-embed-v3-multilingual_retrieval
scifact-pl_text-embedding-3-large_retrieval
scifact-pl_text-embedding-3-small_retrieval
scifact-pl_text-embedding-ada-002_retrieval
scifact_cohere-embed-v3-english_retrieval
scifact_cohere-embed-v3-multilingual_retrieval
scifact_text-embedding-3-large_retrieval
scifact_text-embedding-3-small_retrieval
scifact_text-embedding-ada-002_retrieval
social_iqa__gpt-4-0125-preview__question_answering
social_iqa__meta-llama-3_1-8b-instruct__question_answering
social_iqa__meta-llama-3_1-70b-instruct__question_answering
social_iqa_cohere_command_r_plus_question_answering
social_iqa_cohere_command_r_question_answering
social_iqa_databricks-dbrx-base_question_answering
social_iqa_databricks-dbrx-instruct_question_answering
social_iqa_gpt-4-turbo-2024-04-09_chat_completion
social_iqa_gpt-4o_question_answering
social_iqa_gpt_4_32k_0314_question_answering
social_iqa_gpt_4_32k_0613_question_answering
social_iqa_gpt_4_0314_question_answering
social_iqa_gpt_4_0613_question_answering
social_iqa_gpt_35_turbo_0301_question_answering
social_iqa_gpt_35_turbo_0613_question_answering
social_iqa_llama_2_7b_chat_question_answering
social_iqa_llama_2_7b_question_answering
social_iqa_llama_2_13b_chat_question_answering
social_iqa_llama_2_13b_question_answering
social_iqa_llama_2_70b_chat_question_answering
social_iqa_llama_2_70b_question_answering
social_iqa_meta-llama-3-8b-instruct_question_answering
social_iqa_meta-llama-3-8b_question_answering
social_iqa_meta-llama-3-70b-instruct_question_answering
social_iqa_meta-llama-3-70b_question_answering
social_iqa_meta-llama-3_1-405b-instruct_question_answering
social_iqa_microsoft_phi_2_question_answering
social_iqa_mistral-community-mixtral-8x22b-v0-1_question_answering
social_iqa_mistral_7b_instruct_v01_question_answering
social_iqa_mistral_7b_v01_question_answering
social_iqa_mistral_large_question_answering
social_iqa_mistralai-mistral-7b-instruct-v0-2_question_answering
social_iqa_mistralai-mixtral-8x7b-instruct-v01_question_answering
social_iqa_mistralai-mixtral-8x7b-v01_question_answering
social_iqa_mistralai-mixtral-8x22b-instruct-v0-1_question_answering
social_iqa_mistralai-mixtral-8x22b-v0-1_question_answering
social_iqa_phi-3-medium-4k-instruct_question_answering
social_iqa_phi-3-medium-128k-instruct_question_answering
social_iqa_phi-3-mini-4k-instruct_chat_completion
social_iqa_phi-3-mini-128k-instruct_chat_completion
social_iqa_phi-3-small-8k-instruct_question_answering
social_iqa_phi-3-small-128k-instruct_question_answering
squad_v2__gpt-4-0125-preview__question_answering
squad_v2__meta-llama-3_1-8b-instruct__question_answering
squad_v2__meta-llama-3_1-70b-instruct__question_answering
squad_v2_cohere-command-r-plus_question_answering
squad_v2_cohere-command-r_question_answering
squad_v2_databricks-dbrx-base_question_answering
squad_v2_databricks-dbrx-instruct_question_answering
squad_v2_gpt-4-32k-0314_question_answering
squad_v2_gpt-4-32k-0613_question_answering
squad_v2_gpt-4-0314_question_answering
squad_v2_gpt-4-0613_question_answering
squad_v2_gpt-4-turbo-2024-04-09_chat_completion
squad_v2_gpt-4o_question_answering
squad_v2_gpt-35-turbo-0301_question_answering
squad_v2_gpt-35-turbo-0613_question_answering
squad_v2_llama-2-7b-chat_question_answering
squad_v2_llama-2-7b_question_answering
squad_v2_llama-2-13b-chat_question_answering
squad_v2_llama-2-13b_question_answering
squad_v2_llama-2-70b-chat_question_answering
squad_v2_llama-2-70b_question_answering
squad_v2_meta-llama-3-8b-instruct_question_answering
squad_v2_meta-llama-3-70b-instruct_question_answering
squad_v2_meta-llama-3_1-405b-instruct_question_answering
squad_v2_microsoft-phi-2_question_answering
squad_v2_mistral-community-mixtral-8x22b-v0-1_question_answering
squad_v2_mistral-large_question_answering
squad_v2_mistralai-mistral-7b-v01_question_answering
squad_v2_mistralai-mixtral-8x7b-instruct-v01_question_answering
squad_v2_mistralai-mixtral-8x7b-v01_question_answering
squad_v2_mistralai-mixtral-8x22b-v0-1_question_answering
squad_v2_mistralaimistral7binstruct_question_answering
squad_v2_mixtral8x22binstructv01_question_answering
squad_v2_phi-3-medium-4k-instruct_question_answering
squad_v2_phi-3-medium-128k-instruct_question_answering
squad_v2_phi-3-small-8k-instruct_question_answering
squad_v2_phi-3-small-128k-instruct_question_answering
squad_v2_phi3-mini-4k-instruct_chat_completion
squad_v2_phi3-mini-128k-instruct_chat_completion
stsbenchmark_cohere-embed-v3-english_sts
stsbenchmark_cohere-embed-v3-multilingual_sts
stsbenchmark_text-embedding-3-large_sts
stsbenchmark_text-embedding-3-small_sts
stsbenchmark_text-embedding-ada-002_sts
summeval_cohere-embed-v3-english_summarization
summeval_cohere-embed-v3-multilingual_summarization
summeval_text-embedding-3-large_summarization
summeval_text-embedding-3-small_summarization
summeval_text-embedding-ada-002_summarization
tatoeba_cohere-embed-v3-english_bitext_mining
tatoeba_cohere-embed-v3-multilingual_bitext_mining
tatoeba_text-embedding-3-large_bitext_mining
tatoeba_text-embedding-3-small_bitext_mining
tatoeba_text-embedding-ada-002_bitext_mining
toxicconversationsclassification_cohere-embed-v3-english_classification
toxicconversationsclassification_cohere-embed-v3-multilingual_classification
toxicconversationsclassification_text-embedding-3-large_classification
toxicconversationsclassification_text-embedding-3-small_classification
toxicconversationsclassification_text-embedding-ada-002_classification
truthfulqa_generation__gpt-4-0125-preview__question_answering
truthfulqa_generation__meta-llama-3_1-8b-instruct__question_answering
truthfulqa_generation__meta-llama-3_1-70b-instruct__question_answering
truthfulqa_generation_cohere-command-r-plus_question_answering
truthfulqa_generation_cohere-command-r_question_answering
truthfulqa_generation_communitymixtral8x22bv01_question_answering
truthfulqa_generation_databricks-dbrx-base_question_answering
truthfulqa_generation_databricks-dbrx-instruct_question_answering
truthfulqa_generation_gpt-4-32k-0314_question_answering
truthfulqa_generation_gpt-4-32k-0613_question_answering
truthfulqa_generation_gpt-4-0314_question_answering
truthfulqa_generation_gpt-4-0613_question_answering
truthfulqa_generation_gpt-4-turbo-2024-04-09_chat_completion
truthfulqa_generation_gpt-4o_question_answering
truthfulqa_generation_gpt-35-turbo-0301_question_answering
truthfulqa_generation_gpt-35-turbo-0613_question_answering
truthfulqa_generation_llama-2-7b-chat_question_answering
truthfulqa_generation_llama-2-7b_question_answering
truthfulqa_generation_llama-2-13b-chat_question_answering
truthfulqa_generation_llama-2-13b_question_answering
truthfulqa_generation_llama-2-70b-chat_question_answering
truthfulqa_generation_llama-2-70b_question_answering
truthfulqa_generation_meta-llama-3-8b-instruct_question_answering
truthfulqa_generation_meta-llama-3-70b-instruct_question_answering
truthfulqa_generation_meta-llama-3_1-405b-instruct_question_answering
truthfulqa_generation_microsoft-phi-2_question_answering
truthfulqa_generation_microsoft_phi_2_question_answering
truthfulqa_generation_mistral-large_question_answering
truthfulqa_generation_mistral_7b_instruct_v01_question_answering
truthfulqa_generation_mistral_7b_v01_question_answering
truthfulqa_generation_mistralai-mistral-7b-instruct-v0-2_question_answering
truthfulqa_generation_mistralai-mistral-7b-v01_question_answering
truthfulqa_generation_mistralai-mixtral-8x7b-instruct-v01_question_answering
truthfulqa_generation_mistralai-mixtral-8x7b-v01_question_answering
truthfulqa_generation_mistralai-mixtral-8x22b-v0-1_question_answering
truthfulqa_generation_mistralaimistral7binstruct_question_answering
truthfulqa_generation_mixtral8x7binstructv01_question_answering
truthfulqa_generation_mixtral8x22binstructv01_question_answering
truthfulqa_generation_phi-3-medium-4k-instruct_question_answering
truthfulqa_generation_phi-3-medium-128k-instruct_question_answering
truthfulqa_generation_phi-3-small-8k-instruct_question_answering
truthfulqa_generation_phi-3-small-128k-instruct_question_answering
truthfulqa_generation_phi3-mini-4k-instruct_chat_completion
truthfulqa_generation_phi3-mini-128k-instruct_chat_completion
truthfulqa_mc1__gpt-4-0125-preview__question_answering
truthfulqa_mc1__meta-llama-3_1-8b-instruct__question_answering
truthfulqa_mc1__meta-llama-3_1-70b-instruct__question_answering
truthfulqa_mc1_cohere_command_r_plus_question_answering
truthfulqa_mc1_cohere_command_r_question_answering
truthfulqa_mc1_databricks-dbrx-base_question_answering
truthfulqa_mc1_databricks-dbrx-instruct_question_answering
truthfulqa_mc1_gpt-4-turbo-2024-04-09_chat_completion
truthfulqa_mc1_gpt-4o_question_answering
truthfulqa_mc1_gpt_4_32k_0314_question_answering
truthfulqa_mc1_gpt_4_32k_0613_question_answering
truthfulqa_mc1_gpt_4_0314_question_answering
truthfulqa_mc1_gpt_4_0613_question_answering
truthfulqa_mc1_gpt_35_turbo_0301_question_answering
truthfulqa_mc1_gpt_35_turbo_0613_question_answering
truthfulqa_mc1_llama_2_7b_chat_question_answering
truthfulqa_mc1_llama_2_7b_question_answering
truthfulqa_mc1_llama_2_13b_chat_question_answering
truthfulqa_mc1_llama_2_13b_question_answering
truthfulqa_mc1_llama_2_70b_chat_question_answering
truthfulqa_mc1_llama_2_70b_question_answering
truthfulqa_mc1_meta-llama-3-8b-instruct_question_answering
truthfulqa_mc1_meta-llama-3-8b_question_answering
truthfulqa_mc1_meta-llama-3-70b-instruct_question_answering
truthfulqa_mc1_meta-llama-3-70b_question_answering
truthfulqa_mc1_meta-llama-3_1-405b-instruct_question_answering
truthfulqa_mc1_microsoft_phi_2_question_answering
truthfulqa_mc1_mistral-community-mixtral-8x22b-v0-1_question_answering
truthfulqa_mc1_mistral_7b_instruct_v01_question_answering
truthfulqa_mc1_mistral_7b_v01_question_answering
truthfulqa_mc1_mistral_large_question_answering
truthfulqa_mc1_mistralai-mistral-7b-instruct-v0-2_question_answering
truthfulqa_mc1_mistralai-mixtral-8x7b-instruct-v01_question_answering
truthfulqa_mc1_mistralai-mixtral-8x7b-v01_question_answering
truthfulqa_mc1_mistralai-mixtral-8x22b-instruct-v0-1_question_answering
truthfulqa_mc1_mistralai-mixtral-8x22b-v0-1_question_answering
truthfulqa_mc1_phi-3-medium-4k-instruct_question_answering
truthfulqa_mc1_phi-3-medium-128k-instruct_question_answering
truthfulqa_mc1_phi-3-mini-4k-instruct_chat_completion
truthfulqa_mc1_phi-3-mini-128k-instruct_chat_completion
truthfulqa_mc1_phi-3-small-8k-instruct_question_answering
truthfulqa_mc1_phi-3-small-128k-instruct_question_answering
tweetsentimentextractionclassification_cohere-embed-v3-english_classification
tweetsentimentextractionclassification_cohere-embed-v3-multilingual_classification
tweetsentimentextractionclassification_text-embedding-3-large_classification
tweetsentimentextractionclassification_text-embedding-3-small_classification
tweetsentimentextractionclassification_text-embedding-ada-002_classification
twentynewsgroupsclustering.v2_cohere-embed-v3-english_clustering
twentynewsgroupsclustering.v2_cohere-embed-v3-multilingual_clustering
twentynewsgroupsclustering.v2_text-embedding-3-large_clustering
twentynewsgroupsclustering.v2_text-embedding-3-small_clustering
twentynewsgroupsclustering.v2_text-embedding-ada-002_clustering
winogrande__gpt-4-0125-preview__question_answering
winogrande__meta-llama-3_1-8b-instruct__question_answering
winogrande__meta-llama-3_1-70b-instruct__question_answering
winogrande_cohere_command_r_plus_question_answering
winogrande_cohere_command_r_question_answering
winogrande_databricks-dbrx-base_question_answering
winogrande_databricks-dbrx-instruct_question_answering
winogrande_gpt-4-turbo-2024-04-09_chat_completion
winogrande_gpt-4o_question_answering
winogrande_gpt_4_32k_0314_question_answering
winogrande_gpt_4_32k_0613_question_answering
winogrande_gpt_4_0314_question_answering
winogrande_gpt_4_0613_question_answering
winogrande_gpt_35_turbo_0301_question_answering
winogrande_gpt_35_turbo_0613_question_answering
winogrande_llama_2_7b_chat_question_answering
winogrande_llama_2_7b_question_answering
winogrande_llama_2_13b_chat_question_answering
winogrande_llama_2_13b_question_answering
winogrande_llama_2_70b_chat_question_answering
winogrande_llama_2_70b_question_answering
winogrande_meta-llama-3-8b-instruct_question_answering
winogrande_meta-llama-3-8b_question_answering
winogrande_meta-llama-3-70b-instruct_question_answering
winogrande_meta-llama-3-70b_question_answering
winogrande_meta-llama-3_1-405b-instruct_question_answering
winogrande_microsoft_phi_2_question_answering
winogrande_mistral-community-mixtral-8x22b-v0-1_question_answering
winogrande_mistral_7b_instruct_v01_question_answering
winogrande_mistral_7b_v01_question_answering
winogrande_mistral_large_question_answering
winogrande_mistralai-mistral-7b-instruct-v0-2_question_answering
winogrande_mistralai-mixtral-8x7b-instruct-v01_question_answering
winogrande_mistralai-mixtral-8x7b-v01_question_answering
winogrande_mistralai-mixtral-8x22b-instruct-v0-1_question_answering
winogrande_mistralai-mixtral-8x22b-v0-1_question_answering
winogrande_phi-3-medium-4k-instruct_question_answering
winogrande_phi-3-medium-128k-instruct_question_answering
winogrande_phi-3-mini-4k-instruct_chat_completion
winogrande_phi-3-mini-128k-instruct_chat_completion
winogrande_phi-3-small-8k-instruct_question_answering
winogrande_phi-3-small-128k-instruct_question_answering