Index of /helm/benchmark_output/runs/mmlu

[ICO]NameLast modifiedSizeDescription

[DIR]Parent Directory  -  
[DIR]mmlu:subject=abstract_algebra,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=abstract_algebra,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=anatomy,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=abstract_algebra,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=abstract_algebra,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=anatomy,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=anatomy,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=abstract_algebra,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=astronomy,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=anatomy,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=astronomy,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=astronomy,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=business_ethics,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=business_ethics,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=astronomy,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=business_ethics,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=business_ethics,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=clinical_knowledge,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=college_biology,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=clinical_knowledge,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=clinical_knowledge,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=college_biology,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=college_biology,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=college_chemistry,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=college_chemistry,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=college_computer_science,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=college_chemistry,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=college_computer_science,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=college_computer_science,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=college_mathematics,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=college_mathematics,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=college_mathematics,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=college_medicine,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=college_medicine,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=college_medicine,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=college_physics,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=computer_security,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=college_physics,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=college_physics,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=computer_security,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=computer_security,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=conceptual_physics,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=conceptual_physics,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=conceptual_physics,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=econometrics,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=econometrics,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=econometrics,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=electrical_engineering,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=electrical_engineering,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=elementary_mathematics,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=elementary_mathematics,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=elementary_mathematics,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=electrical_engineering,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=formal_logic,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=formal_logic,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=formal_logic,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=global_facts,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=global_facts,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=high_school_biology,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=global_facts,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=high_school_biology,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=high_school_biology,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=high_school_chemistry,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=high_school_chemistry,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=high_school_chemistry,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=high_school_computer_science,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=high_school_computer_science,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=high_school_computer_science,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=high_school_european_history,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=high_school_european_history,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=high_school_european_history,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=high_school_geography,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=high_school_geography,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=high_school_geography,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=high_school_government_and_politics,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=high_school_government_and_politics,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=high_school_government_and_politics,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=high_school_macroeconomics,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=high_school_macroeconomics,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=high_school_mathematics,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=high_school_microeconomics,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=high_school_mathematics,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=high_school_physics,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=high_school_psychology,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=high_school_statistics,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=high_school_us_history,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=high_school_world_history,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=jurisprudence,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=human_sexuality,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=international_law,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=human_aging,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=logical_fallacies,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=machine_learning,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=management,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=marketing,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=nutrition,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=medical_genetics,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=moral_scenarios,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=miscellaneous,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=moral_disputes,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=prehistory,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=philosophy,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=professional_accounting,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=public_relations,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=professional_law,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=professional_medicine,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=professional_psychology,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=security_studies,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=us_foreign_policy,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=sociology,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=virology,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=world_religions,method=multiple_choice_joint,model=openai_gpt-4-0613/04-Mar-2024 13:07 -  
[DIR]mmlu:subject=anatomy,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=astronomy,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=business_ethics,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=clinical_knowledge,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=clinical_knowledge,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=college_biology,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=college_biology,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=college_chemistry,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=college_chemistry,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=college_computer_science,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=college_computer_science,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=college_mathematics,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=college_mathematics,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=college_medicine,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=college_medicine,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=college_physics,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=college_physics,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=computer_security,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=conceptual_physics,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=computer_security,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=conceptual_physics,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=econometrics,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=econometrics,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=electrical_engineering,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=electrical_engineering,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=elementary_mathematics,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=elementary_mathematics,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=formal_logic,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=formal_logic,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=global_facts,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=global_facts,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_biology,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_biology,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_chemistry,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_chemistry,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_computer_science,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_computer_science,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_european_history,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_european_history,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_geography,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_geography,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_government_and_politics,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_government_and_politics,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_macroeconomics,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_macroeconomics,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_macroeconomics,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_mathematics,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_mathematics,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_mathematics,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_microeconomics,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_microeconomics,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_microeconomics,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_microeconomics,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_physics,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_physics,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_physics,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_physics,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_psychology,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_psychology,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_psychology,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_psychology,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_statistics,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_statistics,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_statistics,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_statistics,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_us_history,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_us_history,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_us_history,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_us_history,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_world_history,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_world_history,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_world_history,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=high_school_world_history,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=human_aging,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=human_aging,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=human_aging,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=human_aging,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=human_sexuality,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=human_sexuality,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=human_sexuality,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=human_sexuality,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=international_law,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=international_law,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=international_law,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=international_law,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=jurisprudence,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=jurisprudence,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=jurisprudence,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=jurisprudence,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=logical_fallacies,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=logical_fallacies,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=logical_fallacies,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=logical_fallacies,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=machine_learning,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=machine_learning,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=machine_learning,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=management,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=machine_learning,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=management,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=management,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=management,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=marketing,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=marketing,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=marketing,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=marketing,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=medical_genetics,method=multiple_choice_joint,model=anthropic_claude-2.1/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=medical_genetics,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=medical_genetics,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=medical_genetics,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=miscellaneous,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=miscellaneous,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=miscellaneous,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=moral_disputes,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=moral_disputes,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=moral_disputes,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=moral_scenarios,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=moral_scenarios,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=moral_scenarios,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=nutrition,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=nutrition,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=nutrition,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=philosophy,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=philosophy,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=philosophy,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=prehistory,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=prehistory,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=professional_accounting,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=professional_accounting,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=prehistory,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=professional_accounting,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=professional_law,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=professional_law,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=professional_medicine,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=professional_medicine,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=professional_law,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=professional_medicine,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=professional_psychology,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=professional_psychology,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=public_relations,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=professional_psychology,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=public_relations,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=public_relations,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=security_studies,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=security_studies,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=sociology,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=security_studies,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=sociology,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=sociology,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=us_foreign_policy,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=us_foreign_policy,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=virology,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=us_foreign_policy,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=virology,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=virology,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=world_religions,method=multiple_choice_joint,model=google_text-unicorn@001/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=world_religions,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=world_religions,method=multiple_choice_joint,model=meta_llama-2-70b/04-Mar-2024 13:47 -  
[DIR]mmlu:subject=abstract_algebra,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_abstract_algebra/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=abstract_algebra,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_abstract_algebra/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=abstract_algebra,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_abstract_algebra/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=abstract_algebra,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_abstract_algebra/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=abstract_algebra,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_abstract_algebra/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=abstract_algebra,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_abstract_algebra/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=abstract_algebra,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_abstract_algebra/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=anatomy,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_anatomy/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=anatomy,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_anatomy/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=anatomy,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_anatomy/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=anatomy,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_anatomy/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=anatomy,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_anatomy/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=anatomy,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_anatomy/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=anatomy,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_anatomy/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=astronomy,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_astronomy/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=astronomy,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_astronomy/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=astronomy,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_astronomy/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=astronomy,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_astronomy/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=astronomy,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_astronomy/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=astronomy,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_astronomy/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=astronomy,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_astronomy/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=business_ethics,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_business_ethics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=business_ethics,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_business_ethics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=business_ethics,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_business_ethics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=business_ethics,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_business_ethics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=business_ethics,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_business_ethics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=business_ethics,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_business_ethics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=business_ethics,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_business_ethics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=clinical_knowledge,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_clinical_knowledge/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=clinical_knowledge,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_clinical_knowledge/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=clinical_knowledge,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_clinical_knowledge/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=clinical_knowledge,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_clinical_knowledge/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=clinical_knowledge,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_clinical_knowledge/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=clinical_knowledge,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_clinical_knowledge/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=clinical_knowledge,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_clinical_knowledge/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_biology,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_college_biology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_biology,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_college_biology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_biology,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_college_biology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_biology,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_college_biology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_chemistry,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_college_chemistry/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_biology,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_college_biology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_biology,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_college_biology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_biology,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_college_biology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_chemistry,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_college_chemistry/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_chemistry,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_college_chemistry/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_chemistry,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_college_chemistry/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_chemistry,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_college_chemistry/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_computer_science,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_college_computer_science/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_chemistry,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_college_chemistry/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_chemistry,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_college_chemistry/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_computer_science,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_college_computer_science/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_computer_science,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_college_computer_science/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_computer_science,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_college_computer_science/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_computer_science,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_college_computer_science/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_mathematics,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_college_mathematics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_computer_science,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_college_computer_science/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_mathematics,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_college_mathematics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_computer_science,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_college_computer_science/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_mathematics,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_college_mathematics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_mathematics,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_college_mathematics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_mathematics,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_college_mathematics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_medicine,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_college_medicine/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_mathematics,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_college_mathematics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_mathematics,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_college_mathematics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_medicine,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_college_medicine/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_medicine,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_college_medicine/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_medicine,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_college_medicine/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_medicine,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_college_medicine/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_physics,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_college_physics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_medicine,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_college_medicine/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_physics,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_college_physics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_medicine,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_college_medicine/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_physics,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_college_physics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_physics,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_college_physics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_physics,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_college_physics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=computer_security,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_computer_security/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_physics,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_college_physics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=computer_security,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_computer_security/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=college_physics,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_college_physics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=computer_security,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_computer_security/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=computer_security,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_computer_security/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=computer_security,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_computer_security/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=computer_security,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_computer_security/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=conceptual_physics,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_conceptual_physics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=computer_security,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_computer_security/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=conceptual_physics,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_conceptual_physics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=conceptual_physics,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_conceptual_physics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=conceptual_physics,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_conceptual_physics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=conceptual_physics,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_conceptual_physics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=conceptual_physics,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_conceptual_physics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=conceptual_physics,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_conceptual_physics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=econometrics,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_econometrics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=econometrics,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_econometrics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=econometrics,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_econometrics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=econometrics,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_econometrics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=electrical_engineering,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_electrical_engineering/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=econometrics,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_econometrics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=econometrics,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_econometrics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=econometrics,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_econometrics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=electrical_engineering,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_electrical_engineering/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=electrical_engineering,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_electrical_engineering/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=electrical_engineering,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_electrical_engineering/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=electrical_engineering,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_electrical_engineering/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=elementary_mathematics,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_elementary_mathematics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=electrical_engineering,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_electrical_engineering/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=elementary_mathematics,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_elementary_mathematics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=electrical_engineering,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_electrical_engineering/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=elementary_mathematics,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_elementary_mathematics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=elementary_mathematics,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_elementary_mathematics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=elementary_mathematics,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_elementary_mathematics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=elementary_mathematics,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_elementary_mathematics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=formal_logic,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_formal_logic/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=elementary_mathematics,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_elementary_mathematics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=formal_logic,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_formal_logic/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=formal_logic,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_formal_logic/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=formal_logic,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_formal_logic/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=formal_logic,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_formal_logic/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=global_facts,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_global_facts/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=formal_logic,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_formal_logic/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=global_facts,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_global_facts/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=formal_logic,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_formal_logic/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=global_facts,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_global_facts/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=global_facts,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_global_facts/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=global_facts,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_global_facts/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=global_facts,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_global_facts/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=global_facts,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_global_facts/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_biology,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_high_school_biology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_biology,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_high_school_biology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_biology,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_high_school_biology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_biology,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_high_school_biology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_biology,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_high_school_biology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_chemistry,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_high_school_chemistry/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_biology,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_high_school_biology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_chemistry,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_high_school_chemistry/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_chemistry,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_high_school_chemistry/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_biology,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_high_school_biology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_chemistry,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_high_school_chemistry/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_chemistry,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_high_school_chemistry/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_chemistry,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_high_school_chemistry/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_computer_science,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_high_school_computer_science/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_computer_science,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_high_school_computer_science/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_computer_science,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_high_school_computer_science/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_chemistry,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_high_school_chemistry/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_computer_science,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_high_school_computer_science/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_computer_science,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_high_school_computer_science/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_computer_science,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_high_school_computer_science/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_computer_science,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_high_school_computer_science/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_european_history,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_high_school_european_history/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_european_history,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_high_school_european_history/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_european_history,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_high_school_european_history/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_european_history,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_high_school_european_history/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_european_history,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_high_school_european_history/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_european_history,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_high_school_european_history/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_european_history,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_high_school_european_history/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_geography,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_high_school_geography/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_geography,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_high_school_geography/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_geography,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_high_school_geography/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_geography,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_high_school_geography/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_geography,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_high_school_geography/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_geography,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_high_school_geography/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_government_and_politics,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_high_school_government_and_politics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_government_and_politics,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_high_school_government_and_politics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_geography,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_high_school_geography/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_government_and_politics,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_high_school_government_and_politics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_government_and_politics,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_high_school_government_and_politics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_government_and_politics,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_high_school_government_and_politics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_government_and_politics,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_high_school_government_and_politics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_macroeconomics,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_high_school_macroeconomics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_government_and_politics,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_high_school_government_and_politics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_macroeconomics,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_high_school_macroeconomics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_macroeconomics,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_high_school_macroeconomics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_macroeconomics,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_high_school_macroeconomics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_macroeconomics,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_high_school_macroeconomics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_macroeconomics,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_high_school_macroeconomics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_macroeconomics,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_high_school_macroeconomics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_mathematics,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_high_school_mathematics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_mathematics,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_high_school_mathematics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_mathematics,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_high_school_mathematics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_mathematics,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_high_school_mathematics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_mathematics,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_high_school_mathematics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_mathematics,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_high_school_mathematics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_microeconomics,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_high_school_microeconomics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_mathematics,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_high_school_mathematics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_microeconomics,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_high_school_microeconomics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_microeconomics,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_high_school_microeconomics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_microeconomics,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_high_school_microeconomics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_microeconomics,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_high_school_microeconomics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_microeconomics,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_high_school_microeconomics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_microeconomics,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_high_school_microeconomics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_physics,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_high_school_physics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_physics,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_high_school_physics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_physics,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_high_school_physics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_physics,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_high_school_physics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_physics,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_high_school_physics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_physics,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_high_school_physics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_physics,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_high_school_physics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_psychology,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_high_school_psychology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_psychology,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_high_school_psychology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_psychology,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_high_school_psychology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_psychology,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_high_school_psychology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_psychology,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_high_school_psychology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_psychology,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_high_school_psychology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_psychology,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_high_school_psychology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_statistics,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_high_school_statistics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_statistics,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_high_school_statistics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_statistics,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_high_school_statistics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_statistics,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_high_school_statistics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_statistics,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_high_school_statistics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_statistics,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_high_school_statistics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_statistics,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_high_school_statistics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_us_history,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_high_school_us_history/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_us_history,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_high_school_us_history/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_us_history,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_high_school_us_history/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_us_history,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_high_school_us_history/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_us_history,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_high_school_us_history/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_us_history,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_high_school_us_history/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_us_history,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_high_school_us_history/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_world_history,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_high_school_world_history/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_world_history,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_high_school_world_history/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_world_history,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_high_school_world_history/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_world_history,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_high_school_world_history/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_world_history,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_high_school_world_history/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_world_history,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_high_school_world_history/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=human_aging,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_human_aging/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=high_school_world_history,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_high_school_world_history/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=human_aging,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_human_aging/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=human_aging,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_human_aging/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=human_aging,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_human_aging/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=human_aging,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_human_aging/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=human_aging,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_human_aging/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=human_aging,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_human_aging/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=human_sexuality,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_human_sexuality/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=human_sexuality,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_human_sexuality/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=human_sexuality,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_human_sexuality/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=human_sexuality,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_human_sexuality/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=human_sexuality,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_human_sexuality/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=human_sexuality,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_human_sexuality/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=international_law,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_international_law/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=human_sexuality,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_human_sexuality/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=international_law,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_international_law/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=international_law,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_international_law/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=international_law,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_international_law/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=international_law,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_international_law/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=international_law,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_international_law/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=international_law,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_international_law/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=jurisprudence,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_jurisprudence/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=jurisprudence,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_jurisprudence/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=jurisprudence,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_jurisprudence/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=jurisprudence,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_jurisprudence/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=jurisprudence,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_jurisprudence/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=logical_fallacies,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_logical_fallacies/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=jurisprudence,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_jurisprudence/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=jurisprudence,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_jurisprudence/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=logical_fallacies,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_logical_fallacies/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=logical_fallacies,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_logical_fallacies/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=logical_fallacies,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_logical_fallacies/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=logical_fallacies,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_logical_fallacies/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=logical_fallacies,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_logical_fallacies/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=machine_learning,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_machine_learning/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=machine_learning,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_machine_learning/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=logical_fallacies,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_logical_fallacies/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=machine_learning,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_machine_learning/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=machine_learning,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_machine_learning/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=machine_learning,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_machine_learning/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=machine_learning,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_machine_learning/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=machine_learning,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_machine_learning/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=management,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_management/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=management,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_management/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=management,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_management/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=management,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_management/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=management,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_management/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=management,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_management/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=management,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_management/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=marketing,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_marketing/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=marketing,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_marketing/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=marketing,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_marketing/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=marketing,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_marketing/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=marketing,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_marketing/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=marketing,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_marketing/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=marketing,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_marketing/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=medical_genetics,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_medical_genetics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=medical_genetics,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_medical_genetics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=medical_genetics,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_medical_genetics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=medical_genetics,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_medical_genetics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=medical_genetics,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_medical_genetics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=medical_genetics,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_medical_genetics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=miscellaneous,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_miscellaneous/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=medical_genetics,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_medical_genetics/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=miscellaneous,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_miscellaneous/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=miscellaneous,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_miscellaneous/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=miscellaneous,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_miscellaneous/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=miscellaneous,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_miscellaneous/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=miscellaneous,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_miscellaneous/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=miscellaneous,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_miscellaneous/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=moral_disputes,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_moral_disputes/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=moral_disputes,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_moral_disputes/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=moral_disputes,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_moral_disputes/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=moral_disputes,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_moral_disputes/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=moral_disputes,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_moral_disputes/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=moral_disputes,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_moral_disputes/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=moral_disputes,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_moral_disputes/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=moral_scenarios,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_moral_scenarios/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=moral_scenarios,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_moral_scenarios/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=moral_scenarios,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_moral_scenarios/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=moral_scenarios,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_moral_scenarios/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=nutrition,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_nutrition/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=moral_scenarios,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_moral_scenarios/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=moral_scenarios,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_moral_scenarios/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=moral_scenarios,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_moral_scenarios/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=nutrition,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_nutrition/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=nutrition,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_nutrition/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=nutrition,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_nutrition/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=nutrition,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_nutrition/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=nutrition,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_nutrition/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=philosophy,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_philosophy/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=philosophy,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_philosophy/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=nutrition,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_nutrition/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=philosophy,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_philosophy/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=philosophy,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_philosophy/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=philosophy,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_philosophy/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=philosophy,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_philosophy/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=philosophy,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_philosophy/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=prehistory,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_prehistory/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=prehistory,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_prehistory/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=prehistory,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_prehistory/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=prehistory,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_prehistory/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=prehistory,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_prehistory/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=prehistory,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_prehistory/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=prehistory,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_prehistory/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=professional_accounting,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_professional_accounting/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=professional_accounting,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_professional_accounting/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=professional_accounting,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_professional_accounting/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=professional_accounting,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_professional_accounting/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=professional_accounting,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_professional_accounting/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=professional_accounting,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_professional_accounting/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=professional_accounting,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_professional_accounting/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=professional_law,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_professional_law/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=professional_law,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_professional_law/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=professional_law,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_professional_law/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=professional_law,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_professional_law/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=professional_law,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_professional_law/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=professional_medicine,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_professional_medicine/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=professional_law,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_professional_law/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=professional_law,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_professional_law/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=professional_medicine,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_professional_medicine/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=professional_medicine,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_professional_medicine/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=professional_medicine,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_professional_medicine/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=professional_medicine,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_professional_medicine/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=professional_medicine,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_professional_medicine/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=professional_psychology,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_professional_psychology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=professional_psychology,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_professional_psychology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=professional_medicine,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_professional_medicine/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=professional_psychology,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_professional_psychology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=professional_psychology,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_professional_psychology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=professional_psychology,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_professional_psychology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=professional_psychology,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_professional_psychology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=professional_psychology,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_professional_psychology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=public_relations,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_public_relations/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=public_relations,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_public_relations/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=public_relations,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_public_relations/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=public_relations,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_public_relations/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=public_relations,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_public_relations/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=public_relations,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_public_relations/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=security_studies,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_security_studies/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=public_relations,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_public_relations/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=security_studies,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_security_studies/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=security_studies,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_security_studies/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=security_studies,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_security_studies/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=security_studies,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_security_studies/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=security_studies,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_security_studies/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=sociology,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_sociology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=security_studies,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_security_studies/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=sociology,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_sociology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=sociology,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_sociology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=sociology,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_sociology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=sociology,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_sociology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=sociology,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_sociology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=us_foreign_policy,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_us_foreign_policy/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=sociology,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_sociology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=us_foreign_policy,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_us_foreign_policy/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=us_foreign_policy,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_us_foreign_policy/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=us_foreign_policy,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_us_foreign_policy/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=us_foreign_policy,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_us_foreign_policy/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=us_foreign_policy,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_us_foreign_policy/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=us_foreign_policy,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_us_foreign_policy/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=virology,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_virology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=virology,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_virology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=virology,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_virology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=virology,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_virology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=virology,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_virology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=virology,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_virology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=virology,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_virology/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=world_religions,method=multiple_choice_joint,model=google_text-unicorn@001,groups=mmlu_world_religions/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=world_religions,method=multiple_choice_joint,model=anthropic_claude-2.1,groups=mmlu_world_religions/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=world_religions,method=multiple_choice_joint,model=meta_llama-2-70b,groups=mmlu_world_religions/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=world_religions,method=multiple_choice_joint,model=meta_llama-2-13b,groups=mmlu_world_religions/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=world_religions,method=multiple_choice_joint,model=meta_llama-2-7b,groups=mmlu_world_religions/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=world_religions,method=multiple_choice_joint,model=microsoft_phi-2,groups=mmlu_world_religions/11-Mar-2024 11:47 -  
[DIR]mmlu:subject=world_religions,method=multiple_choice_joint,model=openai_gpt-4-0613,groups=mmlu_world_religions/11-Mar-2024 11:47 -  
[DIR]eval_cache/22-Mar-2024 19:39 -  
[DIR]mmlu:subject=abstract_algebra,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,additional_instructions=yifan,groups=mmlu_abstract_algebra/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=abstract_algebra,method=multiple_choice_joint,model=anthropic_claude-instant-1.2,eval_split=test,additional_instructions=yifan,groups=mmlu_abstract_algebra/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=abstract_algebra,method=multiple_choice_joint,model=01-ai_yi-6b,eval_split=test,additional_instructions=yifan,groups=mmlu_abstract_algebra/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=abstract_algebra,method=multiple_choice_joint,model=google_text-bison@001,eval_split=test,additional_instructions=yifan,groups=mmlu_abstract_algebra/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=abstract_algebra,method=multiple_choice_joint,model=anthropic_claude-2.1,eval_split=test,additional_instructions=yifan,groups=mmlu_abstract_algebra/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=abstract_algebra,method=multiple_choice_joint,model=google_gemini-pro,eval_split=test,additional_instructions=yifan,groups=mmlu_abstract_algebra/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=abstract_algebra,method=multiple_choice_joint,model=meta_llama-2-7b,eval_split=test,additional_instructions=yifan,groups=mmlu_abstract_algebra/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=abstract_algebra,method=multiple_choice_joint,model=microsoft_phi-2,eval_split=test,additional_instructions=yifan,groups=mmlu_abstract_algebra/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=abstract_algebra,method=multiple_choice_joint,model=openai_gpt-3.5-turbo-0613,eval_split=test,additional_instructions=yifan,groups=mmlu_abstract_algebra/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=abstract_algebra,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen,eval_split=test,additional_instructions=yifan,groups=mmlu_abstract_algebra/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=abstract_algebra,method=multiple_choice_joint,model=openai_gpt-4-1106-preview,eval_split=test,additional_instructions=yifan,groups=mmlu_abstract_algebra/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=college_chemistry,method=multiple_choice_joint,model=01-ai_yi-6b,eval_split=test,additional_instructions=yifan,groups=mmlu_college_chemistry/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=college_chemistry,method=multiple_choice_joint,model=anthropic_claude-instant-1.2,eval_split=test,additional_instructions=yifan,groups=mmlu_college_chemistry/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=college_chemistry,method=multiple_choice_joint,model=anthropic_claude-2.1,eval_split=test,additional_instructions=yifan,groups=mmlu_college_chemistry/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=abstract_algebra,method=multiple_choice_joint,model=qwen_qwen1.5-7b,eval_split=test,additional_instructions=yifan,groups=mmlu_abstract_algebra/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=college_chemistry,method=multiple_choice_joint,model=google_gemini-pro,eval_split=test,additional_instructions=yifan,groups=mmlu_college_chemistry/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=college_chemistry,method=multiple_choice_joint,model=meta_llama-2-7b,eval_split=test,additional_instructions=yifan,groups=mmlu_college_chemistry/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=college_chemistry,method=multiple_choice_joint,model=microsoft_phi-2,eval_split=test,additional_instructions=yifan,groups=mmlu_college_chemistry/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=college_chemistry,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,additional_instructions=yifan,groups=mmlu_college_chemistry/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=college_chemistry,method=multiple_choice_joint,model=google_text-bison@001,eval_split=test,additional_instructions=yifan,groups=mmlu_college_chemistry/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=college_chemistry,method=multiple_choice_joint,model=openai_gpt-4-1106-preview,eval_split=test,additional_instructions=yifan,groups=mmlu_college_chemistry/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=college_chemistry,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen,eval_split=test,additional_instructions=yifan,groups=mmlu_college_chemistry/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=college_chemistry,method=multiple_choice_joint,model=openai_gpt-3.5-turbo-0613,eval_split=test,additional_instructions=yifan,groups=mmlu_college_chemistry/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=college_chemistry,method=multiple_choice_joint,model=qwen_qwen1.5-7b,eval_split=test,additional_instructions=yifan,groups=mmlu_college_chemistry/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=computer_security,method=multiple_choice_joint,model=01-ai_yi-6b,eval_split=test,additional_instructions=yifan,groups=mmlu_computer_security/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=computer_security,method=multiple_choice_joint,model=anthropic_claude-2.1,eval_split=test,additional_instructions=yifan,groups=mmlu_computer_security/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=computer_security,method=multiple_choice_joint,model=anthropic_claude-instant-1.2,eval_split=test,additional_instructions=yifan,groups=mmlu_computer_security/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=computer_security,method=multiple_choice_joint,model=google_gemini-pro,eval_split=test,additional_instructions=yifan,groups=mmlu_computer_security/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=computer_security,method=multiple_choice_joint,model=google_text-bison@001,eval_split=test,additional_instructions=yifan,groups=mmlu_computer_security/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=computer_security,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,additional_instructions=yifan,groups=mmlu_computer_security/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=computer_security,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen,eval_split=test,additional_instructions=yifan,groups=mmlu_computer_security/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=computer_security,method=multiple_choice_joint,model=microsoft_phi-2,eval_split=test,additional_instructions=yifan,groups=mmlu_computer_security/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=computer_security,method=multiple_choice_joint,model=qwen_qwen1.5-7b,eval_split=test,additional_instructions=yifan,groups=mmlu_computer_security/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=computer_security,method=multiple_choice_joint,model=openai_gpt-4-1106-preview,eval_split=test,additional_instructions=yifan,groups=mmlu_computer_security/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=computer_security,method=multiple_choice_joint,model=meta_llama-2-7b,eval_split=test,additional_instructions=yifan,groups=mmlu_computer_security/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=computer_security,method=multiple_choice_joint,model=openai_gpt-3.5-turbo-0613,eval_split=test,additional_instructions=yifan,groups=mmlu_computer_security/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=econometrics,method=multiple_choice_joint,model=01-ai_yi-6b,eval_split=test,additional_instructions=yifan,groups=mmlu_econometrics/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=econometrics,method=multiple_choice_joint,model=anthropic_claude-instant-1.2,eval_split=test,additional_instructions=yifan,groups=mmlu_econometrics/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=econometrics,method=multiple_choice_joint,model=anthropic_claude-2.1,eval_split=test,additional_instructions=yifan,groups=mmlu_econometrics/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=econometrics,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,additional_instructions=yifan,groups=mmlu_econometrics/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=econometrics,method=multiple_choice_joint,model=google_text-bison@001,eval_split=test,additional_instructions=yifan,groups=mmlu_econometrics/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=econometrics,method=multiple_choice_joint,model=google_gemini-pro,eval_split=test,additional_instructions=yifan,groups=mmlu_econometrics/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=econometrics,method=multiple_choice_joint,model=meta_llama-2-7b,eval_split=test,additional_instructions=yifan,groups=mmlu_econometrics/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=econometrics,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen,eval_split=test,additional_instructions=yifan,groups=mmlu_econometrics/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=econometrics,method=multiple_choice_joint,model=microsoft_phi-2,eval_split=test,additional_instructions=yifan,groups=mmlu_econometrics/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=econometrics,method=multiple_choice_joint,model=openai_gpt-3.5-turbo-0613,eval_split=test,additional_instructions=yifan,groups=mmlu_econometrics/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=econometrics,method=multiple_choice_joint,model=openai_gpt-4-1106-preview,eval_split=test,additional_instructions=yifan,groups=mmlu_econometrics/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=us_foreign_policy,method=multiple_choice_joint,model=01-ai_yi-6b,eval_split=test,additional_instructions=yifan,groups=mmlu_us_foreign_policy/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=econometrics,method=multiple_choice_joint,model=qwen_qwen1.5-7b,eval_split=test,additional_instructions=yifan,groups=mmlu_econometrics/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=us_foreign_policy,method=multiple_choice_joint,model=anthropic_claude-2.1,eval_split=test,additional_instructions=yifan,groups=mmlu_us_foreign_policy/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=us_foreign_policy,method=multiple_choice_joint,model=anthropic_claude-instant-1.2,eval_split=test,additional_instructions=yifan,groups=mmlu_us_foreign_policy/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=us_foreign_policy,method=multiple_choice_joint,model=google_gemini-pro,eval_split=test,additional_instructions=yifan,groups=mmlu_us_foreign_policy/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=us_foreign_policy,method=multiple_choice_joint,model=google_text-bison@001,eval_split=test,additional_instructions=yifan,groups=mmlu_us_foreign_policy/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=us_foreign_policy,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,additional_instructions=yifan,groups=mmlu_us_foreign_policy/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=us_foreign_policy,method=multiple_choice_joint,model=meta_llama-2-7b,eval_split=test,additional_instructions=yifan,groups=mmlu_us_foreign_policy/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=us_foreign_policy,method=multiple_choice_joint,model=microsoft_phi-2,eval_split=test,additional_instructions=yifan,groups=mmlu_us_foreign_policy/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=us_foreign_policy,method=multiple_choice_joint,model=openai_gpt-3.5-turbo-0613,eval_split=test,additional_instructions=yifan,groups=mmlu_us_foreign_policy/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=us_foreign_policy,method=multiple_choice_joint,model=openai_gpt-4-1106-preview,eval_split=test,additional_instructions=yifan,groups=mmlu_us_foreign_policy/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=us_foreign_policy,method=multiple_choice_joint,model=mistralai_mixtral-8x7b-32kseqlen,eval_split=test,additional_instructions=yifan,groups=mmlu_us_foreign_policy/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=us_foreign_policy,method=multiple_choice_joint,model=qwen_qwen1.5-7b,eval_split=test,additional_instructions=yifan,groups=mmlu_us_foreign_policy/22-Mar-2024 20:04 -  
[DIR]mmlu:subject=abstract_algebra,method=multiple_choice_joint,model=google_gemma-7b,eval_split=test,additional_instructions=yifan,groups=mmlu_abstract_algebra/22-Mar-2024 20:09 -  
[DIR]mmlu:subject=abstract_algebra,method=multiple_choice_joint,model=google_gemma-7b-it,eval_split=test,additional_instructions=yifan,groups=mmlu_abstract_algebra/22-Mar-2024 20:09 -  
[DIR]mmlu:subject=college_chemistry,method=multiple_choice_joint,model=google_gemma-7b,eval_split=test,additional_instructions=yifan,groups=mmlu_college_chemistry/22-Mar-2024 20:09 -  
[DIR]mmlu:subject=college_chemistry,method=multiple_choice_joint,model=google_gemma-7b-it,eval_split=test,additional_instructions=yifan,groups=mmlu_college_chemistry/22-Mar-2024 20:09 -  
[DIR]mmlu:subject=computer_security,method=multiple_choice_joint,model=google_gemma-7b,eval_split=test,additional_instructions=yifan,groups=mmlu_computer_security/22-Mar-2024 20:09 -  
[DIR]mmlu:subject=computer_security,method=multiple_choice_joint,model=google_gemma-7b-it,eval_split=test,additional_instructions=yifan,groups=mmlu_computer_security/22-Mar-2024 20:09 -  
[DIR]mmlu:subject=econometrics,method=multiple_choice_joint,model=google_gemma-7b,eval_split=test,additional_instructions=yifan,groups=mmlu_econometrics/22-Mar-2024 20:09 -  
[DIR]mmlu:subject=econometrics,method=multiple_choice_joint,model=google_gemma-7b-it,eval_split=test,additional_instructions=yifan,groups=mmlu_econometrics/22-Mar-2024 20:09 -  
[DIR]mmlu:subject=us_foreign_policy,method=multiple_choice_joint,model=google_gemma-7b,eval_split=test,additional_instructions=yifan,groups=mmlu_us_foreign_policy/22-Mar-2024 20:09 -  
[DIR]mmlu:subject=us_foreign_policy,method=multiple_choice_joint,model=google_gemma-7b-it,eval_split=test,additional_instructions=yifan,groups=mmlu_us_foreign_policy/22-Mar-2024 20:09 -  
[DIR]narrative_qa:model=google_gemini-pro,additional_instructions=narrative_qa/26-Mar-2024 14:49 -  
[DIR]natural_qa:mode=openbook_longans,model=anthropic_claude-instant-1.2,additional_instructions=natural_qa_openbook/26-Mar-2024 14:54 -  
[DIR]natural_qa:mode=openbook_longans,model=anthropic_claude-2.1,additional_instructions=natural_qa_openbook/26-Mar-2024 14:57 -  
[DIR]mmlu:subject=abstract_algebra,method=multiple_choice_joint,model=anthropic_claude-3-sonnet-20240229,eval_split=test,additional_instructions=yifan,groups=mmlu_abstract_algebra/26-Mar-2024 15:08 -  
[DIR]mmlu:subject=abstract_algebra,method=multiple_choice_joint,model=anthropic_claude-3-opus-20240229,eval_split=test,additional_instructions=yifan,groups=mmlu_abstract_algebra/26-Mar-2024 15:08 -  
[DIR]mmlu:subject=college_chemistry,method=multiple_choice_joint,model=anthropic_claude-3-opus-20240229,eval_split=test,additional_instructions=yifan,groups=mmlu_college_chemistry/26-Mar-2024 15:08 -  
[DIR]mmlu:subject=college_chemistry,method=multiple_choice_joint,model=anthropic_claude-3-sonnet-20240229,eval_split=test,additional_instructions=yifan,groups=mmlu_college_chemistry/26-Mar-2024 15:08 -  
[DIR]mmlu:subject=computer_security,method=multiple_choice_joint,model=anthropic_claude-3-opus-20240229,eval_split=test,additional_instructions=yifan,groups=mmlu_computer_security/26-Mar-2024 15:08 -  
[DIR]mmlu:subject=computer_security,method=multiple_choice_joint,model=anthropic_claude-3-sonnet-20240229,eval_split=test,additional_instructions=yifan,groups=mmlu_computer_security/26-Mar-2024 15:08 -  
[DIR]mmlu:subject=econometrics,method=multiple_choice_joint,model=anthropic_claude-3-opus-20240229,eval_split=test,additional_instructions=yifan,groups=mmlu_econometrics/26-Mar-2024 15:08 -  
[DIR]mmlu:subject=econometrics,method=multiple_choice_joint,model=anthropic_claude-3-sonnet-20240229,eval_split=test,additional_instructions=yifan,groups=mmlu_econometrics/26-Mar-2024 15:08 -  
[DIR]mmlu:subject=us_foreign_policy,method=multiple_choice_joint,model=anthropic_claude-3-opus-20240229,eval_split=test,additional_instructions=yifan,groups=mmlu_us_foreign_policy/26-Mar-2024 15:08 -  
[DIR]mmlu:subject=us_foreign_policy,method=multiple_choice_joint,model=anthropic_claude-3-sonnet-20240229,eval_split=test,additional_instructions=yifan,groups=mmlu_us_foreign_policy/26-Mar-2024 15:08 -  
[DIR]narrative_qa:model=anthropic_claude-2.1,additional_instructions=narrative_qa/26-Mar-2024 15:08 -  
[DIR]narrative_qa:model=01-ai_yi-6b,additional_instructions=narrative_qa/26-Mar-2024 15:08 -  
[DIR]narrative_qa:model=google_gemma-7b-it,additional_instructions=narrative_qa/26-Mar-2024 15:08 -  
[DIR]narrative_qa:model=anthropic_claude-instant-1.2,additional_instructions=narrative_qa/26-Mar-2024 15:08 -  
[DIR]narrative_qa:model=google_gemma-7b,additional_instructions=narrative_qa/26-Mar-2024 15:08 -  
[DIR]narrative_qa:model=google_text-bison@001,additional_instructions=narrative_qa/26-Mar-2024 15:08 -  
[DIR]narrative_qa:model=google_text-unicorn@001,additional_instructions=narrative_qa/26-Mar-2024 15:08 -  
[DIR]narrative_qa:model=meta_llama-2-7b,additional_instructions=narrative_qa/26-Mar-2024 15:08 -  
[DIR]narrative_qa:model=microsoft_phi-2,additional_instructions=narrative_qa/26-Mar-2024 15:08 -  
[DIR]narrative_qa:model=openai_gpt-3.5-turbo-0613,additional_instructions=narrative_qa/26-Mar-2024 15:08 -  
[DIR]narrative_qa:model=mistralai_mixtral-8x7b-32kseqlen,additional_instructions=narrative_qa/26-Mar-2024 15:08 -  
[DIR]narrative_qa:model=qwen_qwen1.5-7b,additional_instructions=narrative_qa/26-Mar-2024 15:08 -  
[DIR]narrative_qa:model=openai_gpt-4-1106-preview,additional_instructions=narrative_qa/26-Mar-2024 15:08 -  
[DIR]natural_qa:mode=closedbook,model=anthropic_claude-instant-1.2,additional_instructions=natural_qa_closedbook/26-Mar-2024 15:08 -  
[DIR]natural_qa:mode=closedbook,model=01-ai_yi-6b,additional_instructions=natural_qa_closedbook/26-Mar-2024 15:08 -  
[DIR]natural_qa:mode=closedbook,model=anthropic_claude-2.1,additional_instructions=natural_qa_closedbook/26-Mar-2024 15:08 -  
[DIR]natural_qa:mode=closedbook,model=google_gemma-7b,additional_instructions=natural_qa_closedbook/26-Mar-2024 15:08 -  
[DIR]natural_qa:mode=closedbook,model=google_gemma-7b-it,additional_instructions=natural_qa_closedbook/26-Mar-2024 15:08 -  
[DIR]natural_qa:mode=closedbook,model=google_text-bison@001,additional_instructions=natural_qa_closedbook/26-Mar-2024 15:08 -  
[DIR]natural_qa:mode=closedbook,model=meta_llama-2-7b,additional_instructions=natural_qa_closedbook/26-Mar-2024 15:08 -  
[DIR]natural_qa:mode=closedbook,model=google_text-unicorn@001,additional_instructions=natural_qa_closedbook/26-Mar-2024 15:08 -  
[DIR]natural_qa:mode=closedbook,model=openai_gpt-3.5-turbo-0613,additional_instructions=natural_qa_closedbook/26-Mar-2024 15:08 -  
[DIR]natural_qa:mode=closedbook,model=openai_gpt-4-1106-preview,additional_instructions=natural_qa_closedbook/26-Mar-2024 15:08 -  
[DIR]natural_qa:mode=closedbook,model=mistralai_mixtral-8x7b-32kseqlen,additional_instructions=natural_qa_closedbook/26-Mar-2024 15:08 -  
[DIR]natural_qa:mode=closedbook,model=microsoft_phi-2,additional_instructions=natural_qa_closedbook/26-Mar-2024 15:08 -  
[DIR]natural_qa:mode=closedbook,model=qwen_qwen1.5-7b,additional_instructions=natural_qa_closedbook/26-Mar-2024 15:08 -  
[DIR]natural_qa:mode=openbook_longans,model=01-ai_yi-6b,additional_instructions=natural_qa_openbook/26-Mar-2024 15:08 -  
[DIR]natural_qa:mode=openbook_longans,model=google_text-bison@001,additional_instructions=natural_qa_openbook/26-Mar-2024 15:08 -  
[DIR]natural_qa:mode=openbook_longans,model=google_gemma-7b,additional_instructions=natural_qa_openbook/26-Mar-2024 15:08 -  
[DIR]natural_qa:mode=openbook_longans,model=google_gemma-7b-it,additional_instructions=natural_qa_openbook/26-Mar-2024 15:08 -  
[DIR]natural_qa:mode=openbook_longans,model=meta_llama-2-7b,additional_instructions=natural_qa_openbook/26-Mar-2024 15:08 -  
[DIR]natural_qa:mode=openbook_longans,model=google_text-unicorn@001,additional_instructions=natural_qa_openbook/26-Mar-2024 15:08 -  
[DIR]natural_qa:mode=openbook_longans,model=microsoft_phi-2,additional_instructions=natural_qa_openbook/26-Mar-2024 15:08 -  
[DIR]natural_qa:mode=openbook_longans,model=mistralai_mixtral-8x7b-32kseqlen,additional_instructions=natural_qa_openbook/26-Mar-2024 15:08 -  
[DIR]natural_qa:mode=openbook_longans,model=openai_gpt-3.5-turbo-0613,additional_instructions=natural_qa_openbook/26-Mar-2024 15:08 -  
[DIR]natural_qa:mode=openbook_longans,model=qwen_qwen1.5-7b,additional_instructions=natural_qa_openbook/26-Mar-2024 15:08 -  
[DIR]natural_qa:mode=openbook_longans,model=openai_gpt-4-1106-preview,additional_instructions=natural_qa_openbook/26-Mar-2024 15:08 -  
[DIR]groups/26-Mar-2024 15:08 -  
[   ]schema.json26-Mar-2024 15:12 55K 
[   ]summary.json26-Mar-2024 15:12 87  
[   ]runs.json26-Mar-2024 15:12 4.1M 
[   ]run_specs.json26-Mar-2024 15:12 259K 
[   ]runs_to_run_suites.json26-Mar-2024 15:12 18K 
[   ]groups.json26-Mar-2024 15:12 12K 
[   ]groups_metadata.json26-Mar-2024 15:12 4.9K 
[   ]costs.json26-Mar-2024 15:12 2  
[DIR]mmlu:subject=abstract_algebra,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_abstract_algebra/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=astronomy,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_astronomy/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=anatomy,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_anatomy/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=business_ethics,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_business_ethics/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=clinical_knowledge,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_clinical_knowledge/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=college_biology,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_college_biology/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=college_chemistry,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_college_chemistry/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=college_computer_science,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_college_computer_science/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=college_mathematics,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_college_mathematics/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=college_physics,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_college_physics/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=college_medicine,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_college_medicine/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=computer_security,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_computer_security/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=econometrics,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_econometrics/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=conceptual_physics,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_conceptual_physics/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=electrical_engineering,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_electrical_engineering/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=formal_logic,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_formal_logic/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=elementary_mathematics,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_elementary_mathematics/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=global_facts,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_global_facts/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=high_school_chemistry,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_high_school_chemistry/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=high_school_biology,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_high_school_biology/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=high_school_computer_science,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_high_school_computer_science/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=high_school_european_history,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_high_school_european_history/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=high_school_geography,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_high_school_geography/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=high_school_government_and_politics,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_high_school_government_and_politics/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=high_school_macroeconomics,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_high_school_macroeconomics/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=high_school_mathematics,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_high_school_mathematics/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=high_school_microeconomics,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_high_school_microeconomics/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=high_school_physics,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_high_school_physics/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=high_school_statistics,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_high_school_statistics/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=high_school_psychology,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_high_school_psychology/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=high_school_us_history,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_high_school_us_history/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=high_school_world_history,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_high_school_world_history/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=human_aging,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_human_aging/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=human_sexuality,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_human_sexuality/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=international_law,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_international_law/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=jurisprudence,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_jurisprudence/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=machine_learning,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_machine_learning/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=logical_fallacies,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_logical_fallacies/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=management,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_management/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=medical_genetics,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_medical_genetics/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=marketing,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_marketing/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=miscellaneous,method=multiple_choice_joint,model=anthropic_claude-2.1/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=moral_disputes,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_moral_disputes/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=nutrition,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_nutrition/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=miscellaneous,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_miscellaneous/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=moral_scenarios,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_moral_scenarios/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=philosophy,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_philosophy/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=prehistory,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_prehistory/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=professional_accounting,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_professional_accounting/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=professional_medicine,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_professional_medicine/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=public_relations,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_public_relations/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=professional_psychology,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_professional_psychology/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=security_studies,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_security_studies/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=professional_law,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_professional_law/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=sociology,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_sociology/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=us_foreign_policy,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_us_foreign_policy/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=virology,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_virology/27-Mar-2024 21:38 -  
[DIR]mmlu:subject=world_religions,method=multiple_choice_joint,model=google_text-unicorn@001,eval_split=test,groups=mmlu_world_religions/27-Mar-2024 21:38 -  

Apache/2.2.15 (CentOS) Server at nlp.stanford.edu Port 443