Index of /helm/finance/benchmark_output/runs/v1.0.0
Name
Last modified
Size
Description
Parent Directory
-
banking77:model=google_gemini-1.5-flash-001/
30-Sep-2024 21:00
-
banking77:model=anthropic_claude-3-sonnet-20240229/
30-Sep-2024 21:00
-
banking77:model=anthropic_claude-3-opus-20240229/
30-Sep-2024 21:00
-
banking77:model=google_gemini-1.0-pro-002/
30-Sep-2024 21:00
-
banking77:model=anthropic_claude-3-5-sonnet-20240620/
30-Sep-2024 21:00
-
banking77:model=meta_llama-3-70b-chat/
30-Sep-2024 21:00
-
banking77:model=meta_llama-3.1-8b-instruct-turbo/
30-Sep-2024 21:01
-
banking77:model=meta_llama-3.1-405b-instruct-turbo/
30-Sep-2024 21:01
-
banking77:model=meta_llama-3-8b-chat/
30-Sep-2024 21:01
-
banking77:model=meta_llama-3.1-70b-instruct-turbo/
30-Sep-2024 21:01
-
banking77:model=meta_llama-3.2-11b-vision-instruct-turbo/
30-Sep-2024 21:01
-
banking77:model=meta_llama-3.2-3b-instruct-turbo/
30-Sep-2024 21:01
-
banking77:model=mistralai_mistral-7b-instruct-v0.3/
30-Sep-2024 21:01
-
banking77:model=meta_llama-3.2-90b-vision-instruct-turbo/
30-Sep-2024 21:01
-
banking77:model=mistralai_mixtral-8x22b-instruct-v0.1/
30-Sep-2024 21:01
-
banking77:model=mistralai_mixtral-8x7b-instruct-v0.1/
30-Sep-2024 21:01
-
banking77:model=openai_gpt-3.5-turbo-0125/
30-Sep-2024 21:01
-
banking77:model=qwen_qwen1.5-72b-chat/
30-Sep-2024 21:01
-
banking77:model=openai_gpt-4o-mini-2024-07-18/
30-Sep-2024 21:01
-
banking77:model=openai_gpt-4o-2024-05-13/
30-Sep-2024 21:01
-
banking77:model=qwen_qwen2-72b-instruct/
30-Sep-2024 21:01
-
fin_qa:model=anthropic_claude-3-5-sonnet-20240620/
30-Sep-2024 21:01
-
fin_qa:model=google_gemini-1.0-pro-002/
30-Sep-2024 21:01
-
fin_qa:model=google_gemini-1.5-flash-001/
30-Sep-2024 21:01
-
fin_qa:model=meta_llama-3-70b-chat/
30-Sep-2024 21:01
-
fin_qa:model=anthropic_claude-3-opus-20240229/
30-Sep-2024 21:01
-
fin_qa:model=meta_llama-3-8b-chat/
30-Sep-2024 21:01
-
fin_qa:model=anthropic_claude-3-sonnet-20240229/
30-Sep-2024 21:01
-
fin_qa:model=meta_llama-3.2-11b-vision-instruct-turbo/
30-Sep-2024 21:01
-
fin_qa:model=meta_llama-3.2-90b-vision-instruct-turbo/
30-Sep-2024 21:01
-
fin_qa:model=meta_llama-3.2-3b-instruct-turbo/
30-Sep-2024 21:01
-
fin_qa:model=meta_llama-3.1-70b-instruct-turbo/
30-Sep-2024 21:01
-
fin_qa:model=meta_llama-3.1-405b-instruct-turbo/
30-Sep-2024 21:01
-
fin_qa:model=meta_llama-3.1-8b-instruct-turbo/
30-Sep-2024 21:01
-
fin_qa:model=mistralai_mixtral-8x22b-instruct-v0.1/
30-Sep-2024 21:01
-
fin_qa:model=mistralai_mistral-7b-instruct-v0.3/
30-Sep-2024 21:01
-
financebench:model=anthropic_claude-3-5-sonnet-20240620/
30-Sep-2024 21:01
-
fin_qa:model=mistralai_mixtral-8x7b-instruct-v0.1/
30-Sep-2024 21:01
-
fin_qa:model=openai_gpt-4o-mini-2024-07-18/
30-Sep-2024 21:01
-
financebench:model=anthropic_claude-3-opus-20240229/
30-Sep-2024 21:01
-
fin_qa:model=qwen_qwen1.5-72b-chat/
30-Sep-2024 21:01
-
fin_qa:model=openai_gpt-4o-2024-05-13/
30-Sep-2024 21:01
-
financebench:model=anthropic_claude-3-sonnet-20240229/
30-Sep-2024 21:01
-
fin_qa:model=qwen_qwen2-72b-instruct/
30-Sep-2024 21:01
-
financebench:model=google_gemini-1.0-pro-002/
30-Sep-2024 21:01
-
financebench:model=google_gemini-1.5-flash-001/
30-Sep-2024 21:01
-
financebench:model=meta_llama-3-70b-chat/
30-Sep-2024 21:01
-
fin_qa:model=openai_gpt-3.5-turbo-0125/
30-Sep-2024 21:01
-
financebench:model=meta_llama-3-8b-chat/
30-Sep-2024 21:02
-
financebench:model=meta_llama-3.1-70b-instruct-turbo/
30-Sep-2024 21:02
-
financebench:model=meta_llama-3.1-405b-instruct-turbo/
30-Sep-2024 21:02
-
financebench:model=meta_llama-3.2-11b-vision-instruct-turbo/
30-Sep-2024 21:02
-
financebench:model=meta_llama-3.1-8b-instruct-turbo/
30-Sep-2024 21:02
-
financebench:model=meta_llama-3.2-3b-instruct-turbo/
30-Sep-2024 21:02
-
financebench:model=meta_llama-3.2-90b-vision-instruct-turbo/
30-Sep-2024 21:02
-
financebench:model=mistralai_mistral-7b-instruct-v0.3/
30-Sep-2024 21:02
-
financebench:model=mistralai_mixtral-8x22b-instruct-v0.1/
30-Sep-2024 21:02
-
financebench:model=mistralai_mixtral-8x7b-instruct-v0.1/
30-Sep-2024 21:02
-
financebench:model=openai_gpt-3.5-turbo-0125/
30-Sep-2024 21:02
-
financebench:model=openai_gpt-4o-2024-05-13/
30-Sep-2024 21:02
-
financebench:model=openai_gpt-4o-mini-2024-07-18/
30-Sep-2024 21:02
-
financebench:model=qwen_qwen1.5-72b-chat/
30-Sep-2024 21:02
-
financebench:model=qwen_qwen2-72b-instruct/
30-Sep-2024 21:02
-
banking77:model=google_gemini-1.5-pro-002/
01-Oct-2024 09:07
-
financebench:model=google_gemini-1.5-pro-002/
01-Oct-2024 09:07
-
fin_qa:model=google_gemini-1.5-pro-002/
01-Oct-2024 09:07
-
fin_qa:model=writer_palmyra-fin-32k/
29-Oct-2024 10:16
-
financebench:model=writer_palmyra-fin-32k/
29-Oct-2024 10:27
-
banking77:model=writer_palmyra-fin-32k/
29-Oct-2024 10:32
-
banking77:model=writer_palmyra-fin-32k,stop=none/
31-Oct-2024 13:38
-
financebench:model=writer_palmyra-fin-32k,stop=none/
31-Oct-2024 13:38
-
fin_qa:model=writer_palmyra-fin-32k,stop=none/
31-Oct-2024 13:38
-
eval_cache/
25-Mar-2025 14:13
-
financebench:model=writer_palmyra-fin/
26-Mar-2025 17:44
-
banking77:model=writer_palmyra-fin/
26-Mar-2025 17:44
-
fin_qa:model=writer_palmyra-fin/
26-Mar-2025 17:44
-
banking77:model=writer_palmyra-x-004/
26-Mar-2025 18:00
-
fin_qa:model=writer_palmyra-x-004/
26-Mar-2025 18:00
-
financebench:model=writer_palmyra-x-004/
26-Mar-2025 18:00
-
banking77:model=anthropic_claude-3-5-haiku-20241022/
27-Mar-2025 08:47
-
banking77:model=anthropic_claude-3-7-sonnet-20250219/
27-Mar-2025 08:47
-
banking77:model=qwen_qwen2.5-7b-instruct-turbo/
27-Mar-2025 08:47
-
banking77:model=qwen_qwen2.5-72b-instruct-turbo/
27-Mar-2025 08:47
-
banking77:model=google_gemini-2.0-flash-lite-preview-02-05/
27-Mar-2025 08:47
-
banking77:model=google_gemini-2.0-flash-001/
27-Mar-2025 08:47
-
banking77:model=deepseek-ai_deepseek-v3/
27-Mar-2025 08:47
-
fin_qa:model=anthropic_claude-3-5-haiku-20241022/
27-Mar-2025 08:47
-
financebench:model=anthropic_claude-3-5-haiku-20241022/
27-Mar-2025 08:47
-
financebench:model=anthropic_claude-3-7-sonnet-20250219/
27-Mar-2025 08:47
-
fin_qa:model=anthropic_claude-3-7-sonnet-20250219/
27-Mar-2025 08:48
-
fin_qa:model=google_gemini-2.0-flash-lite-preview-02-05/
27-Mar-2025 08:48
-
financebench:model=deepseek-ai_deepseek-v3/
27-Mar-2025 08:48
-
fin_qa:model=deepseek-ai_deepseek-v3/
27-Mar-2025 08:48
-
financebench:model=google_gemini-2.0-flash-001/
27-Mar-2025 08:48
-
fin_qa:model=qwen_qwen2.5-7b-instruct-turbo/
27-Mar-2025 08:48
-
fin_qa:model=qwen_qwen2.5-72b-instruct-turbo/
27-Mar-2025 08:48
-
fin_qa:model=google_gemini-2.0-flash-001/
27-Mar-2025 08:48
-
financebench:model=qwen_qwen2.5-72b-instruct-turbo/
27-Mar-2025 08:48
-
financebench:model=google_gemini-2.0-flash-lite-preview-02-05/
27-Mar-2025 08:48
-
financebench:model=qwen_qwen2.5-7b-instruct-turbo/
27-Mar-2025 08:48
-
Apache/2.2.15 (CentOS) Server at nlp.stanford.edu Port 443