*.7z filter=lfs diff=lfs merge=lfs -text *.arrow filter=lfs diff=lfs merge=lfs -text *.bin filter=lfs diff=lfs merge=lfs -text *.bz2 filter=lfs diff=lfs merge=lfs -text *.ckpt filter=lfs diff=lfs merge=lfs -text *.ftz filter=lfs diff=lfs merge=lfs -text *.gz filter=lfs diff=lfs merge=lfs -text *.h5 filter=lfs diff=lfs merge=lfs -text *.joblib filter=lfs diff=lfs merge=lfs -text *.lfs.* filter=lfs diff=lfs merge=lfs -text *.mlmodel filter=lfs diff=lfs merge=lfs -text *.model filter=lfs diff=lfs merge=lfs -text *.msgpack filter=lfs diff=lfs merge=lfs -text *.npy filter=lfs diff=lfs merge=lfs -text *.npz filter=lfs diff=lfs merge=lfs -text *.onnx filter=lfs diff=lfs merge=lfs -text *.ot filter=lfs diff=lfs merge=lfs -text *.parquet filter=lfs diff=lfs merge=lfs -text *.pb filter=lfs diff=lfs merge=lfs -text *.pickle filter=lfs diff=lfs merge=lfs -text *.pkl filter=lfs diff=lfs merge=lfs -text *.pt filter=lfs diff=lfs merge=lfs -text *.pth filter=lfs diff=lfs merge=lfs -text *.rar filter=lfs diff=lfs merge=lfs -text *.safetensors filter=lfs diff=lfs merge=lfs -text saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.tar.* filter=lfs diff=lfs merge=lfs -text *.tar filter=lfs diff=lfs merge=lfs -text *.tflite filter=lfs diff=lfs merge=lfs -text *.tgz filter=lfs diff=lfs merge=lfs -text *.wasm filter=lfs diff=lfs merge=lfs -text *.xz filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text results/GPT-4-0125-preview.csv filter=lfs diff=lfs merge=lfs -text results/Llama-2-70b-chat-hf.csv filter=lfs diff=lfs merge=lfs -text results/Llama-2-70B.csv filter=lfs diff=lfs merge=lfs -text results/Mistral-7B-Instruct-v0.2.csv filter=lfs diff=lfs merge=lfs -text results/StripedHyena-Nous-7B.csv filter=lfs diff=lfs merge=lfs -text results/Claude-3-Opus.csv filter=lfs diff=lfs merge=lfs -text results/GPT-3.5-Turbo.csv filter=lfs diff=lfs merge=lfs -text results/Qwen1.5-72B-Chat.csv filter=lfs diff=lfs merge=lfs -text results/Claude-3-Haiku.csv filter=lfs diff=lfs merge=lfs -text results/Mixtral-8x7B-Instruct-0.1.csv filter=lfs diff=lfs merge=lfs -text results/CodeLlama-70B.csv filter=lfs diff=lfs merge=lfs -text results/Gemma-7B.csv filter=lfs diff=lfs merge=lfs -text results/Yi-34B-Chat.csv filter=lfs diff=lfs merge=lfs -text results/Claude-3-Haiku.jpg filter=lfs diff=lfs merge=lfs -text results/Gemma-7B.pkl filter=lfs diff=lfs merge=lfs -text results/Llama-2-70b-chat-hf.pkl filter=lfs diff=lfs merge=lfs -text results/Mistral-7B-Instruct-v0.2.png filter=lfs diff=lfs merge=lfs -text results/Mixtral-8x7B-Instruct-0.1.png filter=lfs diff=lfs merge=lfs -text results/Claude-3-Opus.jpg filter=lfs diff=lfs merge=lfs -text results/CodeLlama-70B.pkl filter=lfs diff=lfs merge=lfs -text results/Gemma-7B.jpg filter=lfs diff=lfs merge=lfs -text results/Mistral-7B-Instruct-v0.2.pkl filter=lfs diff=lfs merge=lfs -text results/Mixtral-8x7B-Instruct-0.1.jpg filter=lfs diff=lfs merge=lfs -text results/Claude-3-Haiku.png filter=lfs diff=lfs merge=lfs -text results/GPT-3.5-Turbo.jpg filter=lfs diff=lfs merge=lfs -text results/GPT-3.5-Turbo.pkl filter=lfs diff=lfs merge=lfs -text results/Qwen1.5-72B-Chat.jpg filter=lfs diff=lfs merge=lfs -text results/StripedHyena-Nous-7B.pkl filter=lfs diff=lfs merge=lfs -text results/Yi-34B-Chat.png filter=lfs diff=lfs merge=lfs -text results/CodeLlama-70B.png filter=lfs diff=lfs merge=lfs -text results/GPT-3.5-Turbo.png filter=lfs diff=lfs merge=lfs -text results/Llama-2-70b-chat-hf.jpg filter=lfs diff=lfs merge=lfs -text results/StripedHyena-Nous-7B.png filter=lfs diff=lfs merge=lfs -text results/Llama-2-70b-chat-hf.png filter=lfs diff=lfs merge=lfs -text results/Mistral-7B-Instruct-v0.2.jpg filter=lfs diff=lfs merge=lfs -text results/StripedHyena-Nous-7B.jpg filter=lfs diff=lfs merge=lfs -text results/Qwen1.5-72B-Chat.png filter=lfs diff=lfs merge=lfs -text results/Yi-34B-Chat.pkl filter=lfs diff=lfs merge=lfs -text results/CodeLlama-70B.jpg filter=lfs diff=lfs merge=lfs -text results/GPT-4-0125-preview.jpg filter=lfs diff=lfs merge=lfs -text results/Mixtral-8x7B-Instruct-0.1.pkl filter=lfs diff=lfs merge=lfs -text results/Yi-34B-Chat.jpg filter=lfs diff=lfs merge=lfs -text results/Claude-3-Haiku.pkl filter=lfs diff=lfs merge=lfs -text results/Gemma-7B.png filter=lfs diff=lfs merge=lfs -text results/Qwen1.5-72B-Chat.pkl filter=lfs diff=lfs merge=lfs -text results/Claude-3-Opus.pkl filter=lfs diff=lfs merge=lfs -text results/Claude-3-Opus.png filter=lfs diff=lfs merge=lfs -text results/GPT-4-0125-preview.png filter=lfs diff=lfs merge=lfs -text results/GPT-4-0125-preview.pkl filter=lfs diff=lfs merge=lfs -text results-vision/gpt-4v-vision-preview.png filter=lfs diff=lfs merge=lfs -text results-vision/gpt-4v-vision-preview.jpg filter=lfs diff=lfs merge=lfs -text results-vision/gpt-4v-vision-preview.pkl filter=lfs diff=lfs merge=lfs -text results-vision/claude-3-opus-vision.pkl filter=lfs diff=lfs merge=lfs -text results-vision/claude-3-opus-vision.jpg filter=lfs diff=lfs merge=lfs -text results-vision/gemini-pro-vision-CoT.csv filter=lfs diff=lfs merge=lfs -text results-vision/gemini-pro-vision.png filter=lfs diff=lfs merge=lfs -text results-vision/gpt-4v-CoT.csv filter=lfs diff=lfs merge=lfs -text results-vision/gpt-4v-CoT.jpg filter=lfs diff=lfs merge=lfs -text results-vision/gpt-4v.pkl filter=lfs diff=lfs merge=lfs -text results-vision/gemini-pro-vision-CoT.png filter=lfs diff=lfs merge=lfs -text results-vision/gemini-pro-vision.jpg filter=lfs diff=lfs merge=lfs -text results-vision/gemini-pro-vision-CoT.pkl filter=lfs diff=lfs merge=lfs -text results-vision/gemini-pro-vision.csv filter=lfs diff=lfs merge=lfs -text results-vision/gpt-4v-CoT.pkl filter=lfs diff=lfs merge=lfs -text results-vision/gpt-4v.jpg filter=lfs diff=lfs merge=lfs -text results-vision/gpt-4v.png filter=lfs diff=lfs merge=lfs -text results-vision/claude-3-opus-vision.png filter=lfs diff=lfs merge=lfs -text results-vision/gemini-pro-vision-CoT.jpg filter=lfs diff=lfs merge=lfs -text results-vision/gemini-pro-vision.pkl filter=lfs diff=lfs merge=lfs -text results-vision/gpt-4v-CoT.png filter=lfs diff=lfs merge=lfs -text results-cot/gpt-3.5-CoT.jpg filter=lfs diff=lfs merge=lfs -text results-cot/gpt-4v-CoT-Azure.jpg filter=lfs diff=lfs merge=lfs -text results-vision-CoT/gemini-pro-vision-CoT.jpg filter=lfs diff=lfs merge=lfs -text results-cot/gpt-3.5-CoT.png filter=lfs diff=lfs merge=lfs -text results-cot/gpt-4v-CoT-Azure.png filter=lfs diff=lfs merge=lfs -text results-vision-CoT/gemini-pro-vision-CoT.png filter=lfs diff=lfs merge=lfs -text results-cot/gpt-3.5-CoT.pkl filter=lfs diff=lfs merge=lfs -text results-vision-CoT/gemini-pro-vision-CoT.pkl filter=lfs diff=lfs merge=lfs -text results-cot/gpt-4v-CoT-Azure.pkl filter=lfs diff=lfs merge=lfs -text results-cot/gpt-4v-CoT-Azure.csv filter=lfs diff=lfs merge=lfs -text results-vision-CoT/gemini-pro-vision-CoT.csv filter=lfs diff=lfs merge=lfs -text results-cot/gpt-3.5-CoT.csv filter=lfs diff=lfs merge=lfs -text results/claude-3-haiku-20240307.csv filter=lfs diff=lfs merge=lfs -text results/claude-3-opus-20240229.csv filter=lfs diff=lfs merge=lfs -text results-cot/gemma-7b-it.csv filter=lfs diff=lfs merge=lfs -text results-cot/gpt-3.5-turbo-0125.csv filter=lfs diff=lfs merge=lfs -text results/gpt-3.5-turbo-0125.csv filter=lfs diff=lfs merge=lfs -text results-cot/Mixtral-8x7B-Instruct-v0.1.csv filter=lfs diff=lfs merge=lfs -text results/gemma-7b-it.csv filter=lfs diff=lfs merge=lfs -text results-cot/Qwen1.5-72B-Chat.csv filter=lfs diff=lfs merge=lfs -text results/CodeLlama-70b-Instruct-hf.csv filter=lfs diff=lfs merge=lfs -text results/Mixtral-8x7B-Instruct-v0.1.csv filter=lfs diff=lfs merge=lfs -text results-cot/gemma-7b-it.pkl filter=lfs diff=lfs merge=lfs -text results/claude-3-haiku-20240307.pkl filter=lfs diff=lfs merge=lfs -text results/gemma-7b-it.pkl filter=lfs diff=lfs merge=lfs -text results-cot/gpt-3.5-turbo-0125.pkl filter=lfs diff=lfs merge=lfs -text results-cot/Mixtral-8x7B-Instruct-v0.1.pkl filter=lfs diff=lfs merge=lfs -text results/Mixtral-8x7B-Instruct-v0.1.pkl filter=lfs diff=lfs merge=lfs -text results/claude-3-opus-20240229.pkl filter=lfs diff=lfs merge=lfs -text results-cot/Qwen1.5-72B-Chat.pkl filter=lfs diff=lfs merge=lfs -text results/CodeLlama-70b-Instruct-hf.pkl filter=lfs diff=lfs merge=lfs -text results/gpt-3.5-turbo-0125.pkl filter=lfs diff=lfs merge=lfs -text results/claude-3-haiku-20240307.jpg filter=lfs diff=lfs merge=lfs -text results/claude-3-opus-20240229.jpg filter=lfs diff=lfs merge=lfs -text results/gpt-3.5-turbo-0125.jpg filter=lfs diff=lfs merge=lfs -text results-cot/gpt-3.5-turbo-0125.jpg filter=lfs diff=lfs merge=lfs -text results/Mixtral-8x7B-Instruct-v0.1.jpg filter=lfs diff=lfs merge=lfs -text results-cot/Qwen1.5-72B-Chat.jpg filter=lfs diff=lfs merge=lfs -text results/gemma-7b-it.jpg filter=lfs diff=lfs merge=lfs -text results-cot/Mixtral-8x7B-Instruct-v0.1.jpg filter=lfs diff=lfs merge=lfs -text results-cot/gemma-7b-it.jpg filter=lfs diff=lfs merge=lfs -text results/CodeLlama-70b-Instruct-hf.jpg filter=lfs diff=lfs merge=lfs -text results-cot/gemma-7b-it.png filter=lfs diff=lfs merge=lfs -text results-cot/gpt-3.5-turbo-0125.png filter=lfs diff=lfs merge=lfs -text results/gpt-3.5-turbo-0125.png filter=lfs diff=lfs merge=lfs -text results/CodeLlama-70b-Instruct-hf.png filter=lfs diff=lfs merge=lfs -text results/Mixtral-8x7B-Instruct-v0.1.png filter=lfs diff=lfs merge=lfs -text results/claude-3-opus-20240229.png filter=lfs diff=lfs merge=lfs -text results-cot/Mixtral-8x7B-Instruct-v0.1.png filter=lfs diff=lfs merge=lfs -text results-cot/Qwen1.5-72B-Chat.png filter=lfs diff=lfs merge=lfs -text results/claude-3-haiku-20240307.png filter=lfs diff=lfs merge=lfs -text results/gemma-7b-it.png filter=lfs diff=lfs merge=lfs -text results-cot/dbrx-instruct.jpg filter=lfs diff=lfs merge=lfs -text results-cot/claude-3-sonnet-20240229.png filter=lfs diff=lfs merge=lfs -text results-cot/deepseek-llm-67b-chat.csv filter=lfs diff=lfs merge=lfs -text results-cot/dbrx-instruct.csv filter=lfs diff=lfs merge=lfs -text results-cot/CodeLlama-70b-Instruct-hf.png filter=lfs diff=lfs merge=lfs -text results-cot/claude-3-sonnet-20240229.pkl filter=lfs diff=lfs merge=lfs -text results-cot/deepseek-llm-67b-chat.jpg filter=lfs diff=lfs merge=lfs -text results-cot/CodeLlama-70b-Instruct-hf.pkl filter=lfs diff=lfs merge=lfs -text results-cot/dbrx-instruct.pkl filter=lfs diff=lfs merge=lfs -text results-cot/deepseek-llm-67b-chat.pkl filter=lfs diff=lfs merge=lfs -text results-cot/deepseek-llm-67b-chat.png filter=lfs diff=lfs merge=lfs -text results-cot/CodeLlama-70b-Instruct-hf.csv filter=lfs diff=lfs merge=lfs -text results-cot/claude-3-sonnet-20240229.jpg filter=lfs diff=lfs merge=lfs -text results-cot/CodeLlama-70b-Instruct-hf.jpg filter=lfs diff=lfs merge=lfs -text results-cot/dbrx-instruct.png filter=lfs diff=lfs merge=lfs -text results-cot/claude-3-sonnet-20240229.csv filter=lfs diff=lfs merge=lfs -text results/gpt-4-turbo-2024-04-09.csv filter=lfs diff=lfs merge=lfs -text results/gpt-4-turbo-2024-04-09.jpg filter=lfs diff=lfs merge=lfs -text results/gpt-4-turbo-2024-04-09.pkl filter=lfs diff=lfs merge=lfs -text results/gpt-4-turbo-2024-04-09.png filter=lfs diff=lfs merge=lfs -text results-cot/gemini-pro.pkl filter=lfs diff=lfs merge=lfs -text results-cot/gpt-4-turbo-2024-04-09.pkl filter=lfs diff=lfs merge=lfs -text results-cot/gemini-pro.png filter=lfs diff=lfs merge=lfs -text results-cot/gpt-4-turbo-2024-04-09.png filter=lfs diff=lfs merge=lfs -text results-cot/gemini-pro.jpg filter=lfs diff=lfs merge=lfs -text results-cot/gpt-4-turbo-2024-04-09.jpg filter=lfs diff=lfs merge=lfs -text results-cot/gemini-pro.csv filter=lfs diff=lfs merge=lfs -text results-cot/gpt-4-turbo-2024-04-09.csv filter=lfs diff=lfs merge=lfs -text results-vision/claude-3-opus-20240229.jpg filter=lfs diff=lfs merge=lfs -text results/claude-3-sonnet-20240229.png filter=lfs diff=lfs merge=lfs -text results/deepseek-llm-67b-chat.csv filter=lfs diff=lfs merge=lfs -text results/deepseek-llm-67b-chat.png filter=lfs diff=lfs merge=lfs -text results/deepseek-llm-67b-chat.pkl filter=lfs diff=lfs merge=lfs -text results-vision/claude-3-opus-20240229.pkl filter=lfs diff=lfs merge=lfs -text results-vision/claude-3-opus-20240229.png filter=lfs diff=lfs merge=lfs -text results/claude-3-sonnet-20240229.csv filter=lfs diff=lfs merge=lfs -text results/claude-3-sonnet-20240229.jpg filter=lfs diff=lfs merge=lfs -text results/claude-3-sonnet-20240229.pkl filter=lfs diff=lfs merge=lfs -text results/deepseek-llm-67b-chat.jpg filter=lfs diff=lfs merge=lfs -text results-vision/claude-3-opus-20240229.csv filter=lfs diff=lfs merge=lfs -text results_qwen/CodeLlama-70b-Instruct-hf.csv filter=lfs diff=lfs merge=lfs -text results_qwen/claude-3-opus-20240229.png filter=lfs diff=lfs merge=lfs -text results_qwen/gpt-4-0125-preview.png filter=lfs diff=lfs merge=lfs -text results_qwen/gpt-4-turbo-2024-04-09.jpg filter=lfs diff=lfs merge=lfs -text results_qwen/claude-3-haiku-20240307.csv filter=lfs diff=lfs merge=lfs -text results_qwen/gemma-7b-it.pkl filter=lfs diff=lfs merge=lfs -text results_qwen/gpt-4-0125-preview.csv filter=lfs diff=lfs merge=lfs -text results_qwen/gpt-4-0125-preview.pkl filter=lfs diff=lfs merge=lfs -text results_qwen/CodeLlama-70b-Instruct-hf.jpg filter=lfs diff=lfs merge=lfs -text results_qwen/Mixtral-8x7B-Instruct-v0.1.jpg filter=lfs diff=lfs merge=lfs -text results_qwen/deepseek-llm-67b-chat.pkl filter=lfs diff=lfs merge=lfs -text results_qwen/gemma-7b-it.jpg filter=lfs diff=lfs merge=lfs -text results_qwen/gemma-7b-it.png filter=lfs diff=lfs merge=lfs -text results_qwen/gpt-3.5-turbo-0125.pkl filter=lfs diff=lfs merge=lfs -text results_qwen/Mixtral-8x7B-Instruct-v0.1.pkl filter=lfs diff=lfs merge=lfs -text results_qwen/gpt-4-0125-preview.jpg filter=lfs diff=lfs merge=lfs -text results_qwen/gpt-4-turbo-2024-04-09.csv filter=lfs diff=lfs merge=lfs -text results_qwen/gpt-4-turbo-2024-04-09.png filter=lfs diff=lfs merge=lfs -text results_qwen/Mixtral-8x7B-Instruct-v0.1.csv filter=lfs diff=lfs merge=lfs -text results_qwen/Mixtral-8x7B-Instruct-v0.1.png filter=lfs diff=lfs merge=lfs -text results_qwen/claude-3-haiku-20240307.pkl filter=lfs diff=lfs merge=lfs -text results_qwen/claude-3-haiku-20240307.png filter=lfs diff=lfs merge=lfs -text results_qwen/claude-3-opus-20240229.jpg filter=lfs diff=lfs merge=lfs -text results_qwen/deepseek-llm-67b-chat.csv filter=lfs diff=lfs merge=lfs -text results_qwen/CodeLlama-70b-Instruct-hf.pkl filter=lfs diff=lfs merge=lfs -text results_qwen/deepseek-llm-67b-chat.jpg filter=lfs diff=lfs merge=lfs -text results_qwen/gpt-3.5-turbo-0125.csv filter=lfs diff=lfs merge=lfs -text results_qwen/claude-3-opus-20240229.csv filter=lfs diff=lfs merge=lfs -text results_qwen/claude-3-opus-20240229.pkl filter=lfs diff=lfs merge=lfs -text results_qwen/gemma-7b-it.csv filter=lfs diff=lfs merge=lfs -text results_qwen/gpt-3.5-turbo-0125.jpg filter=lfs diff=lfs merge=lfs -text results_qwen/gpt-3.5-turbo-0125.png filter=lfs diff=lfs merge=lfs -text results_qwen/gpt-4-turbo-2024-04-09.pkl filter=lfs diff=lfs merge=lfs -text results_qwen/CodeLlama-70b-Instruct-hf.png filter=lfs diff=lfs merge=lfs -text results_qwen/claude-3-haiku-20240307.jpg filter=lfs diff=lfs merge=lfs -text results_qwen/deepseek-llm-67b-chat.png filter=lfs diff=lfs merge=lfs -text results_qwen/dbrx-instruct.png filter=lfs diff=lfs merge=lfs -text results_qwen/gpt-35-turbo.jpg filter=lfs diff=lfs merge=lfs -text results_qwen/gpt-35-turbo.pkl filter=lfs diff=lfs merge=lfs -text results_qwen/Qwen1.5-72B-Chat.png filter=lfs diff=lfs merge=lfs -text results_qwen/dbrx-instruct.csv filter=lfs diff=lfs merge=lfs -text results_qwen/dbrx-instruct.pkl filter=lfs diff=lfs merge=lfs -text results_qwen/Yi-34B-Chat.pkl filter=lfs diff=lfs merge=lfs -text results_qwen/gpt-35-turbo.csv filter=lfs diff=lfs merge=lfs -text results_qwen/Llama-2-70b-chat-hf.jpg filter=lfs diff=lfs merge=lfs -text results_qwen/Llama-2-70b-chat-hf.png filter=lfs diff=lfs merge=lfs -text results_qwen/Mistral-7B-Instruct-v0.2.csv filter=lfs diff=lfs merge=lfs -text results_qwen/Mistral-7B-Instruct-v0.2.png filter=lfs diff=lfs merge=lfs -text results_qwen/Qwen1.5-72B-Chat.pkl filter=lfs diff=lfs merge=lfs -text results_qwen/Mistral-7B-Instruct-v0.2.jpg filter=lfs diff=lfs merge=lfs -text results_qwen/Mistral-7B-Instruct-v0.2.pkl filter=lfs diff=lfs merge=lfs -text results_qwen/Qwen1.5-72B-Chat.csv filter=lfs diff=lfs merge=lfs -text results_qwen/Yi-34B-Chat.png filter=lfs diff=lfs merge=lfs -text results_qwen/Llama-2-70b-chat-hf.csv filter=lfs diff=lfs merge=lfs -text results_qwen/StripedHyena-Nous-7B.csv filter=lfs diff=lfs merge=lfs -text results_qwen/StripedHyena-Nous-7B.pkl filter=lfs diff=lfs merge=lfs -text results_qwen/StripedHyena-Nous-7B.jpg filter=lfs diff=lfs merge=lfs -text results_qwen/Yi-34B-Chat.csv filter=lfs diff=lfs merge=lfs -text results_qwen/gpt-35-turbo.png filter=lfs diff=lfs merge=lfs -text results_qwen/Llama-2-70b-chat-hf.pkl filter=lfs diff=lfs merge=lfs -text results_qwen/claude-3-sonnet-20240229.csv filter=lfs diff=lfs merge=lfs -text results_qwen/claude-3-sonnet-20240229.png filter=lfs diff=lfs merge=lfs -text results_qwen/dbrx-instruct.jpg filter=lfs diff=lfs merge=lfs -text results_qwen/Qwen1.5-72B-Chat.jpg filter=lfs diff=lfs merge=lfs -text results_qwen/StripedHyena-Nous-7B.png filter=lfs diff=lfs merge=lfs -text results_qwen/claude-3-sonnet-20240229.jpg filter=lfs diff=lfs merge=lfs -text results_qwen/Yi-34B-Chat.jpg filter=lfs diff=lfs merge=lfs -text results_qwen/claude-3-sonnet-20240229.pkl filter=lfs diff=lfs merge=lfs -text results_qwen/Llama-3-70b-chat-hf.csv filter=lfs diff=lfs merge=lfs -text results_qwen/Llama-3-70b-chat-hf.png filter=lfs diff=lfs merge=lfs -text results_qwen/gpt-4.pkl filter=lfs diff=lfs merge=lfs -text results_qwen/gpt-4.png filter=lfs diff=lfs merge=lfs -text results_qwen/Llama-3-70b-chat-hf.jpg filter=lfs diff=lfs merge=lfs -text results_qwen/gpt-4.csv filter=lfs diff=lfs merge=lfs -text results_qwen/gpt-4.jpg filter=lfs diff=lfs merge=lfs -text results_qwen/Llama-3-70b-chat-hf.pkl filter=lfs diff=lfs merge=lfs -text all_results.pkl filter=lfs diff=lfs merge=lfs -text results/Llama-3-70b-chat-hf.png filter=lfs diff=lfs merge=lfs -text results/dbrx-instruct.png filter=lfs diff=lfs merge=lfs -text results/gpt-3.5-0613.png filter=lfs diff=lfs merge=lfs -text results/gpt-4-1106.png filter=lfs diff=lfs merge=lfs -text results/Llama-3-70b-chat-hf.jpg filter=lfs diff=lfs merge=lfs -text results/dbrx-instruct.jpg filter=lfs diff=lfs merge=lfs -text results/gpt-3.5-0613.jpg filter=lfs diff=lfs merge=lfs -text results/gpt-4-1106.jpg filter=lfs diff=lfs merge=lfs -text results/gpt-4-1106.pkl filter=lfs diff=lfs merge=lfs -text results/Llama-3-70b-chat-hf.pkl filter=lfs diff=lfs merge=lfs -text results/dbrx-instruct.pkl filter=lfs diff=lfs merge=lfs -text results/gpt-3.5-0613.pkl filter=lfs diff=lfs merge=lfs -text final_df.pkl filter=lfs diff=lfs merge=lfs -text heatmaps/claude-3-haiku-20240307_vision.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/Mixtral-8x7B-Instruct-v0.1_Textonly.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/claude-3-haiku-20240307_vision-CoT.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-4-1106_Textonly.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-4-vision-preview_vision-CoT.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/dbrx-instruct_Textonly.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/Llama-2-70b-chat-hf_CoT.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/Llama-3-70b-chat-hf_CoT.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/Llama-3-70b-chat-hf_Textonly.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/Mistral-7B-Instruct-v0.2_Textonly.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/claude-3-sonnet-20240229_vision.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/CodeLlama-70b-Instruct-hf_CoT.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/claude-3-haiku-20240307_Textonly.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/gemma-7b-it_CoT.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-4-0125-preview_CoT.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/claude-3-haiku-20240307_CoT.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/Mistral-7B-Instruct-v0.2_CoT.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/Qwen1.5-72B-Chat_CoT.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-3.5-turbo-0125_1shot.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/claude-3-sonnet-20240229_Textonly.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/Mixtral-8x7B-Instruct-v0.1_CoT.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/gemma-7b-it_Textonly.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-4-0125-preview_Textonly.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-4-turbo-2024-04-09_Textonly.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/claude-3-haiku-20240307_1shot.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/claude-3-opus-20240229_Textonly.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/deepseek-llm-67b-chat_CoT.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/claude-3-opus-20240229_vision-CoT.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/gemini-pro_vision-CoT.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-3.5-0613_Textonly.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-4-vision-preview_vision.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/gemini-pro_CoT.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/CodeLlama-70b-Instruct-hf_Textonly.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/Qwen1.5-72B-Chat_Textonly.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/Yi-34B-Chat_Textonly.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/claude-3-sonnet-20240229_vision-CoT.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/dbrx-instruct_CoT.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/gemini-pro_vision.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-3.5-0613_CoT.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-4-1106_CoT.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-4-turbo-2024-04-09_CoT.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/Llama-2-70b-chat-hf_Textonly.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/claude-3-opus-20240229_CoT.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-3.5-turbo-0125_Textonly.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-3.5-turbo-0125_CoT.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/Yi-34B-Chat_CoT.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/claude-3-opus-20240229_vision.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/claude-3-sonnet-20240229_CoT.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/deepseek-llm-67b-chat_Textonly.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/CodeLlama-70b-Instruct-hf_CoT.png filter=lfs diff=lfs merge=lfs -text heatmaps/Mixtral-8x7B-Instruct-v0.1_CoT.png filter=lfs diff=lfs merge=lfs -text heatmaps/claude-3-haiku-20240307_Textonly.png filter=lfs diff=lfs merge=lfs -text heatmaps/Yi-34B-Chat_CoT.png filter=lfs diff=lfs merge=lfs -text heatmaps/claude-3-sonnet-20240229_CoT.png filter=lfs diff=lfs merge=lfs -text heatmaps/claude-3-sonnet-20240229_vision.png filter=lfs diff=lfs merge=lfs -text heatmaps/gemini-pro_vision-CoT.png filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-35-turbo_CoT.png filter=lfs diff=lfs merge=lfs -text heatmaps/Llama-3-70b-chat-hf_CoT.png filter=lfs diff=lfs merge=lfs -text heatmaps/Mistral-7B-Instruct-v0.2_Textonly.png filter=lfs diff=lfs merge=lfs -text heatmaps/claude-3-haiku-20240307_CoT.png filter=lfs diff=lfs merge=lfs -text heatmaps/deepseek-llm-67b-chat_CoT.png filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-4-turbo-2024-04-09_Textonly.png filter=lfs diff=lfs merge=lfs -text heatmaps/Qwen1.5-72B-Chat_Textonly.png filter=lfs diff=lfs merge=lfs -text heatmaps/dbrx-instruct_Textonly.png filter=lfs diff=lfs merge=lfs -text heatmaps/claude-3-haiku-20240307_vision-CoT.png filter=lfs diff=lfs merge=lfs -text heatmaps/gemini-pro-vision_vision.png filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-3.5-0613_Textonly.png filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-3.5-turbo-0125_Textonly.png filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-35-turbo_1shot.png filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-4_vision-CoT.png filter=lfs diff=lfs merge=lfs -text heatmaps/claude-3-opus-20240229_CoT.png filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-35-turbo_Textonly.png filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-4-1106_Textonly.png filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-4-vision-preview_vision.png filter=lfs diff=lfs merge=lfs -text heatmaps/claude-3-haiku-20240307_vision.png filter=lfs diff=lfs merge=lfs -text heatmaps/gemini-pro_CoT.png filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-4-turbo-2024-04-09_CoT.png filter=lfs diff=lfs merge=lfs -text heatmaps/Mixtral-8x7B-Instruct-v0.1_Textonly.png filter=lfs diff=lfs merge=lfs -text heatmaps/gemma-7b-it_Textonly.png filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-4-1106_CoT.png filter=lfs diff=lfs merge=lfs -text heatmaps/CodeLlama-70b-Instruct-hf_Textonly.png filter=lfs diff=lfs merge=lfs -text heatmaps/Mistral-7B-Instruct-v0.2_CoT.png filter=lfs diff=lfs merge=lfs -text heatmaps/claude-3-sonnet-20240229_Textonly.png filter=lfs diff=lfs merge=lfs -text heatmaps/dbrx-instruct_CoT.png filter=lfs diff=lfs merge=lfs -text heatmaps/gemini-pro-vision_vision-CoT.png filter=lfs diff=lfs merge=lfs -text heatmaps/gemma-7b-it_CoT.png filter=lfs diff=lfs merge=lfs -text heatmaps/Qwen1.5-72B-Chat_CoT.png filter=lfs diff=lfs merge=lfs -text heatmaps/claude-3-opus-20240229_Textonly.png filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-4-0125-preview_Textonly.png filter=lfs diff=lfs merge=lfs -text heatmaps/claude-3-opus-20240229_vision-CoT.png filter=lfs diff=lfs merge=lfs -text heatmaps/claude-3-opus-20240229_vision.png filter=lfs diff=lfs merge=lfs -text heatmaps/claude-3-sonnet-20240229_vision-CoT.png filter=lfs diff=lfs merge=lfs -text heatmaps/gemini-pro_vision.png filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-3.5-turbo-0125_1shot.png filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-4-vision-preview_vision-CoT.png filter=lfs diff=lfs merge=lfs -text heatmaps/Llama-2-70b-chat-hf_CoT.png filter=lfs diff=lfs merge=lfs -text heatmaps/Llama-2-70b-chat-hf_Textonly.png filter=lfs diff=lfs merge=lfs -text heatmaps/Yi-34B-Chat_Textonly.png filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-3.5-turbo-0125_CoT.png filter=lfs diff=lfs merge=lfs -text heatmaps/Llama-3-70b-chat-hf_Textonly.png filter=lfs diff=lfs merge=lfs -text heatmaps/deepseek-llm-67b-chat_Textonly.png filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-3.5-0613_CoT.png filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-4-0125-preview_CoT.png filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-4_vision.png filter=lfs diff=lfs merge=lfs -text heatmaps/claude-3-haiku-20240307_1shot.png filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-4_CoT.png filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-4_Textonly.png filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-4_CoT.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-4_vision.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/gemini-pro-vision_vision.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/gemini-pro-vision_vision-CoT.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-35-turbo_Textonly.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-35-turbo_1shot.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-35-turbo_CoT.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-4_Textonly.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-4_vision-CoT.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/gemini-pro-1.0_vision-CoT.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-4-turbo-2024-04-09_vision.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/gemini-pro-1.0_Textonly.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/gemini-pro-1.0_CoT.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/snowflake-arctic-instruct_Textonly.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-4-turbo-2024-04-09_vision-CoT.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/gemini-pro-1.0_vision.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-4-turbo-2024-04-09_vision.png filter=lfs diff=lfs merge=lfs -text heatmaps/snowflake-arctic-instruct_Textonly.png filter=lfs diff=lfs merge=lfs -text heatmaps/gemini-pro-1.0_Textonly.png filter=lfs diff=lfs merge=lfs -text heatmaps/gpt-4-turbo-2024-04-09_vision-CoT.png filter=lfs diff=lfs merge=lfs -text heatmaps/gemini-pro-1.0_CoT.png filter=lfs diff=lfs merge=lfs -text heatmaps/gemini-pro-1.0_vision-CoT.png filter=lfs diff=lfs merge=lfs -text heatmaps/gemini-pro-1.0_vision.png filter=lfs diff=lfs merge=lfs -text *jpg filter=lfs diff=lfs merge=lfs -text heatmaps/claude-3-opus-20240229_1shot.jpg filter=lfs diff=lfs merge=lfs -text heatmaps/claude-3-opus-20240229_1shot.png filter=lfs diff=lfs merge=lfs -text