diff --git a/final_df.pkl b/final_df.pkl index 34113edef440a8f8e9240d72a4b64626e36268ec..cf869955a0c6e0bc459e0f3a5fa2b0a1836ff7d5 100644 --- a/final_df.pkl +++ b/final_df.pkl @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:7b9acd5d65e88a0cc6655be4987086354db2719122a843652e75ba9b5d7b7d7d -size 797916821 +oid sha256:af070cfe995dc7525d87a670f0cb915085ba643ddc23b68e535ffbf9f5d5b4cf +size 812473008 diff --git a/heatmaps/CodeLlama-70b-Instruct-hf_CoT.png b/heatmaps/CodeLlama-70b-Instruct-hf_CoT.png new file mode 100644 index 0000000000000000000000000000000000000000..a962fe732de7b69eff1a3dc11e9e7c054576ad71 --- /dev/null +++ b/heatmaps/CodeLlama-70b-Instruct-hf_CoT.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4b703d3999364930556cf371142a5bba2110b71783cb88fa8909ae85d714671 +size 1015783 diff --git a/heatmaps/CodeLlama-70b-Instruct-hf_Textonly.png b/heatmaps/CodeLlama-70b-Instruct-hf_Textonly.png new file mode 100644 index 0000000000000000000000000000000000000000..5af44bb22cbbe91217d8568f74060df76a6c8c6a --- /dev/null +++ b/heatmaps/CodeLlama-70b-Instruct-hf_Textonly.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c6ae2fb07adadc075d0aed53c8844721b6adbaf8fd0a7778846c7462907d8a9 +size 1015150 diff --git a/heatmaps/Llama-2-70b-chat-hf_CoT.png b/heatmaps/Llama-2-70b-chat-hf_CoT.png new file mode 100644 index 0000000000000000000000000000000000000000..ccfc6455c23e5dcf8b7e0840b0b256069006c3fb --- /dev/null +++ b/heatmaps/Llama-2-70b-chat-hf_CoT.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f17dd315ca49a7edbb33f1644a9a9e4c7e65d07d1d2e04071c13794e9b2c78c0 +size 1012562 diff --git a/heatmaps/Llama-2-70b-chat-hf_Textonly.png b/heatmaps/Llama-2-70b-chat-hf_Textonly.png new file mode 100644 index 0000000000000000000000000000000000000000..8cc0ddea302abfb9078c136adcd2aee28aa5465c --- /dev/null +++ b/heatmaps/Llama-2-70b-chat-hf_Textonly.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8377077937b29b87238695c35315c51f31c588b210b39fdd582dfad45dbeec1c +size 1012953 diff --git a/heatmaps/Llama-3-70b-chat-hf_CoT.png b/heatmaps/Llama-3-70b-chat-hf_CoT.png new file mode 100644 index 0000000000000000000000000000000000000000..2f1412c709685965c7fe25069898f09ed8cb174a --- /dev/null +++ b/heatmaps/Llama-3-70b-chat-hf_CoT.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac8d589c5c452688ef8b64a8c97853537cf4c022835536900216a66dbd69f437 +size 1007765 diff --git a/heatmaps/Llama-3-70b-chat-hf_Textonly.png b/heatmaps/Llama-3-70b-chat-hf_Textonly.png new file mode 100644 index 0000000000000000000000000000000000000000..c76ff9594dcfcb8e8996bf05e891db463e39cac4 --- /dev/null +++ b/heatmaps/Llama-3-70b-chat-hf_Textonly.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18e2f11ebe5236c6b08725e6b900ab625136c644719d44179c5ab3411e1565ab +size 1007403 diff --git a/heatmaps/Mistral-7B-Instruct-v0.2_CoT.png b/heatmaps/Mistral-7B-Instruct-v0.2_CoT.png new file mode 100644 index 0000000000000000000000000000000000000000..a1a8c4db984c6de861d59892b7b1491281ef351c --- /dev/null +++ b/heatmaps/Mistral-7B-Instruct-v0.2_CoT.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c4d747f70b2678115568f1f5d0b9508da6ad176c624505d3ea627fb0e15d3a3 +size 1013109 diff --git a/heatmaps/Mistral-7B-Instruct-v0.2_Textonly.png b/heatmaps/Mistral-7B-Instruct-v0.2_Textonly.png new file mode 100644 index 0000000000000000000000000000000000000000..501ef08432f492d9538277018eef74510203059c --- /dev/null +++ b/heatmaps/Mistral-7B-Instruct-v0.2_Textonly.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6139f6cbefafdc34b27b58bfd8ce67285166e08363a9d00fcc6a92bffb7943fa +size 1013418 diff --git a/heatmaps/Mixtral-8x7B-Instruct-v0.1_CoT.png b/heatmaps/Mixtral-8x7B-Instruct-v0.1_CoT.png new file mode 100644 index 0000000000000000000000000000000000000000..44e172c701b8ddbe9513e789a4fe891638ae2bb9 --- /dev/null +++ b/heatmaps/Mixtral-8x7B-Instruct-v0.1_CoT.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53390f5c4a574f3900d4f574545b67acdeae2850085be202e52b0e44ab8a641d +size 1015219 diff --git a/heatmaps/Mixtral-8x7B-Instruct-v0.1_Textonly.png b/heatmaps/Mixtral-8x7B-Instruct-v0.1_Textonly.png new file mode 100644 index 0000000000000000000000000000000000000000..fe4426bef2706b1f469d923a96e341521ceec8a4 --- /dev/null +++ b/heatmaps/Mixtral-8x7B-Instruct-v0.1_Textonly.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd489ef12cf2536223105023772f86b43f0d1a2082821a8ee8f650a2f3b11e2c +size 1015193 diff --git a/heatmaps/Qwen1.5-72B-Chat_CoT.png b/heatmaps/Qwen1.5-72B-Chat_CoT.png new file mode 100644 index 0000000000000000000000000000000000000000..2914a9def2126560fb2b1a31c0804e40b0a8476e --- /dev/null +++ b/heatmaps/Qwen1.5-72B-Chat_CoT.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba485c5af43d1ada5c5aec35135d4412732ccf1b61042307b43bc9fc7de3bb63 +size 1013566 diff --git a/heatmaps/Qwen1.5-72B-Chat_Textonly.png b/heatmaps/Qwen1.5-72B-Chat_Textonly.png new file mode 100644 index 0000000000000000000000000000000000000000..3754b1a3b3e5c41a4834cffe97c2cba087fd64ad --- /dev/null +++ b/heatmaps/Qwen1.5-72B-Chat_Textonly.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da6a75456ce2f11d7adda03ab3741d0a4965f23562baf96e0455bd3e6c837fbf +size 1014160 diff --git a/heatmaps/Yi-34B-Chat_CoT.png b/heatmaps/Yi-34B-Chat_CoT.png new file mode 100644 index 0000000000000000000000000000000000000000..49b4cee474cc182e59521a877865b301c8f31038 --- /dev/null +++ b/heatmaps/Yi-34B-Chat_CoT.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0203cef5e3bd69355f8c6b77c769378dacb3ff6fe518ce162d15ee98b74980f +size 1012364 diff --git a/heatmaps/Yi-34B-Chat_Textonly.png b/heatmaps/Yi-34B-Chat_Textonly.png new file mode 100644 index 0000000000000000000000000000000000000000..c216dba704094b4ad0b7520888ac9aec8f8a519e --- /dev/null +++ b/heatmaps/Yi-34B-Chat_Textonly.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1cfa52dc642befaf19311d03498bb53e4d7e633b9c8f15e5819b83502fa74ba +size 1013714 diff --git a/heatmaps/claude-3-haiku-20240307_1shot.png b/heatmaps/claude-3-haiku-20240307_1shot.png new file mode 100644 index 0000000000000000000000000000000000000000..94b419ccc9b4d32bec427031674a266c20bf90da --- /dev/null +++ b/heatmaps/claude-3-haiku-20240307_1shot.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac10f7119f60f0b7fbcc3596fb5e0fc531918e3aaad13efd16b378f5531b6a99 +size 1009478 diff --git a/heatmaps/claude-3-haiku-20240307_CoT.png b/heatmaps/claude-3-haiku-20240307_CoT.png new file mode 100644 index 0000000000000000000000000000000000000000..821e55db38e8b0fb15362565c34c8d766627e466 --- /dev/null +++ b/heatmaps/claude-3-haiku-20240307_CoT.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58718d439e2b2f3ca2cdf6077fe52c02697171bee292c57d5c0e69c172b558d8 +size 1011446 diff --git a/heatmaps/claude-3-haiku-20240307_Textonly.png b/heatmaps/claude-3-haiku-20240307_Textonly.png new file mode 100644 index 0000000000000000000000000000000000000000..2983bbe07cbbcfa89c75254abb76d45a00ff9299 --- /dev/null +++ b/heatmaps/claude-3-haiku-20240307_Textonly.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ce63eae77b0bee6126753b0b4dd92e875606c85a2e9053be79a48ea5f3710a9 +size 1013013 diff --git a/heatmaps/claude-3-haiku-20240307_vision-CoT.png b/heatmaps/claude-3-haiku-20240307_vision-CoT.png new file mode 100644 index 0000000000000000000000000000000000000000..38c8df008efa48054be105da7d1853160152c61f --- /dev/null +++ b/heatmaps/claude-3-haiku-20240307_vision-CoT.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:881eb2164cab4b6c725df5876dbb6ac308b27df0aab9cb168e8146af05f7dfe7 +size 1013350 diff --git a/heatmaps/claude-3-haiku-20240307_vision.png b/heatmaps/claude-3-haiku-20240307_vision.png new file mode 100644 index 0000000000000000000000000000000000000000..9761079f47c7a83570eed48195afeefbce734d27 --- /dev/null +++ b/heatmaps/claude-3-haiku-20240307_vision.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7999d05af83274310ab0c5a2bc8c35f55cfbe11741214d92c1540e836b902a8 +size 1013765 diff --git a/heatmaps/claude-3-opus-20240229_CoT.png b/heatmaps/claude-3-opus-20240229_CoT.png new file mode 100644 index 0000000000000000000000000000000000000000..0afcd732e774ce823a309264536e8499ffd57136 --- /dev/null +++ b/heatmaps/claude-3-opus-20240229_CoT.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97b1aa99bd7f3314c5edcd40ad9c8372f249967818bce03c7fb2d35709ce749e +size 1007696 diff --git a/heatmaps/claude-3-opus-20240229_Textonly.png b/heatmaps/claude-3-opus-20240229_Textonly.png new file mode 100644 index 0000000000000000000000000000000000000000..f80bfbf1d523f2af33230d9fa1edda34be02e731 --- /dev/null +++ b/heatmaps/claude-3-opus-20240229_Textonly.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afacabca17ef01693140c10014c9bac2be4429511c93bd690f13c135f88565d1 +size 1007456 diff --git a/heatmaps/claude-3-opus-20240229_vision-CoT.png b/heatmaps/claude-3-opus-20240229_vision-CoT.png new file mode 100644 index 0000000000000000000000000000000000000000..bf8704bd5b939037ff9d67a9ee4faadc3f67f550 --- /dev/null +++ b/heatmaps/claude-3-opus-20240229_vision-CoT.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:189329927bf4a5238920c94af0a8981afdd8bcd5ccdc17328a5bb766b391fd5e +size 1013679 diff --git a/heatmaps/claude-3-opus-20240229_vision.png b/heatmaps/claude-3-opus-20240229_vision.png new file mode 100644 index 0000000000000000000000000000000000000000..edda919bf37263d61bdf9f32fed84b2540e08581 --- /dev/null +++ b/heatmaps/claude-3-opus-20240229_vision.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ba0697318c6fe5883b116386c867b45a4e38ad770e3f4250caa57bfa95ceb09 +size 1011910 diff --git a/heatmaps/claude-3-sonnet-20240229_CoT.jpg b/heatmaps/claude-3-sonnet-20240229_CoT.jpg index cfcec38cbfb44c696a3adca6f13275f949c3e454..11b199b920d3f006cc3075d4dedde5bf643ce0b4 100644 --- a/heatmaps/claude-3-sonnet-20240229_CoT.jpg +++ b/heatmaps/claude-3-sonnet-20240229_CoT.jpg @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:97f3fcc436adf32351392db6fe0b36969554ecfef9f5a6be87d6cb73b59d3840 -size 1333230 +oid sha256:ea55e964a1547d4462364c8f41ecbaf870af6cb151589bc45af03bbcc171afad +size 1280445 diff --git a/heatmaps/claude-3-sonnet-20240229_CoT.png b/heatmaps/claude-3-sonnet-20240229_CoT.png new file mode 100644 index 0000000000000000000000000000000000000000..77f5c2ac3409a8a9cb3245fbe1daa8519935650f --- /dev/null +++ b/heatmaps/claude-3-sonnet-20240229_CoT.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8bb80b9223b84284c4b7b00b43fc352bc083e472cc153252a46f67885ce74c9e +size 1006278 diff --git a/heatmaps/claude-3-sonnet-20240229_Textonly.png b/heatmaps/claude-3-sonnet-20240229_Textonly.png new file mode 100644 index 0000000000000000000000000000000000000000..6df05ac9a960d4b4bd76877d42ad8ef58f696575 --- /dev/null +++ b/heatmaps/claude-3-sonnet-20240229_Textonly.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bd38f277f8ab03ff4394b563a72634ddaf7a39044561e25a1b1d9c734695f2d +size 1007373 diff --git a/heatmaps/claude-3-sonnet-20240229_vision-CoT.png b/heatmaps/claude-3-sonnet-20240229_vision-CoT.png new file mode 100644 index 0000000000000000000000000000000000000000..f18fdcd073311bb5056ef03781c6ac214b31575a --- /dev/null +++ b/heatmaps/claude-3-sonnet-20240229_vision-CoT.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a93035f2d36505bb6c6126b541704bb42cc6c3a4aff47b76e79f4221ba9b3c7 +size 1013406 diff --git a/heatmaps/claude-3-sonnet-20240229_vision.jpg b/heatmaps/claude-3-sonnet-20240229_vision.jpg index 11b199b920d3f006cc3075d4dedde5bf643ce0b4..cfcec38cbfb44c696a3adca6f13275f949c3e454 100644 --- a/heatmaps/claude-3-sonnet-20240229_vision.jpg +++ b/heatmaps/claude-3-sonnet-20240229_vision.jpg @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:ea55e964a1547d4462364c8f41ecbaf870af6cb151589bc45af03bbcc171afad -size 1280445 +oid sha256:97f3fcc436adf32351392db6fe0b36969554ecfef9f5a6be87d6cb73b59d3840 +size 1333230 diff --git a/heatmaps/claude-3-sonnet-20240229_vision.png b/heatmaps/claude-3-sonnet-20240229_vision.png new file mode 100644 index 0000000000000000000000000000000000000000..1681f634d223d7565bd290167911f71de0a3ca41 --- /dev/null +++ b/heatmaps/claude-3-sonnet-20240229_vision.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85b53bb356b419260d72c5a1ab4c5c095c759fc3bed9f6023ad9703577211d16 +size 1012448 diff --git a/heatmaps/dbrx-instruct_CoT.png b/heatmaps/dbrx-instruct_CoT.png new file mode 100644 index 0000000000000000000000000000000000000000..6d77594f2a985b9a8030975ca0b4c25d9eda4903 --- /dev/null +++ b/heatmaps/dbrx-instruct_CoT.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ece339a94f8ffc03a5ddb611e0ef9ebd43716f55bcdfbc1ee72dee3db092c9b +size 1014810 diff --git a/heatmaps/dbrx-instruct_Textonly.png b/heatmaps/dbrx-instruct_Textonly.png new file mode 100644 index 0000000000000000000000000000000000000000..876a010f5166e7277f2b4b2c95cb025a9daa224d --- /dev/null +++ b/heatmaps/dbrx-instruct_Textonly.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1b49a0957e72d26093d87055ed1d3547ec5b15cdbea16fc152bce108dd0a089 +size 1016609 diff --git a/heatmaps/deepseek-llm-67b-chat_CoT.png b/heatmaps/deepseek-llm-67b-chat_CoT.png new file mode 100644 index 0000000000000000000000000000000000000000..1422a9ac005ec036cd225bed9990ef6882134c64 --- /dev/null +++ b/heatmaps/deepseek-llm-67b-chat_CoT.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0019a7d6d2ee430c5f7385da3d7670ca4093714d8adc5efda5e85f1d82abd1e +size 1014990 diff --git a/heatmaps/deepseek-llm-67b-chat_Textonly.png b/heatmaps/deepseek-llm-67b-chat_Textonly.png new file mode 100644 index 0000000000000000000000000000000000000000..24995410e4ed55031cfe6e149c2d304adf2525a5 --- /dev/null +++ b/heatmaps/deepseek-llm-67b-chat_Textonly.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13d0ed905e772cd6bac1313c4b2be38b8c94b6805c1619038f2ded2fb1d8c6eb +size 1013928 diff --git a/heatmaps/gemini-pro-vision_vision-CoT.jpg b/heatmaps/gemini-pro-vision_vision-CoT.jpg new file mode 100644 index 0000000000000000000000000000000000000000..397db7b8c1e30301d62da537c35e25b123a0ea78 --- /dev/null +++ b/heatmaps/gemini-pro-vision_vision-CoT.jpg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:116b2a07fb740560e59471347f4c6da6fbb251ef0a6cda7f4c3cd9cf8ef2beac +size 1325582 diff --git a/heatmaps/gemini-pro-vision_vision-CoT.png b/heatmaps/gemini-pro-vision_vision-CoT.png new file mode 100644 index 0000000000000000000000000000000000000000..d2676153e27f606f25e15d000427eeb562bf554c --- /dev/null +++ b/heatmaps/gemini-pro-vision_vision-CoT.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:760d125e5041c0ab84740df1cc1aaa201e4e7b6cdc1957e20be2cdb5642fe969 +size 1013221 diff --git a/heatmaps/gemini-pro-vision_vision.jpg b/heatmaps/gemini-pro-vision_vision.jpg new file mode 100644 index 0000000000000000000000000000000000000000..4a6576b8f66f2de2a334d22f8b76369896afca6f --- /dev/null +++ b/heatmaps/gemini-pro-vision_vision.jpg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36cc139756d58b144d03cffdd23df7a07a71f1a3b77d8544b35d24afbece3a10 +size 1328654 diff --git a/heatmaps/gemini-pro-vision_vision.png b/heatmaps/gemini-pro-vision_vision.png new file mode 100644 index 0000000000000000000000000000000000000000..9f8dc36de96ae337422e66b34047f9b47ad7b315 --- /dev/null +++ b/heatmaps/gemini-pro-vision_vision.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad0d9194c4035d8ce57f7ee9ea4807dc4169349576f1eecc56def274a16cc69a +size 1014396 diff --git a/heatmaps/gemini-pro_CoT.png b/heatmaps/gemini-pro_CoT.png new file mode 100644 index 0000000000000000000000000000000000000000..330a67b7bceae11d052f9deb7b4388bc3f8935f0 --- /dev/null +++ b/heatmaps/gemini-pro_CoT.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4277a0cd9c8d3289a79c89ff36ffd983e103f781a66879c2dbe136eb08823133 +size 1015461 diff --git a/heatmaps/gemini-pro_vision-CoT.png b/heatmaps/gemini-pro_vision-CoT.png new file mode 100644 index 0000000000000000000000000000000000000000..d2676153e27f606f25e15d000427eeb562bf554c --- /dev/null +++ b/heatmaps/gemini-pro_vision-CoT.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:760d125e5041c0ab84740df1cc1aaa201e4e7b6cdc1957e20be2cdb5642fe969 +size 1013221 diff --git a/heatmaps/gemini-pro_vision.png b/heatmaps/gemini-pro_vision.png new file mode 100644 index 0000000000000000000000000000000000000000..9f8dc36de96ae337422e66b34047f9b47ad7b315 --- /dev/null +++ b/heatmaps/gemini-pro_vision.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad0d9194c4035d8ce57f7ee9ea4807dc4169349576f1eecc56def274a16cc69a +size 1014396 diff --git a/heatmaps/gemma-7b-it_CoT.png b/heatmaps/gemma-7b-it_CoT.png new file mode 100644 index 0000000000000000000000000000000000000000..82b851f582926610cfa8bc7597cf3871dd7c86ca --- /dev/null +++ b/heatmaps/gemma-7b-it_CoT.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8f6d3816f1f9de91e83f3d5d918f59e8498c1ff3b4bf6c67da776c08cafe72c +size 1009568 diff --git a/heatmaps/gemma-7b-it_Textonly.png b/heatmaps/gemma-7b-it_Textonly.png new file mode 100644 index 0000000000000000000000000000000000000000..8ca94d52c3e0c66e2bcd5d5afe3224af13355e3e --- /dev/null +++ b/heatmaps/gemma-7b-it_Textonly.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b201026783da62603536971932d37effbdf59151545c82def24af8ab23718678 +size 1011023 diff --git a/heatmaps/gpt-3.5-0613_CoT.png b/heatmaps/gpt-3.5-0613_CoT.png new file mode 100644 index 0000000000000000000000000000000000000000..ef71eadaf278a0f00890d1704bea70d5ae00c132 --- /dev/null +++ b/heatmaps/gpt-3.5-0613_CoT.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f7384d2c201299c3eb1a7fdf82a4430f62a5f5730dbf63aa9bd5f5d878ef0b3 +size 1016934 diff --git a/heatmaps/gpt-3.5-0613_Textonly.png b/heatmaps/gpt-3.5-0613_Textonly.png new file mode 100644 index 0000000000000000000000000000000000000000..9d2dc6480bd05cb85ee049318e17721a75e1eecb --- /dev/null +++ b/heatmaps/gpt-3.5-0613_Textonly.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fb1964c888537286beeec01612bd66b620b1c0c94f31b6ad84e54c52475b97a +size 1012686 diff --git a/heatmaps/gpt-3.5-turbo-0125_1shot.png b/heatmaps/gpt-3.5-turbo-0125_1shot.png new file mode 100644 index 0000000000000000000000000000000000000000..6055e4a933f70869e6e4b4357046bc115fbeea81 --- /dev/null +++ b/heatmaps/gpt-3.5-turbo-0125_1shot.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee8bb855f9aeb66f2c695c11cb7b3da4ecae44c4c5f3ac5ef70bc47edf78644b +size 1014525 diff --git a/heatmaps/gpt-3.5-turbo-0125_CoT.png b/heatmaps/gpt-3.5-turbo-0125_CoT.png new file mode 100644 index 0000000000000000000000000000000000000000..cf3ae5112a560d604e97e49730212c5f0cfe9182 --- /dev/null +++ b/heatmaps/gpt-3.5-turbo-0125_CoT.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c282cd460ba6186cc8eaf7835a34d494a7d7071f9b189033ba2688014d9a55a2 +size 1016223 diff --git a/heatmaps/gpt-3.5-turbo-0125_Textonly.png b/heatmaps/gpt-3.5-turbo-0125_Textonly.png new file mode 100644 index 0000000000000000000000000000000000000000..0597425aa23f42f36de664029f27005b2b800f39 --- /dev/null +++ b/heatmaps/gpt-3.5-turbo-0125_Textonly.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acee80e0cbdb9cd65e8b9dd6798e095006df1899ab5de48ec4b7f1698cce5392 +size 1014322 diff --git a/heatmaps/gpt-35-turbo_1shot.jpg b/heatmaps/gpt-35-turbo_1shot.jpg new file mode 100644 index 0000000000000000000000000000000000000000..21eb4858c370c73097a5a05b0c1cf8096c49265f --- /dev/null +++ b/heatmaps/gpt-35-turbo_1shot.jpg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45770b4c8e836e17cccb2ad73ed7894802f070fbfb760c166881a9ada6eccaa5 +size 1316586 diff --git a/heatmaps/gpt-35-turbo_1shot.png b/heatmaps/gpt-35-turbo_1shot.png new file mode 100644 index 0000000000000000000000000000000000000000..6055e4a933f70869e6e4b4357046bc115fbeea81 --- /dev/null +++ b/heatmaps/gpt-35-turbo_1shot.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee8bb855f9aeb66f2c695c11cb7b3da4ecae44c4c5f3ac5ef70bc47edf78644b +size 1014525 diff --git a/heatmaps/gpt-35-turbo_CoT.jpg b/heatmaps/gpt-35-turbo_CoT.jpg new file mode 100644 index 0000000000000000000000000000000000000000..50af6c75507cee4005726e5eacac7809c279aafc --- /dev/null +++ b/heatmaps/gpt-35-turbo_CoT.jpg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e36f991250d11adf955df905756e4abb8313fb2f46a06bb6e4fb1c1f117dd332 +size 1318275 diff --git a/heatmaps/gpt-35-turbo_CoT.png b/heatmaps/gpt-35-turbo_CoT.png new file mode 100644 index 0000000000000000000000000000000000000000..ef71eadaf278a0f00890d1704bea70d5ae00c132 --- /dev/null +++ b/heatmaps/gpt-35-turbo_CoT.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f7384d2c201299c3eb1a7fdf82a4430f62a5f5730dbf63aa9bd5f5d878ef0b3 +size 1016934 diff --git a/heatmaps/gpt-35-turbo_Textonly.jpg b/heatmaps/gpt-35-turbo_Textonly.jpg new file mode 100644 index 0000000000000000000000000000000000000000..d1c1611e809ca2f99310544e973e10738703dba4 --- /dev/null +++ b/heatmaps/gpt-35-turbo_Textonly.jpg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57cc450248c9ce976f6eb76d148c75ff1087499a585c2dd12fd8c3c27e1f1ce2 +size 1321315 diff --git a/heatmaps/gpt-35-turbo_Textonly.png b/heatmaps/gpt-35-turbo_Textonly.png new file mode 100644 index 0000000000000000000000000000000000000000..9d2dc6480bd05cb85ee049318e17721a75e1eecb --- /dev/null +++ b/heatmaps/gpt-35-turbo_Textonly.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fb1964c888537286beeec01612bd66b620b1c0c94f31b6ad84e54c52475b97a +size 1012686 diff --git a/heatmaps/gpt-4-0125-preview_CoT.png b/heatmaps/gpt-4-0125-preview_CoT.png new file mode 100644 index 0000000000000000000000000000000000000000..1c69f370cd8b227f275747c2b7cd8fb92dbf2ec1 --- /dev/null +++ b/heatmaps/gpt-4-0125-preview_CoT.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1e1d8e98b040e2246ad1f83c4e657eb7351230cd31fd9b8ac49381a05b2471d +size 1007898 diff --git a/heatmaps/gpt-4-0125-preview_Textonly.png b/heatmaps/gpt-4-0125-preview_Textonly.png new file mode 100644 index 0000000000000000000000000000000000000000..8af7c2b6283037ce542d484fa2ea319b2c984ce7 --- /dev/null +++ b/heatmaps/gpt-4-0125-preview_Textonly.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a9cadfc44d92146e623b120f6d10d078e335330c5844b68de1d728dafe903e8 +size 1007831 diff --git a/heatmaps/gpt-4-1106_CoT.png b/heatmaps/gpt-4-1106_CoT.png new file mode 100644 index 0000000000000000000000000000000000000000..09cd0c4b09dce3ff755702a89acb79a3efa0832e --- /dev/null +++ b/heatmaps/gpt-4-1106_CoT.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8573a510b1e2fa081ab4d964d70e09ce4b87c7f27b79ff1d3e9c7b635582bcbb +size 1007767 diff --git a/heatmaps/gpt-4-1106_Textonly.png b/heatmaps/gpt-4-1106_Textonly.png new file mode 100644 index 0000000000000000000000000000000000000000..bcb863549a6160a72dfe7f8fa5b9c73532e642ef --- /dev/null +++ b/heatmaps/gpt-4-1106_Textonly.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b45f475bb2c3bf1281681a92293ca7f2d069d92ee7ce8149655d899c33654352 +size 1007762 diff --git a/heatmaps/gpt-4-turbo-2024-04-09_CoT.png b/heatmaps/gpt-4-turbo-2024-04-09_CoT.png new file mode 100644 index 0000000000000000000000000000000000000000..e17891c3dd69f0b93f12389fdb10554ca9d426f3 --- /dev/null +++ b/heatmaps/gpt-4-turbo-2024-04-09_CoT.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4770cb89f7167fc71bb2f13779c229820a523b22e485499882848b5fc8b96689 +size 1007864 diff --git a/heatmaps/gpt-4-turbo-2024-04-09_Textonly.png b/heatmaps/gpt-4-turbo-2024-04-09_Textonly.png new file mode 100644 index 0000000000000000000000000000000000000000..7ffe3c400f708cab5a7f9ea54451a6e363577424 --- /dev/null +++ b/heatmaps/gpt-4-turbo-2024-04-09_Textonly.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c212b5d2f5c413940ba464adacef8fcec7d83f1abdacc9548b520879ef4bdf1b +size 1007985 diff --git a/heatmaps/gpt-4-vision-preview_vision-CoT.png b/heatmaps/gpt-4-vision-preview_vision-CoT.png new file mode 100644 index 0000000000000000000000000000000000000000..6155d0f0360fe6ca2e0666100c0e28c2b27e673d --- /dev/null +++ b/heatmaps/gpt-4-vision-preview_vision-CoT.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c64e6429e0a8e0b51f0373196a72e6de2abf8025f833a1eba7808642d6fcfba8 +size 1013704 diff --git a/heatmaps/gpt-4-vision-preview_vision.png b/heatmaps/gpt-4-vision-preview_vision.png new file mode 100644 index 0000000000000000000000000000000000000000..5693c6504f84a1060e77d3eecd34e484636849af --- /dev/null +++ b/heatmaps/gpt-4-vision-preview_vision.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6daaf76f1ceaa9ebe4b8af533325fa48e2e809f251938d9849dfd4d4fa4c98e6 +size 1012341 diff --git a/heatmaps/gpt-4_CoT.jpg b/heatmaps/gpt-4_CoT.jpg new file mode 100644 index 0000000000000000000000000000000000000000..13f44feae78a4bc159822acf85cbb162460fd813 --- /dev/null +++ b/heatmaps/gpt-4_CoT.jpg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa4af344d9bdf4aac858531ac565bc09235774629e0f4a6485f13b01bbb98835 +size 1232100 diff --git a/heatmaps/gpt-4_CoT.png b/heatmaps/gpt-4_CoT.png new file mode 100644 index 0000000000000000000000000000000000000000..1c69f370cd8b227f275747c2b7cd8fb92dbf2ec1 --- /dev/null +++ b/heatmaps/gpt-4_CoT.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1e1d8e98b040e2246ad1f83c4e657eb7351230cd31fd9b8ac49381a05b2471d +size 1007898 diff --git a/heatmaps/gpt-4_Textonly.jpg b/heatmaps/gpt-4_Textonly.jpg new file mode 100644 index 0000000000000000000000000000000000000000..db435d6eb04a68cd455435e1e59ca4a538b5b34c --- /dev/null +++ b/heatmaps/gpt-4_Textonly.jpg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddf8c95dc35b8277b7a2b5e9a08e366f0152af08ee78c398f12bc083a29adb94 +size 1235790 diff --git a/heatmaps/gpt-4_Textonly.png b/heatmaps/gpt-4_Textonly.png new file mode 100644 index 0000000000000000000000000000000000000000..bcb863549a6160a72dfe7f8fa5b9c73532e642ef --- /dev/null +++ b/heatmaps/gpt-4_Textonly.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b45f475bb2c3bf1281681a92293ca7f2d069d92ee7ce8149655d899c33654352 +size 1007762 diff --git a/heatmaps/gpt-4_vision-CoT.jpg b/heatmaps/gpt-4_vision-CoT.jpg new file mode 100644 index 0000000000000000000000000000000000000000..d61b96c4f4c2411ec1cc976b647477bd24fa4859 --- /dev/null +++ b/heatmaps/gpt-4_vision-CoT.jpg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:910c2d4820c49249d143e390f500aa149f68ba00a56c3fcb0c61b2485e93d3ab +size 1319084 diff --git a/heatmaps/gpt-4_vision-CoT.png b/heatmaps/gpt-4_vision-CoT.png new file mode 100644 index 0000000000000000000000000000000000000000..6155d0f0360fe6ca2e0666100c0e28c2b27e673d --- /dev/null +++ b/heatmaps/gpt-4_vision-CoT.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c64e6429e0a8e0b51f0373196a72e6de2abf8025f833a1eba7808642d6fcfba8 +size 1013704 diff --git a/heatmaps/gpt-4_vision.jpg b/heatmaps/gpt-4_vision.jpg new file mode 100644 index 0000000000000000000000000000000000000000..7f22eee19e8c3c0088dae371baea2ce5b9964659 --- /dev/null +++ b/heatmaps/gpt-4_vision.jpg @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1cd741abe572de14c59286eaa8ae830bc20ca142035a4adfc39fc9641354379 +size 1321753 diff --git a/heatmaps/gpt-4_vision.png b/heatmaps/gpt-4_vision.png new file mode 100644 index 0000000000000000000000000000000000000000..5693c6504f84a1060e77d3eecd34e484636849af --- /dev/null +++ b/heatmaps/gpt-4_vision.png @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6daaf76f1ceaa9ebe4b8af533325fa48e2e809f251938d9849dfd4d4fa4c98e6 +size 1012341