xhluca commited on
Commit
972a7b5
·
1 Parent(s): 12beee1

add judgments

Browse files
This view is limited to 50 files because it contains too many changes.   See raw diff
Files changed (50) hide show
  1. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/aer/webarena.100.json +3 -0
  2. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/aer/webarena.126.json +3 -0
  3. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/aer/webarena.144.json +3 -0
  4. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/aer/webarena.15.json +3 -0
  5. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/aer/webarena.153.json +3 -0
  6. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/aer/webarena.155.json +3 -0
  7. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/aer/webarena.158.json +3 -0
  8. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/aer/webarena.164.json +3 -0
  9. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/aer/webarena.171.json +3 -0
  10. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/aer/webarena.177.json +3 -0
  11. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/aer/webarena.185.json +3 -0
  12. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noaxtree/webarena.100.json +3 -0
  13. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noaxtree/webarena.126.json +3 -0
  14. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noaxtree/webarena.144.json +3 -0
  15. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noaxtree/webarena.15.json +3 -0
  16. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noaxtree/webarena.153.json +3 -0
  17. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noaxtree/webarena.155.json +3 -0
  18. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noaxtree/webarena.158.json +3 -0
  19. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noaxtree/webarena.164.json +3 -0
  20. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noaxtree/webarena.171.json +3 -0
  21. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noaxtree/webarena.177.json +3 -0
  22. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noaxtree/webarena.185.json +3 -0
  23. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noscreen/webarena.100.json +3 -0
  24. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noscreen/webarena.126.json +3 -0
  25. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noscreen/webarena.144.json +3 -0
  26. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noscreen/webarena.15.json +3 -0
  27. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noscreen/webarena.153.json +3 -0
  28. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noscreen/webarena.155.json +3 -0
  29. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noscreen/webarena.158.json +3 -0
  30. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noscreen/webarena.164.json +3 -0
  31. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noscreen/webarena.171.json +3 -0
  32. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noscreen/webarena.177.json +3 -0
  33. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noscreen/webarena.185.json +3 -0
  34. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/functional/webarena.100.json +3 -0
  35. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/functional/webarena.126.json +3 -0
  36. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/functional/webarena.144.json +3 -0
  37. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/functional/webarena.15.json +3 -0
  38. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/functional/webarena.153.json +3 -0
  39. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/functional/webarena.155.json +3 -0
  40. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/functional/webarena.158.json +3 -0
  41. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/functional/webarena.164.json +3 -0
  42. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/functional/webarena.171.json +3 -0
  43. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/functional/webarena.177.json +3 -0
  44. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/functional/webarena.185.json +3 -0
  45. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/gpt-4o-noaxtree/webarena.100.json +3 -0
  46. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/gpt-4o-noaxtree/webarena.126.json +3 -0
  47. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/gpt-4o-noaxtree/webarena.144.json +3 -0
  48. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/gpt-4o-noaxtree/webarena.15.json +3 -0
  49. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/gpt-4o-noaxtree/webarena.153.json +3 -0
  50. trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/gpt-4o-noaxtree/webarena.155.json +3 -0
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/aer/webarena.100.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:63b2a82161f4b68fcb32f485f89813f780d619c3882535ee6a452185b8e99c68
3
+ size 47415
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/aer/webarena.126.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:419232e3a819178471660100cf5c794311043e467fd0aea05365bc57668bf2c1
3
+ size 34388
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/aer/webarena.144.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a6802c5690e70af756a7463b8d977a3e4df7f29d251daa58f3c26971b7f22799
3
+ size 52111
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/aer/webarena.15.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:66689a2e62f7305a758244ed355a7521f080ae47fa308273bf8d5f5e2f4cf23f
3
+ size 47604
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/aer/webarena.153.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cafd053a95899448c6aac9edd061a41e2e910e7d72dceb00bd4d0893285f090e
3
+ size 26670
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/aer/webarena.155.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c69cf4da2358038e21de1078f2ae613ea4b591b3db73a9c62114fd1cc565748
3
+ size 27048
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/aer/webarena.158.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4cda5a4cbcc2242b81400b83cc28d9964dd76dfab9005aa39f86594481af179f
3
+ size 24302
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/aer/webarena.164.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:544ca3636815bebeb7aa874967bf1ccb5dec3d96f7b8115320aa169d336a95f8
3
+ size 16321
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/aer/webarena.171.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:25278e4460547e122408af48d9b6389c14e956cc056d3449b988349ae76314e8
3
+ size 48797
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/aer/webarena.177.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ffe00146c6d0f61f0df809514c6bb22b51ba9fc837c5cad859b46c60d8d1cddf
3
+ size 20566
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/aer/webarena.185.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:78c4e40bdf4bed219622105a969f999656814871cfde34da1b6f35a3b63022f6
3
+ size 22157
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noaxtree/webarena.100.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6367e1cf9def972f50e4bc7fb52df37d5e9eeec1903b2f2896b091359b46e00a
3
+ size 748694
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noaxtree/webarena.126.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b5ed6211fc4a31655d4b5c05d73ef85355507b61b25ab4ab155ac304490ca48f
3
+ size 1037890
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noaxtree/webarena.144.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:85f927955db0bed35e6aa3543bd0b9bc7e66a8a59e4428f88c1f9fc98e64cb12
3
+ size 296941
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noaxtree/webarena.15.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:757d0555773e91712db6ffa2b8cb9c9108845ad965e07cac8af26aeb5dfbc0ed
3
+ size 216919
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noaxtree/webarena.153.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6e9b5d5ff9e61710ad9a5816c0759b61209e1c1b87138927e2406ec79445d51a
3
+ size 2194032
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noaxtree/webarena.155.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:1a7e20220718a512fda3bab1b79da4ae49aaf9bebe1878dd38f21ed21111089a
3
+ size 3184953
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noaxtree/webarena.158.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:b9bc45767b415cc373df90281a71d5bf572d7fef9cc589d0cba981cb32d9a86b
3
+ size 588903
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noaxtree/webarena.164.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:90276a27bef88ce21d0c964092a3b15468a9bd3d0b83a42b99c4524a9bf2efb4
3
+ size 131137
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noaxtree/webarena.171.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a32416d81341b1cfdfc9b87abcff78e7d9d0fec56775799df5a40e2d70921599
3
+ size 339870
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noaxtree/webarena.177.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4af51dc153b711cee308f4a2cd78d0d808af058999298cd0a254c08c45113e41
3
+ size 438691
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noaxtree/webarena.185.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:65ef5db0461211d3ba0152dbcd98ea42f26ffac45f0ce779fcd219825cec60d8
3
+ size 248905
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noscreen/webarena.100.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:6c831fc15401ee48f91e5cef1fbd202b0401367b435b4f9f20a6aa2f9a1fdba7
3
+ size 47559
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noscreen/webarena.126.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0583ed7eb2c938c837777461492c5b013bef8a6039e18fbb7874e99b400485c9
3
+ size 55392
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noscreen/webarena.144.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3e5320639253c8e59263cc93ebf3f8b87902d3987f82f8aa582b2bd5f2ca597b
3
+ size 67423
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noscreen/webarena.15.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:da31d1033c6db1acc20ecf29601c5d6cf60660b8d68776aff7ef2aca7cc41001
3
+ size 56459
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noscreen/webarena.153.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:760bdbb3c2f6ed6b573236d28a1391fb96528957523cfdeecf3dff85b9201c63
3
+ size 36780
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noscreen/webarena.155.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cfbbf44624da1c64349db6838c737767cfc8d7088849a85cf73466c8421c5c8c
3
+ size 30916
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noscreen/webarena.158.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:254ddec8dc2fd286a2801fbf1c0cd38fcc5301a111dfa549cc61d01f736e5c6f
3
+ size 41838
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noscreen/webarena.164.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:69fee036d723e82c079c6039c7f70226ca6dede976df126bacc6bc98e39e0ed9
3
+ size 27201
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noscreen/webarena.171.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4f4d748e147a88bb3eed8d70543b0a644ab16bfa537dd0f65c3c7fe5f437f4cd
3
+ size 73746
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noscreen/webarena.177.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:cec7d980641461abc45f9dd7dfe9345d5c527a3738b4ae824c37cb5124600509
3
+ size 40390
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/claude-3.7-sonnet-noscreen/webarena.185.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:a52af140d25f366e498e84fa55682a43cc5185e0728ae8ec6314b98988fa4458
3
+ size 391475
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/functional/webarena.100.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0c303a4f8beb1f2a916774b0789ef1ae05f293dc921b4fe7b30ba253e9c70057
3
+ size 3067
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/functional/webarena.126.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:085c95dae9600eb2b9910c9a0888cc12e4855f4f5fb92e6a1c580a4d62b51337
3
+ size 3050
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/functional/webarena.144.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:73d8ef08c0b47be99c75edcd0e4297f227a7b000f271498be712f8a81ab66f29
3
+ size 3055
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/functional/webarena.15.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:251b86dd483ac2cc68f10586c8b426ab79ec994de9d8fdcd37e20803b9a293e7
3
+ size 3069
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/functional/webarena.153.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:0534c42febc7808d87cdaa28da89d70c8513cabef8885619612486b56c4c9620
3
+ size 3028
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/functional/webarena.155.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:4384601320f5288b7b863eefd748f35fce7949501bd4e98c222f1046f5a4ab3e
3
+ size 3071
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/functional/webarena.158.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:ebd98f4cab124dabc5618b379e3a4eda104b8e23fd0d3e964ce7db87c380c22d
3
+ size 3075
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/functional/webarena.164.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:2bea721012cc3cf91376d8d401cd665225a68b3ecd33f3c87792a2ec5f4004bb
3
+ size 3047
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/functional/webarena.171.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:091650046789f005ab53b35be6a625517a203a4aa07afb4c6e9a6481f5fa0acd
3
+ size 3085
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/functional/webarena.177.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:56f655fc31fec6456961ed9d3bf4fe9734771efb94004b070a80e413d5944d91
3
+ size 3070
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/functional/webarena.185.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3245273463770cb8cbb135b19e648d5b7a2f3ddb2842e7c3b184a19bc2eff842
3
+ size 3032
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/gpt-4o-noaxtree/webarena.100.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:654c771b5ec70dc1b0dc6e879d1d9f49a75e3f52e08e826e99970bf516e8010e
3
+ size 748449
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/gpt-4o-noaxtree/webarena.126.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:dbf3b5ae2534e1e9cc7f6da174b679905f394bee2771c4823ed5129de49f3bea
3
+ size 1037840
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/gpt-4o-noaxtree/webarena.144.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:d5b23afb9bed1e9a644f86886b66c8bc1a8af6624f729da1e0dee1cc2aec35d4
3
+ size 296635
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/gpt-4o-noaxtree/webarena.15.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:3172d4507ad1cc286dd567c155c5a842b28a528ee1ffa5557fccb449cdffcec9
3
+ size 215794
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/gpt-4o-noaxtree/webarena.153.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:bafc45b30bce312e24dee78070ef407db073751d87c1e854e611fc596d2f15cf
3
+ size 2193796
trajectories/judgments/webarena/GenericAgent-Qwen_Qwen2.5-VL-72B-Instruct/gpt-4o-noaxtree/webarena.155.json ADDED
@@ -0,0 +1,3 @@
 
 
 
 
1
+ version https://git-lfs.github.com/spec/v1
2
+ oid sha256:095400dd4948ada487fb5b9316d0eea2ee66a634106dc33bbd290ac44e92e76a
3
+ size 3184385