[ { "benchmark": "gaia", "score": 40.0, "metric": "accuracy", "cost_per_instance": 0.1206, "average_runtime": 527.0, "full_archive": "https://results.eval.all-hands.dev/gaia/litellm_proxy-converse-nemotron-super-3-120b/24197982616/results.tar.gz", "tags": [ "gaia" ], "agent_version": "v1.16.1", "submission_time": "2026-04-09T21:31:04+00:00", "eval_visualization_page": "https://laminar.sh/shared/evals/83b65b31-9799-4019-844c-815151e4798e" }, { "benchmark": "swe-bench", "score": 62.0, "metric": "accuracy", "cost_per_instance": 0.4663, "average_runtime": 874.0, "full_archive": "https://results.eval.all-hands.dev/swebench/litellm_proxy-converse-nemotron-super-3-120b/24135041475/results.tar.gz", "tags": [ "swe-bench" ], "agent_version": "v1.16.1", "submission_time": "2026-04-09T07:52:01+00:00", "eval_visualization_page": "https://laminar.sh/shared/evals/054f0361-d26c-4466-82ae-042503b93f2e" }, { "benchmark": "swt-bench", "score": 45.7, "metric": "accuracy", "cost_per_instance": 0.3333, "average_runtime": 1027.0, "full_archive": "https://results.eval.all-hands.dev/swtbench/litellm_proxy-converse-nemotron-super-3-120b/24106920313/results.tar.gz", "tags": [ "swt-bench" ], "agent_version": "v1.16.1", "submission_time": "2026-04-09T05:03:09+00:00", "eval_visualization_page": "https://laminar.sh/shared/evals/01e58390-f947-4dcc-8d34-5e8c61bd3788" }, { "benchmark": "swe-bench-multimodal", "score": 20.6, "metric": "solveable_accuracy", "cost_per_instance": 0.7679, "average_runtime": 1311.0, "full_archive": "https://results.eval.all-hands.dev/swebenchmultimodal/litellm_proxy-converse-nemotron-super-3-120b/24197975725/results.tar.gz", "tags": [ "swe-bench-multimodal" ], "agent_version": "v1.16.1", "submission_time": "2026-04-10T01:36:28+00:00", "component_scores": { "solveable_accuracy": 20.6, "unsolveable_accuracy": 0.0, "combined_accuracy": 13.7 }, "eval_visualization_page": "https://laminar.sh/shared/evals/44cc701e-6ecf-4c70-9cca-4246cbd402f4" }, { "benchmark": "commit0", "score": 12.5, "metric": "accuracy", "cost_per_instance": 1.2153, "average_runtime": 2905.0, "full_archive": "https://results.eval.all-hands.dev/commit0/litellm_proxy-converse-nemotron-super-3-120b/24197990049/results.tar.gz", "tags": [ "commit0" ], "agent_version": "v1.16.1", "submission_time": "2026-04-09T23:08:31+00:00", "eval_visualization_page": "https://laminar.sh/shared/evals/ba725a00-2947-484f-9dad-951071d34c3d" } ]