[ { "benchmark": "commit0", "score": 12.5, "metric": "accuracy", "cost_per_instance": 1.64, "average_runtime": 1686.0, "full_archive": "https://results.eval.all-hands.dev/commit0/litellm_proxy-openrouter-z-ai-glm-4-7/25033135919/results.tar.gz", "tags": [ "commit0" ], "agent_version": "v1.17.0", "submission_time": "2026-04-28T08:45:59+00:00", "eval_visualization_page": "https://laminar.sh/shared/evals/84ad9e18-dc52-4085-bc7f-54205df4fae4" }, { "benchmark": "swe-bench-multimodal", "score": 22.1, "metric": "solveable_accuracy", "cost_per_instance": 0.66, "average_runtime": 1519.0, "full_archive": "https://results.eval.all-hands.dev/swebenchmultimodal/litellm_proxy-openrouter-z-ai-glm-4-7/21674056150/results.tar.gz", "tags": [ "swe-bench-multimodal" ], "component_scores": { "solveable_accuracy": 22.1, "unsolveable_accuracy": 0.0, "combined_accuracy": 14.7, "solveable_resolved": 15, "solveable_total": 68, "unsolveable_resolved": 0, "unsolveable_total": 34 }, "agent_version": "v1.10.0", "submission_time": "2026-02-05T03:47:02+00:00" }, { "benchmark": "swe-bench", "score": 73.4, "metric": "accuracy", "cost_per_instance": 0.5596, "average_runtime": 1007.0, "full_archive": "https://results.eval.all-hands.dev/swebench/litellm_proxy-openrouter-z-ai-glm-4-7/21547894190/results.tar.gz", "tags": [ "swe-bench" ], "agent_version": "v1.10.0", "submission_time": "2026-02-01T09:50:58+00:00" }, { "benchmark": "swt-bench", "score": 49.4, "metric": "accuracy", "cost_per_instance": 0.37, "average_runtime": 744.0, "full_archive": "https://results.eval.all-hands.dev/swtbench/litellm_proxy-openrouter-z-ai-glm-4-7/21548136286/results.tar.gz", "tags": [ "swt-bench" ], "agent_version": "v1.10.0", "submission_time": "2026-02-01T04:32:01+00:00" }, { "benchmark": "gaia", "score": 53.9, "metric": "accuracy", "cost_per_instance": 0.15, "average_runtime": 1138.0, "full_archive": "https://results.eval.all-hands.dev/gaia/litellm_proxy-openrouter-z-ai-glm-4-7/21520797407/results.tar.gz", "tags": [ "gaia" ], "agent_version": "v1.10.1", "submission_time": "2026-01-31T02:30:18+00:00" } ]