,"-, clemscore","adventuregame, % Played","adventuregame, Quality Score","all, Average % Played","all, Average Quality Score","clean_up, % Played","clean_up, Quality Score","codenames, % Played","codenames, Quality Score","dond, % Played","dond, Quality Score","guesswhat, % Played","guesswhat, Quality Score","hot_air_balloon, % Played","hot_air_balloon, Quality Score","imagegame, % Played","imagegame, Quality Score","matchit_ascii, % Played","matchit_ascii, Quality Score","privateshared, % Played","privateshared, Quality Score","referencegame, % Played","referencegame, Quality Score","taboo, % Played","taboo, Quality Score","textmapworld, % Played","textmapworld, Quality Score","textmapworld_graphreasoning, % Played","textmapworld_graphreasoning, Quality Score","textmapworld_specificroom, % Played","textmapworld_specificroom, Quality Score","wordle, % Played","wordle, Quality Score","wordle_withclue, % Played","wordle_withclue, Quality Score","wordle_withcritic, % Played","wordle_withcritic, Quality Score" Aya-Expanse-32B-t0.0,16.9,10.0,16.67,36.14,46.76,0.0,,11.54,46.67,2.5,0.0,0.0,,0.0,,0.0,,100.0,92.5,64.0,58.64,100.0,40.0,61.67,51.35,78.0,56.55,73.33,58.83,100.0,53.33,6.67,0.0,3.33,100.0,3.33,33.33 EuroLLM-22B-Instruct-2512-t0.0,13.9,45.0,9.26,30.11,46.17,11.11,2.09,31.54,21.95,2.5,68.75,0.0,,0.0,,0.0,,100.0,80.0,16.0,86.74,100.0,31.11,98.33,12.43,14.0,44.29,26.67,49.11,60.0,94.44,0.0,,3.33,0.0,3.33,100.0 Llama-3.1-70B-Instruct-t0.0,46.8,67.5,64.2,77.2,60.62,77.78,48.92,87.69,39.47,77.5,34.63,91.67,28.48,33.33,51.41,97.5,85.03,82.5,69.7,100.0,88.12,100.0,60.0,88.33,72.64,92.0,71.1,93.33,62.2,100.0,100.0,90.0,8.89,13.33,87.5,20.0,58.33 Llama-3.1-8B-Instruct-t0.0,25.28,37.5,24.44,56.58,44.68,66.67,38.55,43.85,26.32,82.5,2.42,96.67,6.9,0.0,,55.0,43.86,95.0,76.32,66.0,56.25,100.0,42.22,100.0,33.06,22.0,55.91,30.0,51.65,83.33,100.0,60.0,2.78,10.0,83.33,13.33,70.83 Llama-3.3-70B-Instruct-t0.0,50.0,92.5,48.65,82.4,60.68,81.48,35.47,77.69,31.68,65.0,66.0,93.33,43.45,100.0,47.74,87.5,91.89,75.0,80.0,100.0,90.59,100.0,56.67,98.33,62.15,100.0,69.92,70.0,61.24,86.67,100.0,83.33,12.4,46.67,70.83,43.33,62.82 Ministral-3-14B-Reasoning-2512-nothink-t0.0,26.66,35.0,57.14,54.75,48.69,0.0,,33.08,27.91,97.5,19.2,65.0,25.64,5.56,62.8,95.0,71.95,100.0,85.0,84.0,22.61,100.0,56.67,81.67,42.52,74.0,60.14,0.0,,83.33,100.0,33.33,5.0,26.67,43.75,16.67,50.0 Olmo-3.1-32B-Instruct-t0.0,14.63,45.0,0.0,29.5,49.61,0.0,,5.38,0.0,95.0,25.84,0.0,,0.0,,0.0,,67.5,81.48,40.0,12.62,100.0,52.22,76.67,40.22,2.0,33.33,0.0,,50.0,100.0,0.0,,16.67,100.0,3.33,100.0 Qwen2.5-72B-Instruct-t0.0,48.07,45.0,40.74,79.66,60.34,62.96,65.26,71.54,26.88,100.0,70.37,96.67,60.92,97.22,50.1,57.5,85.65,100.0,87.5,100.0,45.26,100.0,70.0,83.33,70.0,100.0,68.82,96.67,63.14,96.67,100.0,83.33,6.8,30.0,64.81,33.33,49.5 Qwen2.5-Coder-32B-Instruct-t0.0,35.32,30.0,50.0,67.63,52.23,51.85,41.82,56.15,39.73,15.0,27.45,96.67,59.2,75.0,44.48,0.0,,85.0,76.47,100.0,49.53,100.0,73.33,96.67,50.0,100.0,68.86,100.0,63.24,73.33,100.0,76.67,12.17,56.67,35.49,36.67,43.94 Qwen3-Next-80B-A3B-Instruct-t0.0,45.24,50.0,33.33,74.41,60.8,74.07,54.51,36.92,37.5,97.5,12.66,100.0,56.67,0.0,,92.5,99.46,100.0,80.0,74.0,50.71,100.0,72.22,100.0,50.28,100.0,74.06,90.0,67.31,93.33,100.0,56.67,16.47,56.67,84.31,43.33,83.33 Teuken-7B-Instruct-v0.4-t0.0,7.02,7.5,0.0,32.12,21.84,0.0,,0.0,,47.5,3.68,25.0,0.0,0.0,,0.0,,100.0,25.0,22.0,25.96,33.33,33.33,96.67,5.17,94.0,55.2,16.67,48.54,100.0,43.33,0.0,,3.33,0.0,0.0, claude-sonnet-4-5-20250929-t1.0,87.42,97.5,97.44,98.28,88.95,100.0,88.77,100.0,60.77,100.0,95.25,100.0,92.22,100.0,85.47,85.0,100.0,100.0,100.0,100.0,98.7,100.0,100.0,98.33,95.76,100.0,86.29,93.33,88.74,100.0,100.0,100.0,64.33,100.0,79.44,96.67,79.02 claude-sonnet-4-5-azure-high-t1.0,90.1,100.0,97.5,98.87,91.13,100.0,93.63,100.0,73.85,100.0,94.34,100.0,88.33,100.0,95.53,92.5,99.81,100.0,100.0,100.0,97.95,100.0,98.89,98.33,96.61,100.0,87.53,90.0,91.93,100.0,100.0,100.0,64.67,100.0,82.5,100.0,86.11 claude-sonnet-4-5-azure-low-t1.0,86.01,97.5,92.31,97.65,88.08,100.0,92.39,99.23,61.24,100.0,94.36,100.0,91.67,100.0,79.74,72.5,100.0,97.5,100.0,100.0,98.47,100.0,100.0,100.0,98.33,100.0,84.95,96.67,89.31,100.0,100.0,100.0,54.33,100.0,80.11,96.67,80.17 deepseek-v3.2-t1.0,59.61,52.5,57.14,86.14,69.2,92.59,73.91,66.15,33.72,100.0,53.4,83.33,60.67,91.67,94.49,12.5,85.4,100.0,90.0,100.0,42.6,98.89,64.04,90.0,87.96,100.0,74.36,100.0,68.47,96.67,100.0,96.67,47.93,90.0,69.14,93.33,73.21 deepseek-v3.2-without-reasoning-t1.0,52.94,62.5,68.0,77.68,68.15,88.89,79.37,62.31,35.8,100.0,56.2,81.67,47.62,33.33,73.93,15.0,89.83,100.0,85.0,100.0,43.4,98.89,70.79,80.0,82.99,98.0,68.51,90.0,67.98,96.67,100.0,73.33,40.91,73.33,73.56,66.67,74.58 gemini-3-flash-t1.0,84.03,87.5,94.29,95.81,87.7,100.0,97.25,90.77,71.19,100.0,82.68,100.0,92.78,100.0,70.69,87.5,100.0,80.0,100.0,100.0,83.26,100.0,100.0,98.33,97.18,98.0,93.21,93.33,89.02,100.0,100.0,100.0,60.0,100.0,80.11,93.33,79.17 glm-4.6-t1.0,63.91,25.0,80.0,81.44,78.48,100.0,83.29,93.08,47.11,100.0,67.36,96.67,82.18,100.0,90.16,92.5,98.76,37.5,86.67,98.0,88.69,96.67,97.7,98.33,72.32,80.0,85.66,70.0,82.03,100.0,100.0,63.33,55.26,83.33,66.47,50.0,50.55 glm-4.7-t1.0,78.05,80.0,98.96,88.71,87.98,100.0,87.06,68.46,66.29,100.0,87.75,96.67,93.1,97.22,93.49,92.5,100.0,87.5,97.14,100.0,91.15,100.0,100.0,95.0,90.35,94.0,87.79,80.0,87.44,96.67,100.0,83.33,67.2,86.67,77.88,50.0,70.0 glm-5-without-reasoning-t1.0,58.68,77.5,70.97,82.19,71.39,96.3,73.12,44.62,31.03,100.0,72.53,16.67,63.33,97.22,77.17,85.0,99.68,70.0,85.71,100.0,57.03,100.0,76.67,100.0,75.83,100.0,81.0,96.67,74.47,100.0,100.0,76.67,31.3,73.33,75.38,63.33,68.42 gpt-5.2-2025-12-11-t1.0,81.66,95.0,93.86,94.73,86.2,100.0,98.24,99.23,72.09,100.0,76.76,100.0,86.11,36.11,93.22,100.0,99.92,100.0,97.5,100.0,93.87,100.0,97.78,100.0,95.56,100.0,82.34,83.33,82.34,100.0,100.0,100.0,62.33,100.0,68.17,96.67,65.23 gpt-5.2-azure-high-t1.0,84.19,100.0,99.17,91.1,92.42,100.0,100.0,95.38,91.94,100.0,99.12,100.0,93.33,58.33,99.53,100.0,99.82,95.0,100.0,100.0,95.7,100.0,100.0,100.0,98.33,100.0,85.01,0.0,,100.0,100.0,100.0,69.0,100.0,77.5,100.0,70.28 gpt-5.2-azure-medium-t1.0,79.61,100.0,97.5,89.95,88.51,100.0,99.94,96.92,75.4,100.0,87.34,100.0,86.67,38.89,94.89,100.0,99.8,100.0,100.0,100.0,94.27,100.0,98.89,100.0,95.83,100.0,84.79,0.0,,100.0,100.0,100.0,53.0,100.0,76.39,93.33,71.43 gpt-5.2-azure-minimal-t1.0,74.27,87.5,90.48,92.33,80.44,96.3,88.96,93.08,52.89,100.0,69.23,98.33,75.14,77.78,67.03,100.0,99.88,100.0,100.0,100.0,91.62,100.0,97.78,100.0,94.17,100.0,78.54,53.33,84.23,100.0,100.0,86.67,46.54,93.33,65.48,83.33,65.47 gpt-oss-120b-t1.0,35.96,27.5,81.82,48.82,73.65,18.52,62.07,3.08,50.0,95.0,47.42,83.33,88.67,63.89,92.57,5.0,100.0,0.0,,8.0,48.97,8.89,100.0,93.33,83.33,70.0,72.51,73.33,79.12,10.0,100.0,73.33,56.82,96.67,64.65,100.0,50.39 gpt-oss-20b-t1.0,41.57,10.0,16.67,67.38,61.7,81.48,43.76,94.62,45.53,90.0,29.29,38.33,66.67,80.56,91.63,67.5,89.63,10.0,50.0,56.0,53.11,100.0,98.89,81.67,68.71,82.0,67.85,63.33,67.5,63.33,100.0,90.0,48.89,76.67,53.91,60.0,56.94 kimi-k2-thinking-t1.0,77.79,77.5,98.92,91.15,85.34,100.0,98.04,78.46,55.88,95.0,66.16,96.67,89.66,94.44,94.52,72.5,99.62,62.5,96.0,94.0,94.48,98.89,98.88,95.0,85.67,98.0,81.44,96.67,87.18,100.0,100.0,100.0,73.0,96.67,72.53,93.33,58.75 kimi-k2.5-without-reasoning-t1.0,60.28,72.5,93.1,76.3,79.0,77.78,79.19,57.69,38.67,100.0,78.59,85.0,72.55,100.0,70.29,5.0,100.0,92.5,86.49,100.0,92.69,40.0,97.22,96.67,78.45,100.0,77.42,96.67,75.68,70.0,100.0,80.0,51.25,73.33,74.77,50.0,76.67 minimax-m2.5-t1.0,55.68,50.0,95.0,75.75,73.51,92.59,80.16,86.92,44.25,92.5,59.72,90.0,62.96,100.0,72.8,62.5,94.36,97.5,79.49,0.0,,86.67,100.0,85.0,86.6,94.0,74.28,86.67,77.59,93.33,100.0,66.67,22.5,73.33,81.06,30.0,45.37 mistral-3-large-2512-t1.0,44.79,77.5,62.37,69.64,64.32,29.63,55.57,30.0,51.28,100.0,38.3,66.67,69.17,36.11,58.47,5.0,100.0,100.0,92.5,100.0,34.38,100.0,84.44,98.33,77.97,94.0,76.29,73.33,71.3,96.67,100.0,86.67,16.54,63.33,47.72,26.67,57.08 qwen3-max-t1.0,59.66,80.0,62.5,82.71,72.13,88.89,81.04,74.62,34.02,97.5,54.16,95.0,69.59,33.33,73.69,17.5,100.0,97.5,87.18,100.0,55.94,100.0,86.67,98.33,77.97,100.0,80.18,100.0,82.32,96.67,100.0,86.67,28.46,73.33,71.59,66.67,80.83