meta_taskLabel RdfConnectionExplainStatic-jsonld RdfConnectionExplainStatic-nt RdfConnectionExplainStatic-turtle RdfConnectionExplainStatic-xml RdfFriendCount-jsonld-1 RdfFriendCount-jsonld-2 RdfFriendCount-nt-1 RdfFriendCount-nt-2 RdfFriendCount-turtle-1 RdfFriendCount-turtle-2 RdfFriendCount-xml-1 RdfFriendCount-xml-2 RdfSyntaxFixList-jsonld RdfSyntaxFixList-nt RdfSyntaxFixList-turtle Sparql2AnswerListOrga-jsonld Sparql2AnswerListOrga-turtle SparqlSyntaxFixingListLcQuad Text2AnswerListOrga-jsonld Text2AnswerListOrga-turtle Text2SparqlExecEvalListBeastiary-turtle-schema Text2SparqlExecEvalListBeastiary-turtle-subgraph Text2SparqlExecEvalListBeastiary-turtle-subschema Text2SparqlExecEvalListCoypuMini Text2SparqlExecEvalListOrgaNumerical Text2SparqlExecEvalListOrganizational
meta_taskId RdfConnectionExplainStatic RdfConnectionExplainStatic RdfConnectionExplainStatic RdfConnectionExplainStatic RdfFriendCount RdfFriendCount RdfFriendCount RdfFriendCount RdfFriendCount RdfFriendCount RdfFriendCount RdfFriendCount RdfSyntaxFixList RdfSyntaxFixList RdfSyntaxFixList Sparql2AnswerListOrganizational Sparql2AnswerListOrganizational SparqlSyntaxFixingListLcQuad Text2AnswerListOrganizational Text2AnswerListOrganizational Text2SparqlExecEvalListBeastiary Text2SparqlExecEvalListBeastiary Text2SparqlExecEvalListBeastiary Text2SparqlExecEvalListCoypuMini Text2SparqlExecEvalListOrgaNumerical Text2SparqlExecEvalListOrganizational
scoreName score_listTrimF1 score_listTrimF1 score_listTrimF1 score_listTrimF1 score_f1 score_f1 score_f1 score_f1 score_f1 score_f1 score_f1 score_f1 score_max_combined score_max_combined score_max_combined score_combinedF1 score_combinedF1 score_max_combined score_combinedF1 score_combinedF1 score_max_combined score_max_combined score_max_combined score_max_combined score_max_combined score_max_combined
meta_modelId
Claude 3.5 Haiku 1.000000 0.902778 0.888889 0.995455 0.000000 0.000000 1.000000 1.000000 1.000000 1.000000 1.000000 1.000000 0.978828 0.996669 0.975132 1.000000 1.000000 1.000000 0.937500 0.850000 0.373434 0.946667 0.306768 0.600000 1.000000 1.000000
Claude 3.5 Sonnet 1.000000 0.972222 1.000000 1.000000 1.000000 1.000000 0.100000 0.300000 0.950000 1.000000 0.550000 1.000000 0.989340 0.997335 0.983773 1.000000 1.000000 1.000000 1.000000 1.000000 0.411429 0.946667 0.426667 0.520000 0.960000 1.000000
Claude Opus 4.6 0.958333 1.000000 1.000000 1.000000 0.095238 0.095238 0.219048 0.203571 1.000000 1.000000 0.149405 0.102976 0.989340 0.999334 1.000000 1.000000 1.000000 1.000000 1.000000 1.000000 0.786667 0.946667 0.666667 0.600000 0.960000 0.840000
Claude Sonnet 4.6 0.456086 0.548158 0.456435 0.893056 0.091558 0.091558 0.052082 0.048173 0.091342 0.091126 0.091558 0.092208 0.989340 0.997335 1.000000 1.000000 1.000000 1.000000 1.000000 1.000000 0.709020 0.946667 0.746667 0.600000 0.840000 0.800000
Deepseek-Chat-v3 0.988667 0.855739 0.895523 0.980000 0.292942 0.395908 0.249684 0.309121 0.543704 0.394131 0.514371 0.533565 0.989340 0.992781 0.991192 0.993333 0.922500 1.000000 0.905000 0.713353 0.456000 0.946667 0.408000 0.520000 0.680000 0.980000
Deepseek-Coder-33B 0.529135 0.240873 0.438351 0.447071 0.203714 0.333853 0.110699 0.171715 0.068297 0.083108 0.348605 0.381844 0.975712 0.828732 0.840765 0.223839 0.313351 0.968000 0.228011 0.220510 0.336762 0.914909 0.399051 0.575253 0.570732 0.751938
Deepseek-R1 0.960000 0.996667 1.000000 0.980000 1.000000 1.000000 1.000000 1.000000 0.980000 1.000000 1.000000 1.000000 0.989340 0.997335 0.986800 0.993333 1.000000 1.000000 0.970000 0.985000 0.442902 0.952000 0.349333 0.520000 0.872000 0.984000
GPT3.5 2024/01 0.901216 0.801072 0.848182 0.813240 0.200000 0.550000 0.000000 0.000000 0.000000 0.000000 0.550000 0.900000 0.989340 0.998001 0.997005 0.500000 0.695833 1.000000 0.506250 0.850000 0.386667 0.946667 0.260606 0.520000 0.600000 0.760000
GPT4o 2024/11 0.850000 0.597792 0.866667 0.844697 1.000000 1.000000 0.000000 0.100000 1.000000 1.000000 0.000000 1.000000 0.989340 0.997335 0.971539 0.950000 0.881250 1.000000 0.950000 0.950000 0.306667 0.946667 0.306667 0.520000 1.000000 1.000000
GPT4o-mini 2024/07 0.833333 0.723275 0.828030 0.752727 0.100000 0.000000 0.000000 0.150000 0.200000 0.250000 1.000000 1.000000 0.979005 0.994671 0.976808 0.758333 0.962500 0.920000 0.775000 0.950000 0.328485 0.946667 0.254545 0.520000 0.640000 1.000000
GPT5.2-chat 1.000000 1.000000 1.000000 1.000000 1.000000 1.000000 1.000000 1.000000 1.000000 1.000000 1.000000 1.000000 0.989340 0.997335 0.999202 1.000000 1.000000 1.000000 1.000000 1.000000 0.586667 0.946667 0.626667 0.560000 1.000000 1.000000
GPT5.4 2026/03 1.000000 0.975000 1.000000 1.000000 1.000000 1.000000 1.000000 1.000000 1.000000 1.000000 1.000000 1.000000 0.989340 0.997335 1.000000 1.000000 1.000000 1.000000 1.000000 1.000000 0.586667 0.946667 0.506667 0.520000 0.680000 0.600000
GPTo1-mini 2024/09 0.983333 0.975000 1.000000 0.983333 1.000000 1.000000 1.000000 1.000000 1.000000 1.000000 1.000000 1.000000 0.989340 0.996669 0.989988 0.975000 1.000000 1.000000 1.000000 0.975000 0.386667 0.946667 0.346667 0.520000 0.680000 0.920000
GPTo1-pre 2024/09 0.914286 0.827381 0.925000 0.936310 0.502428 0.498335 0.362820 0.487980 0.531517 0.591626 0.612231 0.779662 0.989340 0.994670 0.991959 1.000000 1.000000 1.000000 1.000000 1.000000 0.466667 0.888000 0.346667 0.720000 0.760000 0.880000
Gemini 1.5 Flash 1.000000 0.976389 1.000000 1.000000 0.000000 1.000000 0.950000 0.850000 1.000000 1.000000 0.050000 0.950000 0.973314 1.000000 0.976641 1.000000 1.000000 0.820000 1.000000 1.000000 0.546667 0.960000 0.234041 0.520000 0.920000 1.000000
Gemini 1.5 Pro 1.000000 0.963889 1.000000 1.000000 1.000000 1.000000 0.000000 0.000000 1.000000 1.000000 1.000000 1.000000 0.919152 1.000000 0.978296 1.000000 1.000000 0.810000 1.000000 1.000000 0.466667 0.973333 0.304762 0.560000 1.000000 1.000000
Gemini 2.0 Flash Exp 1.000000 0.641667 1.000000 0.914286 1.000000 1.000000 0.900000 0.850000 1.000000 1.000000 1.000000 1.000000 0.989340 1.000000 0.974734 1.000000 1.000000 1.000000 1.000000 1.000000 0.306667 0.946667 0.280000 0.520000 0.320000 0.840000
Gemini 3 Flash Preview 1.000000 0.858333 1.000000 0.875000 1.000000 1.000000 1.000000 1.000000 1.000000 1.000000 1.000000 1.000000 0.989340 0.996003 0.998403 1.000000 1.000000 1.000000 1.000000 1.000000 0.466667 1.000000 0.460588 0.680000 0.840000 0.880000
Llama-3.0-70B 0.990000 0.770466 0.996667 0.970000 0.500000 0.980000 0.020000 0.000000 0.000000 0.000000 0.060000 0.660000 0.986675 1.000000 0.936253 1.000000 1.000000 0.980000 1.000000 1.000000 0.351758 0.946667 0.232970 0.537415 0.568000 0.872000
Llama-3.0-8B 0.352975 0.556408 0.700451 0.584890 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.723188 0.427364 0.744359 0.662667 0.615000 0.076000 0.660000 0.770000 0.216974 0.594296 0.157143 0.511111 0.276000 0.398667
Llama-3.1-70B 0.990000 0.834489 0.993333 0.988182 0.060000 0.060000 0.860000 0.780000 0.020000 0.000000 1.000000 0.980000 0.979462 1.000000 0.938462 0.901667 1.000000 1.000000 1.000000 0.960000 0.417212 0.946667 0.260606 0.516000 0.808000 0.744000
Llama-3.1-8B 0.755913 0.593478 0.693924 0.616798 0.240000 0.340000 0.640000 0.740000 0.000000 0.000000 0.440000 0.780000 0.979443 0.899821 0.864353 0.638333 0.535333 0.476000 0.463929 0.518214 0.228545 0.561158 0.155983 0.393333 0.242667 0.224000
Llama-3.2-1B 0.381925 0.141825 0.371436 0.441697 0.040000 0.040000 0.060000 0.000000 0.053951 0.058710 0.060055 0.020000 0.644124 0.410076 0.179947 0.015706 0.020929 0.032000 0.054496 0.051063 0.004000 0.039040 0.025073 0.016327 0.040000 0.012000
Llama-3.2-3B 0.704686 0.762408 0.684669 0.731665 0.020000 0.020000 0.020000 0.040000 0.180000 0.280000 0.280000 0.380000 0.890835 0.884863 0.541952 0.308333 0.308333 0.093878 0.216667 0.205333 0.094514 0.209901 0.068831 0.177778 0.116279 0.345736
Llama-3.3-70B 1.000000 0.950556 1.000000 1.000000 1.000000 1.000000 0.000000 0.000000 0.000000 0.000000 1.000000 1.000000 0.986675 0.994671 0.952578 1.000000 1.000000 1.000000 1.000000 1.000000 0.450667 0.946667 0.392000 0.536000 0.520000 0.680000
Llama-4-Maverick 1.000000 0.910909 1.000000 0.996667 1.000000 1.000000 0.184254 0.202332 0.140532 0.111463 0.600000 0.600000 0.969855 0.993070 0.960157 0.865000 0.910000 1.000000 0.789842 0.728980 0.401361 0.946667 0.237333 0.696000 0.824000 0.792000
OpenCoder-8B 0.214315 0.062167 0.176923 0.201580 0.169333 0.321414 0.085951 0.049901 0.192603 0.198524 0.036000 0.081714 0.914417 0.683208 0.852135 0.266667 0.400417 0.668000 0.306667 0.340417 0.313045 0.709760 0.282162 0.221333 0.440000 0.666667
Phi-3.0-medium-128k 0.320192 0.651949 0.644859 0.766126 0.000000 0.025000 0.023636 0.046667 0.000000 0.000000 0.000000 0.000000 0.904428 0.843001 0.910894 0.520000 0.625000 0.556000 0.472500 0.580833 0.278606 0.710048 0.204149 0.081633 0.167442 0.579259
Phi-3.0-mini-128k 0.635426 0.415904 0.708862 0.665091 0.040000 0.140000 0.000000 0.000000 0.020000 0.000000 0.000000 0.000000 0.898581 0.503027 0.579395 0.505000 0.428333 0.367111 0.642500 0.556667 0.204874 0.364750 0.220478 0.036735 0.188000 0.391667
Phi-3.0-small-128k 0.836859 0.617538 0.644704 0.730746 0.000000 0.000000 0.000000 0.000000 0.007521 0.000000 0.000000 0.000000 0.352723 0.405366 0.536557 0.486667 0.593333 0.136000 0.625561 0.550584 0.276450 0.529881 0.289697 0.227211 0.152000 0.290667
Phi-3.5-MoE 0.580485 0.528509 0.660508 0.835168 0.903077 0.820000 0.466027 0.311823 0.050003 0.015065 0.020000 0.000000 0.986675 0.621987 0.915424 0.685000 0.688333 0.886667 0.751667 0.702500 0.361055 0.866566 0.312851 0.524000 0.348387 0.854545
Phi-3.5-mini 0.026667 0.300523 0.525426 0.767842 0.120000 0.000000 0.020000 0.000000 0.000000 0.000000 1.000000 1.000000 0.935077 0.392306 0.588416 0.456000 0.450000 0.576000 0.405000 0.435000 0.201818 0.608727 0.276975 0.227273 0.244000 0.320000
Qwen-2.0-0.5B 0.148376 0.040164 0.079012 0.119329 0.116970 0.146159 0.040000 0.000000 0.102115 0.054531 0.060000 0.160000 0.035084 0.160801 0.030990 0.049611 0.040000 0.000000 0.041000 0.053857 0.016000 0.036571 0.020408 0.000000 0.004000 0.000000
Qwen-2.0-1.5B 0.133651 0.247508 0.389646 0.439562 0.453333 0.393333 0.000000 0.000000 0.100000 0.060000 0.000000 0.020000 0.301260 0.039467 0.094499 0.151571 0.153798 0.256000 0.191667 0.159167 0.066951 0.199167 0.121336 0.066667 0.100680 0.092000
Qwen-2.0-57B-A14B 0.710443 0.017000 0.726667 0.769293 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.986675 0.918771 0.889388 0.395000 0.630000 0.800000 0.830000 1.000000 0.328242 0.698101 0.192000 0.528000 0.360000 0.808000
Qwen-2.0-72B 0.797778 0.861761 0.745000 0.986768 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.340000 0.980000 0.973704 0.989630 0.949645 1.000000 1.000000 1.000000 1.000000 1.000000 0.390835 0.866065 0.427879 0.493333 0.394595 1.000000
Qwen-2.0-7B 0.631293 0.511936 0.564206 0.590881 0.000000 0.020000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.749007 0.736985 0.729558 0.485000 0.573333 0.928000 0.790000 0.916667 0.324493 0.550427 0.308970 0.320000 0.174667 0.432000
Qwen-2.5-0.5B 0.164765 0.108828 0.242846 0.307080 0.004000 0.000000 0.000000 0.000000 0.000000 0.000000 0.100000 0.420000 0.097380 0.060112 0.146421 0.046667 0.070833 0.088000 0.088333 0.053333 0.012000 0.053061 0.079167 0.036735 0.072000 0.096000
Qwen-2.5-1.5B 0.592019 0.645727 0.600783 0.565280 0.020000 0.020000 0.100000 0.120000 0.000000 0.000000 0.540000 0.620000 0.783916 0.466752 0.502001 0.153333 0.126667 0.423556 0.140000 0.153333 0.216507 0.271591 0.214173 0.210526 0.184615 0.311111
Qwen-2.5-14B 0.886667 0.662140 1.000000 0.762595 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.962168 0.823599 0.979802 1.000000 0.933333 0.820000 0.960000 1.000000 0.332848 0.866065 0.315394 0.520000 0.584000 0.712000
Qwen-2.5-32B 1.000000 0.325778 1.000000 0.982323 0.000000 0.000000 1.000000 1.000000 0.340000 0.380000 0.000000 0.000000 0.986675 0.992606 0.965763 1.000000 0.800000 1.000000 1.000000 0.960000 0.306667 0.946667 0.306667 0.520000 0.568000 0.568000
Qwen-2.5-3B 0.904444 0.891912 0.888889 0.734714 0.000000 0.000000 0.160000 0.160000 0.000000 0.000000 0.040000 0.820000 0.985887 0.864512 0.720666 0.433333 0.453333 0.691111 0.676667 0.786667 0.327181 0.649255 0.240654 0.493878 0.224000 0.548000
Qwen-2.5-72B 1.000000 0.796879 1.000000 0.966429 0.120000 0.260000 1.000000 1.000000 0.000000 0.000000 1.000000 1.000000 0.986675 0.997601 0.975531 1.000000 1.000000 1.000000 0.800000 1.000000 0.333333 0.946667 0.333333 0.520000 0.840000 0.936000
Qwen-2.5-7B 0.886667 0.719173 0.769444 0.891277 0.020000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.000000 0.962169 1.000000 0.957151 0.360000 0.585833 0.952000 0.520000 0.800000 0.288000 0.914667 0.353400 0.520000 0.376000 0.600000
Qwen-2.5-Coder-32B 1.000000 0.579566 1.000000 0.997778 0.020000 0.020000 0.100000 0.120000 0.420000 0.520000 0.000000 0.000000 0.986675 0.995736 0.989615 1.000000 1.000000 1.000000 1.000000 1.000000 0.332848 0.933576 0.401212 0.530667 0.872000 0.984000
Qwen-3-235B 0.978723 0.950758 1.000000 0.930233 1.000000 1.000000 0.980000 1.000000 0.980000 0.980000 1.000000 1.000000 0.988789 0.997335 0.994349 1.000000 1.000000 1.000000 0.983333 1.000000 0.383333 0.968000 0.404471 0.536000 0.836000 0.912000
Qwen-3.5-397B 1.000000 1.000000 1.000000 1.000000 1.000000 1.000000 1.000000 1.000000 1.000000 1.000000 1.000000 1.000000 0.989340 0.997335 0.995213 1.000000 1.000000 1.000000 1.000000 1.000000 0.613333 1.000000 0.440000 0.840000 0.920000 1.000000