|
Model,Ordinal (Win rate),Cardinal (Score),RO Stability,Rank Distance,CFI,SRMR,RMSEA,Cronbach alpha |
|
phi-3-mini-128k-instruct,0.258309591642925,0.18707102480796897,0.16880341880341881,0.7264957264957265,0.32478632478632474,0.5555555555555556,0.6239316239316239,0.23076923076923084 |
|
phi-3-medium-128k-instruct,0.28490028490028496,0.18789267301588508,0.26282051282051283,0.7521367521367521,0.2820512820512821,0.7692307692307692,0.7606837606837606,0.5128205128205128 |
|
Mistral-7B-Instruct-v0.1,0.3418803418803419,0.23063750442486428,0.12393162393162394,0.4786324786324786,0.49572649572649574,0.3076923076923077,0.2222222222222222,0.09401709401709403 |
|
Mistral-7B-Instruct-v0.2,0.3342830009496676,0.1747138068267554,0.41666666666666674,0.4358974358974358,0.1282051282051282,0.829059829059829,0.8205128205128205,0.2991452991452992 |
|
Mistral-7B-Instruct-v0.3,0.3133903133903134,0.20131219867252867,0.23504273504273498,0.4273504273504273,0.28205128205128205,0.6324786324786325,0.5897435897435896,0.24786324786324787 |
|
Mixtral-8x7B-Instruct-v0.1,0.43114909781576455,0.2437400779497571,0.5811965811965812,0.641025641025641,0.2136752136752137,0.7863247863247863,0.7521367521367521,0.5213675213675214 |
|
Mixtral-8x22B-Instruct-v0.1,0.29629629629629634,0.18791617935864172,0.37820512820512825,0.6837606837606838,0.1794871794871795,0.9230769230769231,0.9145299145299145,0.49572649572649574 |
|
command_r_plus,0.560303893637227,0.3737946817620246,0.6880341880341879,0.6923076923076923,0.45299145299145294,0.5128205128205128,0.5811965811965811,0.6239316239316239 |
|
llama_3_8b_instruct,0.4691358024691358,0.28828624999947805,0.5747863247863247,0.5470085470085471,0.3162393162393162,0.7008547008547008,0.6923076923076923,0.5470085470085471 |
|
llama_3_70b_instruct,0.7701804368471036,0.5976823900754995,0.9380341880341881,0.7264957264957265,0.8376068376068376,0.4273504273504274,0.49572649572649574,0.9914529914529915 |
|
Qwen2-7B-Instruct,0.5251661918328584,0.3400513233761655,0.5769230769230768,0.5811965811965811,0.4188034188034188,0.45299145299145294,0.4871794871794872,0.5213675213675214 |
|
Qwen2-72B-Instruct,0.5906932573599241,0.42123592516768155,0.9658119658119655,0.5811965811965811,0.07692307692307693,0.9658119658119658,0.9914529914529915,0.9145299145299146 |
|
gpt-3.5-turbo-0125,0.23741690408357075,0.14920836189480854,0.24145299145299137,0.7777777777777778,0.1965811965811966,0.717948717948718,0.7094017094017093,0.1794871794871795 |
|
gpt-4o-0513,0.7340930674264008,0.5383734693976642,0.8482905982905984,0.6666666666666667,0.811965811965812,0.41025641025641024,0.3418803418803419,0.8205128205128205 |
|
|