File size: 4,987 Bytes
1047c44 f505d13 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 |
Model,Ordinal (Win rate),Cardinal (Score),RO Stability,Stress,CFI,SRMR,RMSEA
GLM-4-32B-0414,0.45519713261648753,0.5924102038593776,0.5231398045089577,0.1885053649385876,0.5887694444444445,0.37460555555555564,0.37893611111111114
Qwen3-235B-A22B-FP8,0.6115591397849462,0.7184051653356879,0.679310553271359,0.18145366817771102,0.7192055555555557,0.24603055555555564,0.2617222222222222
Qwen3-32B-A3B,0.6666666666666666,0.748951174933817,0.695394000772024,0.17751938139533974,0.7652638888888889,0.18118611111111127,0.19652499999999995
Qwen3-32B,0.6796594982078853,0.7364185588714854,0.7356392645359847,0.17307803161650182,0.6883833333333335,0.27474999999999994,0.29176388888888893
Qwen3-8B,0.6115591397849462,0.7184453974322014,0.7185440961120562,0.19916042721283456,0.6796805555555555,0.29908055555555557,0.30805277777777773
Qwen3-4B,0.5613799283154122,0.6970544522219364,0.659760116763837,0.2009520715020784,0.6930888888888889,0.27008333333333345,0.28465833333333335
reka-flash-3,0.3853046594982079,0.4899723723251134,0.2885614355228928,0.21908343015733012,0.6356444444444445,0.32448055555555566,0.3265472222222222
Llama-4-Scout-17B-16E-Instruct,0.5094086021505376,0.6180917882104732,0.4967998772578945,0.1945790922366818,0.6979444444444444,0.2716777777777778,0.2741527777777778
Llama-3.3-70B-Instruct,0.8127240143369175,0.7826258982618856,0.8101440811870466,0.15086913865310292,0.7070694444444444,0.2484805555555556,0.2872888888888889
Llama-3.1-70B-Instruct,0.739247311827957,0.7716257197180342,0.7627363693137972,0.1590258306220288,0.7405305555555556,0.2069805555555555,0.2524638888888888
Llama-3.1-Nemotron-70B-Instruct,0.8234767025089607,0.806561245024004,0.7986269216633632,0.15639272646142155,0.7771694444444445,0.1574805555555555,0.2053138888888889
Llama-3.1-8B-Instruct,0.5022401433691756,0.6200396929619997,0.5544135256446929,0.177589336660551,0.6203138888888889,0.3474166666666667,0.3526444444444444
Llama-3.2-3B-Instruct,0.3781362007168459,0.4920203960749596,0.3095420768898777,0.23477458340427637,0.6402583333333334,0.3671361111111112,0.34035277777777784
Llama-3.2-1B-Instruct,0.17338709677419353,0.28494630130657267,0.017845599375419068,0.29245365371576204,0.4570666666666667,0.49829999999999997,0.458125
Mistral-Large-Instruct-2411,0.6563620071684587,0.7334649247049873,0.7061158170869489,0.17181887070789792,0.7237666666666667,0.24669166666666675,0.262
Mistral-Large-Instruct-2407,0.7576164874551972,0.7865403071348558,0.7786865940656633,0.18242669696158476,0.7757583333333334,0.19862499999999994,0.21713055555555572
Mistral-Nemo-Instruct-2407,0.3736559139784947,0.5243749748919985,0.409719354830282,0.21289984240736382,0.565475,0.40046944444444443,0.39598333333333324
Mistral-Small-3.1-24B-Instruct-2503,0.6048387096774194,0.7026337346865648,0.6848141294613206,0.17721164035276304,0.6713749999999999,0.29685555555555565,0.3154944444444444
Mistral-7B-Instruct-v0.2,0.12096774193548386,0.23355028783364112,0.026105642941629623,0.29118693576405585,0.3286527777777778,0.6504444444444444,0.6230416666666667
Mixtral-8x7B-Instruct-v0.1,0.28763440860215056,0.41570329172979925,0.2810231146470137,0.24656890252743824,0.4673222222222222,0.5223027777777778,0.4969166666666667
QwQ-32B,0.7665770609318997,0.7719313363889678,0.8091295835194909,0.1769481985217758,0.6934333333333333,0.27074999999999994,0.30680277777777776
Qwen2.5-VL-72B-Instruct,0.8987455197132618,0.8360251140700989,0.8125460511443046,0.15932218090531514,0.8454611111111111,0.10019722222222227,0.14792499999999997
Qwen2.5-VL-7B-Instruct,0.2594086021505376,0.42422904460473104,0.28582477835186304,0.25948620101404807,0.45279444444444444,0.4787000000000001,0.464075
Qwen2.5-VL-3B-Instruct,0.132168458781362,0.2655381207197522,0.059657867275330144,0.2877042811210807,0.3650055555555556,0.6013444444444445,0.5902833333333335
Qwen2.5-14B-Instruct-1M,0.5882616487455197,0.7022023055217502,0.6551137143166985,0.1785253019816836,0.7130944444444444,0.26870277777777785,0.26870277777777773
phi-4,0.2181899641577061,0.3158767913757621,0.09850602595828868,0.25104588393816885,0.4269,0.5274305555555556,0.5154333333333333
phi-3-medium-128k-instruct,0.1160394265232975,0.22454028939367154,-0.009343401612861558,0.2918818561769593,0.3458111111111111,0.6230527777777779,0.5971805555555556
Dracarys2-72B-Instruct,0.7912186379928315,0.7740958932029343,0.789501612210195,0.15836985877285903,0.7307833333333333,0.2581972222222222,0.27945555555555546
Nautilus-70B-v0.1,0.6424731182795698,0.724110072700376,0.7188870305946458,0.1688175407755762,0.6729305555555555,0.2789694444444444,0.30781111111111104
Cydonia-22B-v1.2,0.418010752688172,0.5660454327134821,0.4926092723062008,0.20778751640583537,0.5617833333333333,0.40446111111111116,0.39160833333333345
Ministrations-8B-v1,0.3387096774193548,0.4918972616356232,0.34889128317469287,0.2302731507248964,0.5484527777777779,0.4000972222222221,0.3784694444444444
dummy,0.11379928315412184,0.2291015386716794,-0.009004148398032956,0.2928877637010999,0.3755222222222222,0.622275,0.5915305555555557
|