{"benchmark_id":"gre_physics_cot","size":75,"models":51,"total_pairs":1222,"close_pairs":1160,"no_solve":0,"tau-":4,"SE(A)":{"count":49.0,"mean":0.0517851107,"std":0.005838125,"min":0.0365316383,"25%":0.0475946562,"50%":0.0539178257,"75%":0.0567492731,"max":0.0576985211},"SE_x(A)":{"count":49.0,"mean":0.0367095296,"std":0.0121328685,"min":0.0107837103,"25%":0.0319379192,"50%":0.0406898221,"75%":0.0452300327,"max":0.0558516554},"SE_pred(A)":{"count":49.0,"mean":0.0333479452,"std":0.0106548275,"min":0.0,"25%":0.0307179059,"50%":0.0348155312,"75%":0.0401421974,"max":0.04877489},"SE(A-B)":{"count":1160.0,"mean":0.0662533615,"std":0.0055094702,"min":0.0421219081,"25%":0.0627976489,"50%":0.067055526,"75%":0.070537026,"max":0.0788352538},"SE_x(A-B)":{"count":1160.0,"mean":0.0422823626,"std":0.01124353,"min":0.0017141983,"25%":0.0355191885,"50%":0.0428230799,"75%":0.0503770891,"max":0.0705533683},"SE_pred(A-B)":{"count":1160.0,"mean":0.0493122403,"std":0.0086079412,"min":0.0,"25%":0.0444213984,"50%":0.050387945,"75%":0.0553645179,"max":0.0666181642},"SE_signtest":{"count":1160.0,"mean":0.0674985815,"std":0.0058259769,"min":0.0421344116,"25%":0.0637191328,"50%":0.068381962,"75%":0.0719076286,"max":0.0793152513},"corr(A,B)":{"count":1160.0,"mean":0.3231317495,"std":0.1986238351,"min":-0.2889849243,"25%":0.2014654251,"50%":0.3373879052,"75%":0.4617182602,"max":0.9023175148},"sum(A!=B)":{"count":1160.0,"mean":25.8185883072,"std":4.2934142203,"min":9.986111111,"25%":22.8382194719,"50%":26.3030303027,"75%":29.0852272722,"max":35.3863636366}}
