{"benchmark_id":"lsat_cot","size":403,"models":45,"total_pairs":1074,"close_pairs":795,"no_solve":1,"tau-":42,"SE(A)":{"count":45.0,"mean":0.0233226225,"std":0.001541183,"min":0.0198975537,"25%":0.0222169552,"50%":0.0235113037,"75%":0.024732828,"max":0.0249053342},"SE_x(A)":{"count":43.0,"mean":0.0178221017,"std":0.004686694,"min":0.003251027,"25%":0.0164095914,"50%":0.0188073586,"75%":0.0205005561,"max":0.0248588034},"SE_pred(A)":{"count":43.0,"mean":0.0133870633,"std":0.0053410933,"min":0.0,"25%":0.0119516897,"50%":0.0139537567,"75%":0.0172287883,"max":0.0198312237},"SE(A-B)":{"count":795.0,"mean":0.0270664893,"std":0.002686942,"min":0.0196491252,"25%":0.0249692232,"50%":0.0275961282,"75%":0.0292748126,"max":0.031540521},"SE_x(A-B)":{"count":723.0,"mean":0.0184255123,"std":0.0037597363,"min":0.0071367882,"25%":0.0161504166,"50%":0.0185618406,"75%":0.0208863865,"max":0.0281672444},"SE_pred(A-B)":{"count":723.0,"mean":0.0196015386,"std":0.0042409947,"min":0.0,"25%":0.0171177917,"50%":0.0191672957,"75%":0.0226316943,"max":0.0278602913},"SE_signtest":{"count":795.0,"mean":0.0273355405,"std":0.0027515612,"min":0.0197082043,"25%":0.0251329217,"50%":0.0279688442,"75%":0.0295825092,"max":0.0325000898},"corr(A,B)":{"count":795.0,"mean":0.4827814836,"std":0.1530887428,"min":-0.0224367614,"25%":0.4364885066,"50%":0.5078754013,"75%":0.5721252675,"max":0.8400331694},"sum(A!=B)":{"count":795.0,"mean":122.5852318088,"std":23.9362433916,"min":63.081818181,"25%":102.5878787875,"50%":127.0454545439,"75%":142.1281565654,"max":171.5454545432}}
