{"benchmark_id":"mbpp","size":500,"models":35,"total_pairs":640,"close_pairs":362,"no_solve":15,"tau-":12,"SE(A)":{"count":34.0,"mean":0.0209263197,"std":0.0019879178,"min":0.0148590624,"25%":0.0206788607,"50%":0.0214989312,"75%":0.0221868253,"max":0.0223555329},"SE_x(A)":{"count":34.0,"mean":0.0173902071,"std":0.0028943045,"min":0.009736158,"25%":0.0164238526,"50%":0.0178582517,"75%":0.0188385594,"max":0.022354239},"SE_pred(A)":{"count":34.0,"mean":0.0107722592,"std":0.0039514801,"min":0.0,"25%":0.0101058726,"50%":0.0119946831,"75%":0.0132733446,"max":0.0146746535},"SE(A-B)":{"count":362.0,"mean":0.0214151409,"std":0.0012455106,"min":0.0166074655,"25%":0.0208429741,"50%":0.0215601607,"75%":0.0222853095,"max":0.0239078738},"SE_x(A-B)":{"count":362.0,"mean":0.0135929872,"std":0.0028955998,"min":0.0052683676,"25%":0.0114329349,"50%":0.0132472573,"75%":0.0159806068,"max":0.0200414375},"SE_pred(A-B)":{"count":362.0,"mean":0.0160424872,"std":0.0031128772,"min":0.0,"25%":0.013758964,"50%":0.0169267584,"75%":0.018358055,"max":0.0206664712},"SE_signtest":{"count":362.0,"mean":0.021595027,"std":0.0012790982,"min":0.0166081958,"25%":0.0210244058,"50%":0.0217384908,"75%":0.0224957909,"max":0.0241600722},"corr(A,B)":{"count":362.0,"mean":0.6924561378,"std":0.0757028602,"min":0.505578694,"25%":0.641235345,"50%":0.7012787924,"75%":0.7438977999,"max":0.8777750514},"sum(A!=B)":{"count":362.0,"mean":116.9941907047,"std":13.4702877963,"min":68.9580419555,"25%":110.5064102553,"50%":118.1404958655,"75%":126.5151515119,"max":145.9272727259}}
