{"val/score-all": 0.7454545454545455, "val/entropy-all": 0.3351094126701355, "val/entropy-time": 58.276182398200035, "val/think_end": 0.7305785123966942, "val/repetition": 0.1780171756360684, "val-aux/math500/reward/mean@1": 0.964, "val-aux/math500/score/mean@1": 0.964, "val-aux/math500/format_score/mean@1": 0.99, "val-core/math500/acc/mean@1": 0.964, "val-aux/math500/length/mean@1": 4445.818, "val-aux/math500/inlength/mean@1": 97.158, "val-aux/math500/index/mean@1": 249.5, "val-aux/aime24/reward/mean@32": 0.7114583333333333, "val-aux/aime24/reward/std@32": 0.19842906583671674, "val-aux/aime24/reward/best@2/mean": 0.7934666666666668, "val-aux/aime24/reward/best@2/std": 0.12876781291203307, "val-aux/aime24/reward/worst@2/mean": 0.6265666666666667, "val-aux/aime24/reward/worst@2/std": 0.20820707003313163, "val-aux/aime24/reward/best@4/mean": 0.8363333333333333, "val-aux/aime24/reward/best@4/std": 0.06148732358623278, "val-aux/aime24/reward/worst@4/mean": 0.5347000000000001, "val-aux/aime24/reward/worst@4/std": 0.186965909349987, "val-aux/aime24/reward/best@8/mean": 0.8561666666666667, "val-aux/aime24/reward/best@8/std": 0.025613249976904808, "val-aux/aime24/reward/worst@8/mean": 0.4532333333333334, "val-aux/aime24/reward/worst@8/std": 0.13640588469771095, "val-aux/aime24/reward/best@16/mean": 0.8646666666666666, "val-aux/aime24/reward/best@16/std": 0.00995046474006298, "val-aux/aime24/reward/worst@16/mean": 0.4033666666666667, "val-aux/aime24/reward/worst@16/std": 0.0783350021046306, "val-aux/aime24/reward/best@32/mean": 0.8666, "val-aux/aime24/reward/best@32/std": 0.0014892205269125785, "val-aux/aime24/reward/worst@32/mean": 0.3806, "val-aux/aime24/reward/worst@32/std": 0.03220936331273987, "val-aux/aime24/score/mean@32": 0.7114583333333333, "val-aux/aime24/score/std@32": 0.19842906583671674, "val-aux/aime24/score/best@2/mean": 0.7934666666666668, "val-aux/aime24/score/best@2/std": 0.12876781291203307, "val-aux/aime24/score/worst@2/mean": 0.6265666666666667, "val-aux/aime24/score/worst@2/std": 0.20820707003313163, "val-aux/aime24/score/best@4/mean": 0.8363333333333333, "val-aux/aime24/score/best@4/std": 0.06148732358623278, "val-aux/aime24/score/worst@4/mean": 0.5347000000000001, "val-aux/aime24/score/worst@4/std": 0.186965909349987, "val-aux/aime24/score/best@8/mean": 0.8561666666666667, "val-aux/aime24/score/best@8/std": 0.025613249976904808, "val-aux/aime24/score/worst@8/mean": 0.4532333333333334, "val-aux/aime24/score/worst@8/std": 0.13640588469771095, "val-aux/aime24/score/best@16/mean": 0.8646666666666666, "val-aux/aime24/score/best@16/std": 0.00995046474006298, "val-aux/aime24/score/worst@16/mean": 0.4033666666666667, "val-aux/aime24/score/worst@16/std": 0.0783350021046306, "val-aux/aime24/score/best@32/mean": 0.8666, "val-aux/aime24/score/best@32/std": 0.0014892205269125785, "val-aux/aime24/score/worst@32/mean": 0.3806, "val-aux/aime24/score/worst@32/std": 0.03220936331273987, "val-aux/aime24/format_score/mean@32": 0.8239583333333333, "val-aux/aime24/format_score/std@32": 0.20469481788574667, "val-aux/aime24/format_score/best@2/mean": 0.9013666666666665, "val-aux/aime24/format_score/best@2/std": 0.1328332162949296, "val-aux/aime24/format_score/worst@2/mean": 0.7432, "val-aux/aime24/format_score/worst@2/std": 0.2111593084687248, "val-aux/aime24/format_score/best@4/mean": 0.9477666666666666, "val-aux/aime24/format_score/best@4/std": 0.07388368982413282, "val-aux/aime24/format_score/worst@4/mean": 0.6582666666666666, "val-aux/aime24/format_score/worst@4/std": 0.19649930748326225, "val-aux/aime24/format_score/best@8/mean": 0.9751666666666667, "val-aux/aime24/format_score/best@8/std": 0.04189823194720929, "val-aux/aime24/format_score/worst@8/mean": 0.5735, "val-aux/aime24/format_score/worst@8/std": 0.16543372321678246, "val-aux/aime24/format_score/best@16/mean": 0.9909666666666667, "val-aux/aime24/format_score/best@16/std": 0.021316484636371133, "val-aux/aime24/format_score/worst@16/mean": 0.5037333333333334, "val-aux/aime24/format_score/worst@16/std": 0.12053265768413927, "val-aux/aime24/format_score/best@32/mean": 0.9984333333333334, "val-aux/aime24/format_score/best@32/std": 0.008399358007455206, "val-aux/aime24/format_score/worst@32/mean": 0.45726666666666665, "val-aux/aime24/format_score/worst@32/std": 0.06192707220170248, "val-core/aime24/acc/mean@32": 0.7114583333333333, "val-aux/aime24/acc/std@32": 0.19842906583671674, "val-aux/aime24/acc/best@2/mean": 0.7934666666666668, "val-aux/aime24/acc/best@2/std": 0.12876781291203307, "val-aux/aime24/acc/worst@2/mean": 0.6265666666666667, "val-aux/aime24/acc/worst@2/std": 0.20820707003313163, "val-aux/aime24/acc/best@4/mean": 0.8363333333333333, "val-aux/aime24/acc/best@4/std": 0.06148732358623278, "val-aux/aime24/acc/worst@4/mean": 0.5347000000000001, "val-aux/aime24/acc/worst@4/std": 0.186965909349987, "val-aux/aime24/acc/best@8/mean": 0.8561666666666667, "val-aux/aime24/acc/best@8/std": 0.025613249976904808, "val-aux/aime24/acc/worst@8/mean": 0.4532333333333334, "val-aux/aime24/acc/worst@8/std": 0.13640588469771095, "val-aux/aime24/acc/best@16/mean": 0.8646666666666666, "val-aux/aime24/acc/best@16/std": 0.00995046474006298, "val-aux/aime24/acc/worst@16/mean": 0.4033666666666667, "val-aux/aime24/acc/worst@16/std": 0.0783350021046306, "val-core/aime24/acc/best@32/mean": 0.8666, "val-core/aime24/acc/best@32/std": 0.0014892205269125785, "val-aux/aime24/acc/worst@32/mean": 0.3806, "val-aux/aime24/acc/worst@32/std": 0.03220936331273987, "val-aux/aime24/length/mean@32": 14858.18125, "val-aux/aime24/length/std@32": 2905.1166997727787, "val-aux/aime24/length/best@2/mean": 16427.038033333334, "val-aux/aime24/length/best@2/std": 2503.588409198355, "val-aux/aime24/length/worst@2/mean": 13359.499866666667, "val-aux/aime24/length/worst@2/std": 2309.2293121383486, "val-aux/aime24/length/best@4/mean": 17741.0144, "val-aux/aime24/length/best@4/std": 1963.256734349599, "val-aux/aime24/length/worst@4/mean": 12144.904933333335, "val-aux/aime24/length/worst@4/std": 1690.60388224146, "val-aux/aime24/length/best@8/mean": 18730.607066666667, "val-aux/aime24/length/best@8/std": 1369.3130504061696, "val-aux/aime24/length/worst@8/mean": 11230.308866666666, "val-aux/aime24/length/worst@8/std": 1260.905686866845, "val-aux/aime24/length/best@16/mean": 19353.1331, "val-aux/aime24/length/best@16/std": 844.147107199464, "val-aux/aime24/length/worst@16/mean": 10550.218533333335, "val-aux/aime24/length/worst@16/std": 895.501569094431, "val-aux/aime24/length/best@32/mean": 19707.38496666667, "val-aux/aime24/length/best@32/std": 501.76750238283444, "val-aux/aime24/length/worst@32/mean": 10106.380666666668, "val-aux/aime24/length/worst@32/std": 548.7481712365875, "val-aux/aime24/inlength/mean@32": 124.96666666666667, "val-aux/aime24/inlength/std@32": 0.0, "val-aux/aime24/inlength/best@2/mean": 124.96666666666667, "val-aux/aime24/inlength/best@2/std": 0.0, "val-aux/aime24/inlength/worst@2/mean": 124.96666666666667, "val-aux/aime24/inlength/worst@2/std": 0.0, "val-aux/aime24/inlength/best@4/mean": 124.96666666666667, "val-aux/aime24/inlength/best@4/std": 0.0, "val-aux/aime24/inlength/worst@4/mean": 124.96666666666667, "val-aux/aime24/inlength/worst@4/std": 0.0, "val-aux/aime24/inlength/best@8/mean": 124.96666666666667, "val-aux/aime24/inlength/best@8/std": 0.0, "val-aux/aime24/inlength/worst@8/mean": 124.96666666666667, "val-aux/aime24/inlength/worst@8/std": 0.0, "val-aux/aime24/inlength/best@16/mean": 124.96666666666667, "val-aux/aime24/inlength/best@16/std": 0.0, "val-aux/aime24/inlength/worst@16/mean": 124.96666666666667, "val-aux/aime24/inlength/worst@16/std": 0.0, "val-aux/aime24/inlength/best@32/mean": 124.96666666666667, "val-aux/aime24/inlength/best@32/std": 0.0, "val-aux/aime24/inlength/worst@32/mean": 124.96666666666667, "val-aux/aime24/inlength/worst@32/std": 0.0, "val-aux/aime24/index/mean@32": 14.5, "val-aux/aime24/index/std@32": 0.0, "val-aux/aime24/index/best@2/mean": 14.5, "val-aux/aime24/index/best@2/std": 0.0, "val-aux/aime24/index/worst@2/mean": 14.5, "val-aux/aime24/index/worst@2/std": 0.0, "val-aux/aime24/index/best@4/mean": 14.5, "val-aux/aime24/index/best@4/std": 0.0, "val-aux/aime24/index/worst@4/mean": 14.5, "val-aux/aime24/index/worst@4/std": 0.0, "val-aux/aime24/index/best@8/mean": 14.5, "val-aux/aime24/index/best@8/std": 0.0, "val-aux/aime24/index/worst@8/mean": 14.5, "val-aux/aime24/index/worst@8/std": 0.0, "val-aux/aime24/index/best@16/mean": 14.5, "val-aux/aime24/index/best@16/std": 0.0, "val-aux/aime24/index/worst@16/mean": 14.5, "val-aux/aime24/index/worst@16/std": 0.0, "val-aux/aime24/index/best@32/mean": 14.5, "val-aux/aime24/index/best@32/std": 0.0, "val-aux/aime24/index/worst@32/mean": 14.5, "val-aux/aime24/index/worst@32/std": 0.0, "val-aux/aime25/reward/mean@32": 0.665625, "val-aux/aime25/reward/std@32": 0.19092645066622296, "val-aux/aime25/reward/best@2/mean": 0.7335333333333334, "val-aux/aime25/reward/best@2/std": 0.11783857412096076, "val-aux/aime25/reward/worst@2/mean": 0.5990666666666667, "val-aux/aime25/reward/worst@2/std": 0.19556630707998857, "val-aux/aime25/reward/best@4/mean": 0.7744666666666666, "val-aux/aime25/reward/best@4/std": 0.07217658428595969, "val-aux/aime25/reward/worst@4/mean": 0.5238666666666667, "val-aux/aime25/reward/worst@4/std": 0.19312839308238022, "val-aux/aime25/reward/best@8/mean": 0.8024, "val-aux/aime25/reward/best@8/std": 0.04576476416691795, "val-aux/aime25/reward/worst@8/mean": 0.4469666666666667, "val-aux/aime25/reward/worst@8/std": 0.17884709304600277, "val-aux/aime25/reward/best@16/mean": 0.8191, "val-aux/aime25/reward/best@16/std": 0.02830918655604679, "val-aux/aime25/reward/worst@16/mean": 0.3713333333333333, "val-aux/aime25/reward/worst@16/std": 0.15475217682134754, "val-aux/aime25/reward/best@32/mean": 0.8288, "val-aux/aime25/reward/best@32/std": 0.01142628548566856, "val-aux/aime25/reward/worst@32/mean": 0.29933333333333334, "val-aux/aime25/reward/worst@32/std": 0.11579645102410158, "val-aux/aime25/score/mean@32": 0.665625, "val-aux/aime25/score/std@32": 0.19092645066622296, "val-aux/aime25/score/best@2/mean": 0.7335333333333334, "val-aux/aime25/score/best@2/std": 0.11783857412096076, "val-aux/aime25/score/worst@2/mean": 0.5990666666666667, "val-aux/aime25/score/worst@2/std": 0.19556630707998857, "val-aux/aime25/score/best@4/mean": 0.7744666666666666, "val-aux/aime25/score/best@4/std": 0.07217658428595969, "val-aux/aime25/score/worst@4/mean": 0.5238666666666667, "val-aux/aime25/score/worst@4/std": 0.19312839308238022, "val-aux/aime25/score/best@8/mean": 0.8024, "val-aux/aime25/score/best@8/std": 0.04576476416691795, "val-aux/aime25/score/worst@8/mean": 0.4469666666666667, "val-aux/aime25/score/worst@8/std": 0.17884709304600277, "val-aux/aime25/score/best@16/mean": 0.8191, "val-aux/aime25/score/best@16/std": 0.02830918655604679, "val-aux/aime25/score/worst@16/mean": 0.3713333333333333, "val-aux/aime25/score/worst@16/std": 0.15475217682134754, "val-aux/aime25/score/best@32/mean": 0.8288, "val-aux/aime25/score/best@32/std": 0.01142628548566856, "val-aux/aime25/score/worst@32/mean": 0.29933333333333334, "val-aux/aime25/score/worst@32/std": 0.11579645102410158, "val-aux/aime25/format_score/mean@32": 0.7635416666666667, "val-aux/aime25/format_score/std@32": 0.2165096566940471, "val-aux/aime25/format_score/best@2/mean": 0.8420666666666666, "val-aux/aime25/format_score/best@2/std": 0.1654316297838109, "val-aux/aime25/format_score/worst@2/mean": 0.6815, "val-aux/aime25/format_score/worst@2/std": 0.19503293883913705, "val-aux/aime25/format_score/best@4/mean": 0.9093333333333333, "val-aux/aime25/format_score/best@4/std": 0.12168509885349191, "val-aux/aime25/format_score/worst@4/mean": 0.6131333333333334, "val-aux/aime25/format_score/worst@4/std": 0.16864368139000224, "val-aux/aime25/format_score/best@8/mean": 0.9628666666666668, "val-aux/aime25/format_score/best@8/std": 0.07794787309448335, "val-aux/aime25/format_score/worst@8/mean": 0.5479, "val-aux/aime25/format_score/worst@8/std": 0.1551352828485955, "val-aux/aime25/format_score/best@16/mean": 0.9898333333333333, "val-aux/aime25/format_score/best@16/std": 0.033577494179743185, "val-aux/aime25/format_score/worst@16/mean": 0.47923333333333334, "val-aux/aime25/format_score/worst@16/std": 0.13758301346695742, "val-aux/aime25/format_score/best@32/mean": 0.9985333333333334, "val-aux/aime25/format_score/best@32/std": 0.00940853921122379, "val-aux/aime25/format_score/worst@32/mean": 0.41426666666666667, "val-aux/aime25/format_score/worst@32/std": 0.09649442389140475, "val-core/aime25/acc/mean@32": 0.665625, "val-aux/aime25/acc/std@32": 0.19092645066622296, "val-aux/aime25/acc/best@2/mean": 0.7335333333333334, "val-aux/aime25/acc/best@2/std": 0.11783857412096076, "val-aux/aime25/acc/worst@2/mean": 0.5990666666666667, "val-aux/aime25/acc/worst@2/std": 0.19556630707998857, "val-aux/aime25/acc/best@4/mean": 0.7744666666666666, "val-aux/aime25/acc/best@4/std": 0.07217658428595969, "val-aux/aime25/acc/worst@4/mean": 0.5238666666666667, "val-aux/aime25/acc/worst@4/std": 0.19312839308238022, "val-aux/aime25/acc/best@8/mean": 0.8024, "val-aux/aime25/acc/best@8/std": 0.04576476416691795, "val-aux/aime25/acc/worst@8/mean": 0.4469666666666667, "val-aux/aime25/acc/worst@8/std": 0.17884709304600277, "val-aux/aime25/acc/best@16/mean": 0.8191, "val-aux/aime25/acc/best@16/std": 0.02830918655604679, "val-aux/aime25/acc/worst@16/mean": 0.3713333333333333, "val-aux/aime25/acc/worst@16/std": 0.15475217682134754, "val-core/aime25/acc/best@32/mean": 0.8288, "val-core/aime25/acc/best@32/std": 0.01142628548566856, "val-aux/aime25/acc/worst@32/mean": 0.29933333333333334, "val-aux/aime25/acc/worst@32/std": 0.11579645102410158, "val-aux/aime25/length/mean@32": 16455.247916666667, "val-aux/aime25/length/std@32": 2244.507542963066, "val-aux/aime25/length/best@2/mean": 17538.63006666667, "val-aux/aime25/length/best@2/std": 1919.9356662037353, "val-aux/aime25/length/worst@2/mean": 15349.766333333333, "val-aux/aime25/length/worst@2/std": 1748.7152712096306, "val-aux/aime25/length/best@4/mean": 18484.069066666667, "val-aux/aime25/length/best@4/std": 1672.555651538279, "val-aux/aime25/length/worst@4/mean": 14472.231033333335, "val-aux/aime25/length/worst@4/std": 1411.4202783262647, "val-aux/aime25/length/best@8/mean": 19342.317, "val-aux/aime25/length/best@8/std": 1461.6182577717582, "val-aux/aime25/length/worst@8/mean": 13727.427999999998, "val-aux/aime25/length/worst@8/std": 1172.6386288567096, "val-aux/aime25/length/best@16/mean": 20078.772233333333, "val-aux/aime25/length/best@16/std": 1165.3512022128182, "val-aux/aime25/length/worst@16/mean": 13102.596966666666, "val-aux/aime25/length/worst@16/std": 936.4927779880715, "val-aux/aime25/length/best@32/mean": 20668.986133333336, "val-aux/aime25/length/best@32/std": 768.8588547054713, "val-aux/aime25/length/worst@32/mean": 12621.764333333334, "val-aux/aime25/length/worst@32/std": 662.1983919876033, "val-aux/aime25/inlength/mean@32": 144.36666666666667, "val-aux/aime25/inlength/std@32": 0.0, "val-aux/aime25/inlength/best@2/mean": 144.36666666666667, "val-aux/aime25/inlength/best@2/std": 0.0, "val-aux/aime25/inlength/worst@2/mean": 144.36666666666667, "val-aux/aime25/inlength/worst@2/std": 0.0, "val-aux/aime25/inlength/best@4/mean": 144.36666666666667, "val-aux/aime25/inlength/best@4/std": 0.0, "val-aux/aime25/inlength/worst@4/mean": 144.36666666666667, "val-aux/aime25/inlength/worst@4/std": 0.0, "val-aux/aime25/inlength/best@8/mean": 144.36666666666667, "val-aux/aime25/inlength/best@8/std": 0.0, "val-aux/aime25/inlength/worst@8/mean": 144.36666666666667, "val-aux/aime25/inlength/worst@8/std": 0.0, "val-aux/aime25/inlength/best@16/mean": 144.36666666666667, "val-aux/aime25/inlength/best@16/std": 0.0, "val-aux/aime25/inlength/worst@16/mean": 144.36666666666667, "val-aux/aime25/inlength/worst@16/std": 0.0, "val-aux/aime25/inlength/best@32/mean": 144.36666666666667, "val-aux/aime25/inlength/best@32/std": 0.0, "val-aux/aime25/inlength/worst@32/mean": 144.36666666666667, "val-aux/aime25/inlength/worst@32/std": 0.0, "val-aux/aime25/index/mean@32": 14.5, "val-aux/aime25/index/std@32": 0.0, "val-aux/aime25/index/best@2/mean": 14.5, "val-aux/aime25/index/best@2/std": 0.0, "val-aux/aime25/index/worst@2/mean": 14.5, "val-aux/aime25/index/worst@2/std": 0.0, "val-aux/aime25/index/best@4/mean": 14.5, "val-aux/aime25/index/best@4/std": 0.0, "val-aux/aime25/index/worst@4/mean": 14.5, "val-aux/aime25/index/worst@4/std": 0.0, "val-aux/aime25/index/best@8/mean": 14.5, "val-aux/aime25/index/best@8/std": 0.0, "val-aux/aime25/index/worst@8/mean": 14.5, "val-aux/aime25/index/worst@8/std": 0.0, "val-aux/aime25/index/best@16/mean": 14.5, "val-aux/aime25/index/best@16/std": 0.0, "val-aux/aime25/index/worst@16/mean": 14.5, "val-aux/aime25/index/worst@16/std": 0.0, "val-aux/aime25/index/best@32/mean": 14.5, "val-aux/aime25/index/best@32/std": 0.0, "val-aux/aime25/index/worst@32/mean": 14.5, "val-aux/aime25/index/worst@32/std": 0.0, "val_response_length/math500/mean": 4445.818, "val_response_length/aime24/mean": 14858.18125, "val_response_length/aime25/mean": 16455.247916666667, "val_response_length/overall_mean": 13340.413636363637, "val-core/save_overall_score": 0.7803611111111111}