{"database": "grpo-gsm8k-train", "table": "summaries", "is_view": false, "human_description_en": "", "rows": [[1, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_50", 1319, 968, 0.7338893100833965, 4, "{\"stop:-\": 1315, \"length:-\": 4}", "25s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_50/actor/huggingface"], [2, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_50", 5000, 2469, 0.4938, 610, "{\"stop:-\": 4467, \"length:-\": 531, \"stop:Problem:\": 2}", "2m 34s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_50/actor/huggingface"], [3, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_100", 1319, 980, 0.7429871114480667, 4, "{\"stop:-\": 1315, \"length:-\": 4}", "23s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_100/actor/huggingface"], [4, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_100", 5000, 2524, 0.5048, 635, "{\"stop:-\": 4439, \"length:-\": 561}", "2m 32s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_100/actor/huggingface"], [5, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_150", 1319, 986, 0.7475360121304018, 3, "{\"stop:-\": 1316, \"length:-\": 3}", "23s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_150/actor/huggingface"], [6, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_150", 5000, 2500, 0.5, 635, "{\"stop:-\": 4429, \"length:-\": 570, \"stop:Problem:\": 1}", "2m 33s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_150/actor/huggingface"], [7, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_200", 1319, 1003, 0.7604245640636846, 4, "{\"stop:-\": 1315, \"length:-\": 4}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_200/actor/huggingface"], [8, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_200", 5000, 2484, 0.4968, 670, "{\"stop:-\": 4408, \"length:-\": 590, \"stop:Problem:\": 2}", "2m 33s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_200/actor/huggingface"], [9, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_250", 1319, 1002, 0.759666413949962, 4, "{\"stop:-\": 1315, \"length:-\": 4}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_250/actor/huggingface"], [10, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_250", 5000, 2508, 0.5016, 636, "{\"stop:-\": 4442, \"length:-\": 557, \"stop:Problem:\": 1}", "2m 32s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_250/actor/huggingface"], [11, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_300", 1319, 991, 0.7513267626990144, 5, "{\"stop:-\": 1314, \"length:-\": 5}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_300/actor/huggingface"], [12, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_300", 5000, 2513, 0.5026, 641, "{\"stop:-\": 4436, \"length:-\": 563, \"stop:Problem:\": 1}", "2m 33s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_300/actor/huggingface"], [13, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_350", 1319, 989, 0.7498104624715694, 3, "{\"stop:-\": 1316, \"length:-\": 3}", "25s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_350/actor/huggingface"], [14, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_350", 5000, 2504, 0.5008, 657, "{\"stop:-\": 4418, \"length:-\": 580, \"stop:Problem:\": 2}", "2m 34s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_350/actor/huggingface"], [15, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_400", 1319, 1014, 0.7687642153146323, 4, "{\"stop:-\": 1315, \"length:-\": 4}", "23s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_400/actor/huggingface"], [16, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_400", 5000, 2538, 0.5076, 660, "{\"stop:-\": 4417, \"length:-\": 582, \"stop:Problem:\": 1}", "2m 34s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_400/actor/huggingface"], [17, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_450", 1319, 1019, 0.7725549658832449, 10, "{\"stop:-\": 1309, \"length:-\": 10}", "25s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_450/actor/huggingface"], [18, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_450", 5000, 2539, 0.5078, 656, "{\"stop:-\": 4423, \"length:-\": 575, \"stop:Problem:\": 2}", "2m 35s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_450/actor/huggingface"], [19, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_500", 1319, 1002, 0.759666413949962, 8, "{\"stop:-\": 1311, \"length:-\": 8}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_500/actor/huggingface"], [20, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_500", 5000, 2531, 0.5062, 642, "{\"stop:-\": 4437, \"length:-\": 561, \"stop:Problem:\": 2}", "2m 34s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_500/actor/huggingface"], [21, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_550", 1319, 1022, 0.7748294162244125, 4, "{\"stop:-\": 1315, \"length:-\": 4}", "23s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_550/actor/huggingface"], [22, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_550", 5000, 2521, 0.5042, 633, "{\"stop:-\": 4458, \"length:-\": 539, \"stop:Problem:\": 3}", "2m 33s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_550/actor/huggingface"], [23, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_600", 1319, 1027, 0.778620166793025, 7, "{\"stop:-\": 1312, \"length:-\": 7}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_600/actor/huggingface"], [24, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_600", 5000, 2565, 0.513, 628, "{\"stop:-\": 4443, \"length:-\": 555, \"stop:Problem:\": 2}", "2m 33s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_600/actor/huggingface"], [25, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_650", 1319, 1028, 0.7793783169067475, 2, "{\"stop:-\": 1317, \"length:-\": 2}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_650/actor/huggingface"], [26, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_650", 5000, 2557, 0.5114, 628, "{\"stop:-\": 4442, \"length:-\": 557, \"stop:Problem:\": 1}", "2m 33s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_650/actor/huggingface"], [27, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_700", 1319, 1027, 0.778620166793025, 6, "{\"stop:-\": 1313, \"length:-\": 6}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_700/actor/huggingface"], [28, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_700", 5000, 2529, 0.5058, 642, "{\"stop:-\": 4428, \"length:-\": 571, \"stop:Problem:\": 1}", "2m 33s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_700/actor/huggingface"], [29, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_750", 1319, 1037, 0.7862016679302501, 3, "{\"stop:-\": 1316, \"length:-\": 3}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_750/actor/huggingface"], [30, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_750", 5000, 2539, 0.5078, 609, "{\"stop:-\": 4468, \"length:-\": 530, \"stop:Problem:\": 2}", "2m 33s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_750/actor/huggingface"], [31, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_800", 1319, 1041, 0.7892342683851402, 3, "{\"stop:-\": 1316, \"length:-\": 3}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_800/actor/huggingface"], [32, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_800", 5000, 2536, 0.5072, 622, "{\"stop:-\": 4455, \"length:-\": 543, \"stop:Problem:\": 2}", "2m 33s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_800/actor/huggingface"], [33, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_850", 1319, 1044, 0.7915087187263078, 1, "{\"stop:-\": 1318, \"length:-\": 1}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_850/actor/huggingface"], [34, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_850", 5000, 2585, 0.517, 620, "{\"stop:-\": 4459, \"length:-\": 539, \"stop:Problem:\": 2}", "2m 31s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_850/actor/huggingface"], [35, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_900", 1319, 1048, 0.7945413191811979, 4, "{\"stop:-\": 1315, \"length:-\": 4}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_900/actor/huggingface"], [36, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_900", 5000, 2568, 0.5136, 635, "{\"stop:-\": 4444, \"length:-\": 553, \"stop:Problem:\": 3}", "2m 33s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_900/actor/huggingface"], [37, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_950", 1319, 1051, 0.7968157695223654, 1, "{\"stop:-\": 1318, \"length:-\": 1}", "23s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_950/actor/huggingface"], [38, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_950", 5000, 2565, 0.513, 609, "{\"stop:-\": 4461, \"length:-\": 537, \"stop:Problem:\": 2}", "2m 34s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_950/actor/huggingface"], [39, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_1000", 1319, 1029, 0.78013646702047, 3, "{\"stop:-\": 1316, \"length:-\": 3}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1000/actor/huggingface"], [40, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_1000", 5000, 2596, 0.5192, 619, "{\"stop:-\": 4450, \"length:-\": 548, \"stop:Problem:\": 2}", "2m 34s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1000/actor/huggingface"], [41, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_1050", 1319, 1040, 0.7884761182714177, 4, "{\"stop:-\": 1315, \"length:-\": 4}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1050/actor/huggingface"], [42, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_1050", 5000, 2568, 0.5136, 612, "{\"stop:-\": 4460, \"length:-\": 538, \"stop:Problem:\": 2}", "2m 33s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1050/actor/huggingface"], [43, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_1100", 1319, 1033, 0.7831690674753601, 3, "{\"stop:-\": 1316, \"length:-\": 3}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1100/actor/huggingface"], [44, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_1100", 5000, 2575, 0.515, 612, "{\"stop:-\": 4460, \"length:-\": 538, \"stop:Problem:\": 2}", "2m 34s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1100/actor/huggingface"], [45, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_1150", 1319, 1040, 0.7884761182714177, 3, "{\"stop:-\": 1316, \"length:-\": 3}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1150/actor/huggingface"], [46, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_1150", 5000, 2585, 0.517, 631, "{\"stop:-\": 4444, \"length:-\": 555, \"stop:Problem:\": 1}", "2m 35s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1150/actor/huggingface"], [47, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_1200", 1319, 1038, 0.7869598180439727, 2, "{\"stop:-\": 1317, \"length:-\": 2}", "25s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1200/actor/huggingface"], [48, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_1200", 5000, 2570, 0.514, 644, "{\"stop:-\": 4422, \"length:-\": 576, \"stop:Problem:\": 2}", "2m 38s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1200/actor/huggingface"], [49, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_1250", 1319, 1039, 0.7877179681576952, 2, "{\"stop:-\": 1317, \"length:-\": 2}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1250/actor/huggingface"], [50, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_1250", 5000, 2571, 0.5142, 655, "{\"stop:-\": 4421, \"length:-\": 576, \"stop:Problem:\": 3}", "2m 38s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1250/actor/huggingface"], [51, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_1300", 1319, 1041, 0.7892342683851402, 7, "{\"stop:-\": 1312, \"length:-\": 7}", "25s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1300/actor/huggingface"], [52, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_1300", 5000, 2592, 0.5184, 638, "{\"stop:-\": 4434, \"length:-\": 564, \"stop:Problem:\": 2}", "2m 40s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1300/actor/huggingface"], [53, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_1350", 1319, 1049, 0.7952994692949203, 2, "{\"stop:-\": 1317, \"length:-\": 2}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1350/actor/huggingface"], [54, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_1350", 5000, 2572, 0.5144, 649, "{\"stop:-\": 4425, \"length:-\": 574, \"stop:Problem:\": 1}", "2m 36s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1350/actor/huggingface"], [55, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_1400", 1319, 1054, 0.799090219863533, 3, "{\"stop:-\": 1316, \"length:-\": 3}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1400/actor/huggingface"], [56, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_1400", 5000, 2554, 0.5108, 655, "{\"stop:-\": 4420, \"length:-\": 579, \"stop:Problem:\": 1}", "2m 36s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1400/actor/huggingface"], [57, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_1450", 1319, 1052, 0.7975739196360879, 6, "{\"stop:-\": 1313, \"length:-\": 6}", "25s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1450/actor/huggingface"], [58, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_1450", 5000, 2593, 0.5186, 662, "{\"stop:-\": 4411, \"length:-\": 585, \"stop:Problem:\": 4}", "2m 37s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1450/actor/huggingface"], [59, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_1500", 1319, 1045, 0.7922668688400303, 7, "{\"stop:-\": 1312, \"length:-\": 7}", "25s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1500/actor/huggingface"], [60, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_1500", 5000, 2595, 0.519, 634, "{\"stop:-\": 4438, \"length:-\": 559, \"stop:Problem:\": 3}", "2m 38s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1500/actor/huggingface"], [61, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_1550", 1319, 1058, 0.8021228203184231, 4, "{\"stop:-\": 1315, \"length:-\": 4}", "25s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1550/actor/huggingface"], [62, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_1550", 5000, 2590, 0.518, 608, "{\"stop:-\": 4476, \"length:-\": 520, \"stop:Problem:\": 4}", "2m 36s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1550/actor/huggingface"], [63, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_1600", 1319, 1051, 0.7968157695223654, 5, "{\"stop:-\": 1314, \"length:-\": 5}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1600/actor/huggingface"], [64, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_1600", 5000, 2595, 0.519, 572, "{\"stop:-\": 4498, \"length:-\": 498, \"stop:Problem:\": 4}", "2m 34s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1600/actor/huggingface"], [65, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_1650", 1319, 1044, 0.7915087187263078, 2, "{\"stop:-\": 1317, \"length:-\": 2}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1650/actor/huggingface"], [66, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_1650", 5000, 2573, 0.5146, 564, "{\"stop:-\": 4507, \"length:-\": 491, \"stop:Problem:\": 2}", "2m 32s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1650/actor/huggingface"], [67, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_1700", 1319, 1058, 0.8021228203184231, 2, "{\"stop:-\": 1317, \"length:-\": 2}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1700/actor/huggingface"], [68, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_1700", 5000, 2581, 0.5162, 604, "{\"stop:-\": 4468, \"length:-\": 531, \"stop:Problem:\": 1}", "2m 33s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1700/actor/huggingface"], [69, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_1750", 1319, 1044, 0.7915087187263078, 2, "{\"stop:-\": 1317, \"length:-\": 2}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1750/actor/huggingface"], [70, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_1750", 5000, 2578, 0.5156, 612, "{\"stop:-\": 4458, \"length:-\": 540, \"stop:Problem:\": 2}", "2m 35s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1750/actor/huggingface"], [71, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_1800", 1319, 1060, 0.8036391205458681, 2, "{\"stop:-\": 1317, \"length:-\": 2}", "23s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1800/actor/huggingface"], [72, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_1800", 5000, 2591, 0.5182, 613, "{\"stop:-\": 4470, \"length:-\": 526, \"stop:Problem:\": 4}", "2m 35s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1800/actor/huggingface"], [73, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_1850", 1319, 1044, 0.7915087187263078, 2, "{\"stop:-\": 1317, \"length:-\": 2}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1850/actor/huggingface"], [74, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_1850", 5000, 2545, 0.509, 585, "{\"stop:-\": 4494, \"length:-\": 504, \"stop:Problem:\": 2}", "2m 34s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1850/actor/huggingface"], [75, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_1900", 1319, 1049, 0.7952994692949203, 6, "{\"stop:-\": 1313, \"length:-\": 6}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1900/actor/huggingface"], [76, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_1900", 5000, 2577, 0.5154, 591, "{\"stop:-\": 4480, \"length:-\": 520}", "2m 33s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1900/actor/huggingface"], [77, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_1950", 1319, 1057, 0.8013646702047005, 3, "{\"stop:-\": 1316, \"length:-\": 3}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1950/actor/huggingface"], [78, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_1950", 5000, 2610, 0.522, 572, "{\"stop:-\": 4499, \"length:-\": 501}", "2m 34s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1950/actor/huggingface"], [79, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_2000", 1319, 1046, 0.7930250189537529, 5, "{\"stop:-\": 1314, \"length:-\": 5}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2000/actor/huggingface"], [80, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_2000", 5000, 2603, 0.5206, 573, "{\"stop:-\": 4504, \"length:-\": 496}", "2m 33s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2000/actor/huggingface"], [81, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_2050", 1319, 1055, 0.7998483699772555, 2, "{\"stop:-\": 1317, \"length:-\": 2}", "23s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2050/actor/huggingface"], [82, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_2050", 5000, 2576, 0.5152, 584, "{\"stop:-\": 4501, \"length:-\": 498, \"stop:Problem:\": 1}", "2m 32s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2050/actor/huggingface"], [83, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_2100", 1319, 1063, 0.8059135708870356, 5, "{\"stop:-\": 1314, \"length:-\": 5}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2100/actor/huggingface"], [84, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_2100", 5000, 2592, 0.5184, 607, "{\"stop:-\": 4470, \"length:-\": 529, \"stop:Problem:\": 1}", "2m 37s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2100/actor/huggingface"], [85, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_2150", 1319, 1060, 0.8036391205458681, 5, "{\"stop:-\": 1314, \"length:-\": 5}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2150/actor/huggingface"], [86, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_2150", 5000, 2606, 0.5212, 641, "{\"stop:-\": 4434, \"length:-\": 563, \"stop:Problem:\": 3}", "2m 36s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2150/actor/huggingface"], [87, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_2200", 1319, 1069, 0.8104624715693708, 3, "{\"stop:-\": 1316, \"length:-\": 3}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2200/actor/huggingface"], [88, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_2200", 5000, 2580, 0.516, 609, "{\"stop:-\": 4462, \"length:-\": 536, \"stop:Problem:\": 2}", "2m 34s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2200/actor/huggingface"], [89, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_2250", 1319, 1064, 0.8066717210007581, 3, "{\"stop:-\": 1316, \"length:-\": 3}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2250/actor/huggingface"], [90, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_2250", 5000, 2584, 0.5168, 580, "{\"stop:-\": 4494, \"length:-\": 504, \"stop:Problem:\": 2}", "2m 33s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2250/actor/huggingface"], [91, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_2300", 1319, 1063, 0.8059135708870356, 5, "{\"stop:-\": 1314, \"length:-\": 5}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2300/actor/huggingface"], [92, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_2300", 5000, 2574, 0.5148, 586, "{\"stop:-\": 4490, \"length:-\": 507, \"stop:Problem:\": 3}", "2m 33s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2300/actor/huggingface"], [93, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_2350", 1319, 1050, 0.796057619408643, 6, "{\"stop:-\": 1313, \"length:-\": 6}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2350/actor/huggingface"], [94, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_2350", 5000, 2595, 0.519, 586, "{\"stop:-\": 4490, \"length:-\": 507, \"stop:Problem:\": 3}", "2m 33s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2350/actor/huggingface"], [95, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_2400", 1319, 1061, 0.8043972706595905, 4, "{\"stop:-\": 1315, \"length:-\": 4}", "25s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2400/actor/huggingface"], [96, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_2400", 5000, 2599, 0.5198, 603, "{\"stop:-\": 4468, \"length:-\": 530, \"stop:Problem:\": 2}", "2m 35s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2400/actor/huggingface"], [97, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_2450", 1319, 1045, 0.7922668688400303, 3, "{\"stop:-\": 1316, \"length:-\": 3}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2450/actor/huggingface"], [98, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_2450", 5000, 2605, 0.521, 542, "{\"stop:-\": 4526, \"length:-\": 472, \"stop:Problem:\": 2}", "2m 30s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2450/actor/huggingface"], [99, "gsm8k_main(0)", "grpo-gsm8k-train-13ep-success_global_step_2500", 1319, 1045, 0.7922668688400303, 7, "{\"stop:-\": 1312, \"length:-\": 7}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2500/actor/huggingface"], [100, "hendrycks_math(0)", "grpo-gsm8k-train-13ep-success_global_step_2500", 5000, 2598, 0.5196, 567, "{\"stop:-\": 4505, \"length:-\": 493, \"stop:Problem:\": 2}", "2m 33s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2500/actor/huggingface"]], "truncated": false, "filtered_table_rows_count": 165, "expanded_columns": [], "expandable_columns": [], "columns": ["id", "task_name", "model_tag", "total_examples", "correct", "accuracy", "no_answer_count", "stop_reason_counts", "duration_human", "pass_k", "temperature", "top_p", "max_tokens", "error", "model"], "primary_keys": ["id"], "units": {}, "query": {"sql": "select id, task_name, model_tag, total_examples, correct, accuracy, no_answer_count, stop_reason_counts, duration_human, pass_k, temperature, top_p, max_tokens, error, model from summaries order by id limit 101", "params": {}}, "facet_results": {}, "suggested_facets": [{"name": "task_name", "toggle_url": "http://jayminban-rlvr-vs-sft-qwen2-5-1-5b.hf.space/grpo-gsm8k-train/summaries.json?_facet=task_name"}, {"name": "total_examples", "toggle_url": "http://jayminban-rlvr-vs-sft-qwen2-5-1-5b.hf.space/grpo-gsm8k-train/summaries.json?_facet=total_examples"}, {"name": "duration_human", "toggle_url": "http://jayminban-rlvr-vs-sft-qwen2-5-1-5b.hf.space/grpo-gsm8k-train/summaries.json?_facet=duration_human"}], "next": "100", "next_url": "http://jayminban-rlvr-vs-sft-qwen2-5-1-5b.hf.space/grpo-gsm8k-train/summaries.json?_next=100", "private": false, "allow_execute_sql": true, "query_ms": 15.458233188837767}