{"database": "grpo-one-example", "table": "summaries", "is_view": false, "human_description_en": "", "rows": [[1, "gsm8k_main(0)", "dsr-one-example-grpo_global_step_50", 1319, 945, 0.7164518574677786, 8, "{\"stop:-\": 1313, \"length:-\": 6}", "25s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_50/actor/huggingface"], [2, "hendrycks_math(0)", "dsr-one-example-grpo_global_step_50", 5000, 2462, 0.4924, 623, "{\"stop:-\": 4454, \"length:-\": 537, \"stop:Problem:\": 9}", "2m 30s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_50/actor/huggingface"], [3, "gsm8k_main(0)", "dsr-one-example-grpo_global_step_100", 1319, 949, 0.7194844579226687, 6, "{\"stop:-\": 1313, \"length:-\": 6}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_100/actor/huggingface"], [4, "hendrycks_math(0)", "dsr-one-example-grpo_global_step_100", 5000, 2467, 0.4934, 617, "{\"stop:-\": 4457, \"length:-\": 537, \"stop:Problem:\": 6}", "2m 28s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_100/actor/huggingface"], [5, "gsm8k_main(0)", "dsr-one-example-grpo_global_step_150", 1319, 947, 0.7179681576952237, 5, "{\"stop:-\": 1314, \"length:-\": 5}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_150/actor/huggingface"], [6, "hendrycks_math(0)", "dsr-one-example-grpo_global_step_150", 5000, 2477, 0.4954, 644, "{\"stop:-\": 4430, \"length:-\": 564, \"stop:Problem:\": 6}", "2m 28s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_150/actor/huggingface"], [7, "gsm8k_main(0)", "dsr-one-example-grpo_global_step_200", 1319, 967, 0.733131159969674, 3, "{\"stop:-\": 1316, \"length:-\": 3}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_200/actor/huggingface"], [8, "hendrycks_math(0)", "dsr-one-example-grpo_global_step_200", 5000, 2487, 0.4974, 632, "{\"stop:-\": 4453, \"length:-\": 539, \"stop:Problem:\": 8}", "2m 29s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_200/actor/huggingface"], [9, "gsm8k_main(0)", "dsr-one-example-grpo_global_step_250", 1319, 955, 0.7240333586050038, 6, "{\"stop:-\": 1313, \"length:-\": 6}", "23s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_250/actor/huggingface"], [10, "hendrycks_math(0)", "dsr-one-example-grpo_global_step_250", 5000, 2466, 0.4932, 617, "{\"stop:-\": 4458, \"length:-\": 537, \"stop:Problem:\": 5}", "2m 28s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_250/actor/huggingface"], [11, "gsm8k_main(0)", "dsr-one-example-grpo_global_step_300", 1319, 949, 0.7194844579226687, 6, "{\"stop:-\": 1313, \"length:-\": 6}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_300/actor/huggingface"], [12, "hendrycks_math(0)", "dsr-one-example-grpo_global_step_300", 5000, 2493, 0.4986, 624, "{\"stop:-\": 4451, \"length:-\": 545, \"stop:Problem:\": 4}", "2m 29s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_300/actor/huggingface"], [13, "gsm8k_main(0)", "dsr-one-example-grpo_global_step_350", 1319, 950, 0.7202426080363912, 1, "{\"stop:-\": 1318, \"length:-\": 1}", "21s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_350/actor/huggingface"], [14, "hendrycks_math(0)", "dsr-one-example-grpo_global_step_350", 5000, 2490, 0.498, 622, "{\"stop:-\": 4450, \"length:-\": 538, \"stop:Problem:\": 12}", "2m 28s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_350/actor/huggingface"], [15, "gsm8k_main(0)", "dsr-one-example-grpo_global_step_400", 1319, 948, 0.7187263078089462, 3, "{\"stop:-\": 1316, \"length:-\": 3}", "23s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_400/actor/huggingface"], [16, "hendrycks_math(0)", "dsr-one-example-grpo_global_step_400", 5000, 2482, 0.4964, 623, "{\"stop:-\": 4457, \"length:-\": 532, \"stop:Problem:\": 11}", "2m 29s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_400/actor/huggingface"], [17, "gsm8k_main(0)", "dsr-one-example-grpo_global_step_450", 1319, 965, 0.731614859742229, 5, "{\"stop:-\": 1314, \"length:-\": 5}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_450/actor/huggingface"], [18, "hendrycks_math(0)", "dsr-one-example-grpo_global_step_450", 5000, 2462, 0.4924, 580, "{\"stop:-\": 4490, \"length:-\": 497, \"stop:Problem:\": 13}", "2m 28s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_450/actor/huggingface"], [19, "gsm8k_main(0)", "dsr-one-example-grpo_global_step_500", 1319, 960, 0.7278241091736164, 7, "{\"stop:-\": 1312, \"length:-\": 7}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_500/actor/huggingface"], [20, "hendrycks_math(0)", "dsr-one-example-grpo_global_step_500", 5000, 2428, 0.4856, 613, "{\"stop:-\": 4456, \"length:-\": 531, \"stop:Problem:\": 13}", "2m 28s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_500/actor/huggingface"], [21, "gsm8k_main(0)", "dsr-one-example-grpo_global_step_550", 1319, 948, 0.7187263078089462, 9, "{\"stop:-\": 1310, \"length:-\": 9}", "23s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_550/actor/huggingface"], [22, "hendrycks_math(0)", "dsr-one-example-grpo_global_step_550", 5000, 2445, 0.489, 602, "{\"stop:-\": 4474, \"length:-\": 512, \"stop:Problem:\": 14}", "2m 29s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_550/actor/huggingface"], [23, "gsm8k_main(0)", "dsr-one-example-grpo_global_step_600", 1319, 959, 0.7270659590598939, 4, "{\"stop:-\": 1315, \"length:-\": 4}", "23s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_600/actor/huggingface"], [24, "hendrycks_math(0)", "dsr-one-example-grpo_global_step_600", 5000, 2485, 0.497, 610, "{\"stop:-\": 4465, \"length:-\": 522, \"stop:Problem:\": 13}", "2m 29s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_600/actor/huggingface"], [25, "gsm8k_main(0)", "dsr-one-example-grpo_global_step_650", 1319, 960, 0.7278241091736164, 7, "{\"stop:-\": 1312, \"length:-\": 7}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_650/actor/huggingface"], [26, "hendrycks_math(0)", "dsr-one-example-grpo_global_step_650", 5000, 2433, 0.4866, 602, "{\"stop:-\": 4480, \"length:-\": 507, \"stop:Problem:\": 13}", "2m 30s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_650/actor/huggingface"], [27, "gsm8k_main(0)", "dsr-one-example-grpo_global_step_700", 1319, 964, 0.7308567096285065, 8, "{\"stop:-\": 1311, \"length:-\": 8}", "23s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_700/actor/huggingface"], [28, "hendrycks_math(0)", "dsr-one-example-grpo_global_step_700", 5000, 2431, 0.4862, 625, "{\"stop:-\": 4451, \"length:-\": 534, \"stop:Problem:\": 15}", "2m 30s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_700/actor/huggingface"], [29, "gsm8k_main(0)", "dsr-one-example-grpo_global_step_750", 1319, 960, 0.7278241091736164, 7, "{\"stop:-\": 1312, \"length:-\": 7}", "23s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_750/actor/huggingface"], [30, "hendrycks_math(0)", "dsr-one-example-grpo_global_step_750", 5000, 2432, 0.4864, 652, "{\"stop:-\": 4414, \"length:-\": 573, \"stop:Problem:\": 13}", "2m 32s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_750/actor/huggingface"], [31, "gsm8k_main(0)", "dsr-one-example-grpo_global_step_800", 1319, 972, 0.7369219105382866, 4, "{\"stop:-\": 1315, \"length:-\": 4}", "23s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_800/actor/huggingface"], [32, "hendrycks_math(0)", "dsr-one-example-grpo_global_step_800", 5000, 2419, 0.4838, 623, "{\"stop:-\": 4450, \"length:-\": 533, \"stop:Problem:\": 17}", "2m 30s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_800/actor/huggingface"], [33, "gsm8k_main(0)", "dsr-one-example-grpo_global_step_850", 1319, 967, 0.733131159969674, 10, "{\"stop:-\": 1309, \"length:-\": 10}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_850/actor/huggingface"], [34, "hendrycks_math(0)", "dsr-one-example-grpo_global_step_850", 5000, 2442, 0.4884, 642, "{\"stop:-\": 4432, \"length:-\": 552, \"stop:Problem:\": 16}", "2m 31s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_850/actor/huggingface"], [35, "gsm8k_main(0)", "dsr-one-example-grpo_global_step_900", 1319, 976, 0.7399545109931767, 3, "{\"stop:-\": 1316, \"length:-\": 3}", "23s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_900/actor/huggingface"], [36, "hendrycks_math(0)", "dsr-one-example-grpo_global_step_900", 5000, 2439, 0.4878, 599, "{\"stop:-\": 4469, \"length:-\": 516, \"stop:Problem:\": 15}", "2m 30s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_900/actor/huggingface"], [37, "gsm8k_main(0)", "dsr-one-example-grpo_global_step_950", 1319, 971, 0.7361637604245641, 5, "{\"stop:-\": 1314, \"length:-\": 5}", "23s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_950/actor/huggingface"], [38, "hendrycks_math(0)", "dsr-one-example-grpo_global_step_950", 5000, 2458, 0.4916, 648, "{\"stop:-\": 4418, \"length:-\": 569, \"stop:Problem:\": 13}", "2m 31s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_950/actor/huggingface"], [39, "gsm8k_main(0)", "dsr-one-example-grpo_global_step_1000", 1319, 979, 0.7422289613343442, 5, "{\"stop:-\": 1314, \"length:-\": 5}", "23s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_1000/actor/huggingface"], [40, "hendrycks_math(0)", "dsr-one-example-grpo_global_step_1000", 5000, 2469, 0.4938, 620, "{\"stop:-\": 4455, \"length:-\": 524, \"stop:Problem:\": 21}", "2m 30s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/dsr-one-example-grpo/global_step_1000/actor/huggingface"], [41, "gsm8k_main(0)", "grpo-one-example-gsm8k_global_step_50", 1319, 962, 0.7293404094010614, 7, "{\"stop:-\": 1312, \"length:-\": 7}", "25s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_50/actor/huggingface"], [42, "hendrycks_math(0)", "grpo-one-example-gsm8k_global_step_50", 5000, 2468, 0.4936, 637, "{\"stop:-\": 4438, \"length:-\": 559, \"stop:Problem:\": 3}", "2m 32s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_50/actor/huggingface"], [43, "gsm8k_main(0)", "grpo-one-example-gsm8k_global_step_100", 1319, 985, 0.7467778620166793, 2, "{\"stop:-\": 1317, \"length:-\": 2}", "23s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_100/actor/huggingface"], [44, "hendrycks_math(0)", "grpo-one-example-gsm8k_global_step_100", 5000, 2480, 0.496, 636, "{\"stop:-\": 4441, \"length:-\": 556, \"stop:Problem:\": 3}", "2m 33s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_100/actor/huggingface"], [45, "gsm8k_main(0)", "grpo-one-example-gsm8k_global_step_150", 1319, 982, 0.7445034116755117, 5, "{\"stop:-\": 1314, \"length:-\": 5}", "23s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_150/actor/huggingface"], [46, "hendrycks_math(0)", "grpo-one-example-gsm8k_global_step_150", 5000, 2499, 0.4998, 633, "{\"stop:-\": 4453, \"length:-\": 545, \"stop:Problem:\": 2}", "2m 32s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_150/actor/huggingface"], [47, "gsm8k_main(0)", "grpo-one-example-gsm8k_global_step_200", 1319, 986, 0.7475360121304018, 6, "{\"stop:-\": 1313, \"length:-\": 6}", "23s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_200/actor/huggingface"], [48, "hendrycks_math(0)", "grpo-one-example-gsm8k_global_step_200", 5000, 2451, 0.4902, 667, "{\"stop:-\": 4416, \"length:-\": 582, \"stop:Problem:\": 2}", "2m 33s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_200/actor/huggingface"], [49, "gsm8k_main(0)", "grpo-one-example-gsm8k_global_step_250", 1319, 969, 0.734647460197119, 3, "{\"stop:-\": 1316, \"length:-\": 3}", "23s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_250/actor/huggingface"], [50, "hendrycks_math(0)", "grpo-one-example-gsm8k_global_step_250", 5000, 2456, 0.4912, 630, "{\"stop:-\": 4452, \"length:-\": 545, \"stop:Problem:\": 3}", "2m 32s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_250/actor/huggingface"], [51, "gsm8k_main(0)", "grpo-one-example-gsm8k_global_step_300", 1319, 989, 0.7498104624715694, 4, "{\"stop:-\": 1315, \"length:-\": 4}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_300/actor/huggingface"], [52, "hendrycks_math(0)", "grpo-one-example-gsm8k_global_step_300", 5000, 2502, 0.5004, 620, "{\"stop:-\": 4460, \"length:-\": 537, \"stop:Problem:\": 3}", "2m 31s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_300/actor/huggingface"], [53, "gsm8k_main(0)", "grpo-one-example-gsm8k_global_step_350", 1319, 974, 0.7384382107657316, 6, "{\"stop:-\": 1313, \"length:-\": 6}", "24s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_350/actor/huggingface"], [54, "hendrycks_math(0)", "grpo-one-example-gsm8k_global_step_350", 5000, 2493, 0.4986, 651, "{\"stop:-\": 4423, \"length:-\": 572, \"stop:Problem:\": 5}", "2m 32s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_350/actor/huggingface"], [55, "gsm8k_main(0)", "grpo-one-example-gsm8k_global_step_400", 1319, 984, 0.7460197119029568, 6, "{\"stop:-\": 1313, \"length:-\": 6}", "25s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_400/actor/huggingface"], [56, "hendrycks_math(0)", "grpo-one-example-gsm8k_global_step_400", 5000, 2501, 0.5002, 616, "{\"stop:-\": 4457, \"length:-\": 541, \"stop:Problem:\": 2}", "2m 36s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_400/actor/huggingface"], [57, "gsm8k_main(0)", "grpo-one-example-gsm8k_global_step_450", 1319, 968, 0.7338893100833965, 6, "{\"stop:-\": 1313, \"length:-\": 6}", "27s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_450/actor/huggingface"], [58, "hendrycks_math(0)", "grpo-one-example-gsm8k_global_step_450", 5000, 2539, 0.5078, 597, "{\"stop:-\": 4481, \"length:-\": 516, \"stop:Problem:\": 3}", "2m 33s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_450/actor/huggingface"], [59, "gsm8k_main(0)", "grpo-one-example-gsm8k_global_step_500", 1319, 978, 0.7414708112206216, 2, "{\"stop:-\": 1317, \"length:-\": 2}", "27s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_500/actor/huggingface"], [60, "hendrycks_math(0)", "grpo-one-example-gsm8k_global_step_500", 5000, 2474, 0.4948, 640, "{\"stop:-\": 4441, \"length:-\": 556, \"stop:Problem:\": 3}", "2m 34s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_500/actor/huggingface"], [61, "gsm8k_main(0)", "grpo-one-example-gsm8k_global_step_550", 1319, 983, 0.7452615617892343, 3, "{\"stop:-\": 1316, \"length:-\": 3}", "26s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_550/actor/huggingface"], [62, "hendrycks_math(0)", "grpo-one-example-gsm8k_global_step_550", 5000, 2483, 0.4966, 600, "{\"stop:-\": 4480, \"length:-\": 519, \"stop:Problem:\": 1}", "2m 36s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_550/actor/huggingface"], [63, "gsm8k_main(0)", "grpo-one-example-gsm8k_global_step_600", 1319, 985, 0.7467778620166793, 4, "{\"stop:-\": 1315, \"length:-\": 4}", "26s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_600/actor/huggingface"], [64, "hendrycks_math(0)", "grpo-one-example-gsm8k_global_step_600", 5000, 2485, 0.497, 618, "{\"stop:-\": 4457, \"length:-\": 539, \"stop:Problem:\": 4}", "2m 35s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_600/actor/huggingface"], [65, "gsm8k_main(0)", "grpo-one-example-gsm8k_global_step_650", 1319, 971, 0.7361637604245641, 4, "{\"stop:-\": 1315, \"length:-\": 4}", "26s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_650/actor/huggingface"], [66, "hendrycks_math(0)", "grpo-one-example-gsm8k_global_step_650", 5000, 2463, 0.4926, 605, "{\"stop:-\": 4469, \"length:-\": 528, \"stop:Problem:\": 3}", "2m 35s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_650/actor/huggingface"], [67, "gsm8k_main(0)", "grpo-one-example-gsm8k_global_step_700", 1319, 977, 0.7407126611068992, 1, "{\"stop:-\": 1318, \"length:-\": 1}", "26s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_700/actor/huggingface"], [68, "hendrycks_math(0)", "grpo-one-example-gsm8k_global_step_700", 5000, 2473, 0.4946, 651, "{\"stop:-\": 4425, \"length:-\": 568, \"stop:Problem:\": 7}", "2m 37s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_700/actor/huggingface"], [69, "gsm8k_main(0)", "grpo-one-example-gsm8k_global_step_750", 1319, 976, 0.7399545109931767, 4, "{\"stop:-\": 1315, \"length:-\": 4}", "27s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_750/actor/huggingface"], [70, "hendrycks_math(0)", "grpo-one-example-gsm8k_global_step_750", 5000, 2457, 0.4914, 632, "{\"stop:-\": 4450, \"length:-\": 547, \"stop:Problem:\": 3}", "2m 35s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_750/actor/huggingface"], [71, "gsm8k_main(0)", "grpo-one-example-gsm8k_global_step_800", 1319, 980, 0.7429871114480667, 8, "{\"stop:-\": 1311, \"length:-\": 8}", "26s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_800/actor/huggingface"], [72, "hendrycks_math(0)", "grpo-one-example-gsm8k_global_step_800", 5000, 2471, 0.4942, 621, "{\"stop:-\": 4456, \"length:-\": 542, \"stop:Problem:\": 2}", "2m 36s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_800/actor/huggingface"], [73, "gsm8k_main(0)", "grpo-one-example-gsm8k_global_step_850", 1319, 975, 0.7391963608794542, 2, "{\"stop:-\": 1317, \"length:-\": 2}", "25s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_850/actor/huggingface"], [74, "hendrycks_math(0)", "grpo-one-example-gsm8k_global_step_850", 5000, 2439, 0.4878, 627, "{\"stop:-\": 4449, \"length:-\": 547, \"stop:Problem:\": 4}", "2m 36s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_850/actor/huggingface"], [75, "gsm8k_main(0)", "grpo-one-example-gsm8k_global_step_900", 1319, 986, 0.7475360121304018, 5, "{\"stop:-\": 1314, \"length:-\": 5}", "26s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_900/actor/huggingface"], [76, "hendrycks_math(0)", "grpo-one-example-gsm8k_global_step_900", 5000, 2474, 0.4948, 616, "{\"stop:-\": 4459, \"length:-\": 538, \"stop:Problem:\": 3}", "2m 32s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_900/actor/huggingface"], [77, "gsm8k_main(0)", "grpo-one-example-gsm8k_global_step_950", 1319, 958, 0.7263078089461713, 6, "{\"stop:-\": 1313, \"length:-\": 6}", "25s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_950/actor/huggingface"], [78, "hendrycks_math(0)", "grpo-one-example-gsm8k_global_step_950", 5000, 2447, 0.4894, 663, "{\"stop:-\": 4420, \"length:-\": 575, \"stop:Problem:\": 5}", "2m 40s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_950/actor/huggingface"], [79, "gsm8k_main(0)", "grpo-one-example-gsm8k_global_step_1000", 1319, 979, 0.7422289613343442, 3, "{\"stop:-\": 1316, \"length:-\": 3}", "25s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_1000/actor/huggingface"], [80, "hendrycks_math(0)", "grpo-one-example-gsm8k_global_step_1000", 5000, 2470, 0.494, 665, "{\"stop:-\": 4414, \"length:-\": 580, \"stop:Problem:\": 6}", "2m 40s", 1, 0.0, 0.95, 1024, null, "/mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-one-example-gsm8k/global_step_1000/actor/huggingface"], [81, "gsm8k_main(0)", "Qwen_Qwen2.5-1.5B-Instruct", 1319, 920, 0.6974981046247157, 44, "{\"stop:-\": 1311, \"length:-\": 8}", "26s", 1, 0.0, 0.95, 1024, null, "/mnt/2data/Documents/safetensors/Qwen_Qwen2.5-1.5B-Instruct"], [82, "hendrycks_math(0)", "Qwen_Qwen2.5-1.5B-Instruct", 5000, 2457, 0.4914, 625, "{\"stop:-\": 4461, \"length:-\": 533, \"stop:Problem:\": 6}", "2m 35s", 1, 0.0, 0.95, 1024, null, "/mnt/2data/Documents/safetensors/Qwen_Qwen2.5-1.5B-Instruct"], [83, "TOTAL", "41 models", 259079, 140807, 0.5434905955326368, 25911, "{}", "2h 06m 20s", 1, 0.0, 0.95, 1024, null, "Models: dsr-one-example-grpo_global_step_50, dsr-one-example-grpo_global_step_100, dsr-one-example-grpo_global_step_150, dsr-one-example-grpo_global_step_200, dsr-one-example-grpo_global_step_250, dsr-one-example-grpo_global_step_300, dsr-one-example-grpo_global_step_350, dsr-one-example-grpo_global_step_400, dsr-one-example-grpo_global_step_450, dsr-one-example-grpo_global_step_500, dsr-one-example-grpo_global_step_550, dsr-one-example-grpo_global_step_600, dsr-one-example-grpo_global_step_650, dsr-one-example-grpo_global_step_700, dsr-one-example-grpo_global_step_750, dsr-one-example-grpo_global_step_800, dsr-one-example-grpo_global_step_850, dsr-one-example-grpo_global_step_900, dsr-one-example-grpo_global_step_950, dsr-one-example-grpo_global_step_1000, grpo-one-example-gsm8k_global_step_50, grpo-one-example-gsm8k_global_step_100, grpo-one-example-gsm8k_global_step_150, grpo-one-example-gsm8k_global_step_200, grpo-one-example-gsm8k_global_step_250, grpo-one-example-gsm8k_global_step_300, grpo-one-example-gsm8k_global_step_350, grpo-one-example-gsm8k_global_step_400, grpo-one-example-gsm8k_global_step_450, grpo-one-example-gsm8k_global_step_500, grpo-one-example-gsm8k_global_step_550, grpo-one-example-gsm8k_global_step_600, grpo-one-example-gsm8k_global_step_650, grpo-one-example-gsm8k_global_step_700, grpo-one-example-gsm8k_global_step_750, grpo-one-example-gsm8k_global_step_800, grpo-one-example-gsm8k_global_step_850, grpo-one-example-gsm8k_global_step_900, grpo-one-example-gsm8k_global_step_950, grpo-one-example-gsm8k_global_step_1000, Qwen_Qwen2.5-1.5B-Instruct | Tasks: gsm8k_main(0), hendrycks_math(0)"]], "truncated": false, "filtered_table_rows_count": 83, "expanded_columns": [], "expandable_columns": [], "columns": ["id", "task_name", "model_tag", "total_examples", "correct", "accuracy", "no_answer_count", "stop_reason_counts", "duration_human", "pass_k", "temperature", "top_p", "max_tokens", "error", "model"], "primary_keys": ["id"], "units": {}, "query": {"sql": "select id, task_name, model_tag, total_examples, correct, accuracy, no_answer_count, stop_reason_counts, duration_human, pass_k, temperature, top_p, max_tokens, error, model from summaries order by id limit 101", "params": {}}, "facet_results": {}, "suggested_facets": [{"name": "task_name", "toggle_url": "http://jayminban-rlvr-vs-sft-qwen2-5-1-5b.hf.space/grpo-one-example/summaries.json?_facet=task_name"}, {"name": "total_examples", "toggle_url": "http://jayminban-rlvr-vs-sft-qwen2-5-1-5b.hf.space/grpo-one-example/summaries.json?_facet=total_examples"}, {"name": "duration_human", "toggle_url": "http://jayminban-rlvr-vs-sft-qwen2-5-1-5b.hf.space/grpo-one-example/summaries.json?_facet=duration_human"}], "next": null, "next_url": null, "private": false, "allow_execute_sql": true, "query_ms": 797.0934701152146}