home / grpo-gsm8k-train

summaries

165 rows

✎ View and edit SQL

This data as json, CSV (advanced)

Suggested facets: task_name, total_examples, duration_human

id ▼ task_name model_tag total_examples correct accuracy no_answer_count stop_reason_counts duration_human pass_k temperature top_p max_tokens error model
1 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_50 1319 968 0.7338893100833965 4 {"stop:-": 1315, "length:-": 4} 25s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_50/actor/huggingface
2 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_50 5000 2469 0.4938 610 {"stop:-": 4467, "length:-": 531, "stop:Problem:": 2} 2m 34s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_50/actor/huggingface
3 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_100 1319 980 0.7429871114480667 4 {"stop:-": 1315, "length:-": 4} 23s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_100/actor/huggingface
4 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_100 5000 2524 0.5048 635 {"stop:-": 4439, "length:-": 561} 2m 32s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_100/actor/huggingface
5 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_150 1319 986 0.7475360121304018 3 {"stop:-": 1316, "length:-": 3} 23s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_150/actor/huggingface
6 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_150 5000 2500 0.5 635 {"stop:-": 4429, "length:-": 570, "stop:Problem:": 1} 2m 33s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_150/actor/huggingface
7 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_200 1319 1003 0.7604245640636846 4 {"stop:-": 1315, "length:-": 4} 24s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_200/actor/huggingface
8 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_200 5000 2484 0.4968 670 {"stop:-": 4408, "length:-": 590, "stop:Problem:": 2} 2m 33s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_200/actor/huggingface
9 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_250 1319 1002 0.759666413949962 4 {"stop:-": 1315, "length:-": 4} 24s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_250/actor/huggingface
10 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_250 5000 2508 0.5016 636 {"stop:-": 4442, "length:-": 557, "stop:Problem:": 1} 2m 32s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_250/actor/huggingface
11 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_300 1319 991 0.7513267626990144 5 {"stop:-": 1314, "length:-": 5} 24s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_300/actor/huggingface
12 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_300 5000 2513 0.5026 641 {"stop:-": 4436, "length:-": 563, "stop:Problem:": 1} 2m 33s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_300/actor/huggingface
13 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_350 1319 989 0.7498104624715694 3 {"stop:-": 1316, "length:-": 3} 25s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_350/actor/huggingface
14 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_350 5000 2504 0.5008 657 {"stop:-": 4418, "length:-": 580, "stop:Problem:": 2} 2m 34s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_350/actor/huggingface
15 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_400 1319 1014 0.7687642153146323 4 {"stop:-": 1315, "length:-": 4} 23s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_400/actor/huggingface
16 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_400 5000 2538 0.5076 660 {"stop:-": 4417, "length:-": 582, "stop:Problem:": 1} 2m 34s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_400/actor/huggingface
17 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_450 1319 1019 0.7725549658832449 10 {"stop:-": 1309, "length:-": 10} 25s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_450/actor/huggingface
18 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_450 5000 2539 0.5078 656 {"stop:-": 4423, "length:-": 575, "stop:Problem:": 2} 2m 35s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_450/actor/huggingface
19 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_500 1319 1002 0.759666413949962 8 {"stop:-": 1311, "length:-": 8} 24s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_500/actor/huggingface
20 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_500 5000 2531 0.5062 642 {"stop:-": 4437, "length:-": 561, "stop:Problem:": 2} 2m 34s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_500/actor/huggingface
21 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_550 1319 1022 0.7748294162244125 4 {"stop:-": 1315, "length:-": 4} 23s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_550/actor/huggingface
22 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_550 5000 2521 0.5042 633 {"stop:-": 4458, "length:-": 539, "stop:Problem:": 3} 2m 33s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_550/actor/huggingface
23 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_600 1319 1027 0.778620166793025 7 {"stop:-": 1312, "length:-": 7} 24s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_600/actor/huggingface
24 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_600 5000 2565 0.513 628 {"stop:-": 4443, "length:-": 555, "stop:Problem:": 2} 2m 33s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_600/actor/huggingface
25 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_650 1319 1028 0.7793783169067475 2 {"stop:-": 1317, "length:-": 2} 24s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_650/actor/huggingface
26 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_650 5000 2557 0.5114 628 {"stop:-": 4442, "length:-": 557, "stop:Problem:": 1} 2m 33s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_650/actor/huggingface
27 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_700 1319 1027 0.778620166793025 6 {"stop:-": 1313, "length:-": 6} 24s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_700/actor/huggingface
28 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_700 5000 2529 0.5058 642 {"stop:-": 4428, "length:-": 571, "stop:Problem:": 1} 2m 33s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_700/actor/huggingface
29 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_750 1319 1037 0.7862016679302501 3 {"stop:-": 1316, "length:-": 3} 24s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_750/actor/huggingface
30 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_750 5000 2539 0.5078 609 {"stop:-": 4468, "length:-": 530, "stop:Problem:": 2} 2m 33s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_750/actor/huggingface
31 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_800 1319 1041 0.7892342683851402 3 {"stop:-": 1316, "length:-": 3} 24s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_800/actor/huggingface
32 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_800 5000 2536 0.5072 622 {"stop:-": 4455, "length:-": 543, "stop:Problem:": 2} 2m 33s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_800/actor/huggingface
33 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_850 1319 1044 0.7915087187263078 1 {"stop:-": 1318, "length:-": 1} 24s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_850/actor/huggingface
34 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_850 5000 2585 0.517 620 {"stop:-": 4459, "length:-": 539, "stop:Problem:": 2} 2m 31s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_850/actor/huggingface
35 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_900 1319 1048 0.7945413191811979 4 {"stop:-": 1315, "length:-": 4} 24s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_900/actor/huggingface
36 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_900 5000 2568 0.5136 635 {"stop:-": 4444, "length:-": 553, "stop:Problem:": 3} 2m 33s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_900/actor/huggingface
37 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_950 1319 1051 0.7968157695223654 1 {"stop:-": 1318, "length:-": 1} 23s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_950/actor/huggingface
38 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_950 5000 2565 0.513 609 {"stop:-": 4461, "length:-": 537, "stop:Problem:": 2} 2m 34s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_950/actor/huggingface
39 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_1000 1319 1029 0.78013646702047 3 {"stop:-": 1316, "length:-": 3} 24s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1000/actor/huggingface
40 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_1000 5000 2596 0.5192 619 {"stop:-": 4450, "length:-": 548, "stop:Problem:": 2} 2m 34s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1000/actor/huggingface
41 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_1050 1319 1040 0.7884761182714177 4 {"stop:-": 1315, "length:-": 4} 24s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1050/actor/huggingface
42 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_1050 5000 2568 0.5136 612 {"stop:-": 4460, "length:-": 538, "stop:Problem:": 2} 2m 33s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1050/actor/huggingface
43 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_1100 1319 1033 0.7831690674753601 3 {"stop:-": 1316, "length:-": 3} 24s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1100/actor/huggingface
44 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_1100 5000 2575 0.515 612 {"stop:-": 4460, "length:-": 538, "stop:Problem:": 2} 2m 34s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1100/actor/huggingface
45 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_1150 1319 1040 0.7884761182714177 3 {"stop:-": 1316, "length:-": 3} 24s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1150/actor/huggingface
46 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_1150 5000 2585 0.517 631 {"stop:-": 4444, "length:-": 555, "stop:Problem:": 1} 2m 35s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1150/actor/huggingface
47 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_1200 1319 1038 0.7869598180439727 2 {"stop:-": 1317, "length:-": 2} 25s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1200/actor/huggingface
48 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_1200 5000 2570 0.514 644 {"stop:-": 4422, "length:-": 576, "stop:Problem:": 2} 2m 38s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1200/actor/huggingface
49 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_1250 1319 1039 0.7877179681576952 2 {"stop:-": 1317, "length:-": 2} 24s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1250/actor/huggingface
50 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_1250 5000 2571 0.5142 655 {"stop:-": 4421, "length:-": 576, "stop:Problem:": 3} 2m 38s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1250/actor/huggingface
51 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_1300 1319 1041 0.7892342683851402 7 {"stop:-": 1312, "length:-": 7} 25s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1300/actor/huggingface
52 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_1300 5000 2592 0.5184 638 {"stop:-": 4434, "length:-": 564, "stop:Problem:": 2} 2m 40s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1300/actor/huggingface
53 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_1350 1319 1049 0.7952994692949203 2 {"stop:-": 1317, "length:-": 2} 24s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1350/actor/huggingface
54 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_1350 5000 2572 0.5144 649 {"stop:-": 4425, "length:-": 574, "stop:Problem:": 1} 2m 36s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1350/actor/huggingface
55 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_1400 1319 1054 0.799090219863533 3 {"stop:-": 1316, "length:-": 3} 24s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1400/actor/huggingface
56 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_1400 5000 2554 0.5108 655 {"stop:-": 4420, "length:-": 579, "stop:Problem:": 1} 2m 36s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1400/actor/huggingface
57 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_1450 1319 1052 0.7975739196360879 6 {"stop:-": 1313, "length:-": 6} 25s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1450/actor/huggingface
58 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_1450 5000 2593 0.5186 662 {"stop:-": 4411, "length:-": 585, "stop:Problem:": 4} 2m 37s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1450/actor/huggingface
59 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_1500 1319 1045 0.7922668688400303 7 {"stop:-": 1312, "length:-": 7} 25s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1500/actor/huggingface
60 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_1500 5000 2595 0.519 634 {"stop:-": 4438, "length:-": 559, "stop:Problem:": 3} 2m 38s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1500/actor/huggingface
61 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_1550 1319 1058 0.8021228203184231 4 {"stop:-": 1315, "length:-": 4} 25s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1550/actor/huggingface
62 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_1550 5000 2590 0.518 608 {"stop:-": 4476, "length:-": 520, "stop:Problem:": 4} 2m 36s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1550/actor/huggingface
63 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_1600 1319 1051 0.7968157695223654 5 {"stop:-": 1314, "length:-": 5} 24s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1600/actor/huggingface
64 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_1600 5000 2595 0.519 572 {"stop:-": 4498, "length:-": 498, "stop:Problem:": 4} 2m 34s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1600/actor/huggingface
65 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_1650 1319 1044 0.7915087187263078 2 {"stop:-": 1317, "length:-": 2} 24s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1650/actor/huggingface
66 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_1650 5000 2573 0.5146 564 {"stop:-": 4507, "length:-": 491, "stop:Problem:": 2} 2m 32s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1650/actor/huggingface
67 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_1700 1319 1058 0.8021228203184231 2 {"stop:-": 1317, "length:-": 2} 24s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1700/actor/huggingface
68 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_1700 5000 2581 0.5162 604 {"stop:-": 4468, "length:-": 531, "stop:Problem:": 1} 2m 33s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1700/actor/huggingface
69 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_1750 1319 1044 0.7915087187263078 2 {"stop:-": 1317, "length:-": 2} 24s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1750/actor/huggingface
70 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_1750 5000 2578 0.5156 612 {"stop:-": 4458, "length:-": 540, "stop:Problem:": 2} 2m 35s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1750/actor/huggingface
71 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_1800 1319 1060 0.8036391205458681 2 {"stop:-": 1317, "length:-": 2} 23s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1800/actor/huggingface
72 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_1800 5000 2591 0.5182 613 {"stop:-": 4470, "length:-": 526, "stop:Problem:": 4} 2m 35s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1800/actor/huggingface
73 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_1850 1319 1044 0.7915087187263078 2 {"stop:-": 1317, "length:-": 2} 24s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1850/actor/huggingface
74 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_1850 5000 2545 0.509 585 {"stop:-": 4494, "length:-": 504, "stop:Problem:": 2} 2m 34s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1850/actor/huggingface
75 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_1900 1319 1049 0.7952994692949203 6 {"stop:-": 1313, "length:-": 6} 24s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1900/actor/huggingface
76 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_1900 5000 2577 0.5154 591 {"stop:-": 4480, "length:-": 520} 2m 33s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1900/actor/huggingface
77 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_1950 1319 1057 0.8013646702047005 3 {"stop:-": 1316, "length:-": 3} 24s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1950/actor/huggingface
78 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_1950 5000 2610 0.522 572 {"stop:-": 4499, "length:-": 501} 2m 34s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1950/actor/huggingface
79 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_2000 1319 1046 0.7930250189537529 5 {"stop:-": 1314, "length:-": 5} 24s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2000/actor/huggingface
80 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_2000 5000 2603 0.5206 573 {"stop:-": 4504, "length:-": 496} 2m 33s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2000/actor/huggingface
81 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_2050 1319 1055 0.7998483699772555 2 {"stop:-": 1317, "length:-": 2} 23s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2050/actor/huggingface
82 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_2050 5000 2576 0.5152 584 {"stop:-": 4501, "length:-": 498, "stop:Problem:": 1} 2m 32s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2050/actor/huggingface
83 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_2100 1319 1063 0.8059135708870356 5 {"stop:-": 1314, "length:-": 5} 24s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2100/actor/huggingface
84 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_2100 5000 2592 0.5184 607 {"stop:-": 4470, "length:-": 529, "stop:Problem:": 1} 2m 37s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2100/actor/huggingface
85 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_2150 1319 1060 0.8036391205458681 5 {"stop:-": 1314, "length:-": 5} 24s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2150/actor/huggingface
86 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_2150 5000 2606 0.5212 641 {"stop:-": 4434, "length:-": 563, "stop:Problem:": 3} 2m 36s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2150/actor/huggingface
87 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_2200 1319 1069 0.8104624715693708 3 {"stop:-": 1316, "length:-": 3} 24s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2200/actor/huggingface
88 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_2200 5000 2580 0.516 609 {"stop:-": 4462, "length:-": 536, "stop:Problem:": 2} 2m 34s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2200/actor/huggingface
89 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_2250 1319 1064 0.8066717210007581 3 {"stop:-": 1316, "length:-": 3} 24s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2250/actor/huggingface
90 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_2250 5000 2584 0.5168 580 {"stop:-": 4494, "length:-": 504, "stop:Problem:": 2} 2m 33s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2250/actor/huggingface
91 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_2300 1319 1063 0.8059135708870356 5 {"stop:-": 1314, "length:-": 5} 24s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2300/actor/huggingface
92 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_2300 5000 2574 0.5148 586 {"stop:-": 4490, "length:-": 507, "stop:Problem:": 3} 2m 33s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2300/actor/huggingface
93 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_2350 1319 1050 0.796057619408643 6 {"stop:-": 1313, "length:-": 6} 24s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2350/actor/huggingface
94 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_2350 5000 2595 0.519 586 {"stop:-": 4490, "length:-": 507, "stop:Problem:": 3} 2m 33s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2350/actor/huggingface
95 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_2400 1319 1061 0.8043972706595905 4 {"stop:-": 1315, "length:-": 4} 25s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2400/actor/huggingface
96 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_2400 5000 2599 0.5198 603 {"stop:-": 4468, "length:-": 530, "stop:Problem:": 2} 2m 35s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2400/actor/huggingface
97 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_2450 1319 1045 0.7922668688400303 3 {"stop:-": 1316, "length:-": 3} 24s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2450/actor/huggingface
98 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_2450 5000 2605 0.521 542 {"stop:-": 4526, "length:-": 472, "stop:Problem:": 2} 2m 30s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2450/actor/huggingface
99 gsm8k_main(0) grpo-gsm8k-train-13ep-success_global_step_2500 1319 1045 0.7922668688400303 7 {"stop:-": 1312, "length:-": 7} 24s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2500/actor/huggingface
100 hendrycks_math(0) grpo-gsm8k-train-13ep-success_global_step_2500 5000 2598 0.5196 567 {"stop:-": 4505, "length:-": 493, "stop:Problem:": 2} 2m 33s 1 0.0 0.95 1024   /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2500/actor/huggingface

Next page

Advanced export

JSON shape: default, array, newline-delimited, object

CSV options:

CREATE TABLE summaries (
                id INTEGER PRIMARY KEY AUTOINCREMENT,
                task_name TEXT NOT NULL,
                model_tag TEXT NOT NULL,
                total_examples INTEGER,
                correct INTEGER,
                accuracy REAL,
                no_answer_count INTEGER,
                stop_reason_counts TEXT,
                duration_human TEXT,
                pass_k INTEGER,
                temperature REAL,
                top_p REAL,
                max_tokens INTEGER,
                error TEXT,
                model TEXT NOT NULL
            );
CREATE INDEX idx_summaries_model ON summaries(model_tag);
CREATE INDEX idx_summaries_task ON summaries(task_name);
Powered by Datasette · Queries took 29.706ms