summaries
165 rows
This data as json, CSV (advanced)
Suggested facets: task_name, total_examples, duration_human
| id ▼ | task_name | model_tag | total_examples | correct | accuracy | no_answer_count | stop_reason_counts | duration_human | pass_k | temperature | top_p | max_tokens | error | model |
|---|---|---|---|---|---|---|---|---|---|---|---|---|---|---|
| 1 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_50 | 1319 | 968 | 0.7338893100833965 | 4 | {"stop:-": 1315, "length:-": 4} | 25s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_50/actor/huggingface | |
| 2 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_50 | 5000 | 2469 | 0.4938 | 610 | {"stop:-": 4467, "length:-": 531, "stop:Problem:": 2} | 2m 34s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_50/actor/huggingface | |
| 3 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_100 | 1319 | 980 | 0.7429871114480667 | 4 | {"stop:-": 1315, "length:-": 4} | 23s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_100/actor/huggingface | |
| 4 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_100 | 5000 | 2524 | 0.5048 | 635 | {"stop:-": 4439, "length:-": 561} | 2m 32s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_100/actor/huggingface | |
| 5 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_150 | 1319 | 986 | 0.7475360121304018 | 3 | {"stop:-": 1316, "length:-": 3} | 23s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_150/actor/huggingface | |
| 6 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_150 | 5000 | 2500 | 0.5 | 635 | {"stop:-": 4429, "length:-": 570, "stop:Problem:": 1} | 2m 33s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_150/actor/huggingface | |
| 7 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_200 | 1319 | 1003 | 0.7604245640636846 | 4 | {"stop:-": 1315, "length:-": 4} | 24s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_200/actor/huggingface | |
| 8 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_200 | 5000 | 2484 | 0.4968 | 670 | {"stop:-": 4408, "length:-": 590, "stop:Problem:": 2} | 2m 33s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_200/actor/huggingface | |
| 9 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_250 | 1319 | 1002 | 0.759666413949962 | 4 | {"stop:-": 1315, "length:-": 4} | 24s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_250/actor/huggingface | |
| 10 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_250 | 5000 | 2508 | 0.5016 | 636 | {"stop:-": 4442, "length:-": 557, "stop:Problem:": 1} | 2m 32s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_250/actor/huggingface | |
| 11 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_300 | 1319 | 991 | 0.7513267626990144 | 5 | {"stop:-": 1314, "length:-": 5} | 24s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_300/actor/huggingface | |
| 12 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_300 | 5000 | 2513 | 0.5026 | 641 | {"stop:-": 4436, "length:-": 563, "stop:Problem:": 1} | 2m 33s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_300/actor/huggingface | |
| 13 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_350 | 1319 | 989 | 0.7498104624715694 | 3 | {"stop:-": 1316, "length:-": 3} | 25s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_350/actor/huggingface | |
| 14 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_350 | 5000 | 2504 | 0.5008 | 657 | {"stop:-": 4418, "length:-": 580, "stop:Problem:": 2} | 2m 34s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_350/actor/huggingface | |
| 15 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_400 | 1319 | 1014 | 0.7687642153146323 | 4 | {"stop:-": 1315, "length:-": 4} | 23s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_400/actor/huggingface | |
| 16 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_400 | 5000 | 2538 | 0.5076 | 660 | {"stop:-": 4417, "length:-": 582, "stop:Problem:": 1} | 2m 34s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_400/actor/huggingface | |
| 17 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_450 | 1319 | 1019 | 0.7725549658832449 | 10 | {"stop:-": 1309, "length:-": 10} | 25s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_450/actor/huggingface | |
| 18 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_450 | 5000 | 2539 | 0.5078 | 656 | {"stop:-": 4423, "length:-": 575, "stop:Problem:": 2} | 2m 35s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_450/actor/huggingface | |
| 19 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_500 | 1319 | 1002 | 0.759666413949962 | 8 | {"stop:-": 1311, "length:-": 8} | 24s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_500/actor/huggingface | |
| 20 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_500 | 5000 | 2531 | 0.5062 | 642 | {"stop:-": 4437, "length:-": 561, "stop:Problem:": 2} | 2m 34s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_500/actor/huggingface | |
| 21 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_550 | 1319 | 1022 | 0.7748294162244125 | 4 | {"stop:-": 1315, "length:-": 4} | 23s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_550/actor/huggingface | |
| 22 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_550 | 5000 | 2521 | 0.5042 | 633 | {"stop:-": 4458, "length:-": 539, "stop:Problem:": 3} | 2m 33s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_550/actor/huggingface | |
| 23 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_600 | 1319 | 1027 | 0.778620166793025 | 7 | {"stop:-": 1312, "length:-": 7} | 24s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_600/actor/huggingface | |
| 24 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_600 | 5000 | 2565 | 0.513 | 628 | {"stop:-": 4443, "length:-": 555, "stop:Problem:": 2} | 2m 33s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_600/actor/huggingface | |
| 25 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_650 | 1319 | 1028 | 0.7793783169067475 | 2 | {"stop:-": 1317, "length:-": 2} | 24s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_650/actor/huggingface | |
| 26 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_650 | 5000 | 2557 | 0.5114 | 628 | {"stop:-": 4442, "length:-": 557, "stop:Problem:": 1} | 2m 33s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_650/actor/huggingface | |
| 27 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_700 | 1319 | 1027 | 0.778620166793025 | 6 | {"stop:-": 1313, "length:-": 6} | 24s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_700/actor/huggingface | |
| 28 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_700 | 5000 | 2529 | 0.5058 | 642 | {"stop:-": 4428, "length:-": 571, "stop:Problem:": 1} | 2m 33s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_700/actor/huggingface | |
| 29 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_750 | 1319 | 1037 | 0.7862016679302501 | 3 | {"stop:-": 1316, "length:-": 3} | 24s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_750/actor/huggingface | |
| 30 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_750 | 5000 | 2539 | 0.5078 | 609 | {"stop:-": 4468, "length:-": 530, "stop:Problem:": 2} | 2m 33s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_750/actor/huggingface | |
| 31 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_800 | 1319 | 1041 | 0.7892342683851402 | 3 | {"stop:-": 1316, "length:-": 3} | 24s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_800/actor/huggingface | |
| 32 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_800 | 5000 | 2536 | 0.5072 | 622 | {"stop:-": 4455, "length:-": 543, "stop:Problem:": 2} | 2m 33s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_800/actor/huggingface | |
| 33 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_850 | 1319 | 1044 | 0.7915087187263078 | 1 | {"stop:-": 1318, "length:-": 1} | 24s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_850/actor/huggingface | |
| 34 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_850 | 5000 | 2585 | 0.517 | 620 | {"stop:-": 4459, "length:-": 539, "stop:Problem:": 2} | 2m 31s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_850/actor/huggingface | |
| 35 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_900 | 1319 | 1048 | 0.7945413191811979 | 4 | {"stop:-": 1315, "length:-": 4} | 24s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_900/actor/huggingface | |
| 36 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_900 | 5000 | 2568 | 0.5136 | 635 | {"stop:-": 4444, "length:-": 553, "stop:Problem:": 3} | 2m 33s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_900/actor/huggingface | |
| 37 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_950 | 1319 | 1051 | 0.7968157695223654 | 1 | {"stop:-": 1318, "length:-": 1} | 23s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_950/actor/huggingface | |
| 38 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_950 | 5000 | 2565 | 0.513 | 609 | {"stop:-": 4461, "length:-": 537, "stop:Problem:": 2} | 2m 34s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_950/actor/huggingface | |
| 39 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_1000 | 1319 | 1029 | 0.78013646702047 | 3 | {"stop:-": 1316, "length:-": 3} | 24s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1000/actor/huggingface | |
| 40 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_1000 | 5000 | 2596 | 0.5192 | 619 | {"stop:-": 4450, "length:-": 548, "stop:Problem:": 2} | 2m 34s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1000/actor/huggingface | |
| 41 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_1050 | 1319 | 1040 | 0.7884761182714177 | 4 | {"stop:-": 1315, "length:-": 4} | 24s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1050/actor/huggingface | |
| 42 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_1050 | 5000 | 2568 | 0.5136 | 612 | {"stop:-": 4460, "length:-": 538, "stop:Problem:": 2} | 2m 33s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1050/actor/huggingface | |
| 43 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_1100 | 1319 | 1033 | 0.7831690674753601 | 3 | {"stop:-": 1316, "length:-": 3} | 24s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1100/actor/huggingface | |
| 44 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_1100 | 5000 | 2575 | 0.515 | 612 | {"stop:-": 4460, "length:-": 538, "stop:Problem:": 2} | 2m 34s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1100/actor/huggingface | |
| 45 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_1150 | 1319 | 1040 | 0.7884761182714177 | 3 | {"stop:-": 1316, "length:-": 3} | 24s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1150/actor/huggingface | |
| 46 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_1150 | 5000 | 2585 | 0.517 | 631 | {"stop:-": 4444, "length:-": 555, "stop:Problem:": 1} | 2m 35s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1150/actor/huggingface | |
| 47 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_1200 | 1319 | 1038 | 0.7869598180439727 | 2 | {"stop:-": 1317, "length:-": 2} | 25s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1200/actor/huggingface | |
| 48 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_1200 | 5000 | 2570 | 0.514 | 644 | {"stop:-": 4422, "length:-": 576, "stop:Problem:": 2} | 2m 38s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1200/actor/huggingface | |
| 49 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_1250 | 1319 | 1039 | 0.7877179681576952 | 2 | {"stop:-": 1317, "length:-": 2} | 24s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1250/actor/huggingface | |
| 50 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_1250 | 5000 | 2571 | 0.5142 | 655 | {"stop:-": 4421, "length:-": 576, "stop:Problem:": 3} | 2m 38s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1250/actor/huggingface | |
| 51 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_1300 | 1319 | 1041 | 0.7892342683851402 | 7 | {"stop:-": 1312, "length:-": 7} | 25s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1300/actor/huggingface | |
| 52 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_1300 | 5000 | 2592 | 0.5184 | 638 | {"stop:-": 4434, "length:-": 564, "stop:Problem:": 2} | 2m 40s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1300/actor/huggingface | |
| 53 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_1350 | 1319 | 1049 | 0.7952994692949203 | 2 | {"stop:-": 1317, "length:-": 2} | 24s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1350/actor/huggingface | |
| 54 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_1350 | 5000 | 2572 | 0.5144 | 649 | {"stop:-": 4425, "length:-": 574, "stop:Problem:": 1} | 2m 36s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1350/actor/huggingface | |
| 55 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_1400 | 1319 | 1054 | 0.799090219863533 | 3 | {"stop:-": 1316, "length:-": 3} | 24s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1400/actor/huggingface | |
| 56 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_1400 | 5000 | 2554 | 0.5108 | 655 | {"stop:-": 4420, "length:-": 579, "stop:Problem:": 1} | 2m 36s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1400/actor/huggingface | |
| 57 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_1450 | 1319 | 1052 | 0.7975739196360879 | 6 | {"stop:-": 1313, "length:-": 6} | 25s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1450/actor/huggingface | |
| 58 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_1450 | 5000 | 2593 | 0.5186 | 662 | {"stop:-": 4411, "length:-": 585, "stop:Problem:": 4} | 2m 37s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1450/actor/huggingface | |
| 59 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_1500 | 1319 | 1045 | 0.7922668688400303 | 7 | {"stop:-": 1312, "length:-": 7} | 25s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1500/actor/huggingface | |
| 60 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_1500 | 5000 | 2595 | 0.519 | 634 | {"stop:-": 4438, "length:-": 559, "stop:Problem:": 3} | 2m 38s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1500/actor/huggingface | |
| 61 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_1550 | 1319 | 1058 | 0.8021228203184231 | 4 | {"stop:-": 1315, "length:-": 4} | 25s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1550/actor/huggingface | |
| 62 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_1550 | 5000 | 2590 | 0.518 | 608 | {"stop:-": 4476, "length:-": 520, "stop:Problem:": 4} | 2m 36s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1550/actor/huggingface | |
| 63 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_1600 | 1319 | 1051 | 0.7968157695223654 | 5 | {"stop:-": 1314, "length:-": 5} | 24s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1600/actor/huggingface | |
| 64 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_1600 | 5000 | 2595 | 0.519 | 572 | {"stop:-": 4498, "length:-": 498, "stop:Problem:": 4} | 2m 34s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1600/actor/huggingface | |
| 65 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_1650 | 1319 | 1044 | 0.7915087187263078 | 2 | {"stop:-": 1317, "length:-": 2} | 24s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1650/actor/huggingface | |
| 66 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_1650 | 5000 | 2573 | 0.5146 | 564 | {"stop:-": 4507, "length:-": 491, "stop:Problem:": 2} | 2m 32s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1650/actor/huggingface | |
| 67 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_1700 | 1319 | 1058 | 0.8021228203184231 | 2 | {"stop:-": 1317, "length:-": 2} | 24s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1700/actor/huggingface | |
| 68 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_1700 | 5000 | 2581 | 0.5162 | 604 | {"stop:-": 4468, "length:-": 531, "stop:Problem:": 1} | 2m 33s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1700/actor/huggingface | |
| 69 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_1750 | 1319 | 1044 | 0.7915087187263078 | 2 | {"stop:-": 1317, "length:-": 2} | 24s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1750/actor/huggingface | |
| 70 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_1750 | 5000 | 2578 | 0.5156 | 612 | {"stop:-": 4458, "length:-": 540, "stop:Problem:": 2} | 2m 35s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1750/actor/huggingface | |
| 71 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_1800 | 1319 | 1060 | 0.8036391205458681 | 2 | {"stop:-": 1317, "length:-": 2} | 23s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1800/actor/huggingface | |
| 72 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_1800 | 5000 | 2591 | 0.5182 | 613 | {"stop:-": 4470, "length:-": 526, "stop:Problem:": 4} | 2m 35s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1800/actor/huggingface | |
| 73 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_1850 | 1319 | 1044 | 0.7915087187263078 | 2 | {"stop:-": 1317, "length:-": 2} | 24s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1850/actor/huggingface | |
| 74 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_1850 | 5000 | 2545 | 0.509 | 585 | {"stop:-": 4494, "length:-": 504, "stop:Problem:": 2} | 2m 34s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1850/actor/huggingface | |
| 75 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_1900 | 1319 | 1049 | 0.7952994692949203 | 6 | {"stop:-": 1313, "length:-": 6} | 24s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1900/actor/huggingface | |
| 76 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_1900 | 5000 | 2577 | 0.5154 | 591 | {"stop:-": 4480, "length:-": 520} | 2m 33s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1900/actor/huggingface | |
| 77 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_1950 | 1319 | 1057 | 0.8013646702047005 | 3 | {"stop:-": 1316, "length:-": 3} | 24s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1950/actor/huggingface | |
| 78 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_1950 | 5000 | 2610 | 0.522 | 572 | {"stop:-": 4499, "length:-": 501} | 2m 34s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_1950/actor/huggingface | |
| 79 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_2000 | 1319 | 1046 | 0.7930250189537529 | 5 | {"stop:-": 1314, "length:-": 5} | 24s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2000/actor/huggingface | |
| 80 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_2000 | 5000 | 2603 | 0.5206 | 573 | {"stop:-": 4504, "length:-": 496} | 2m 33s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2000/actor/huggingface | |
| 81 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_2050 | 1319 | 1055 | 0.7998483699772555 | 2 | {"stop:-": 1317, "length:-": 2} | 23s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2050/actor/huggingface | |
| 82 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_2050 | 5000 | 2576 | 0.5152 | 584 | {"stop:-": 4501, "length:-": 498, "stop:Problem:": 1} | 2m 32s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2050/actor/huggingface | |
| 83 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_2100 | 1319 | 1063 | 0.8059135708870356 | 5 | {"stop:-": 1314, "length:-": 5} | 24s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2100/actor/huggingface | |
| 84 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_2100 | 5000 | 2592 | 0.5184 | 607 | {"stop:-": 4470, "length:-": 529, "stop:Problem:": 1} | 2m 37s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2100/actor/huggingface | |
| 85 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_2150 | 1319 | 1060 | 0.8036391205458681 | 5 | {"stop:-": 1314, "length:-": 5} | 24s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2150/actor/huggingface | |
| 86 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_2150 | 5000 | 2606 | 0.5212 | 641 | {"stop:-": 4434, "length:-": 563, "stop:Problem:": 3} | 2m 36s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2150/actor/huggingface | |
| 87 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_2200 | 1319 | 1069 | 0.8104624715693708 | 3 | {"stop:-": 1316, "length:-": 3} | 24s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2200/actor/huggingface | |
| 88 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_2200 | 5000 | 2580 | 0.516 | 609 | {"stop:-": 4462, "length:-": 536, "stop:Problem:": 2} | 2m 34s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2200/actor/huggingface | |
| 89 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_2250 | 1319 | 1064 | 0.8066717210007581 | 3 | {"stop:-": 1316, "length:-": 3} | 24s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2250/actor/huggingface | |
| 90 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_2250 | 5000 | 2584 | 0.5168 | 580 | {"stop:-": 4494, "length:-": 504, "stop:Problem:": 2} | 2m 33s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2250/actor/huggingface | |
| 91 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_2300 | 1319 | 1063 | 0.8059135708870356 | 5 | {"stop:-": 1314, "length:-": 5} | 24s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2300/actor/huggingface | |
| 92 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_2300 | 5000 | 2574 | 0.5148 | 586 | {"stop:-": 4490, "length:-": 507, "stop:Problem:": 3} | 2m 33s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2300/actor/huggingface | |
| 93 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_2350 | 1319 | 1050 | 0.796057619408643 | 6 | {"stop:-": 1313, "length:-": 6} | 24s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2350/actor/huggingface | |
| 94 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_2350 | 5000 | 2595 | 0.519 | 586 | {"stop:-": 4490, "length:-": 507, "stop:Problem:": 3} | 2m 33s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2350/actor/huggingface | |
| 95 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_2400 | 1319 | 1061 | 0.8043972706595905 | 4 | {"stop:-": 1315, "length:-": 4} | 25s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2400/actor/huggingface | |
| 96 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_2400 | 5000 | 2599 | 0.5198 | 603 | {"stop:-": 4468, "length:-": 530, "stop:Problem:": 2} | 2m 35s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2400/actor/huggingface | |
| 97 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_2450 | 1319 | 1045 | 0.7922668688400303 | 3 | {"stop:-": 1316, "length:-": 3} | 24s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2450/actor/huggingface | |
| 98 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_2450 | 5000 | 2605 | 0.521 | 542 | {"stop:-": 4526, "length:-": 472, "stop:Problem:": 2} | 2m 30s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2450/actor/huggingface | |
| 99 | gsm8k_main(0) | grpo-gsm8k-train-13ep-success_global_step_2500 | 1319 | 1045 | 0.7922668688400303 | 7 | {"stop:-": 1312, "length:-": 7} | 24s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2500/actor/huggingface | |
| 100 | hendrycks_math(0) | grpo-gsm8k-train-13ep-success_global_step_2500 | 5000 | 2598 | 0.5196 | 567 | {"stop:-": 4505, "length:-": 493, "stop:Problem:": 2} | 2m 33s | 1 | 0.0 | 0.95 | 1024 | /mnt/data8tb/Documents/project/rlvr_winter/verl-my-rlvr/finished-models/grpo-gsm8k-train-13ep-success/global_step_2500/actor/huggingface |
Advanced export
JSON shape: default, array, newline-delimited, object
CREATE TABLE summaries (
id INTEGER PRIMARY KEY AUTOINCREMENT,
task_name TEXT NOT NULL,
model_tag TEXT NOT NULL,
total_examples INTEGER,
correct INTEGER,
accuracy REAL,
no_answer_count INTEGER,
stop_reason_counts TEXT,
duration_human TEXT,
pass_k INTEGER,
temperature REAL,
top_p REAL,
max_tokens INTEGER,
error TEXT,
model TEXT NOT NULL
);
CREATE INDEX idx_summaries_model ON summaries(model_tag);
CREATE INDEX idx_summaries_task ON summaries(task_name);