rlsamplingJF/Llama-3.2-3B-finemath_part1_part2-rm-lr1e-6-constant-warmup_0.05-bs16-gc1.0-cc0.01-ls0-step437 3B • Updated 19 days ago • 36
rlsamplingJF/Llama-3.2-3B-finemath_part1_part2_lr1e-6-constant-warmup_0-bs32-gc1.0-cc0.01-ls0-step150 3B • Updated 19 days ago • 111
rlsamplingJF/Qwen2.5-3B-Instruct-finemath_part1_part2-lr1e-6-constant-warmup_0-bs8-gc1.0-cc0.01-step120 3B • Updated 22 days ago • 35
rlsamplingJF/evolm-4B-160BT-finemath_part1_part2-rm-lr1e-6-constant-warmup_0.05-bs16-gc1.0-cc0.01-ls0-step180 4B • Updated 23 days ago • 17
rlsamplingJF/Qwen2.5-7B-Instruct-finemath_part1-rm-lr1e-6-constant-warmup_0.05-bs8-gc1.0-cc0.01-ls0.1-step45 7B • Updated 24 days ago • 38
rlsamplingJF/Llama-3.2-3B-finemath_part1_part2-rm-lr1e-6-constant-warmup_0.05-bs16-gc1.0-cc0.01-ls0-step375 3B • Updated 25 days ago • 40
rlsamplingJF/Llama-3.2-3B-finemath_part1_part2-rm-lr1e-6-constant-warmup_0.05-bs16-gc1.0-step345 3B • Updated 26 days ago • 41
rlsamplingJF/evolm-4B-160BT-finemath_part1_part2-rm-lr1e-6-constant-warmup_0.05-bs16-gc1.0-cc0.01-ls0-initial 4B • Updated 26 days ago • 20
rlsamplingJF/evolm-4B-160BT-finemath_part1_part2-rm-lr1e-6-constant-warmup_0.05-bs16-gc1.0-cc0.01-ls0-step120 4B • Updated 26 days ago • 24
rlsamplingJF/Llama-3.2-1B-finemath_part1_part2-rm-lr1e-6-constant-warmup_0.05-bs16-gc1.0-cc0.01-ls0.1-step150 1B • Updated 27 days ago • 15
rlsamplingJF/Llama-3.2-1B-finemath_part1_part2-rm-lr1e-6-constant-warmup_0.05-bs16-gc1.0-cc0-ls0-initial 1B • Updated 27 days ago • 21
rlsamplingJF/Llama-3.2-1B-finemath_part1_part2-rm-lr1e-6-constant-warmup_0.05-bs16-gc1.0-cc0-ls0-step405 1B • Updated 27 days ago • 18
rlsamplingJF/Qwen2.5-7B-Instruct-finemath_part1-rm-lr1e-6-constant-warmup_0.05-bs16-gc1.0-cc0.01-ls0.1-step30 7B • Updated 27 days ago • 28
rlsamplingJF/Llama-3.2-3B-finemath_part1_part2-rm-lr1e-5-constant-warmup_0.05-bs44-gc1.0-step105 3B • Updated 28 days ago • 17
rlsamplingJF/Llama-3.2-3B-finemath_part1_part2-rm-lr1e-6-constant-warmup_0.05-bs32-gc1.0-step195 3B • Updated 29 days ago • 45
rlsamplingJF/Qwen2.5-7B-Instruct-finemath_part1-rm-lr5e-7-constant-warmup_0.05-bs8-gc1.0-cc0.0-ls0.0-initial 7B • Updated 29 days ago • 97
rlsamplingJF/Qwen2.5-7B-Instruct-finemath_part1-rm-lr5e-7-constant-warmup_0.05-bs8-gc1.0-cc0.0-ls0.0-step105 7B • Updated 29 days ago • 23
rlsamplingJF/Qwen2.5-7B-Instruct-finemath_part1-rm-lr1e-6-constant-warmup_0.05-bs8-gc1.0-step60 7B • Updated 29 days ago • 129
rlsamplingJF/Llama-3.2-3B-finemath_part1-rm-lr1e-6-constant-warmup_0.05-bs32-gc1.0-cc0.01-ls0-initial 3B • Updated 30 days ago • 58
rlsamplingJF/Llama-3.2-3B-finemath_part1-rm-lr1e-6-constant-warmup_0.05-bs32-gc1.0-cc0.01-ls0-step109 3B • Updated 30 days ago • 42
rlsamplingJF/Llama-3.2-3B-finemath_part1-rm-lr1e-6-constant-warmup_0.05-bs16-gc1.0-initial 3B • Updated about 1 month ago • 17
rlsamplingJF/Llama-3.2-3B-finemath_part1-rm-lr1e-6-constant-warmup_0.05-bs16-gc1.0-step220 3B • Updated about 1 month ago • 10
rlsamplingJF/Qwen2.5-3B-Instruct-finemath-highquality-part1-seed2028-initial 3B • Updated Nov 30, 2025 • 14
rlsamplingJF/Llama-3.2-3B-finemath-highquality-rm-run2-lr3e-5-cosine-bs32-gc1.0-initial 3B • Updated Nov 1, 2025
rlsamplingJF/Llama-3.2-3B-finemath-highquality-rm-run2-lr3e-5-cosine-bs32-gc1.0 3B • Updated Nov 1, 2025