rlsamplingJF/Llama-3.2-3B-finemath_part1_part2-rm-lr1e-6-constant-warmup_0.05-bs16-gc1.0-cc0.01-ls0-step437 3B • Updated about 24 hours ago • 13
rlsamplingJF/Llama-3.2-3B-finemath_part1_part2-rm-lr1e-6-constant-warmup_0.05-bs16-gc1.0-cc0.01-ls0-step437 3B • Updated about 24 hours ago • 13
rlsamplingJF/Llama-3.2-3B-finemath_part1_part2_lr1e-6-constant-warmup_0-bs32-gc1.0-cc0.01-ls0-step150 3B • Updated about 24 hours ago • 21
rlsamplingJF/Llama-3.2-3B-finemath_part1_part2_lr1e-6-constant-warmup_0-bs32-gc1.0-cc0.01-ls0-step150 3B • Updated about 24 hours ago • 21
rlsamplingJF/Qwen2.5-3B-Instruct-finemath_part1_part2-lr1e-6-constant-warmup_0-bs8-gc1.0-cc0.01-step120 3B • Updated 4 days ago • 22
rlsamplingJF/Qwen2.5-3B-Instruct-finemath_part1_part2-lr1e-6-constant-warmup_0-bs8-gc1.0-cc0.01-step120 3B • Updated 4 days ago • 22
rlsamplingJF/evolm-4B-160BT-finemath_part1_part2-rm-lr1e-6-constant-warmup_0.05-bs16-gc1.0-cc0.01-ls0-step180 4B • Updated 5 days ago • 17
rlsamplingJF/evolm-4B-160BT-finemath_part1_part2-rm-lr1e-6-constant-warmup_0.05-bs16-gc1.0-cc0.01-ls0-step180 4B • Updated 5 days ago • 17
rlsamplingJF/Qwen2.5-7B-Instruct-finemath_part1-rm-lr1e-6-constant-warmup_0.05-bs8-gc1.0-cc0.01-ls0.1-step45 7B • Updated 6 days ago • 23
rlsamplingJF/Qwen2.5-7B-Instruct-finemath_part1-rm-lr1e-6-constant-warmup_0.05-bs8-gc1.0-cc0.01-ls0.1-step45 7B • Updated 6 days ago • 23
rlsamplingJF/Llama-3.2-3B-finemath_part1_part2-rm-lr1e-6-constant-warmup_0.05-bs16-gc1.0-cc0.01-ls0-step375 3B • Updated 7 days ago • 40
rlsamplingJF/Llama-3.2-3B-finemath_part1_part2-rm-lr1e-6-constant-warmup_0.05-bs16-gc1.0-cc0.01-ls0-step375 3B • Updated 7 days ago • 40
rlsamplingJF/Llama-3.2-3B-finemath_part1_part2-rm-lr1e-6-constant-warmup_0.05-bs16-gc1.0-step345 3B • Updated 8 days ago • 19
rlsamplingJF/Llama-3.2-3B-finemath_part1_part2-rm-lr1e-6-constant-warmup_0.05-bs16-gc1.0-step345 3B • Updated 8 days ago • 19
rlsamplingJF/evolm-4B-160BT-finemath_part1_part2-rm-lr1e-6-constant-warmup_0.05-bs16-gc1.0-cc0.01-ls0-initial 4B • Updated 8 days ago • 20
rlsamplingJF/evolm-4B-160BT-finemath_part1_part2-rm-lr1e-6-constant-warmup_0.05-bs16-gc1.0-cc0.01-ls0-initial 4B • Updated 8 days ago • 20
rlsamplingJF/evolm-4B-160BT-finemath_part1_part2-rm-lr1e-6-constant-warmup_0.05-bs16-gc1.0-cc0.01-ls0-step120 4B • Updated 8 days ago • 24
rlsamplingJF/evolm-4B-160BT-finemath_part1_part2-rm-lr1e-6-constant-warmup_0.05-bs16-gc1.0-cc0.01-ls0-step120 4B • Updated 8 days ago • 24
rlsamplingJF/Llama-3.2-1B-finemath_part1_part2-rm-lr1e-6-constant-warmup_0.05-bs16-gc1.0-cc0.01-ls0.1-step150 1B • Updated 9 days ago • 15
rlsamplingJF/Llama-3.2-1B-finemath_part1_part2-rm-lr1e-6-constant-warmup_0.05-bs16-gc1.0-cc0.01-ls0.1-step150 1B • Updated 9 days ago • 15