rghosh8/arc-grpo-nemotron-mini-4b-instruct-seed-42-G-4-REDUCED-modules-layers-beta-0.01-merged 4B • Updated about 8 hours ago
rghosh8/arc-grpo-nemotron-mini-4b-instruct-seed-42-G-4-REDUCED-modules-layers-beta-0.01 Text Generation • Updated about 8 hours ago
rghosh8/arc-grpo-deepseek-llm-7b-chat-rajat-seed-42-G-4-epsilon-high-0.3_merged 7B • Updated about 22 hours ago
rghosh8/arc-grpo-deepseek-llm-7b-chat-rajat-seed-42-G-4-epsilon-high-0.3 Text Generation • Updated about 22 hours ago
rghosh8/arc-grpo-nemotron-mini-4b-instruct-beta-0.01-adapter Text Generation • Updated about 24 hours ago • 12
rghosh8/arc-grpo-nemotron-mini-4b-instruct-rajat-seed-42-G-4-REDUCED-modules_merged 4B • Updated 1 day ago • 32
rghosh8/arc-grpo-nemotron-mini-4b-instruct-rajat-seed-42-G-4-REDUCED-modules Text Generation • Updated 1 day ago • 12
rghosh8/deepseek-llm-7b-chat-opencoder-educational-instruct-seed-42-G-4-REDUCED-LAYERS-new-params_merged 7B • Updated 1 day ago • 49
rghosh8/deepseek-llm-7b-chat-opencoder-educational-instruct-seed-42-G-4-REDUCED-LAYERS-new-params Text Generation • Updated 1 day ago • 13
rghosh8/arc-grpo-deepseek-R1-distill-qwen-1.5b-rajat-seed-3407-G-16 Text Generation • Updated 3 days ago • 14
rghosh8/arc-grpo-deepseek-R1-distill-qwen-1.5b-rajat-seed-3407-G-4 Text Generation • Updated 3 days ago • 17
rghosh8/arc-grpo-deepseek-r1-distill-qwen-1.5b-rajat-seed-42-G-4-baseline Text Generation • Updated 3 days ago • 14
rghosh8/arc-grpo-nemotron-mini-4b-instruct-rajat-seed-42-G-4-REDUCED-LAYERS-2_merged 4B • Updated 4 days ago • 41
rghosh8/arc-grpo-nemotron-mini-4b-instruct-rajat-seed-42-G-4-REDUCED-LAYERS-2 Text Generation • Updated 4 days ago • 15
rghosh8/gsm8k-nemotron-mini-4b-instruct-rajat-seed-42-G-4-REDUCED-LAYERS-2_merged 4B • Updated 4 days ago • 13
rghosh8/gsm8k-nemotron-mini-4b-instruct-rajat-seed-42-G-4-REDUCED-LAYERS-2 Text Generation • Updated 4 days ago • 12
rghosh8/gsm8k-deepseek-r1-distill-qwen-1.5b-rajat-seed-3407-G-4 Text Generation • Updated 5 days ago • 21
rghosh8/gsm8k-deepseek-r1-distill-qwen-1.5b-rajat-seed-42-G-4 Text Generation • Updated 5 days ago • 22
rghosh8/nemotron-mini-4b-opencoder-educational-instruct-seed-42-G-4-REDUCED-LAYERS-new-params_merged 4B • Updated 5 days ago • 40
rghosh8/nemotron-mini-4b-instruct-opencoder-educational-instruct-seed-42-G-4-REDUCED-LAYERS-new-params Text Generation • Updated 5 days ago • 10
rghosh8/arc-grpo-Nemotron-Mini-4B-Instruct-rajat-seed-42-G-4-REDUCED-LAYERS_merged 4B • Updated 6 days ago • 47
rghosh8/arc-grpo-Nemotron-Mini-4B-Instruct-rajat-seed-42-G-4-REDUCED-LAYERS Text Generation • Updated 6 days ago • 11
rghosh8/gsm8k-Nemotron-Mini-4B-Instruct-rajat-seed-42-G-4-REDUCED-LAYERS_merged 4B • Updated 6 days ago • 11
rghosh8/gsm8k-Nemotron-Mini-4B-Instruct-rajat-seed-42-G-4-REDUCED-LAYERS Text Generation • Updated 6 days ago • 12
rghosh8/nemotron-mini-4b-instruct-opencoder-educational-instruct-seed-42-G-4-REDUCED-LAYERS_merged 4B • Updated 6 days ago • 32