- CodeLlama-13b-Python-hf-sft
- CodeLlama-34b-Python-hf-sft
- CodeLlama-7b-Python-hf-sft
- Eurus-7b-sft
- deepseek-coder-33b-sft
- deepseek-math-7b-dpo
- deepseek-math-7b-expo-0.5
- deepseek-math-7b-kto
- deepseek-math-7b-rl-sft
- deepseek-math-7b-rl
- deepseek-math-7b-sft
- internlm-math-20b-sft
- internlm-math-7b-sft
- mistral-7b-sft
- mixtral-47b-sft
- ppo_aimo_vllm_extract_answer_warmup_1e-6_promising
- qwen-14b-sft
- starcoder2-15b-sft
- tora-code-34b-v1.0