license: apache-2.0 | |
language: | |
- en | |
- zh | |
base_model: | |
- prithivMLmods/SmolLM2_135M_Grpo_Gsm8k | |
pipeline_tag: text-generation | |
library_name: transformers | |
tags: | |
- Grpo | |
- text-generation-inference | |
- Llama | |
- trl | |
 | |