license: apache-2.0 language: - en - zh base_model: - prithivMLmods/SmolLM2_135M_Grpo_Gsm8k pipeline_tag: text-generation library_name: transformers tags: - Grpo - text-generation-inference - Llama - trl