license: apache-2.0 language: - en - zh base_model: - HuggingFaceTB/SmolLM2-360M-Instruct pipeline_tag: text-generation library_name: transformers tags: - Grpo - text-generation-inference - Llama - trl