license: apache-2.0 | |
language: | |
- en | |
- zh | |
base_model: | |
- HuggingFaceTB/SmolLM2-360M-Instruct | |
pipeline_tag: text-generation | |
library_name: transformers | |
tags: | |
- Grpo | |
- text-generation-inference | |
- Llama | |
- trl | |
license: apache-2.0 | |
language: | |
- en | |
- zh | |
base_model: | |
- HuggingFaceTB/SmolLM2-360M-Instruct | |
pipeline_tag: text-generation | |
library_name: transformers | |
tags: | |
- Grpo | |
- text-generation-inference | |
- Llama | |
- trl | |