metadata
license: apache-2.0
datasets:
- openai/gsm8k
language:
- en
base_model:
- Qwen/Qwen2.5-0.5B-Instruct
pipeline_tag: text-generation
library_name: transformers
tags:
- math
- reasoning
- grpo
- trl
- code
license: apache-2.0
datasets:
- openai/gsm8k
language:
- en
base_model:
- Qwen/Qwen2.5-0.5B-Instruct
pipeline_tag: text-generation
library_name: transformers
tags:
- math
- reasoning
- grpo
- trl
- code