metadata
license: apache-2.0
datasets:
- hkust-nlp/SimpleRL-Zoo-Data
- agentica-org/DeepScaleR-Preview-Dataset
language:
- en
metrics:
- accuracy
base_model:
- Qwen/Qwen2.5-7B
pipeline_tag: reinforcement-learning
license: apache-2.0
datasets:
- hkust-nlp/SimpleRL-Zoo-Data
- agentica-org/DeepScaleR-Preview-Dataset
language:
- en
metrics:
- accuracy
base_model:
- Qwen/Qwen2.5-7B
pipeline_tag: reinforcement-learning