| # yaml-language-server: $schema=../../config_schema.json | |
| task: question-answering | |
| base_model: /home/praise/PycharmProjects/encoder_playground/ModernBERT-base-nli | |
| data: | |
| path: rajpurkar/squad_v2 | |
| train_split: train # this must be either train.csv or train.json | |
| test_split: validation # this must be either valid.csv or valid.json | |
| trainer: | |
| trainer_name: "hf_trainer" | |
| hf_trainer_args: | |
| eval_steps: 200 | |
| save_steps: 200 | |
| logging_steps: 200 | |
| optim: adamw_torch | |
| num_train_epochs: 4 | |
| weight_decay: 0.01 | |
| learning_rate: 3.0E-5 | |
| metric_for_best_model: "f1" | |
| greater_is_better: true | |
| per_device_train_batch_size: 32 | |
| per_device_eval_batch_size: 32 | |
| output_dir: /home/praise/PycharmProjects/encoder_playground/runs/ModernBERT-base-squad2-v0.24 | |
| bf16: true | |
| warmup_ratio: 0.1 | |
| extra_trainer_args: | |
| early_stopping_patience: 20 | |
| early_stopping_threshold: 0.001 | |
| huggingface_hub_username: "Praise2112" | |