File size: 950 Bytes
d0940c3 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 |
# yaml-language-server: $schema=../../config_schema.json
task: question-answering
base_model: /home/praise/PycharmProjects/encoder_playground/ModernBERT-base-nli
data:
path: rajpurkar/squad_v2
train_split: train # this must be either train.csv or train.json
test_split: validation # this must be either valid.csv or valid.json
trainer:
trainer_name: "hf_trainer"
hf_trainer_args:
eval_steps: 200
save_steps: 200
logging_steps: 200
optim: adamw_torch
num_train_epochs: 4
weight_decay: 0.01
learning_rate: 3.0E-5
metric_for_best_model: "f1"
greater_is_better: true
per_device_train_batch_size: 32
per_device_eval_batch_size: 32
output_dir: /home/praise/PycharmProjects/encoder_playground/runs/ModernBERT-base-squad2-v0.24
bf16: true
warmup_ratio: 0.1
extra_trainer_args:
early_stopping_patience: 20
early_stopping_threshold: 0.001
huggingface_hub_username: "Praise2112"
|