File size: 950 Bytes
d0940c3
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
# yaml-language-server: $schema=../../config_schema.json

task: question-answering
base_model: /home/praise/PycharmProjects/encoder_playground/ModernBERT-base-nli

data:
  path: rajpurkar/squad_v2
  train_split: train # this must be either train.csv or train.json
  test_split: validation  # this must be either valid.csv or valid.json

trainer:
  trainer_name: "hf_trainer"
  hf_trainer_args:
    eval_steps: 200
    save_steps: 200
    logging_steps: 200
    optim: adamw_torch
    num_train_epochs: 4
    weight_decay: 0.01
    learning_rate: 3.0E-5
    metric_for_best_model: "f1"
    greater_is_better: true
    per_device_train_batch_size: 32
    per_device_eval_batch_size: 32
    output_dir: /home/praise/PycharmProjects/encoder_playground/runs/ModernBERT-base-squad2-v0.24
    bf16: true
    warmup_ratio: 0.1

  extra_trainer_args:
    early_stopping_patience: 20
    early_stopping_threshold: 0.001

huggingface_hub_username: "Praise2112"