|
activations: Tanh |
|
batch_size: 8 |
|
class_identifier: regression_metric |
|
dropout: 0.1 |
|
encoder_learning_rate: 1.0e-05 |
|
encoder_model: MiniLM |
|
final_activation: null |
|
hidden_sizes: |
|
- 384 |
|
keep_embeddings_frozen: true |
|
layer: 12 |
|
layerwise_decay: 0.95 |
|
learning_rate: 3.1e-05 |
|
load_weights_from_checkpoint: lightning_logs/cometinho_part-i/checkpoints/epoch=0-step=899999.ckpt |
|
nr_frozen_epochs: 0.0 |
|
optimizer: AdamW |
|
pool: avg |
|
pretrained_model: microsoft/Multilingual-MiniLM-L12-H384 |
|
train_data: data/euro-distil.da.part_ii.csv |
|
validation_data: data/2019-da-dev.csv |
|
|