|
{ |
|
"batching": { |
|
"batch_size": 64, |
|
"max_tokens": 1024, |
|
"sampling_smoothing": 1, |
|
"sort_by_size": true |
|
}, |
|
"decoders": { |
|
"classification": {}, |
|
"default_decoder": { |
|
"layers_to_use": [ |
|
-1 |
|
], |
|
"loss_weight": 1, |
|
"metric": "accuracy", |
|
"topn": 1 |
|
}, |
|
"dependency": { |
|
"arc_representation_dim": 768, |
|
"metric": "las", |
|
"tag_representation_dim": 256 |
|
}, |
|
"mlm": { |
|
"metric": "perplexity" |
|
}, |
|
"multiclas": { |
|
"metric": "multi_acc", |
|
"threshold": 0.7 |
|
}, |
|
"multiseq": { |
|
"metric": "multi_acc", |
|
"threshold": 0.7 |
|
}, |
|
"regression": { |
|
"metric": "avg_dist" |
|
}, |
|
"seq": {}, |
|
"seq_bio": { |
|
"metric": "span_f1" |
|
}, |
|
"string2string": {}, |
|
"tok": { |
|
"pre_split": true |
|
} |
|
}, |
|
"default_dec_dataset_embeds_dim": 12, |
|
"encoder": { |
|
"dropout": 0.2, |
|
"max_input_length": 64, |
|
"update_weights_encoder": true |
|
}, |
|
"random_seed": 8446, |
|
"training": { |
|
"keep_top_n": 1, |
|
"learning_rate_scheduler": { |
|
"cut_frac": 0.3, |
|
"decay_factor": 0.38, |
|
"discriminative_fine_tuning": true, |
|
"gradual_unfreezing": true |
|
}, |
|
"num_epochs": 50, |
|
"optimizer": { |
|
"betas": [ |
|
0.9, |
|
0.99 |
|
], |
|
"correct_bias": false, |
|
"lr": 0.0015, |
|
"weight_decay": 0.01 |
|
} |
|
}, |
|
"transformer_model": "dbmdz/bert-base-italian-xxl-cased" |
|
} |