File size: 766 Bytes
0689246 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 |
{
"optimizer":"AdamW",
"learning_rate":0.0005,
"adam_epsilon":0.00001,
"warmup_steps":25,
"weight_decay":0,
"train_batch_size":64,
"eval_batch_size":64,
"use_scheduler":true,
"metrics":null,
"model_name_or_path":"allegro/herbert-base-cased",
"num_classes":7,
"finetune_last_n_layers":4,
"config_kwargs":{
"classifier_dropout":0.2
},
"task_model_kwargs":{
"adam_epsilon":0.00001,
"eval_batch_size":64,
"learning_rate":0.0005,
"optimizer":"AdamW",
"train_batch_size":64,
"use_scheduler":true,
"warmup_steps":25,
"weight_decay":0
},
"model_compile_kwargs":null,
"evaluation_mode":"unit",
"tagging_scheme":null,
"ignore_index":-100,
"downstream_model_type":"AutoModelForTokenClassification"
} |