albert-base-v2-STS-B / train_args.json
system's picture
system HF staff
Update train_args.json
8aa0d32
raw
history blame contribute delete
767 Bytes
{
"model": "albert-base-v2",
"dataset": "glue:stsb",
"dataset_train_split": "train",
"dataset_dev_split": "validation",
"tb_writer_step": 1000,
"checkpoint_steps": -1,
"checkpoint_every_epoch": false,
"num_train_epochs": 5,
"early_stopping_epochs": -1,
"batch_size": 32,
"max_length": 128,
"learning_rate": 3e-05,
"grad_accum_steps": 1,
"warmup_proportion": 0.1,
"config_name": "config.json",
"weights_name": "pytorch_model.bin",
"enable_wandb": false,
"output_dir": "/p/qdata/jm8wx/research/text_attacks/textattack/outputs/training/albert-base-v2-glue:stsb-2020-06-29-11:30/",
"num_labels": 1,
"do_regression": true,
"best_eval_score": 0.9064220351504577,
"best_eval_score_epoch": 3,
"epochs_since_best_eval_score": 1
}