roberta-base-relu-sst5 / training_config.json
skytree's picture
Upload training_config.json
ac0a42d verified
{
"model_name": "roberta-base",
"output_dir": "./ckpts/finetune_relu_roberta_from_gelu_sst5",
"learning_rate": 1e-05,
"batch_size": 32,
"num_epochs": 20,
"max_length": 128,
"warmup_steps": 500,
"weight_decay": 0.01,
"seed": 42,
"hidden_act": "relu",
"timestamp": "2025-01-13 19:56:34",
"cuda_available": true,
"cuda_device": "NVIDIA A100 80GB PCIe"
}