apex-seq2seq / config.json
usmankhanic's picture
Publishing model weights bin
3e46063 verified
{
"architectures": [
"Seq2SeqTransformer"
],
"model_type": "encoder-decoder",
"encoder": {
"model_type": "bart",
"num_layers": 3,
"hidden_size": 256,
"num_attention_heads": 8,
"intermediate_size": 512,
"dropout": 0.1,
"vocab_size": 318,
"special_tokens": {
"pad_token": "<pad>",
"bos_token": "<bos>",
"eos_token": "<eos>",
"unk_token": "<unk>"
}
},
"decoder": {
"model_type": "bart",
"num_layers": 3,
"hidden_size": 256,
"num_attention_heads": 8,
"intermediate_size": 512,
"dropout": 0.1,
"vocab_size": 318,
"special_tokens": {
"pad_token": "<pad>",
"bos_token": "<bos>",
"eos_token": "<eos>",
"unk_token": "<unk>"
}
}
}