| { | |
| "architectures": [ | |
| "MCTCTForCTC" | |
| ], | |
| "attention_head_dim": 384, | |
| "attention_probs_dropout_prob": 0.3, | |
| "bos_token_id": 0, | |
| "conv_channels": null, | |
| "conv_dropout": 0.3, | |
| "conv_glu_dim": 1, | |
| "conv_kernel": [ | |
| 7 | |
| ], | |
| "conv_stride": [ | |
| 3 | |
| ], | |
| "ctc_loss_reduction": "sum", | |
| "ctc_zero_infinity": false, | |
| "eos_token_id": 2, | |
| "hidden_act": "relu", | |
| "hidden_dropout_prob": 0.3, | |
| "hidden_size": 1536, | |
| "initializer_range": 0.02, | |
| "input_channels": 1, | |
| "input_feat_per_channel": 80, | |
| "intermediate_size": 6144, | |
| "layer_norm_eps": 1e-05, | |
| "layerdrop": 0.3, | |
| "max_position_embeddings": 920, | |
| "model_type": "mctct", | |
| "num_attention_heads": 4, | |
| "num_conv_layers": 1, | |
| "num_hidden_layers": 36, | |
| "pad_token_id": 1, | |
| "position_embedding_type": "relative_key", | |
| "torch_dtype": "float32", | |
| "transformers_version": "4.18.0.dev0", | |
| "use_cache": true, | |
| "vocab_size": 8065 | |
| } | |