{ "architectures": [ "GazelleForConditionalGeneration" ], "audio_config": { "model_type": "wav2vec2" }, "audio_model_id": "facebook/wav2vec2-base-960h", "audio_token_index": 134411, "hidden_size": 3072, "ignore_index": -100, "model_type": "gazelle", "projector_type": "mlp", "stack_factor": 8, "text_config": { "model_type": "llama", "vocab_size": 134412 }, "text_model_id": "amuvarma/1-1-interleaved-text-content-tokens-1mn-samples-finetuned-1", "torch_dtype": "bfloat16", "transformers_version": "4.46.3", "vocab_size": 134412 }