{ "architectures": [ "EmageAudioModel" ], "audio_f": 256, "audio_fps": 16000, "audio_norm": false, "audio_rep": "wave16k", "audio_sr": 16000, "cf": 0, "ch": 1, "cl": 1, "class_name": "EmageAudioModel", "cu": 1, "hidden_size": 768, "joint_mask": null, "lf": 3, "lh": 3, "ll": 3, "lu": 3, "model_type": "emage_audio", "motion_f": 256, "name_pyfile": "models.emage_audio.modeling_emage_audio", "pose_dims": 330, "pose_fps": 30, "pose_length": 64, "pose_rep": "smplx", "seed_frames": 4, "speaker_dims": 1, "speaker_f": 768, "stride": 20, "test_length": 64, "torch_dtype": "float32", "transformers_version": "4.30.2", "vae_codebook_size": 256 }