paths: root_dir: . data_dir: ${paths.root_dir}/data/ log_dir: ${paths.root_dir}/logs/ output_dir: ${hydra:runtime.output_dir} work_dir: ${hydra:runtime.cwd} data_config: name: mitermix/audiosnippets streaming: true audio_key: mp3 caption_key: caption model_config: tokenizer_name: openai/whisper-tiny model_name: openai/whisper-base attn_implementation: flash_attention_2 name: openai/whisper-tiny trainer_config: tf32: true bf16: true fp16: false dataloader_num_workers: 16 eval_strategy: 'no' eval_steps: null save_strategy: steps save_steps: 5000 save_total_limit: 5 gradient_checkpointing: false gradient_checkpointing_kwargs: use_reentrant: false ddp_find_unused_parameters: false logging_steps: 50 seed: 998244353 optim: adamw_torch adam_beta1: 0.9 adam_beta2: 0.98 max_grad_norm: 1.0 per_device_train_batch_size: 128 output_dir: ${paths.output_dir} report_to: tensorboard logging_dir: ${trainer_config.output_dir}/tb lr_scheduler_type: cosine learning_rate: 0.0001 warmup_steps: 5000 max_steps: 50000 label_smoothing_factor: 0.0 push_to_hub: true hub_model_id: seastar105/whisper-base-emo-speech-caption dataloader_prefetch_factor: 4 task_name: tiny-test