paths: | |
root_dir: . | |
data_dir: ${paths.root_dir}/data/ | |
log_dir: ${paths.root_dir}/logs/ | |
output_dir: ${hydra:runtime.output_dir} | |
work_dir: ${hydra:runtime.cwd} | |
data_config: | |
name: mitermix/audiosnippets | |
streaming: true | |
audio_key: mp3 | |
caption_key: caption | |
model_config: | |
tokenizer_name: openai/whisper-tiny | |
model_name: openai/whisper-base | |
attn_implementation: flash_attention_2 | |
name: openai/whisper-tiny | |
trainer_config: | |
tf32: true | |
bf16: true | |
fp16: false | |
dataloader_num_workers: 16 | |
eval_strategy: 'no' | |
eval_steps: null | |
save_strategy: steps | |
save_steps: 5000 | |
save_total_limit: 5 | |
gradient_checkpointing: false | |
gradient_checkpointing_kwargs: | |
use_reentrant: false | |
ddp_find_unused_parameters: false | |
logging_steps: 50 | |
seed: 998244353 | |
optim: adamw_torch | |
adam_beta1: 0.9 | |
adam_beta2: 0.98 | |
max_grad_norm: 1.0 | |
per_device_train_batch_size: 128 | |
output_dir: ${paths.output_dir} | |
report_to: tensorboard | |
logging_dir: ${trainer_config.output_dir}/tb | |
lr_scheduler_type: cosine | |
learning_rate: 0.0001 | |
warmup_steps: 5000 | |
max_steps: 50000 | |
label_smoothing_factor: 0.0 | |
push_to_hub: true | |
hub_model_id: seastar105/whisper-base-emo-speech-caption | |
dataloader_prefetch_factor: 4 | |
task_name: tiny-test | |