seastar105's picture
Training in progress, step 5000
53c24e9 verified
paths:
root_dir: .
data_dir: ${paths.root_dir}/data/
log_dir: ${paths.root_dir}/logs/
output_dir: ${hydra:runtime.output_dir}
work_dir: ${hydra:runtime.cwd}
data_config:
name: mitermix/audiosnippets
streaming: true
audio_key: mp3
caption_key: caption
model_config:
tokenizer_name: openai/whisper-tiny
model_name: openai/whisper-base
attn_implementation: flash_attention_2
name: openai/whisper-tiny
trainer_config:
tf32: true
bf16: true
fp16: false
dataloader_num_workers: 16
eval_strategy: 'no'
eval_steps: null
save_strategy: steps
save_steps: 5000
save_total_limit: 5
gradient_checkpointing: false
gradient_checkpointing_kwargs:
use_reentrant: false
ddp_find_unused_parameters: false
logging_steps: 50
seed: 998244353
optim: adamw_torch
adam_beta1: 0.9
adam_beta2: 0.98
max_grad_norm: 1.0
per_device_train_batch_size: 128
output_dir: ${paths.output_dir}
report_to: tensorboard
logging_dir: ${trainer_config.output_dir}/tb
lr_scheduler_type: cosine
learning_rate: 0.0001
warmup_steps: 5000
max_steps: 50000
label_smoothing_factor: 0.0
push_to_hub: true
hub_model_id: seastar105/whisper-base-emo-speech-caption
dataloader_prefetch_factor: 4
task_name: tiny-test