nguyenvulebinh commited on
Commit
f1bbf33
·
1 Parent(s): 32440c9

add length for faster train

Browse files
Files changed (1) hide show
  1. main.py +2 -0
main.py CHANGED
@@ -61,6 +61,8 @@ def prepare_dataset(batch, processor):
61
 
62
  batch["input_values"] = processor(batch["speech"], sampling_rate=batch["sampling_rate"][0]).input_values
63
 
 
 
64
  with processor.as_target_processor():
65
  batch["labels"] = processor(batch["target_text"]).input_ids
66
  return batch
 
61
 
62
  batch["input_values"] = processor(batch["speech"], sampling_rate=batch["sampling_rate"][0]).input_values
63
 
64
+ batch["length"] = [len(item) for item in batch["input_values"]]
65
+
66
  with processor.as_target_processor():
67
  batch["labels"] = processor(batch["target_text"]).input_ids
68
  return batch