morkovka1337 commited on
Commit
cda5020
·
1 Parent(s): 42fb614

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +6 -9
app.py CHANGED
@@ -15,6 +15,8 @@ logging.basicConfig(
15
  logger = logging.getLogger(__name__)
16
  logger.setLevel(logging.DEBUG)
17
 
 
 
18
  def run(input_file, history, model_size="300M"):
19
  language = "Russian"
20
  decoding_type = "LM"
@@ -25,18 +27,13 @@ def run(input_file, history, model_size="300M"):
25
  history = []
26
 
27
 
28
- model = {"model_id": "jonatasgrosman/wav2vec2-large-xlsr-53-russian"}
29
- has_lm = True
30
-
31
- model_instance = AutoModelForCTC.from_pretrained(model["model_id"])
32
-
33
  if decoding_type == "LM":
34
- processor = Wav2Vec2ProcessorWithLM.from_pretrained(model["model_id"])
35
- asr = pipeline("automatic-speech-recognition", model=model_instance, tokenizer=processor.tokenizer,
36
  feature_extractor=processor.feature_extractor, decoder=processor.decoder)
37
  else:
38
- processor = Wav2Vec2Processor.from_pretrained(model["model_id"])
39
- asr = pipeline("automatic-speech-recognition", model=model_instance, tokenizer=processor.tokenizer,
40
  feature_extractor=processor.feature_extractor, decoder=None)
41
 
42
  transcription = asr(input_file.name, chunk_length_s=5, stride_length_s=1)["text"]
 
15
  logger = logging.getLogger(__name__)
16
  logger.setLevel(logging.DEBUG)
17
 
18
+ CACHED_MODEL = AutoModelForCTC.from_pretrained("jonatasgrosman/wav2vec2-large-xlsr-53-russian")
19
+
20
  def run(input_file, history, model_size="300M"):
21
  language = "Russian"
22
  decoding_type = "LM"
 
27
  history = []
28
 
29
 
 
 
 
 
 
30
  if decoding_type == "LM":
31
+ processor = Wav2Vec2ProcessorWithLM.from_pretrained("jonatasgrosman/wav2vec2-large-xlsr-53-russian")
32
+ asr = pipeline("automatic-speech-recognition", model=CACHED_MODEL , tokenizer=processor.tokenizer,
33
  feature_extractor=processor.feature_extractor, decoder=processor.decoder)
34
  else:
35
+ processor = Wav2Vec2Processor.from_pretrained("jonatasgrosman/wav2vec2-large-xlsr-53-russian")
36
+ asr = pipeline("automatic-speech-recognition", model=CACHED_MODEL , tokenizer=processor.tokenizer,
37
  feature_extractor=processor.feature_extractor, decoder=None)
38
 
39
  transcription = asr(input_file.name, chunk_length_s=5, stride_length_s=1)["text"]