salomonsky commited on
Commit
4b73d5c
1 Parent(s): 78d8cd5

Update app.py

Browse files
Files changed (1) hide show
  1. app.py +9 -7
app.py CHANGED
@@ -3,20 +3,22 @@ import os
3
  import subprocess
4
  from gtts import gTTS
5
  from pydub import AudioSegment
 
6
  from PIL import Image
7
- from transformers import AlbertTokenizer, AutoModelForCausalLM
8
 
9
- tokenizer = AlbertTokenizer.from_pretrained('dccuchile/bert-base-spanish-wwm-uncased')
10
- model = AutoModelForCausalLM.from_pretrained('dccuchile/bert-base-spanish-wwm-uncased')
11
  os.environ["TOKENIZERS_PARALLELISM"] = "true"
12
 
13
  def generate_output(name, date_of_birth):
14
  welcome = f"Bienvenido {name}:"
15
- input_text = welcome
16
- input_ids = tokenizer.encode(input_text, return_tensors="pt")
17
- output = model.generate(input_ids, max_length=60, num_return_sequences=1)
18
- generated_text = tokenizer.decode(output[0])
19
  generated_text = generated_text.replace(input_text, "").strip()
 
 
20
 
21
  try:
22
  tts = gTTS(generated_text, lang='es')
 
3
  import subprocess
4
  from gtts import gTTS
5
  from pydub import AudioSegment
6
+ from transformers import GPT2LMHeadModel, GPT2Tokenizer, pipeline
7
  from PIL import Image
 
8
 
9
+ generator = pipeline('text-generation', model="checkpoints")
10
+ tokenizer = GPT2Tokenizer.from_pretrained('checkpoints')
11
  os.environ["TOKENIZERS_PARALLELISM"] = "true"
12
 
13
  def generate_output(name, date_of_birth):
14
  welcome = f"Bienvenido {name}:"
15
+ input_tokens = tokenizer.encode(add_special_tokens=True)
16
+ input_text = tokenizer.decode(input_tokens)
17
+ gpt2_output = welcome + generator(input_text, max_length=60, do_sample=True, temperature=0.6)
18
+ generated_text = gpt2_output[0]['generated_text']
19
  generated_text = generated_text.replace(input_text, "").strip()
20
+ if len(gpt2_output) == 0 or 'generated_text' not in gpt2_output[0]:
21
+ return None, "No se pudo generar el texto."
22
 
23
  try:
24
  tts = gTTS(generated_text, lang='es')