Spaces:

CreitinGameplays
/

bloom-3b-conversational-gradio

Sleeping

CreitinGameplays commited on Jun 1

Commit

bc4308f

•

1 Parent(s): a487b7f

Update app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -12,7 +12,7 @@ model = AutoModelForCausalLM.from_pretrained(model_name)
 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 model.to(device)
-@spaces.GPU(duration=60)
 def generate_text(user_prompt):
   """Generates text using the BLOOM model from Hugging Face Transformers and removes the user prompt."""
   # Construct the full prompt with system introduction, user prompt, and assistant role
@@ -24,7 +24,7 @@ def generate_text(user_prompt):
   # Generate text with the complete prompt and limit the maximum length to 256 tokens
   output = model.generate(
       input_ids=prompt_encoded,
-      max_length=256,
       num_beams=1,
       num_return_sequences=1,
       do_sample=True,

 device = torch.device("cuda" if torch.cuda.is_available() else "cpu")
 model.to(device)
+@spaces.GPU(duration=90)
 def generate_text(user_prompt):
   """Generates text using the BLOOM model from Hugging Face Transformers and removes the user prompt."""
   # Construct the full prompt with system introduction, user prompt, and assistant role
   # Generate text with the complete prompt and limit the maximum length to 256 tokens
   output = model.generate(
       input_ids=prompt_encoded,
+      max_length=1900,
       num_beams=1,
       num_return_sequences=1,
       do_sample=True,