Spaces:

Abhijit-192-168-1-1
/

example_LLM2Vec

Sleeping

Abhijit-192-168-1-1 commited on Jul 15, 2024

Commit

77be9aa

1 Parent(s): ffce486

modified app.py

Files changed (1) hide show

app.py CHANGED Viewed

@@ -1,9 +1,9 @@
 import gradio as gr
 from llm2vec import LLM2Vec
 from transformers import AutoTokenizer, AutoModel, AutoConfig
 from peft import PeftModel
 import torch
-import os
 torch.backends.cuda.enable_mem_efficient_sdp(False)
 torch.backends.cuda.enable_flash_sdp(False)
@@ -18,7 +18,6 @@ if not GROQ_API_KEY or not HF_TOKEN:
 os.environ['GROQ_API_KEY'] = GROQ_API_KEY
 os.environ['HF_TOKEN'] = HF_TOKEN
 # Load tokenizer and model
 tokenizer = AutoTokenizer.from_pretrained("McGill-NLP/LLM2Vec-Sheared-LLaMA-mntp")
 config = AutoConfig.from_pretrained("McGill-NLP/LLM2Vec-Sheared-LLaMA-mntp", trust_remote_code=True)
@@ -40,8 +39,8 @@ def encode_text(input_text):
 # Define Gradio interface
 iface = gr.Interface(
     fn=encode_text,
-    inputs=gr.inputs.Textbox(lines=2, placeholder="Enter text here..."),
-    outputs=gr.outputs.JSON()
 )
 # Launch Gradio app

+import os
 import gradio as gr
 from llm2vec import LLM2Vec
 from transformers import AutoTokenizer, AutoModel, AutoConfig
 from peft import PeftModel
 import torch
 torch.backends.cuda.enable_mem_efficient_sdp(False)
 torch.backends.cuda.enable_flash_sdp(False)
 os.environ['GROQ_API_KEY'] = GROQ_API_KEY
 os.environ['HF_TOKEN'] = HF_TOKEN
 # Load tokenizer and model
 tokenizer = AutoTokenizer.from_pretrained("McGill-NLP/LLM2Vec-Sheared-LLaMA-mntp")
 config = AutoConfig.from_pretrained("McGill-NLP/LLM2Vec-Sheared-LLaMA-mntp", trust_remote_code=True)
 # Define Gradio interface
 iface = gr.Interface(
     fn=encode_text,
+    inputs=gr.Textbox(lines=2, placeholder="Enter text here..."),
+    outputs=gr.JSON()
 )
 # Launch Gradio app