Spaces:

vetrovvlad
/

protobench

Sleeping

vtrv.vls commited on Jun 28, 2024

Commit

2375d69

1 Parent(s): 57a81f5

API fix

Files changed (3) hide show

app.py CHANGED Viewed

@@ -6,7 +6,7 @@ from datetime import datetime
 import pandas as pd
 from utils import generate, send_to_s3
-from models import get_tiny_llama, response_tiny_llama
 from constants import css, js_code, js_light
 MERA_table = None
@@ -16,18 +16,16 @@ S3_SESSION = None
 def giga_gen(content, chat_history):
     chat_history.append([content])
-    print(chat_history)
     res = generate(chat_history,'auth_token.json')
     chat_history[-1].append(res)
     send_to_s3(res, f'protobench/giga_{str(datetime.now()).replace(" ", "_")}.json', S3_SESSION)
-    print(chat_history)
     return '', chat_history
 def tiny_gen(content, chat_history):
-    res = response_tiny_llama(TINY_LLAMA, content)
-    chat_history.append((content, res))
     send_to_s3(res, f'protobench/tiny_{str(datetime.now()).replace(" ", "_")}.json', S3_SESSION)
-    print(chat_history)
     return '', chat_history
 def tab_arena():
@@ -158,7 +156,7 @@ if __name__ == "__main__":
     # data_load(args.result_file)
     # TYPES = ["number", "markdown", "number"]
-    TINY_LLAMA =  get_tiny_llama()
     try:
         session = boto3.session.Session()

 import pandas as pd
 from utils import generate, send_to_s3
+from models import get_tinyllama, response_tinyllama
 from constants import css, js_code, js_light
 MERA_table = None
 def giga_gen(content, chat_history):
     chat_history.append([content])
     res = generate(chat_history,'auth_token.json')
     chat_history[-1].append(res)
     send_to_s3(res, f'protobench/giga_{str(datetime.now()).replace(" ", "_")}.json', S3_SESSION)
     return '', chat_history
 def tiny_gen(content, chat_history):
+    chat_history.append([content])
+    res = response_tinyllama(TINY_LLAMA, content)
+    chat_history[-1].append(res)
     send_to_s3(res, f'protobench/tiny_{str(datetime.now()).replace(" ", "_")}.json', S3_SESSION)
     return '', chat_history
 def tab_arena():
     # data_load(args.result_file)
     # TYPES = ["number", "markdown", "number"]
+    TINY_LLAMA =  get_tinyllama()
     try:
         session = boto3.session.Session()

models.py CHANGED Viewed

@@ -1,23 +1,27 @@
 import torch
 from transformers import pipeline
-def get_tiny_llama():
-    pipe = pipeline("text-generation", model="TinyLlama/TinyLlama-1.1B-Chat-v1.0", torch_dtype=torch.float16, device_map="auto")
-    return pipe
-def response_tiny_llama(
-        pipe=None,
-        content="How many helicopters can a human eat in one sitting?"
         ):
-    # We use the tokenizer's chat template to format each message - see https://huggingface.co/docs/transformers/main/en/chat_templating
-    messages = [
         {
             "role": "system",
-            "content": "You are a friendly chatbot who always responds in the style of a pirate",
-        },
-        {"role": "user", "content": content},
     ]
-    prompt = pipe.tokenizer.apply_chat_template(messages, tokenize=False, add_generation_prompt=True)
-    outputs = pipe(prompt, max_new_tokens=32, do_sample=True, temperature=0.7, top_k=50, top_p=0.95)
-    return outputs[0]['generated_text'].split('<|assistant|>')[1]

 import torch
 from transformers import pipeline
+def get_tinyllama():
+    tinyllama = pipeline("text-generation", model="TinyLlama/TinyLlama-1.1B-Chat-v1.0", torch_dtype=torch.float16, device_map="auto")
+    return tinyllama
+def response_tinyllama(
+        model=None,
+        messages=None
         ):
+    messages_dict = [
         {
             "role": "system",
+            "content": "You are a friendly and helpful chatbot",
+        }
     ]
+    for step in messages:
+        messages_dict.append({'role': 'user', 'content': step[0]})
+        if len(step) >= 2:
+            messages_dict.append({'role': 'assistant', 'content': step[1]})
+    prompt = model.tokenizer.apply_chat_template(messages_dict, tokenize=False, add_generation_prompt=True)
+    outputs = model(prompt, max_new_tokens=32, do_sample=True, temperature=0.7, top_k=50, top_p=0.95)
+    return outputs[0]['generated_text'].split('<|assistant|>')[1].strip()

utils.py CHANGED Viewed

@@ -57,7 +57,7 @@ def generate(content=None, auth_file=None):
         auth_token = json.load(f)
     if datetime.fromtimestamp(auth_token['expires_at']/1000) <= datetime.now() - timedelta(seconds=60):
-        gen_auth_token()
         with open(auth_file) as f:
             auth_token = json.load(f)

         auth_token = json.load(f)
     if datetime.fromtimestamp(auth_token['expires_at']/1000) <= datetime.now() - timedelta(seconds=60):
+        gen_auth_token(auth_file)
         with open(auth_file) as f:
             auth_token = json.load(f)