Spaces:

FahadAlam
/

Chatbot

Sleeping

App Files Files Community

FahadAlam commited on Sep 30, 2022

Commit

e9b983f

•

1 Parent(s): 46cf766

Update app.py

Browse files

Files changed (1) hide show

app.py +54 -18

app.py CHANGED Viewed

@@ -1,25 +1,61 @@
-import gradio as gr
-from transformers import AutoModelForCausalLM, AutoTokenizer
 import torch
-tokenizer = AutoTokenizer.from_pretrained("microsoft/DialoGPT-medium")
-model = AutoModelForCausalLM.from_pretrained("microsoft/DialoGPT-medium")
-def predict(input, history=[]):
-    # tokenize the new input sentence
-    new_user_input_ids = tokenizer.encode(input + tokenizer.eos_token, return_tensors='pt')
-    # append the new user input tokens to the chat history
-    bot_input_ids = torch.cat([torch.LongTensor(history), new_user_input_ids], dim=-1)
-    # generate a response
-    history = model.generate(bot_input_ids, max_length=1000, pad_token_id=tokenizer.eos_token_id).tolist()
-    # convert the tokens to text, and then split the responses into lines
-    response = tokenizer.decode(history[0]).split("<|endoftext|>")
-    response = [(response[i], response[i+1]) for i in range(0, len(response)-1, 2)]  # convert to tuples of list
-    return response, history
-gr.Interface(fn=predict,
-             inputs=["text", "state"],
-             outputs=["chatbot", "state"]).launch()

+from transformers import BlenderbotTokenizer, BlenderbotForConditionalGeneration
 import torch
+import gradio as gr
+mname = "facebook/blenderbot-400M-distill"
+model = BlenderbotForConditionalGeneration.from_pretrained(mname)
+tokenizer = BlenderbotTokenizer.from_pretrained(mname)
+def take_last_tokens(inputs, note_history, history):
+    """Filter the last 128 tokens"""
+    if inputs['input_ids'].shape[1] > 128:
+        inputs['input_ids'] = torch.tensor([inputs['input_ids'][0][-128:].tolist()])
+        inputs['attention_mask'] = torch.tensor([inputs['attention_mask'][0][-128:].tolist()])
+        note_history = ['</s> <s>'.join(note_history[0].split('</s> <s>')[2:])]
+        history = history[1:]
+    return inputs, note_history, history
+def add_note_to_history(note, note_history):
+    """Add a note to the historical information"""
+    note_history.append(note)
+    note_history = '</s> <s>'.join(note_history)
+    return [note_history]
+title = "Mantain a conversation with the bot"
+def chatbot(message, history):
+    history = history or []
+    if history:
+        history_useful = ['</s> <s>'.join([str(a[0])+'</s> <s>'+str(a[1]) for a in history])]
+    else:
+        history_useful = []
+    history_useful = add_note_to_history(message, history_useful)
+    inputs = tokenizer(history_useful, return_tensors="pt")
+    inputs, history_useful, history = take_last_tokens(inputs, history_useful, history)
+    reply_ids = model.generate(**inputs)
+    response = tokenizer.batch_decode(reply_ids, skip_special_tokens=True)[0]
+    history_useful = add_note_to_history(response, history_useful)
+    list_history = history_useful[0].split('</s> <s>')
+    history.append((list_history[-2], list_history[-1]))
+    return history, history
+gr.Interface(
+    fn=chatbot,
+    css=".footer {display:none !important}",
+    inputs=["text", "state"],
+    outputs=["chatbot", "state"],
+    title=title,
+    allow_flagging="never",
+    ).launch( debug= True)