Spaces:

papayaga
/

homeros_demo

Sleeping

App Files Files Community

papayaga commited on Jul 22, 2023

Commit

49a7070

1 Parent(s): 1f8e954

voice generation and first story working

Browse files

Files changed (10) hide show

README.md +4 -2
__test.py +36 -1
adaptors/llm.py +16 -9
adaptors/voice.py +11 -28
data/stories.db +0 -0
helpers/__init__.py +31 -10
homeros.py +10 -3
main.py +20 -8
prompts/__init__.py +1 -0
prompts/paraphraser.py +19 -0

README.md CHANGED Viewed

@@ -72,12 +72,14 @@ It puts the user in charge of a how the story is going to develop.
 - [x] Set up flow management
 - [x] Add SQlite DB and save stories
 - [x] GPT-4 story generation in a gradio interface
-- [ ] Do the evaluator (if it's time to end)
-- [ ] Inerchange text output for play.ht voice generation
 - [ ] Interchange text input for whisper
 - [ ] Dockerfile and deploy (including magic word for access control)
 ## Enhancements
 - [ ] Add option to download the full story as one .mp3
 - [ ] Add meta-moderator role to manage story ark better

 - [x] Set up flow management
 - [x] Add SQlite DB and save stories
 - [x] GPT-4 story generation in a gradio interface
+- [x] Do the evaluator (if it's time to end)
+- [x] Inerchange text output for play.ht voice generation
 - [ ] Interchange text input for whisper
+- [ ] Clear input on submit
 - [ ] Dockerfile and deploy (including magic word for access control)
 ## Enhancements
 - [ ] Add option to download the full story as one .mp3
+- [ ] Add option to download full story text
 - [ ] Add meta-moderator role to manage story ark better

__test.py CHANGED Viewed

@@ -5,9 +5,44 @@ from adaptors.db import get_story, get_all_stories
 from pprint import pprint
 import json
 from loguru import logger
 def all_s():
     for s in get_all_stories():
         pprint(s.to_dict())
-all_s()

 from pprint import pprint
 import json
 from loguru import logger
+from adaptors.voice import say_new
 def all_s():
     for s in get_all_stories():
         pprint(s.to_dict())
+def say(text):
+    pprint(text)
+    return say_new(text)
+long_text = '''
+In a distant and rarely trodden corner of Middle Earth, there
+resided an unlikely hero, known to the local forest critters by the '
+rather unusual name, Slippersnail. Unlike the courageous Hobbits or '
+the formidable Elves, Slippersnail was of a forgotten forest folk, '
+a tiny creature, small as a sparrow with an oversized leaf as an '
+umbrella and a snail shell for his home. You could hardly tell if
+he was a gnome, a brownie or something else, for his kind was
+scarcely remembered, even in the oldest songs of the Elves.
+Slippersnail, barely tall enough to poke his head above the
+bracken, lived an unassuming life, busily brewing his famous
+dandelion tea and tending to his miniature garden filled with
+colorful nocturnal glow-flowers. One morning, as Slippersnail was
+pruning his glow-flowers, he found a peculiar golden leaf which
+glittered so brightly it could outshine the glow-flowers by far.
+Soon he discovered that the leaf had a magical property: it could
+create light as bright as a day where the darkness had fallen.
+The news of the magical leaf reached the ears of the Dark Lord in
+the East. Coveting the leaf to manipulate it for his evil motives,
+Sauron dispatched a band of his malevolent minions in search of
+Slippersnail and his leaf.
+Unaware of the danger, Slippersnail saw the shadow creeping over
+his garden now. But, what do you think should our little hero do
+next?
+'''
+say(long_text)

adaptors/llm.py CHANGED Viewed

@@ -4,12 +4,14 @@ an abstraction over GPT-4 for easy substitution later if needed
 import openai
 import os
 openai.api_key = os.getenv('OPENAI_KEY')
-#MODEL = 'gpt-4'
-MODEL = 'gpt-3.5-turbo'
 def answer(system_message, user_and_assistant_messages):
     messages = [{
         "role":"system",
@@ -18,11 +20,16 @@ def answer(system_message, user_and_assistant_messages):
     messages.extend(user_and_assistant_messages)
-    chat_completion = openai.ChatCompletion.create(
-        model=MODEL,
-        messages=messages
-    )
-    output = chat_completion.choices[0].message.content
-    return output

 import openai
 import os
+from tenacity import retry, wait_random_exponential, stop_after_attempt
 openai.api_key = os.getenv('OPENAI_KEY')
+MODEL = 'gpt-4'
+#MODEL = 'gpt-3.5-turbo'
+@retry(wait=wait_random_exponential(multiplier=1, max=40), stop=stop_after_attempt(3))
 def answer(system_message, user_and_assistant_messages):
     messages = [{
         "role":"system",
     messages.extend(user_and_assistant_messages)
+    try:
+        chat_completion = openai.ChatCompletion.create(
+            model=MODEL,
+            messages=messages
+        )
+        output = chat_completion.choices[0].message.content
+        return output
+    except Exception as e:
+        print("Unable to generate ChatCompletion response")
+        print(f"Exception: {e}")
+        return e

adaptors/voice.py CHANGED Viewed

@@ -6,8 +6,10 @@ import requests
 import sseclient
 from loguru import logger
 import os
 from pprint import pprint
 import json
 url = "https://play.ht/api/v2/tts"
 user_id = os.environ["PLAYHT_USERID"]
@@ -20,33 +22,12 @@ headers = {
   "X-USER-ID": user_id
 }
-voices = ["dylan"]
-#TODO pre-generate these with dylan and save locally
-fixed_sayings = {
-    "welcome": [""], #also ask magic word here
-    "wrong_magic_word": [""],
-    "let_me_ask_questions": [""],
-    "ask_world": [""],
-    "ask_hero": [""],
-    "ask_plot": [""],
-    "ask_ending": [""],
-    "ask_style": [""],
-    "its_the_end": [""],
-    "no_more_story": [""]
-}
-'''
-return an old file from a dictionary of pre-generated sayings
-'''
-def say_fixed(fixed_msg, voice):
-    #We need to keep a repository of fixed messages generated in our key voices and for each have a file URL
-    return
 '''
 generate new saying with play.ht
 '''
-def say_new(text, voice):
   payload = {
     "quality": "medium",
     "output_format": "mp3",
@@ -59,13 +40,15 @@ def say_new(text, voice):
   response = requests.post(url, stream=True, headers=headers, json=payload)
   stream_url = response.headers["content-location"]
-  logger.debug(f"stream_url = {stream_url}")
   resp = requests.get(stream_url, stream=True, headers=headers)
   client = sseclient.SSEClient(resp)
   for event in client.events():
-    if event.data:
-      e = json.loads(event.data)
-      if e["stage"] == "complete":
-        return(e["url"])

 import sseclient
 from loguru import logger
 import os
+import helpers
 from pprint import pprint
 import json
+from tenacity import retry, wait_random_exponential, stop_after_attempt
 url = "https://play.ht/api/v2/tts"
 user_id = os.environ["PLAYHT_USERID"]
   "X-USER-ID": user_id
 }
+valid_voices = ["dylan"]
 '''
 generate new saying with play.ht
 '''
+def say_new(text, voice="dylan"):
   payload = {
     "quality": "medium",
     "output_format": "mp3",
   response = requests.post(url, stream=True, headers=headers, json=payload)
   stream_url = response.headers["content-location"]
   resp = requests.get(stream_url, stream=True, headers=headers)
   client = sseclient.SSEClient(resp)
   for event in client.events():
+      if event.data:
+          #pprint(event.data)
+          if helpers.is_valid_json(event.data): # play.ht api is unrealiable
+              e = json.loads(event.data)
+              if e["stage"] == "complete":
+                  return(e["url"])

data/stories.db CHANGED Viewed

Binary files a/data/stories.db and b/data/stories.db differ

helpers/__init__.py CHANGED Viewed

@@ -1,9 +1,24 @@
 import uuid
 import os
 import random
 magic_w = os.environ["MAGICWORD"]
 def gen_unique_id():
     return str(uuid.uuid4())
@@ -13,20 +28,26 @@ def check_magic_word(w):
 def get_fixed_msg(msg_type):
     fixed_sayings = {
-        "welcome": ["Welcome! What's the magic word?"], #also ask magic word here
-        "wrong_magic_word": ["Magic word is wrong. Try again."],
-        "ask_world": ["Let me ask you some questions first. What kind of world should your story unfold in?"],
-        "ask_hero": ["Who should the hero be?"],
-        "ask_plot": ["Can you describe the plot in a few words?"],
-        "ask_ending": ["What kind of ending would you like? A happy one? A tragic one? Something else?"],
-        "ask_style": ["What kind of storytelling style do you wnat? Funny? Poetic?"],
-        "its_the_end": ["And this is the end of our story. Thank you for listening."],
-        "no_more_story": ["I'm sorry, this story has ended. Reload the page to do another story."]
     }
     if msg_type in fixed_sayings:
         saying = random.choice(fixed_sayings[msg_type])
-        return saying
     else:
         raise Exception(f"fixed saying with msg_type {msg_type} not found")

 import uuid
 import os
 import random
+import prompts
+import json
+from adaptors.llm import answer
+from adaptors.voice import say_new
 magic_w = os.environ["MAGICWORD"]
+'''
+check if valid JSON
+'''
+def is_valid_json(input_string):
+    try:
+        json_object = json.loads(input_string)
+    except json.JSONDecodeError:
+        return False
+    return True
 def gen_unique_id():
     return str(uuid.uuid4())
 def get_fixed_msg(msg_type):
     fixed_sayings = {
+        "welcome": ["Welcome, welcome my friend! I'd be happy to tell you a story. But one thing first... Do you know the magic word?"],
+        "wrong_magic_word": ["Oh, my dear, I'm very sorry. But it looks like you don't know the magic word. And I'm afraid I can't tell you the story without the magic word. Please ask around for the magic word and try again then. I'll wait here."],
+        "ask_world": ["Wonderful! That is right... Get ready for a great story that you and I can create together. But before we start, let me ask you a few questions first. What kind of world would you like our story to unfold in? Maybe Middle Earth with elves and orcs? Or a distant future world full of space travel? It can be anything. Just tell me."],
+        "ask_hero": ["That sounds great. And who should our hero be?"],
+        "ask_plot": ["Splendid! Now let's think about the plot of our story. Can you describe in just a few words what our story should be all about. Maybe the hero finds the love of their life? Or maybe they travel far and wide to discover their powers and find friends... it can be anything you want. Just say it and we will make it happen."],
+        "ask_ending": ["That is great. And what kind of ending would you like our story to have? A happy one? A tragic one? Something else?"],
+        "ask_style": ["I see. Now lastly, what kind of storytelling style do you like most? Would you like our story to be funny? Or Epic? Or Poetic? You can decide!"],
+        "its_the_end": ["And this is the end of our story. Thank you, my dear, for making it with me."],
+        "no_more_story": ["I'm very sorry, my dear, but this story has ended. But you can come back again later and we will make another great story together."]
     }
     if msg_type in fixed_sayings:
         saying = random.choice(fixed_sayings[msg_type])
+        system_message = prompts.get('paraphraser')
+        paraphrased = answer(system_message, [{
+            "role" : "user",
+            "content" : saying
+        }])
+        audio = say_new(paraphrased)
+        return audio
     else:
         raise Exception(f"fixed saying with msg_type {msg_type} not found")

homeros.py CHANGED Viewed

@@ -6,8 +6,9 @@ from pprint import pprint
 from helpers import gen_unique_id
 import prompts
 from adaptors.llm import answer
-MAX_STORY_LEN = 2 #after how many chunks we force the story to end
 '''
 initiates a new story and saves in DB
@@ -52,6 +53,10 @@ def continue_story(user_input, story_data):
         "content": user_input
     })
     next_chunk_text = create_next_chunk_text(user_input, story)
     next_chunk_audio = create_next_chunk_audio(next_chunk_text)
     messages.append({
         "role":"assistant",
@@ -61,6 +66,8 @@ def continue_story(user_input, story_data):
         "text" : next_chunk_text,
         "audio_url" : next_chunk_audio
     })
     story.chunks = json.dumps(chunks)
     story.messages = json.dumps(messages)
     story.status = "ongoing"
@@ -135,7 +142,7 @@ def evaluate_story(story):
     evaluation = {}
     story_len = len(story["chunks"])
     logger.debug(story_len)
-    evaluation["is_time_to_end"] = story_len > MAX_STORY_LEN
     return evaluation
@@ -144,4 +151,4 @@ def evaluate_story(story):
 turns next story chunk into audio and returns a URL
 '''
 def create_next_chunk_audio(text):
-    return "url.com"

 from helpers import gen_unique_id
 import prompts
 from adaptors.llm import answer
+from adaptors.voice import say_new
+MAX_STORY_LEN = 3 #after how many chunks we force the story to end
 '''
 initiates a new story and saves in DB
         "content": user_input
     })
     next_chunk_text = create_next_chunk_text(user_input, story)
+    if len(chunks) == 0:
+        next_chunk_text = "May our story begin!\n\n"+next_chunk_text
     next_chunk_audio = create_next_chunk_audio(next_chunk_text)
     messages.append({
         "role":"assistant",
         "text" : next_chunk_text,
         "audio_url" : next_chunk_audio
     })
+    pprint(chunks)
+    pprint(messages)
     story.chunks = json.dumps(chunks)
     story.messages = json.dumps(messages)
     story.status = "ongoing"
     evaluation = {}
     story_len = len(story["chunks"])
     logger.debug(story_len)
+    evaluation["is_time_to_end"] = story_len >= MAX_STORY_LEN
     return evaluation
 turns next story chunk into audio and returns a URL
 '''
 def create_next_chunk_audio(text):
+    return say_new(text)

main.py CHANGED Viewed

@@ -8,12 +8,25 @@ import helpers
 from homeros import init_story, start_story, continue_story, finish_story, define_metadata, evaluate_story
 '''
 Here we manage the flow and state of the story
 '''
 def do_homeros(user_input, story):
-    pprint(story)
     # story hasn't started
     if story["status"] == "not_started":
@@ -67,7 +80,7 @@ def do_homeros(user_input, story):
         story = define_metadata(user_input, "style", story)
         story["status"] = "ongoing"
         story = start_story(story)
-        next_message = story["chunks"][-1]["text"]
     # we are in the middle of the story - evaluate if time to end, or continue
     elif story["status"] == "ongoing":
@@ -79,7 +92,7 @@ def do_homeros(user_input, story):
             story = continue_story(user_input, story)
             story["status"] = "ongoing"
-        next_message = story["chunks"][-1]["text"]
     # story has ended, but the user still inputting. tell them it's over
     elif story["status"] == "finished":
@@ -113,14 +126,12 @@ with demo:
         "full_story_text": ""
     })
-    pprint(story.value)
     with gr.Row():
         gr.Markdown('''
 # HOMEROS
 This demo is exploring the future of interactive storytelling.
-It puts the user in charge and makes blurs the boundary between the reader and the author.
 Hit "Tell me!" to get started.
@@ -135,8 +146,9 @@ When Homeros asks you something - hit record, answer with your voice and then hi
         )
     with gr.Row():
-        story_chunk = gr.Textbox(
-            label="storyteller says"
         )
     with gr.Row():

 from homeros import init_story, start_story, continue_story, finish_story, define_metadata, evaluate_story
+DEFAULT_PARAMS = True
 '''
 Here we manage the flow and state of the story
 '''
 def do_homeros(user_input, story):
+    # if default params is true - skip the asking, including magic word and just start the story
+    if DEFAULT_PARAMS and len(story["chunks"]) == 0:
+        story = init_story(story)
+        story = define_metadata("J.R.R. Tolkien's Middle Earth", "world", story)
+        story = define_metadata("I don't know. Please choose something unusual.", "hero", story)
+        story = define_metadata("I don't know. Please choose something unusual.", "plot", story)
+        story = define_metadata("Happy", "ending", story)
+        story = define_metadata("epic", "style", story)
+        story["status"] = "ongoing"
+        story = start_story(story)
+        next_message = story["chunks"][-1]["audio_url"]
+        return next_message, story
     # story hasn't started
     if story["status"] == "not_started":
         story = define_metadata(user_input, "style", story)
         story["status"] = "ongoing"
         story = start_story(story)
+        next_message = story["chunks"][-1]["audio_url"]
     # we are in the middle of the story - evaluate if time to end, or continue
     elif story["status"] == "ongoing":
             story = continue_story(user_input, story)
             story["status"] = "ongoing"
+        next_message = story["chunks"][-1]["audio_url"]
     # story has ended, but the user still inputting. tell them it's over
     elif story["status"] == "finished":
         "full_story_text": ""
     })
     with gr.Row():
         gr.Markdown('''
 # HOMEROS
 This demo is exploring the future of interactive storytelling.
+It puts the user in charge and blurs the boundary between the reader and the author.
 Hit "Tell me!" to get started.
         )
     with gr.Row():
+        story_chunk = gr.Audio(
+            label="storyteller says",
+            autoplay=True
         )
     with gr.Row():

prompts/__init__.py CHANGED Viewed

@@ -1,5 +1,6 @@
 from pprint import pprint
 from . import storyteller_general
 '''
 basic function that substitues variables in the prompt template and returns a ready prompt

 from pprint import pprint
 from . import storyteller_general
+from . import paraphraser
 '''
 basic function that substitues variables in the prompt template and returns a ready prompt

prompts/paraphraser.py ADDED Viewed

	@@ -0,0 +1,19 @@

+from string import Template
+'''
+paraphraser prompt
+'''
+template = Template('''
+You are a system that helps paraphrase questions and sayings slightly, without changing style or key message. Your paraphrasing should be minimal. Occasionally you can even return unchanged messages.
+The words and terms that shouldn't be changed under any circumstances and should remain in your paraphrased version unchanged:
+- magic word
+- hero
+- plot
+- world
+The user gives you text and you return back a paraphrased version of the same text. Only return  the paraphrased vesion and nothing else.
+''')