File size: 8,117 Bytes
3312835 3649333 3312835 fc1ea0d 3312835 3649333 3312835 3649333 3312835 3649333 3312835 3649333 3312835 3649333 3312835 3649333 3312835 3649333 3312835 3649333 3312835 3649333 3312835 3649333 3312835 3649333 3312835 3649333 3312835 3649333 3312835 3649333 3312835 3649333 3312835 3649333 3312835 e3b6acf 3649333 53df8a9 3649333 e3b6acf fc1ea0d 800ee72 fc1ea0d 3649333 e3b6acf fc1ea0d e3b6acf 3e7a6f8 3649333 3312835 3649333 |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26 27 28 29 30 31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124 125 126 127 128 129 130 131 132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173 174 175 176 177 178 179 180 181 182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 |
# Import necessary libraries
from transformers import MusicgenForConditionalGeneration
from transformers import AutoProcessor
import scipy
import streamlit as st
# Set a random seed for reproducibility
import torch
# Configure the Streamlit app with a custom title and icon
page_title="Plant Orchestra",
# Initialize the model for generating music
def initialise_model():
Initialize the model for generating music using Hugging Face Transformers.
This function loads a pre-trained processor and model from the "facebook/musicgen-small"
checkpoint. It is wrapped in a Streamlit cache, ensuring efficient resource management
for repeated usage of the model within the application.
Tuple[Optional[AutoProcessor], Optional[MusicgenForConditionalGeneration]]: A tuple containing
the processor and model if initialization is successful. If an error occurs during
initialization, the function returns None for both elements of the tuple.
processor, model = initialise_model()
if processor is not None and model is not None:
# Model is successfully initialized, and you can use it for music generation.
# Handle initialization error.
# Load the processor and model from the pretrained model checkpoint
processor = AutoProcessor.from_pretrained("facebook/musicgen-small")
model = MusicgenForConditionalGeneration.from_pretrained("facebook/musicgen-small")
return processor, model
except Exception as e:
# Handle any errors that may occur during model initialization
st.error(f"Error initializing the model: {str(e)}")
return None, None
# Call the 'initialise_model' function to set up the processor and model
processor, model = initialise_model()
# Generate audio with given prompt
def generate_audio(processor, model, prompt):
Generate audio based on a given prompt using a pre-trained model.
This function takes a processor and model, which are responsible for processing
the input and generating audio, and a user-provided prompt to create a musical
processor (AutoProcessor): A pre-trained processor for text-to-sequence tasks.
model (MusicgenForConditionalGeneration): A pre-trained model for generating music.
prompt (str): The user-provided text prompt to guide music generation.
Union[None, torch.Tensor]: If the audio generation is successful, it returns a
tensor containing the generated audio. If an error occurs during generation,
the function returns None.
processor, model = initialise_model()
if processor is not None and model is not None:
audio_data = generate_audio(processor, model, "Sunflower, temperature: 32.5 C, UV light intensity: 50%, Soil water level: 3cm/h")
if audio_data is not None:
# Use the generated audio for further processing or display.
# Handle audio generation error.
# Handle model initialization error.
if processor is not None and model is not None:
# Prepare the input for the model by tokenizing and converting the text to tensors.
inputs = processor(
# Generate audio based on the processed input using the pre-trained model.
audio_values = model.generate(
**"cpu"), # Ensure computation on the CPU
do_sample=True, # Enable sampling for creative output
guidance_scale=3, # Adjust the guidance scale (you can customize)
max_new_tokens=256, # Limit the length of generated audio (you can customize)
return audio_values
except Exception as e:
# Handle any exceptions that may occur during audio generation.
st.error(f"Error generating audio: {str(e)}")
return None
# Save audio file with scipy
def save_file(model, audio_values, filename):
Save audio data as a WAV file using the SciPy library.
model: The pre-trained model used for audio generation.
audio_values (torch.Tensor): The tensor containing the generated audio data.
filename (str): The desired filename for the saved WAV file.
save_file(model, audio_data, "generated_audio.wav")
# Get the sampling rate from the model's configuration
sampling_rate = model.config.audio_encoder.sampling_rate
# Write the audio data to a WAV file with the specified filename, rate=sampling_rate, data=audio_values[0, 0].cpu().numpy())
# Main Code
st.title("Plant Orchestra 🌿")
st.markdown("Generate music based on your own terrarium plants.")
prompt = st.text_area(label='Data collected from terrarium:', placeholder='Enter data here...')
if st.button("Generate Music"):
if processor is not None and model is not None:
with st.spinner("Generating audio..."):
results = generate_audio(processor, model, prompt)
if results is not None:
sampling_rate = model.config.audio_encoder.sampling_rate
st.write("Listen to the generated music:"), data=results[0, 0].cpu().numpy(), format="audio/wav")
# Sidebar: How-to-use
st.sidebar.header("How to Use:")
st.sidebar.write("1. Enter data collected from terrarium in the text input.")
st.sidebar.write("2. Click the 'Generate Music' button to create music based on the provided input.")
st.sidebar.write("3. You can listen to the generated music and download it.")
# Sidebar: Samples
st.sidebar.header('Samples 🎵')
# Sample 1
holland moss, bioelectric levels: 2.1 watts\n
oak leaf fig, bioelectric levels: 3.7 watts\n
baby tears, bioelectric levels: 2.5 watts\n
pilea, bioelectric levels: 1.2 watts\n
temperature: 30C\n
humidity: 90%\n
ultraviolet index: 3
# Sample 2
hydrocotyle tripartita, bioelectric levels: 3.5 watts\n
malayan moss, bioelectric levels: 5.3 watts\n
artillery plant, bioelectric levels: 1.7 watts\n
nerve plant, bioelectric levels: 1.8 watts\n
temperature: 32C\n
humidity: 84%\n
ultraviolet index: 2
# Option to hear more audios
show_more_plant_audio = st.sidebar.checkbox('Show more audios of terrarium plants')
if show_more_plant_audio:
st.sidebar.write('Holland moss')'sound/holland_moss.wav')
st.sidebar.write('Nerve plant')'sound/nerve_plant.wav')
st.sidebar.write('Baby tears')'sound/baby_tears.wav')
st.sidebar.write('Artillery plant')'sound/artillery_plant.wav')
st.sidebar.write('Malayan moss')'sound/malayan_moss.wav')
st.sidebar.write('Hydrocotyle tripartita')'sound/hydrocotyle_tripartita.wav')
st.sidebar.write('Oak leaf fig')'sound/oak_leaf_fig.wav')
st.sidebar.write("This app is built with [MusicGen by Meta](")
# Footer
st.markdown("Created with ❤️ by HS2912 W4 Group 2")