Spaces:
Running
on
Zero
Running
on
Zero
import spaces | |
import gradio as gr | |
import os | |
import json | |
import tempfile | |
from pathlib import Path | |
from model import Jamify | |
from utils import json_to_text, text_to_json | |
# Initialize the Jamify model once | |
print("Initializing Jamify model...") | |
jamify_model = Jamify() | |
print("Jamify model ready.") | |
gr.set_static_paths(paths=[Path.cwd().absolute()]) | |
def generate_song(reference_audio, lyrics_text, style_prompt, duration): | |
# We need to save the uploaded files to temporary paths to pass to the model | |
reference_audio = reference_audio not in ("", None) and reference_audio or None | |
# Convert text format to JSON and save to temporary file | |
lyrics_json = text_to_json(lyrics_text) | |
# Create temporary file for lyrics JSON | |
with tempfile.NamedTemporaryFile(mode='w', suffix='.json', delete=False) as f: | |
json.dump(lyrics_json, f, indent=2) | |
lyrics_file = f.name | |
try: | |
output_path = jamify_model.predict( | |
reference_audio_path=reference_audio, | |
lyrics_json_path=lyrics_file, | |
style_prompt=style_prompt, | |
duration_sec=duration | |
) | |
return output_path | |
finally: | |
# Clean up temporary file | |
if os.path.exists(lyrics_file): | |
os.unlink(lyrics_file) | |
# Load and cache examples | |
def load_examples(): | |
"""Load examples from the examples directory and pre-compute text formats""" | |
examples = [] | |
examples_file = "examples/input.json" | |
if os.path.exists(examples_file): | |
print("Loading and caching examples...") | |
with open(examples_file, 'r') as f: | |
examples_data = json.load(f) | |
for example in examples_data: | |
example_id = example.get('id', '') | |
audio_path = example.get('audio_path', '') | |
lrc_path = example.get('lrc_path', '') | |
duration = example.get('duration', 120) | |
# Load lyrics and convert to text format (pre-computed/cached) | |
lyrics_text = "" | |
if os.path.exists(lrc_path): | |
try: | |
with open(lrc_path, 'r') as f: | |
lyrics_json = json.load(f) | |
lyrics_text = json_to_text(lyrics_json) | |
print(f"Cached example {example_id}: {len(lyrics_text)} chars") | |
except Exception as e: | |
print(f"Error loading lyrics from {lrc_path}: {e}") | |
examples.append({ | |
'id': example_id, | |
'audio_path': audio_path if os.path.exists(audio_path) else None, | |
'lyrics_text': lyrics_text, | |
'duration': duration | |
}) | |
print(f"Loaded {len(examples)} cached examples") | |
return examples | |
def load_example(example_idx, examples): | |
"""Load a specific example and return its data""" | |
if 0 <= example_idx < len(examples): | |
example = examples[example_idx] | |
return ( | |
example['audio_path'], | |
example['lyrics_text'], | |
example['duration'] | |
) | |
return None, "", 120 | |
# Load examples at startup | |
examples = load_examples() | |
# Get default values from first example | |
default_audio = examples[0]['audio_path'] if examples else None | |
default_lyrics = examples[0]['lyrics_text'] if examples else "" | |
default_duration = examples[0]['duration'] if examples else 120 | |
# Gradio interface | |
with gr.Blocks() as demo: | |
gr.Markdown("# Jamify: Music Generation from Lyrics and Style") | |
gr.Markdown("Provide your lyrics, a style reference (either an audio file or a text prompt), and a desired duration to generate a song.") | |
# Sample buttons section | |
if examples: | |
gr.Markdown("### Sample Examples") | |
with gr.Row(): | |
example_buttons = [] | |
for i, example in enumerate(examples): | |
button = gr.Button(f"Example {example['id']}", variant="secondary", size="sm") | |
example_buttons.append(button) | |
with gr.Row(): | |
with gr.Column(): | |
gr.Markdown("### Inputs") | |
lyrics_text = gr.Textbox( | |
label="Lyrics", | |
lines=10, | |
placeholder="Enter lyrics in format: word[start:end] word[start:end]...\nExample: It's[4.96:5.52] a[5.52:5.84] long[5.84:6.16] way[6.16:6.48]...", | |
value=default_lyrics | |
) | |
duration_slider = gr.Slider(minimum=5, maximum=230, value=default_duration, step=30, label="Duration (seconds)") | |
with gr.Tab("Style from Audio"): | |
reference_audio = gr.File(label="Reference Audio (.mp3, .wav)", type="filepath", value=default_audio) | |
with gr.Tab("Style from Text"): | |
style_prompt = gr.Textbox(label="Style Prompt", lines=3, placeholder="e.g., A high-energy electronic dance track with a strong bassline and euphoric synths.") | |
generate_button = gr.Button("Generate Song", variant="primary") | |
with gr.Column(): | |
gr.Markdown("### Output") | |
output_audio = gr.Audio(label="Generated Song") | |
generate_button.click( | |
fn=generate_song, | |
inputs=[reference_audio, lyrics_text, style_prompt, duration_slider], | |
outputs=output_audio, | |
api_name="generate_song" | |
) | |
# Connect example buttons to load data | |
if examples: | |
for i, button in enumerate(example_buttons): | |
button.click( | |
fn=lambda idx=i: load_example(idx, examples), | |
outputs=[reference_audio, lyrics_text, duration_slider] | |
) | |
# Create necessary temporary directories for Gradio | |
print("Creating temporary directories...") | |
try: | |
os.makedirs("/tmp/gradio", exist_ok=True) | |
print("Temporary directories created successfully.") | |
except Exception as e: | |
print(f"Warning: Could not create temporary directories: {e}") | |
demo.queue().launch() |