JAM / app.py
renhang
update
a1ddd2f
raw
history blame
5.97 kB
import spaces
import gradio as gr
import os
import json
import tempfile
from pathlib import Path
from model import Jamify
from utils import json_to_text, text_to_json
# Initialize the Jamify model once
print("Initializing Jamify model...")
jamify_model = Jamify()
print("Jamify model ready.")
gr.set_static_paths(paths=[Path.cwd().absolute()])
@spaces.GPU(duration=100)
def generate_song(reference_audio, lyrics_text, style_prompt, duration):
# We need to save the uploaded files to temporary paths to pass to the model
reference_audio = reference_audio not in ("", None) and reference_audio or None
# Convert text format to JSON and save to temporary file
lyrics_json = text_to_json(lyrics_text)
# Create temporary file for lyrics JSON
with tempfile.NamedTemporaryFile(mode='w', suffix='.json', delete=False) as f:
json.dump(lyrics_json, f, indent=2)
lyrics_file = f.name
try:
output_path = jamify_model.predict(
reference_audio_path=reference_audio,
lyrics_json_path=lyrics_file,
style_prompt=style_prompt,
duration_sec=duration
)
return output_path
finally:
# Clean up temporary file
if os.path.exists(lyrics_file):
os.unlink(lyrics_file)
# Load and cache examples
def load_examples():
"""Load examples from the examples directory and pre-compute text formats"""
examples = []
examples_file = "examples/input.json"
if os.path.exists(examples_file):
print("Loading and caching examples...")
with open(examples_file, 'r') as f:
examples_data = json.load(f)
for example in examples_data:
example_id = example.get('id', '')
audio_path = example.get('audio_path', '')
lrc_path = example.get('lrc_path', '')
duration = example.get('duration', 120)
# Load lyrics and convert to text format (pre-computed/cached)
lyrics_text = ""
if os.path.exists(lrc_path):
try:
with open(lrc_path, 'r') as f:
lyrics_json = json.load(f)
lyrics_text = json_to_text(lyrics_json)
print(f"Cached example {example_id}: {len(lyrics_text)} chars")
except Exception as e:
print(f"Error loading lyrics from {lrc_path}: {e}")
examples.append({
'id': example_id,
'audio_path': audio_path if os.path.exists(audio_path) else None,
'lyrics_text': lyrics_text,
'duration': duration
})
print(f"Loaded {len(examples)} cached examples")
return examples
def load_example(example_idx, examples):
"""Load a specific example and return its data"""
if 0 <= example_idx < len(examples):
example = examples[example_idx]
return (
example['audio_path'],
example['lyrics_text'],
example['duration']
)
return None, "", 120
# Load examples at startup
examples = load_examples()
# Get default values from first example
default_audio = examples[0]['audio_path'] if examples else None
default_lyrics = examples[0]['lyrics_text'] if examples else ""
default_duration = examples[0]['duration'] if examples else 120
# Gradio interface
with gr.Blocks() as demo:
gr.Markdown("# Jamify: Music Generation from Lyrics and Style")
gr.Markdown("Provide your lyrics, a style reference (either an audio file or a text prompt), and a desired duration to generate a song.")
# Sample buttons section
if examples:
gr.Markdown("### Sample Examples")
with gr.Row():
example_buttons = []
for i, example in enumerate(examples):
button = gr.Button(f"Example {example['id']}", variant="secondary", size="sm")
example_buttons.append(button)
with gr.Row():
with gr.Column():
gr.Markdown("### Inputs")
lyrics_text = gr.Textbox(
label="Lyrics",
lines=10,
placeholder="Enter lyrics in format: word[start:end] word[start:end]...\nExample: It's[4.96:5.52] a[5.52:5.84] long[5.84:6.16] way[6.16:6.48]...",
value=default_lyrics
)
duration_slider = gr.Slider(minimum=5, maximum=230, value=default_duration, step=30, label="Duration (seconds)")
with gr.Tab("Style from Audio"):
reference_audio = gr.File(label="Reference Audio (.mp3, .wav)", type="filepath", value=default_audio)
with gr.Tab("Style from Text"):
style_prompt = gr.Textbox(label="Style Prompt", lines=3, placeholder="e.g., A high-energy electronic dance track with a strong bassline and euphoric synths.")
generate_button = gr.Button("Generate Song", variant="primary")
with gr.Column():
gr.Markdown("### Output")
output_audio = gr.Audio(label="Generated Song")
generate_button.click(
fn=generate_song,
inputs=[reference_audio, lyrics_text, style_prompt, duration_slider],
outputs=output_audio,
api_name="generate_song"
)
# Connect example buttons to load data
if examples:
for i, button in enumerate(example_buttons):
button.click(
fn=lambda idx=i: load_example(idx, examples),
outputs=[reference_audio, lyrics_text, duration_slider]
)
# Create necessary temporary directories for Gradio
print("Creating temporary directories...")
try:
os.makedirs("/tmp/gradio", exist_ok=True)
print("Temporary directories created successfully.")
except Exception as e:
print(f"Warning: Could not create temporary directories: {e}")
demo.queue().launch()