Spaces:

declare-lab
/

JAM

Running on Zero

App Files Files Community

renhang commited on 15 days ago

Commit

8e872fa

1 Parent(s): bd37c28

update code without examples

Browse files

Files changed (3) hide show

app.py +68 -7
model.py +15 -1
utils.py +1 -1

app.py CHANGED Viewed

@@ -92,6 +92,27 @@ def load_example(example_idx, examples):
         )
     return None, "", 120
 # Load examples at startup
 examples = load_examples()
@@ -105,14 +126,36 @@ with gr.Blocks() as demo:
     gr.Markdown("# Jamify: Music Generation from Lyrics and Style")
     gr.Markdown("Provide your lyrics, a style reference (either an audio file or a text prompt), and a desired duration to generate a song.")
     # Sample buttons section
     if examples:
         gr.Markdown("### Sample Examples")
         with gr.Row():
             example_buttons = []
             for i, example in enumerate(examples):
-                button = gr.Button(f"Example {example['id']}", variant="secondary", size="sm")
                 example_buttons.append(button)
     with gr.Row():
         with gr.Column():
@@ -120,10 +163,10 @@ with gr.Blocks() as demo:
             lyrics_text = gr.Textbox(
                 label="Lyrics",
                 lines=10,
-                placeholder="Enter lyrics in format: word[start:end] word[start:end]...\nExample: It's[4.96:5.52] a[5.52:5.84] long[5.84:6.16] way[6.16:6.48]...",
                 value=default_lyrics
             )
-            duration_slider = gr.Slider(minimum=5, maximum=230, value=default_duration, step=30, label="Duration (seconds)")
             with gr.Tab("Style from Audio"):
                 reference_audio = gr.File(label="Reference Audio (.mp3, .wav)", type="filepath", value=default_audio)
@@ -143,13 +186,31 @@ with gr.Blocks() as demo:
         api_name="generate_song"
     )
-    # Connect example buttons to load data
     if examples:
         for i, button in enumerate(example_buttons):
             button.click(
-                fn=lambda idx=i: load_example(idx, examples),
-                outputs=[reference_audio, lyrics_text, duration_slider]
             )
 # Create necessary temporary directories for Gradio
 print("Creating temporary directories...")
@@ -159,4 +220,4 @@ try:
 except Exception as e:
     print(f"Warning: Could not create temporary directories: {e}")
-demo.queue().launch()

         )
     return None, "", 120
+def clear_form():
+    """Clear all form inputs to allow user to create their own song"""
+    return None, "", 120  # audio, lyrics, duration
+def update_button_styles(selected_idx, total_examples):
+    """Update button styles to highlight the selected example"""
+    updates = []
+    for i in range(total_examples):
+        if i == selected_idx:
+            updates.append(gr.update(variant="primary"))
+        else:
+            updates.append(gr.update(variant="secondary"))
+    # Update "Make Your Own" button
+    if selected_idx == -1:
+        make_your_own_update = gr.update(variant="primary")
+    else:
+        make_your_own_update = gr.update(variant="secondary")
+    return updates + [make_your_own_update]
 # Load examples at startup
 examples = load_examples()
     gr.Markdown("# Jamify: Music Generation from Lyrics and Style")
     gr.Markdown("Provide your lyrics, a style reference (either an audio file or a text prompt), and a desired duration to generate a song.")
+    # State to track selected example (-1 means "Make Your Own" is selected, 0 is first example)
+    selected_example = gr.State(0 if examples else -1)
     # Sample buttons section
     if examples:
         gr.Markdown("### Sample Examples")
         with gr.Row():
             example_buttons = []
             for i, example in enumerate(examples):
+                # Use consistent button width and truncate long IDs if needed
+                button_text = example['id'][:12] + "..." if len(example['id']) > 15 else example['id']
+                # First button starts as primary (selected), others as secondary
+                initial_variant = "primary" if i == 0 else "secondary"
+                button = gr.Button(
+                    button_text,
+                    variant=initial_variant,
+                    size="sm",
+                    scale=1,  # Equal width for all buttons
+                    min_width=80  # Minimum consistent width
+                )
                 example_buttons.append(button)
+            # Add "Make Your Own" button with same sizing (starts as secondary since first example is selected)
+            make_your_own_button = gr.Button(
+                "🎵 Make Your Own",
+                variant="secondary",
+                size="sm",
+                scale=1,
+                min_width=80
+            )
     with gr.Row():
         with gr.Column():
             lyrics_text = gr.Textbox(
                 label="Lyrics",
                 lines=10,
+                placeholder="Enter lyrics with timestamps: word[start_time:end_time] word[start_time:end_time]...\n\nExample: Hello[0.0:1.2] world[1.5:2.8] this[3.0:3.8] is[4.2:4.6] my[5.0:5.8] song[6.2:7.0]\n\nFormat: Each word followed by [start_seconds:end_seconds] in brackets\nTimestamps should be in seconds with up to 2 decimal places",
                 value=default_lyrics
             )
+            duration_slider = gr.Slider(minimum=120, maximum=230, value=default_duration, step=1, label="Duration (seconds)")
             with gr.Tab("Style from Audio"):
                 reference_audio = gr.File(label="Reference Audio (.mp3, .wav)", type="filepath", value=default_audio)
         api_name="generate_song"
     )
+    # Connect example buttons to load data and update selection
     if examples:
+        def load_example_and_update_selection(idx):
+            """Load example data and update button selection state"""
+            audio, lyrics, duration = load_example(idx, examples)
+            button_updates = update_button_styles(idx, len(examples))
+            return [audio, lyrics, duration, idx] + button_updates
+        def clear_form_and_update_selection():
+            """Clear form and update button selection state"""
+            audio, lyrics, duration = clear_form()
+            button_updates = update_button_styles(-1, len(examples))
+            return [audio, lyrics, duration, -1] + button_updates
         for i, button in enumerate(example_buttons):
             button.click(
+                fn=lambda idx=i: load_example_and_update_selection(idx),
+                outputs=[reference_audio, lyrics_text, duration_slider, selected_example] + example_buttons + [make_your_own_button]
             )
+        # Connect "Make Your Own" button to clear form and update selection
+        make_your_own_button.click(
+            fn=clear_form_and_update_selection,
+            outputs=[reference_audio, lyrics_text, duration_slider, selected_example] + example_buttons + [make_your_own_button]
+        )
 # Create necessary temporary directories for Gradio
 print("Creating temporary directories...")
 except Exception as e:
     print(f"Warning: Could not create temporary directories: {e}")
+demo.queue().launch(share=True)

model.py CHANGED Viewed

@@ -173,7 +173,21 @@ class Jamify:
         if pred_audio.shape[1] > trim_samples:
             pred_audio = pred_audio[:, :trim_samples]
-        output_path = "generated_song.mp3"
         print(f"Saving audio to {output_path}")
         torchaudio.save(output_path, pred_audio, sample_rate, format="mp3")

         if pred_audio.shape[1] > trim_samples:
             pred_audio = pred_audio[:, :trim_samples]
+        import time
+        import glob
+        # Clean up old generated files (keep only last 5 files)
+        old_files = sorted(glob.glob("generated_song_*.mp3"))
+        if len(old_files) >= 5:
+            for old_file in old_files[:-4]:  # Keep last 4, delete older ones
+                try:
+                    os.remove(old_file)
+                    print(f"Cleaned up old file: {old_file}")
+                except OSError:
+                    pass
+        timestamp = int(time.time() * 1000)  # Use milliseconds for uniqueness
+        output_path = f"generated_song_{timestamp}.mp3"
         print(f"Saving audio to {output_path}")
         torchaudio.save(output_path, pred_audio, sample_rate, format="mp3")

utils.py CHANGED Viewed

@@ -121,7 +121,7 @@ def json_to_text(json_data: dict) -> str:
     words = json_data['word']
     # Group words into segments using the existing regroup_words function
-    segments = regroup_words(words, max_len=15.0, gap=0.50)
     # Convert each segment to text format
     segment_lines = []

     words = json_data['word']
     # Group words into segments using the existing regroup_words function
+    segments = regroup_words(words, max_len=5, gap=0.50)
     # Convert each segment to text format
     segment_lines = []