Spaces:

PatienceIzere
/

AudioTranscriber

Running

App Files Files Community

PatienceIzere commited on 11 days ago

Commit

7bcfa4d

verified ·

1 Parent(s): a6e99c9

Update app.py

Browse files

Files changed (1) hide show

app.py +54 -15

app.py CHANGED Viewed

@@ -25,21 +25,34 @@ def init_recording():
         from hf_transcriber import HFTranscriber
         from recorder import AudioRecorder, list_audio_devices
-        # Update config
-        app_config['RECORDING_ENABLED'] = True
         app_config['AudioRecorder'] = AudioRecorder
         app_config['list_audio_devices'] = list_audio_devices
         # Try to list audio devices to verify everything works
-        app_config['AUDIO_DEVICES'] = list_audio_devices()
         return True
     except ImportError as e:
-        st.warning(f"Some features may be limited: {str(e)}")
         app_config['RECORDING_ENABLED'] = False
         return False
     except Exception as e:
-        st.warning(f"Audio device initialization failed: {str(e)}")
         app_config['RECORDING_ENABLED'] = False
         return False
@@ -75,7 +88,14 @@ def main():
     st.title("🎵 Audio to Sheet Music Transcriber")
     st.markdown("### Convert monophonic audio to sheet music")
-    # Initialize session state for recording
     if app_config['RECORDING_ENABLED']:
         if 'recorder' not in st.session_state:
             try:
@@ -85,24 +105,43 @@ def main():
                 st.error(f"Failed to initialize audio recorder: {str(e)}")
                 app_config['RECORDING_ENABLED'] = False
-    st.sidebar.header("Transcription Settings")
-    use_hf = st.sidebar.checkbox("Use Hugging Face Model", value=True)
     # Initialize model_name with a default value
-    model_name = "microsoft/speecht5_asr"
     if use_hf:
-        model_name = st.sidebar.selectbox(
             "Select Model",
-            ["microsoft/speecht5_asr", "facebook/wav2vec2-base-960h"],
             index=0
         )
     # Audio Input Section
-    st.sidebar.header("Audio Input")
-    # Always show file upload option
-    input_method = st.sidebar.radio("Choose input method:",
-                                  ["Upload Audio File"] + (["Record Live Audio"] if app_config['RECORDING_ENABLED'] else []))
     audio_file = None

         from hf_transcriber import HFTranscriber
         from recorder import AudioRecorder, list_audio_devices
+        # Update config with recording components
         app_config['AudioRecorder'] = AudioRecorder
         app_config['list_audio_devices'] = list_audio_devices
         # Try to list audio devices to verify everything works
+        try:
+            devices = list_audio_devices()
+            app_config['AUDIO_DEVICES'] = devices
+            if not devices or not any(d.get('max_input_channels', 0) > 0 for d in devices):
+                st.warning("⚠️ No input devices with recording capability found. Using fallback mode.")
+                app_config['RECORDING_ENABLED'] = False
+            else:
+                app_config['RECORDING_ENABLED'] = True
+        except Exception as e:
+            st.warning(f"⚠️ Could not detect audio devices: {str(e)}. Using fallback mode.")
+            app_config['RECORDING_ENABLED'] = False
+            app_config['AUDIO_DEVICES'] = []
         return True
     except ImportError as e:
+        st.warning(f"⚠️ Some features may be limited: {str(e)}")
         app_config['RECORDING_ENABLED'] = False
         return False
     except Exception as e:
+        st.warning(f"⚠️ Audio initialization failed: {str(e)}. Using fallback mode.")
         app_config['RECORDING_ENABLED'] = False
         return False
     st.title("🎵 Audio to Sheet Music Transcriber")
     st.markdown("### Convert monophonic audio to sheet music")
+    # Show warning if no audio devices are available
+    if not app_config['RECORDING_ENABLED']:
+        st.warning("""
+        ⚠️ **No audio recording devices detected**
+        You can still use this app by uploading audio files for transcription.
+        """, icon="⚠️")
+    # Initialize session state for recording if enabled
     if app_config['RECORDING_ENABLED']:
         if 'recorder' not in st.session_state:
             try:
                 st.error(f"Failed to initialize audio recorder: {str(e)}")
                 app_config['RECORDING_ENABLED'] = False
+    # Sidebar settings
+    st.sidebar.header("🔧 Transcription Settings")
+    # Model selection
+    use_hf = st.sidebar.checkbox("Use Hugging Face Model", value=True,
+                               help="Use pre-trained models from Hugging Face for better accuracy")
     # Initialize model_name with a default value
+    model_name = "openai/whisper-small"  # Default to whisper for better accuracy
     if use_hf:
+        model_options = {
+            "Whisper Small (Recommended)": "openai/whisper-small",
+            "Whisper Base": "openai/whisper-base",
+            "Wav2Vec2 Base": "facebook/wav2vec2-base-960h",
+            "SpeechT5": "microsoft/speecht5_asr"
+        }
+        model_display = st.sidebar.selectbox(
             "Select Model",
+            options=list(model_options.keys()),
             index=0
         )
+        model_name = model_options[model_display]
     # Audio Input Section
+    st.sidebar.header("🎤 Audio Input")
+    # Input method selection
+    input_methods = ["Upload Audio File"]
+    if app_config['RECORDING_ENABLED']:
+        input_methods.append("Record Live Audio")
+    input_method = st.sidebar.radio(
+        "Choose input method:",
+        input_methods,
+        help="Select how you want to provide the audio for transcription"
+    )
     audio_file = None