Spaces:

invincible-jha
/

vc-copilot

Sleeping

App Files Files Community

invincible-jha commited on Nov 25, 2024

Commit

9f71913

verified ·

1 Parent(s): 788d26b

Upload 2 files

Browse files

Files changed (1) hide show

app.py +19 -239

app.py CHANGED Viewed

@@ -1,63 +1,19 @@
-import streamlit as st
-import whisper
-import pandas as pd
-from datetime import datetime
-import tempfile
-import os
-import torch
-from transformers import (
-    AutoModelForCausalLM,
-    AutoTokenizer,
-    pipeline,
-    BitsAndBytesConfig
-)
-import gc
-from typing import Optional, Dict, Any, List
-import logging
-import json
-import numpy as np
-from dataclasses import dataclass, asdict
-from queue import Queue
-import threading
-from collections import defaultdict
-# Configure logging
-logging.basicConfig(level=logging.INFO)
-logger = logging.getLogger(__name__)
-# Constants for memory optimization
-CHUNK_SIZE = 30  # seconds
-MAX_AUDIO_LENGTH = 600  # seconds (10 minutes)
-BATCH_SIZE = 8
-# Model configurations with memory optimization
 MODEL_CONFIGS = {
-    "Mistral-7B-Instruct": {
-        "path": "mistralai/Mistral-7B-Instruct-v0.1",
-        "description": "Efficient model for real-time analysis",
-        "memory_required": "16GB"
     }
 }
-@dataclass
-class VCStyle:
-    """Store VC's personal style preferences"""
-    name: str
-    note_format: Dict[str, Any]
-    key_interests: List[str]
-    custom_sections: List[str]
-    insight_preferences: Dict[str, float]
-@dataclass
-class LiveCallContext:
-    """Store context for live calls"""
-    meeting_id: str
-    participants: List[str]
-    topics: List[str]
-    key_points: List[str]
-    questions_asked: List[str]
-    action_items: List[str]
 class ModelManager:
     """Handles model loading and resource management"""
@@ -87,13 +43,11 @@ class ModelManager:
             tokenizer = AutoTokenizer.from_pretrained(
                 config["path"],
-                token=st.secrets.get("HF_TOKEN"),
                 trust_remote_code=True
             )
             model = AutoModelForCausalLM.from_pretrained(
                 config["path"],
-                token=st.secrets.get("HF_TOKEN"),
                 quantization_config=bnb_config,
                 device_map="auto",
                 torch_dtype=torch.float16,
@@ -104,7 +58,7 @@ class ModelManager:
                 "text-generation",
                 model=model,
                 tokenizer=tokenizer,
-                max_new_tokens=512,  # Reduced for memory
                 temperature=0.7,
                 top_p=0.95,
                 repetition_penalty=1.15,
@@ -118,100 +72,6 @@ class ModelManager:
             st.error("Failed to load language model. Please try again.")
             return None
-class AudioProcessor:
-    """Handles audio processing with memory optimization"""
-    def __init__(self, model):
-        self.model = model
-        self.chunk_queue = Queue()
-    def process_audio_chunk(self, audio_chunk) -> Optional[str]:
-        try:
-            # Clear GPU memory before processing
-            if torch.cuda.is_available():
-                torch.cuda.empty_cache()
-            result = self.model.transcribe(
-                audio_chunk,
-                language="en",
-                task="transcribe",
-                fp16=True  # Use half precision
-            )
-            return result["text"]
-        except Exception as e:
-            logger.error(f"Error processing audio chunk: {e}")
-            return None
-        finally:
-            # Cleanup
-            gc.collect()
-            if torch.cuda.is_available():
-                torch.cuda.empty_cache()
-class ContentAnalyzer:
-    """Handles text analysis with optimized prompts"""
-    def __init__(self, generator):
-        self.generator = generator
-    def analyze_text(self, text: str, vc_style: VCStyle) -> Optional[Dict[str, Any]]:
-        try:
-            prompt = self._create_analysis_prompt(text, vc_style)
-            response = self._generate_response(prompt, max_length=512)
-            return self._parse_response(response)
-        except Exception as e:
-            logger.error(f"Analysis error: {e}")
-            return None
-    def _create_analysis_prompt(self, text: str, vc_style: VCStyle) -> str:
-        return f"""Analyze this startup pitch focusing on {', '.join(vc_style.key_interests)}:
-        {text}
-        Provide structured insights for:
-        1. Key Points
-        2. Metrics
-        3. Risks
-        4. Questions"""
-    def _generate_response(self, prompt: str, max_length: int) -> str:
-        try:
-            response = self.generator(
-                prompt,
-                max_new_tokens=max_length,
-                temperature=0.7,
-                top_p=0.95,
-                repetition_penalty=1.15
-            )
-            return response[0]['generated_text']
-        except Exception as e:
-            logger.error(f"Generation error: {e}")
-            return ""
-class UIManager:
-    """Manages Streamlit UI with performance optimization"""
-    @staticmethod
-    def setup_page():
-        st.set_page_config(
-            page_title="VC Call Assistant",
-            page_icon="🎙️",
-            layout="wide",
-            initial_sidebar_state="expanded"
-        )
-    @staticmethod
-    def show_file_uploader() -> Optional[Any]:
-        return st.file_uploader(
-            "Upload Audio (Max 10 minutes)",
-            type=['wav', 'mp3', 'm4a'],
-            help="Supports WAV, MP3, M4A formats. Maximum duration: 10 minutes."
-        )
-    @staticmethod
-    def show_progress(text: str) -> Any:
-        return st.progress(0, text=text)
 def main():
     try:
         # Initialize UI
@@ -220,95 +80,15 @@ def main():
         # Sidebar
         with st.sidebar:
             st.title("VC Assistant Settings")
-            model_name = "Mistral-7B-Instruct"  # Fixed for stability
             st.info(f"""Using {model_name}
             Memory Usage: {MODEL_CONFIGS[model_name]['memory_required']}
             Description: {MODEL_CONFIGS[model_name]['description']}""")
-            # VC Profile
-            vc_name = st.text_input("Your Name")
-            note_style = st.selectbox(
-                "Note Style",
-                ["Bullet Points", "Paragraphs", "Q&A"]
-            )
-            interests = st.multiselect(
-                "Focus Areas",
-                ["Product", "Market", "Team", "Financials", "Technology"],
-                default=["Product", "Market"]
-            )
-        # Main content
-        st.title("🎙️ VC Call Assistant")
-        if not vc_name:
-            st.warning("Please enter your name in the sidebar.")
-            return
-        # Initialize processors
-        with st.spinner("Loading models..."):
-            whisper_model = ModelManager.load_whisper()
-            llm = ModelManager.load_llm(model_name)
-            if not whisper_model or not llm:
-                st.error("Failed to initialize models. Please refresh the page.")
-                return
-            audio_processor = AudioProcessor(whisper_model)
-            analyzer = ContentAnalyzer(llm)
-        # File upload
-        audio_file = UIManager.show_file_uploader()
-        if audio_file:
-            # Process audio
-            with st.spinner("Processing audio..."):
-                transcription = audio_processor.process_audio_chunk(audio_file)
-                if transcription:
-                    # Display results
-                    col1, col2 = st.columns(2)
-                    with col1:
-                        st.subheader("📝 Transcript")
-                        st.write(transcription)
-                    with col2:
-                        st.subheader("🔍 Analysis")
-                        vc_style = VCStyle(
-                            name=vc_name,
-                            note_format={"style": note_style},
-                            key_interests=interests,
-                            custom_sections=[],
-                            insight_preferences={}
-                        )
-                        analysis = analyzer.analyze_text(transcription, vc_style)
-                        if analysis:
-                            st.write(analysis)
-                            # Export option
-                            st.download_button(
-                                "📥 Export Analysis",
-                                data=json.dumps({
-                                    "timestamp": datetime.now().isoformat(),
-                                    "transcription": transcription,
-                                    "analysis": analysis
-                                }, indent=2),
-                                file_name=f"vc_analysis_{datetime.now():%Y%m%d_%H%M%S}.json",
-                                mime="application/json"
-                            )
-    except Exception as e:
-        logger.error(f"Application error: {e}")
-        st.error("An unexpected error occurred. Please refresh the page.")
-    finally:
-        # Cleanup
-        gc.collect()
-        if torch.cuda.is_available():
-            torch.cuda.empty_cache()
-if __name__ == "__main__":
-    main()

+# Only showing the modified sections for brevity
+# Update MODEL_CONFIGS to use open models
 MODEL_CONFIGS = {
+    "FLAN-T5-Large": {
+        "path": "google/flan-t5-large",
+        "description": "Efficient open-source model for analysis",
+        "memory_required": "8GB"
+    },
+    "OpenAssistant": {
+        "path": "OpenAssistant/oasst-sft-4-pythia-12b-epoch-3.5",
+        "description": "Powerful open-source assistant model",
+        "memory_required": "12GB"
     }
 }
 class ModelManager:
     """Handles model loading and resource management"""
             tokenizer = AutoTokenizer.from_pretrained(
                 config["path"],
                 trust_remote_code=True
             )
             model = AutoModelForCausalLM.from_pretrained(
                 config["path"],
                 quantization_config=bnb_config,
                 device_map="auto",
                 torch_dtype=torch.float16,
                 "text-generation",
                 model=model,
                 tokenizer=tokenizer,
+                max_new_tokens=512,
                 temperature=0.7,
                 top_p=0.95,
                 repetition_penalty=1.15,
             st.error("Failed to load language model. Please try again.")
             return None
 def main():
     try:
         # Initialize UI
         # Sidebar
         with st.sidebar:
             st.title("VC Assistant Settings")
+            model_name = st.selectbox(
+                "Select Model",
+                list(MODEL_CONFIGS.keys()),
+                index=0,
+                help="Choose the AI model for analysis"
+            )
             st.info(f"""Using {model_name}
             Memory Usage: {MODEL_CONFIGS[model_name]['memory_required']}
             Description: {MODEL_CONFIGS[model_name]['description']}""")
+            # Rest of the sidebar code remains the same