Spaces:

OrganizedProgrammers
/

kig_test

Sleeping

App Files Files Community

adrienbrdne commited on Apr 14

Commit

f8ac349

verified ·

1 Parent(s): fa98115

Upload 3 files

Browse files

Files changed (3) hide show

app.py +212 -0
config.json +19 -0
requirements.txt +16 -0

app.py ADDED Viewed

	@@ -0,0 +1,212 @@

+import os
+import streamlit as st
+from langchain_community.graphs import Neo4jGraph
+import pandas as pd
+import json
+import time
+from ki_gen.planner import build_planner_graph
+from ki_gen.utils import init_app, memory
+from ki_gen.prompts import get_initial_prompt
+from neo4j import GraphDatabase
+# Set page config
+st.set_page_config(page_title="Key Issue Generator", layout="wide")
+# Neo4j Database Configuration
+NEO4J_URI = "neo4j+s://4985272f.databases.neo4j.io"
+NEO4J_USERNAME = "neo4j"
+NEO4J_PASSWORD = os.getenv("neo4j_password")
+# API Keys for LLM services
+OPENAI_API_KEY = os.getenv("openai_api_key")
+GROQ_API_KEY = os.getenv("groq_api_key")
+LANGSMITH_API_KEY = os.getenv("langsmith_api_key")
+def verify_neo4j_connectivity():
+    """Verify connection to Neo4j database"""
+    try:
+        with GraphDatabase.driver(NEO4J_URI, auth=(NEO4J_USERNAME, NEO4J_PASSWORD)) as driver:
+            return driver.verify_connectivity()
+    except Exception as e:
+        return f"Error: {str(e)}"
+def load_config():
+    """Load configuration with custom parameters"""
+    # Custom configuration based on provided parameters
+    custom_config = {
+        "main_llm": "deepseek-r1-distill-llama-70b",
+        "plan_method": "generation",
+        "use_detailed_query": False,
+        "cypher_gen_method": "guided",
+        "validate_cypher": False,
+        "summarize_model": "deepseek-r1-distill-llama-70b",
+        "eval_method": "binary",
+        "eval_threshold": 0.7,
+        "max_docs": 15,
+        "compression_method": "llm_lingua",
+        "compress_rate": 0.33,
+        "force_tokens": ["."],  # Converting to list format as expected by the application
+        "eval_model": "deepseek-r1-distill-llama-70b",
+        "thread_id": "3"
+    }
+    # Add Neo4j graph object to config
+    try:
+        neo_graph = Neo4jGraph(
+            url=NEO4J_URI,
+            username=NEO4J_USERNAME,
+            password=NEO4J_PASSWORD
+        )
+        custom_config["graph"] = neo_graph
+    except Exception as e:
+        st.error(f"Error connecting to Neo4j: {e}")
+        return None
+    return {"configurable": custom_config}
+def generate_key_issues(user_query):
+    """Main function to generate key issues from Neo4j data"""
+    # Initialize application with API keys
+    init_app(
+        openai_key=OPENAI_API_KEY,
+        groq_key=GROQ_API_KEY,
+        langsmith_key=LANGSMITH_API_KEY
+    )
+    # Load configuration with custom parameters
+    config = load_config()
+    if not config:
+        return None
+    # Create status containers
+    plan_status = st.empty()
+    plan_display = st.empty()
+    retrieval_status = st.empty()
+    processing_status = st.empty()
+    # Build planner graph
+    plan_status.info("Building planner graph...")
+    graph = build_planner_graph(memory, config["configurable"])
+    # Execute initial prompt generation
+    plan_status.info(f"Generating plan for query: {user_query}")
+    messages_content = []
+    for event in graph.stream(get_initial_prompt(config, user_query), config, stream_mode="values"):
+        if "messages" in event:
+            event["messages"][-1].pretty_print()
+            messages_content.append(event["messages"][-1].content)
+    # Get the state with the generated plan
+    state = graph.get_state(config)
+    steps = [i for i in range(1, len(state.values['store_plan'])+1)]
+    plan_df = pd.DataFrame({'Plan steps': steps, 'Description': state.values['store_plan']})
+    # Display the plan
+    plan_status.success("Plan generation complete!")
+    plan_display.dataframe(plan_df, use_container_width=True)
+    # Continue with plan execution for document retrieval
+    retrieval_status.info("Retrieving documents...")
+    for event in graph.stream(None, config, stream_mode="values"):
+        if "messages" in event:
+            event["messages"][-1].pretty_print()
+            messages_content.append(event["messages"][-1].content)
+    # Get updated state after document retrieval
+    snapshot = graph.get_state(config)
+    doc_count = len(snapshot.values.get('valid_docs', []))
+    retrieval_status.success(f"Retrieved {doc_count} documents")
+    # Proceed to document processing
+    processing_status.info("Processing documents...")
+    process_steps = ["summarize"]  # Using summarize as default processing step
+    # Update state to indicate human validation is complete and specify processing steps
+    graph.update_state(config, {'human_validated': True, 'process_steps': process_steps}, as_node="human_validation")
+    # Continue execution with document processing
+    for event in graph.stream(None, config, stream_mode="values"):
+        if "messages" in event:
+            event["messages"][-1].pretty_print()
+            messages_content.append(event["messages"][-1].content)
+    # Get final state after processing
+    final_snapshot = graph.get_state(config)
+    processing_status.success("Document processing complete!")
+    if "messages" in final_snapshot.values:
+        final_result = final_snapshot.values["messages"][-1].content
+        return final_result, final_snapshot.values.get('valid_docs', [])
+    return None, []
+# App header
+st.title("Key Issue Generator")
+st.write("Generate key issues from a Neo4j knowledge graph using advanced language models.")
+# Check database connectivity
+connectivity_status = verify_neo4j_connectivity()
+st.sidebar.header("Database Status")
+if "Error" not in str(connectivity_status):
+    st.sidebar.success("Connected to Neo4j database")
+else:
+    st.sidebar.error(f"Database connection issue: {connectivity_status}")
+# User input section
+st.header("Enter Your Query")
+user_query = st.text_area("What would you like to explore?",
+                         "What are the main challenges in AI adoption for healthcare systems?",
+                         height=100)
+# Process button
+if st.button("Generate Key Issues", type="primary"):
+    if not OPENAI_API_KEY or not GROQ_API_KEY or not LANGSMITH_API_KEY or not NEO4J_PASSWORD:
+        st.error("Required API keys or database credentials are missing. Please check your environment variables.")
+    else:
+        with st.spinner("Processing your query..."):
+            start_time = time.time()
+            final_result, valid_docs = generate_key_issues(user_query)
+            end_time = time.time()
+            if final_result:
+                # Display execution time
+                st.sidebar.info(f"Total execution time: {round(end_time - start_time, 2)} seconds")
+                # Display final result
+                st.header("Generated Key Issues")
+                st.markdown(final_result)
+                # Option to download results
+                st.download_button(
+                    label="Download Results",
+                    data=final_result,
+                    file_name="key_issues_results.txt",
+                    mime="text/plain"
+                )
+                # Display retrieved documents in expandable section
+                if valid_docs:
+                    with st.expander("View Retrieved Documents"):
+                        for i, doc in enumerate(valid_docs):
+                            st.markdown(f"### Document {i+1}")
+                            for key in doc:
+                                st.markdown(f"**{key}**: {doc[key]}")
+                            st.divider()
+            else:
+                st.error("An error occurred during processing. Please check the logs for details.")
+# Help information in sidebar
+with st.sidebar:
+    st.header("About")
+    st.info("""
+    This application uses advanced language models to analyze a Neo4j knowledge graph and generate key issues
+    based on your query. The process involves:
+    1. Creating a plan based on your query
+    2. Retrieving relevant documents from the database
+    3. Processing and summarizing the information
+    4. Generating a comprehensive response
+    """)

config.json ADDED Viewed

	@@ -0,0 +1,19 @@

+{
+"main_llm": "deepseek-r1-distill-llama-70b",
+"plan_method": "generation",
+"use_detailed_query": false,
+"cypher_gen_method": "guided",
+"validate_cypher": false,
+"summarize_model": "deepseek-r1-distill-llama-70b",
+"eval_method": "binary",
+"eval_threshold":0.7,
+"max_docs":15,
+"compression_method":"llm_lingua",
+"compress_rate":0.33,
+"force_tokens":".",
+"eval_model":"deepseek-r1-distill-llama-70b",
+"graph": {"address": "neo4j+s://4985272f.databases.neo4j.io", "username":"neo4j", "password":"***"},
+"openai_api_key": "***",
+"groq_api_key":"***",
+"langsmith_api_key":"***"
+}

requirements.txt ADDED Viewed

	@@ -0,0 +1,16 @@

+langchain-community==0.3.0
+sentence-transformers==3.1.0
+openpyxl==3.1.5
+langchain-groq==0.2.0
+langchain-openai==0.2.0
+langchain-core==0.3.1
+llmlingua==0.2.2
+langgraph>=0.2.4
+langgraph-checkpoint-sqlite==1.0.3
+langsmith==0.1.123
+faiss-cpu==1.8.0.post1
+neo4j==5.24.0
+gradio==4.44.0
+streamlit==1.31.0
+pandas==2.1.3
+pydantic==2.9.2