Spaces:

DeathBlade020
/

MedicalQAChatBotRAG

Running

App Files Files Community

DeathBlade020 commited on Jul 1

Commit

d8140c0

verified ·

1 Parent(s): 6b2f56f

Upload 4 files

Browse files

Files changed (4) hide show

src/__init__.py +0 -0
src/constants.py +45 -0
src/get_graph.py +368 -0
src/get_medical_system.py +133 -0

src/__init__.py ADDED Viewed

File without changes

src/constants.py ADDED Viewed

	@@ -0,0 +1,45 @@

+spinner_messages = [
+    "Searching the universe...",
+    "Consulting the medical oracles...",
+    "Paging Dr. AI...",
+    "Googling responsibly...",
+    "Checking the medical textbooks...",
+    "Assembling a team of virtual doctors...",
+    "Running with scissors (just kidding)...",
+    "Putting on my lab coat...",
+    "Sterilizing the stethoscope...",
+    "Counting imaginary pills...",
+    "Reading the fine print on the prescription...",
+    "Asking the mitochondria (it's the powerhouse)...",
+    "Checking WebMD (not really)...",
+    "Looking for my AI degree...",
+    "Washing my hands for 20 seconds...",
+    "Trying not to diagnose you with everything..."
+]
+sidebar_messages = """
+    **Medical Assistant Features:**
+    - 🏥 Medical Q&A database
+    - 🚨 Emergency detection
+    - 🔍 Smart document retrieval
+    - 🧠 Conversation memory  # NEW FEATURE
+    - ⚖️ Safety disclaimers
+    **💬 Memory Commands:**
+    - "Summarize my previous questions"
+    - "What did we discuss earlier?"
+    - "Can you review our conversation?"
+    **⚠️ Important:**
+    - This is for educational purposes only
+    - Always consult healthcare professionals
+    - Call 100 for emergencies
+    """
+st_error_message = "I'm sorry, I'm having technical difficulties. Please try again or consult a healthcare professional."
+st_title = "🏥 Medical Assistant Chatbot"
+st_markdown = "Ask me medical questions! **For emergencies, call 100 immediately.**"
+st_welcome_message = "Namaste! I'm your medical assistant. I can help answer medical questions, but for emergencies, please call 100 immediately. How can I help you today?"

src/get_graph.py ADDED Viewed

	@@ -0,0 +1,368 @@

+from typing import TypedDict, Literal
+from langchain_core.callbacks.manager import CallbackManagerForRetrieverRun
+from pydantic import Field
+from pydantic import BaseModel
+import streamlit as st
+from langchain_core.messages import HumanMessage, SystemMessage
+from get_medical_system import load_medical_system
+from langchain.prompts import PromptTemplate
+from langchain.chains import ConversationalRetrievalChain
+from langchain_community.document_loaders import AmazonTextractPDFLoader
+from langgraph.graph import StateGraph, END, START
+from langchain_community.document_loaders import UnstructuredPDFLoader
+class Route(BaseModel):
+    step: Literal["RAG", "GENERAL", "EMERGENCY", "MEMORY"] = Field(None, description="The next step in the routing process") # type: ignore
+class State(TypedDict):
+    question: str
+    answer: str
+    decision: str
+from langchain_core.retrievers import BaseRetriever
+from typing import List
+from langchain_core.documents import Document
+def init_document_memory():
+    """Initialize document memory in session state"""
+    if "uploaded_documents" not in st.session_state:
+        st.session_state.uploaded_documents = {}
+documents, ensemble_retriever, llm, reranker = load_medical_system()
+router = llm.with_structured_output(Route, method="function_calling")
+def extract_conversation_history():
+    """Extract conversation from session state"""
+    if "messages" not in st.session_state:
+        return []
+    conversation = []
+    for msg in st.session_state.messages:
+        if msg["role"] == "user":
+            conversation.append(f"User: {msg['content']}")
+        elif msg["role"] == "assistant" and not msg["content"].startswith("Hello!"):
+            conversation.append(f"Assistant: {msg['content']}")
+    return conversation
+def handle_conversation_query(state: State):
+    """Handle questions about conversation history"""
+    conversation = extract_conversation_history()
+    if not conversation:
+        return {"answer": "We haven't had any conversation yet. Feel free to ask me a medical question though!"}
+    # Create conversation context
+    conversation_text = "\n".join(conversation[-10:])  # Last 10 exchanges
+    result = llm.invoke([
+        SystemMessage(content=f"""
+Based on this conversation history, answer the user's question about our previous discussion:
+Conversation History:
+{conversation_text}
+Rules:
+- If they ask for a summary, provide a brief overview
+- If they ask about specific questions, reference them
+- If they ask about previous answers, summarize the key points
+- Always maintain medical disclaimers in your response
+        """),
+        HumanMessage(content=state['question'])
+    ])
+    return {"answer": result.content}
+def is_conversation_query(question: str) -> bool:
+    """Check if the question is about conversation history"""
+    memory_keywords = [
+        "previous", "last", "earlier", "before", "summarize", "summarise",
+        "what did i ask", "my questions", "conversation", "history",
+        "we talked", "discussed", "mentioned"
+    ]
+    question_lower = question.lower()
+    return any(keyword in question_lower for keyword in memory_keywords)
+def llm_call_router(state: State):
+    """Enhanced router that includes document routing"""
+    # if st.session_state.get("current_document"):
+    #     return {'decision': "DOCUMENT"}
+    # Check for conversation/memory queries FIRST
+    if is_conversation_query(state['question']):
+        return {'decision': "MEMORY"}
+    # Check if question is about an uploaded document
+    # document_keywords = ["document", "report", "lab results", "test results", "my results", "uploaded", "file"]
+    # if any(keyword in state['question'].lower() for keyword in document_keywords):
+    #     if "current_document" in st.session_state and st.session_state.current_document:
+    #         return {'decision': "DOCUMENT"}
+    # Emergency check
+    emergency_keywords = ["severe", "chest pain", "can't breathe", "emergency", "urgent",
+                         "heart attack", "stroke", "bleeding", "unconscious"]
+    question_lower = state['question'].lower()
+    if any(keyword in question_lower for keyword in emergency_keywords):
+        return {'decision': "EMERGENCY"}
+    # Regular routing
+    decision = router.invoke([
+        SystemMessage(content="Route the input to RAG (medical questions) or GENERAL based on the user's request"),
+        HumanMessage(content=state['question'])
+    ])
+    return {"decision": decision.step} # type: ignore
+def emergency_node(state: State):
+    """Handle emergency queries safely"""
+    return {"answer": "🚨 EMERGENCY: Please seek immediate medical attention or call emergency services (911). This system cannot provide emergency medical care."}
+def rag_node(state: State):
+    """Uses RAG to answer the question with reranking"""
+    custom_prompt = PromptTemplate(
+        input_variables=["context", "question"],
+        template="""You are a medical information assistant. Use the following medical Q&A context to answer questions accurately and safely.
+        Context: {context}
+        Question: {question}
+        Guidelines:
+        - Provide accurate medical information based on the context above
+        - Always recommend consulting healthcare professionals for medical decisions
+        - If uncertain, clearly state limitations
+        - If the question is not suitable for this bot, respond with: "I'm not able to provide medical advice. Please consult a medical professional."
+        Answer:"""
+    )
+    qa_chain = ConversationalRetrievalChain.from_llm(
+        llm=llm,
+        retriever=ensemble_retriever,
+        return_source_documents=True,
+        combine_docs_chain_kwargs={"prompt": custom_prompt}
+    )
+    result = qa_chain.invoke({
+        "question": state['question'],
+        "chat_history": []
+    })
+    # Reranking
+    docs = result.get('source_documents', [])
+    if docs and len(docs) > 1:
+        pairs = [(state['question'], doc.page_content) for doc in docs]
+        scores = reranker.predict(pairs)
+        doc_scores = list(zip(docs, scores))
+        doc_scores.sort(key=lambda x: x[1], reverse=True)
+        top_docs = [doc for doc, score in doc_scores[:3]]
+        better_context = "\\n\\n".join([doc.page_content for doc in top_docs])
+        improved_answer = llm.invoke([
+            SystemMessage(content=f"""Use this medical context to answer the question safely:
+            Context: {better_context}
+            Always recommend consulting healthcare professionals."""),
+            HumanMessage(content=state['question'])
+        ])
+        return {"answer": improved_answer.content}
+    return {"answer": result['answer']}
+def general_node(state: State):
+    """Enhanced general node with sarcastic responses for identity questions"""
+    question_lower = state['question'].lower().strip()
+    # Identity/philosophical questions - sarcastic responses
+    identity_keywords = [
+        "what are you", "who are you", "what is your name", "are you human",
+        "are you real", "are you ai", "are you robot", "are you chatbot",
+        "what's your name", "who made you", "are you alive", "do you think",
+        "are you conscious", "do you feel", "what do you do", "your purpose"
+    ]
+    if any(keyword in question_lower for keyword in identity_keywords):
+        # Sarcastic responses for identity questions
+        sarcastic_responses = [
+            "🤖 Oh, just your friendly neighborhood medical AI trying to keep people from WebMD-ing themselves into thinking they have every disease known to humanity. You know, the usual.",
+            "🩺 I'm a sophisticated medical assistant, which is a fancy way of saying I'm here to tell you to 'consult a healthcare professional' in 47 different ways.",
+            "🏥 I'm an AI that reads medical textbooks faster than you can say 'Google symptoms at 3 AM.' My purpose? Giving you actual medical info instead of letting you convince yourself that headache is definitely a brain tumor.",
+            "💊 I'm basically a walking medical disclaimer with a personality. Think of me as that friend who went to med school but actually remembers what they learned.",
+            "🔬 I'm an artificial intelligence trained on medical knowledge, which means I can tell you about symptoms but I still can't fix your tendency to ignore doctor's appointments.",
+            "🧠 I'm a medical AI assistant. I exist to answer your health questions and remind you that, no, that WebMD article probably doesn't apply to you."
+        ]
+        import random
+        return {"answer": random.choice(sarcastic_responses)}
+    # Greeting responses - also with some personality
+    greeting_keywords = ["hello", "hi", "hey", "good morning", "good evening", "greetings"]
+    if any(keyword in question_lower for keyword in greeting_keywords):
+        friendly_responses = [
+            "Hello! 👋 Ready to get some actual medical information instead of falling down a WebMD rabbit hole?",
+            "Hi there! 🏥 I'm here to answer your medical questions. Fair warning: I'll probably tell you to see a real doctor.",
+            "Hey! 👨‍⚕️ What medical mystery can I help solve today? (Spoiler: the answer might be 'drink more water')",
+            "Greetings! 🩺 Ask me anything medical-related. I promise to give you better advice than your cousin's Facebook post."
+        ]
+        import random
+        return {"answer": random.choice(friendly_responses)}
+    # Regular medical or general questions
+    result = llm.invoke([
+        SystemMessage(content="""
+Answer the user's question helpfully and accurately.
+IMPORTANT SAFETY RULES:
+- For medical questions: Always end with "Please consult a healthcare professional"
+- For emergencies: Direct to call emergency services immediately
+- If unsure: Say "I don't know" rather than guess
+Be helpful but prioritize user safety. You can be slightly witty or conversational, but always maintain professionalism for serious medical topics.
+        """),
+        HumanMessage(content=state['question'])
+    ])
+    return {"answer": result.content}
+def document_node(state: State):
+    """Simple document processing node that integrates with your existing workflow"""
+    # Check if there's an uploaded document in session state
+    if "current_document" not in st.session_state or not st.session_state.current_document:
+        return {"answer": "Please upload a medical document first using the file uploader in the sidebar."}
+    file_path = st.session_state.current_document
+    question = state['question']
+    try:
+        # Check if document already processed
+        if file_path not in st.session_state.uploaded_documents:
+            # Extract document content
+            # loader = AmazonTextractPDFLoader(file_path, region_name="us-east-1")
+            loader = UnstructuredPDFLoader(file_path)
+            documents = loader.load()
+            # Clean and store content
+            content = "\n".join([doc.page_content for doc in documents])
+            st.session_state.uploaded_documents[file_path] = {
+                "content": content,
+                "conversation": []
+            }
+        # Get stored document
+        doc_data = st.session_state.uploaded_documents[file_path]
+        # Build context with previous questions about this document
+        context_parts = [f"Document Content:\n{doc_data['content']}"]
+        if doc_data['conversation']:
+            context_parts.append("\nPrevious questions about this document:")
+            for qa in doc_data['conversation'][-3:]:  # Last 3 Q&As
+                context_parts.append(f"Q: {qa['question']}\nA: {qa['answer'][:200]}...")
+        full_context = "\n".join(context_parts)
+        # Generate answer using your existing LLM
+        from langchain_core.messages import HumanMessage, SystemMessage
+        result = llm.invoke([
+            SystemMessage(content=f"""
+            You are analyzing a medical document. Use the document content and any previous conversation to answer the user's question.
+            Guidelines:
+            - Base your answer on the document content provided
+            - Reference specific values or sections when possible
+            - If information isn't in the document, clearly state this
+            - Always include medical disclaimers
+            - Maintain conversation continuity with previous questions
+            {full_context}
+            """),
+            HumanMessage(content=f"Question about the document: {question}")
+        ])
+        # Store this Q&A in document conversation history
+        doc_data['conversation'].append({
+            "question": question,
+            "answer": result.content
+        })
+        return {"answer": f"📄 **Document Analysis:**\n\n{result.content}"}
+    except Exception as e:
+        return {"answer": f"Error processing document: {str(e)}. Please ensure the file is accessible and try again."}
+def route_decision(state: State):
+    """Enhanced route decision with memory"""
+    if state["decision"] == "MEMORY":
+        return "memory_node"
+    elif state["decision"] == "DOCUMENT":
+        return "document_node"
+    elif state["decision"] == "RAG":
+        return "rag_node"
+    elif state["decision"] == "EMERGENCY":
+        return "emergency_node"
+    else:
+        return "general_node"
+# ==================== CREATE WORKFLOW ====================
+@st.cache_resource
+def create_workflow():
+    """Create the enhanced workflow graph with memory"""
+    init_document_memory()
+    router_builder = StateGraph(State)
+    # Add all nodes (including new memory node)
+    router_builder.add_node("rag_node", rag_node)
+    router_builder.add_node("general_node", general_node)
+    router_builder.add_node("llm_call_router", llm_call_router)
+    router_builder.add_node("emergency_node", emergency_node)
+    router_builder.add_node("memory_node", handle_conversation_query)  # NEW NODE
+    # router_builder.add_node("document_node", document_node)
+    router_builder.add_edge(START, "llm_call_router")
+    router_builder.add_conditional_edges(
+        "llm_call_router",
+        route_decision,
+        {
+            "rag_node": "rag_node",
+            "general_node": "general_node",
+            "emergency_node": "emergency_node",
+            "memory_node": "memory_node",  # NEW ROUTE,
+            # "document_node": "document_node"
+        },
+    )
+    # Add edges to END
+    router_builder.add_edge("rag_node", END)
+    router_builder.add_edge("general_node", END)
+    router_builder.add_edge("emergency_node", END)
+    router_builder.add_edge("memory_node", END)  # NEW EDGE
+    # router_builder.add_edge("document_node", END)
+    return router_builder.compile()

src/get_medical_system.py ADDED Viewed

	@@ -0,0 +1,133 @@

+from langchain_huggingface import HuggingFaceEmbeddings
+from langchain_community.vectorstores import FAISS
+from langchain.schema import Document
+from langchain.retrievers import EnsembleRetriever
+from langchain_community.retrievers import BM25Retriever
+from langchain_openai import ChatOpenAI
+import numpy as np
+from sentence_transformers import CrossEncoder
+from dotenv import load_dotenv
+import streamlit as st
+from datasets import load_dataset
+import os
+import pickle
+import faiss
+from langchain_community.docstore.in_memory import InMemoryDocstore  # Add this import
+import time
+load_dotenv()
+def get_vector_store():
+    """Load vectorstore from pre-computed embeddings"""
+    try:
+        # Load pre-computed data
+        print("📥 Loading pre-computed embeddings...")
+        embeddings_array = np.load('medical_embeddings.npy')
+        with open('medical_texts.pkl', 'rb') as f:
+            texts = pickle.load(f)
+        print(f"✅ Loaded {len(embeddings_array)} pre-computed embeddings")
+        # Create FAISS index from pre-computed embeddings
+        dimension = embeddings_array.shape[1]
+        index = faiss.IndexFlatL2(dimension)
+        index.add(embeddings_array.astype('float32')) # type: ignore
+        # Create embedding function for new queries
+        embeddings_function = HuggingFaceEmbeddings(
+            model_name="microsoft/BiomedNLP-PubMedBERT-base-uncased-abstract"
+        )
+        # Create proper Document objects and InMemoryDocstore
+        documents_dict = {}
+        for i, text in enumerate(texts):
+            # Create Document objects with proper metadata
+            doc = Document(
+                page_content=text,
+                metadata={"doc_id": i, "type": "medical_qa"}
+            )
+            documents_dict[str(i)] = doc
+        # Create proper docstore
+        docstore = InMemoryDocstore(documents_dict)
+        # Create index to docstore mapping
+        index_to_docstore_id = {i: str(i) for i in range(len(texts))}
+        # Create FAISS vectorstore with proper parameters
+        vectorstore = FAISS(
+            embedding_function=embeddings_function,
+            index=index,
+            docstore=docstore,
+            index_to_docstore_id=index_to_docstore_id
+        )
+        return vectorstore
+    except FileNotFoundError as e:
+        print(f"❌ Pre-computed files not found: {e}")
+        print("🔄 Falling back to creating embeddings...")
+        return None
+    except Exception as e:
+        print(f"❌ Error loading pre-computed embeddings: {e}")
+        print("🔄 Falling back to creating embeddings...")
+        return None
+@st.cache_resource
+def load_medical_system():
+    """Load the medical RAG system (cached for performance)"""
+    with st.spinner("🔄 Loading medical knowledge base..."):
+        # Load dataset
+        ds = load_dataset("keivalya/MedQuad-MedicalQnADataset")
+        # Create documents
+        documents = []
+        for i, item in enumerate(ds['train']): # type: ignore
+            content = f"Question: {item['Question']}\nAnswer: {item['Answer']}" # type: ignore
+            metadata = {
+                "doc_id": i,
+                "question": item['Question'], # type: ignore
+                "answer": item['Answer'], # type: ignore
+                "question_type": item['qtype'], # type: ignore
+                "type": "qa_pair"
+            }
+            documents.append(Document(page_content=content, metadata=metadata))
+        start = time.time()
+        # Try to load existing vectorstore
+        vectorstore = get_vector_store()
+        end = time.time()
+        if vectorstore is None:
+            st.error("❌ Could not load the vectorstore. Please ensure the embeddings and text files exist.")
+            st.stop()
+        total_time = end - start
+        st.success(f"✅ Loaded existing vectorstore in {total_time:.2f} seconds")
+        # Create retrievers
+        bm25_retriever = BM25Retriever.from_documents(documents)
+        vector_retriever = vectorstore.as_retriever(search_kwargs={"k": 2})
+        ensemble_retriever = EnsembleRetriever(
+            retrievers=[bm25_retriever, vector_retriever],
+            weights=[0.3, 0.7]
+        )
+        # create LLM
+        openai_key = os.getenv("OPENAI_API_KEY")
+        if not openai_key:
+            st.error("❌ OpenAI API key not found! Please set it in your environment variables or .streamlit/secrets.toml")
+            st.stop()
+        llm = ChatOpenAI(temperature=0, api_key=openai_key) # type: ignore
+        # Create reranker
+        reranker = CrossEncoder('cross-encoder/ms-marco-MiniLM-L-6-v2')
+        return documents, ensemble_retriever, llm, reranker