Spaces:

Ab-Romia
/

Context-Aware-AI

Running

App Files Files Community

Ab-Romia commited on Aug 4, 2025

Commit

47dc68d

verified ·

1 Parent(s): c2cb0c4

Update app/services.py

Browse files

Files changed (1) hide show

app/services.py +35 -8

app/services.py CHANGED Viewed

@@ -402,7 +402,7 @@ async def get_rag_response(request_data: ChatRequest, api_key: Optional[str] = N
         if doc_count == 0:
             logger.warning("⚠️  Vector DB is empty. Cannot answer query.")
-            return "The knowledge base is empty. Please provide some context in the left panel and click 'Index Context' before asking questions."
         # Step 3: Retrieve relevant chunks from ChromaDB
         logger.info("🔎 Retrieving relevant chunks from vector DB...")
@@ -413,7 +413,7 @@ async def get_rag_response(request_data: ChatRequest, api_key: Optional[str] = N
         if not retrieved_chunks or not retrieved_chunks.get('documents') or not retrieved_chunks['documents'][0]:
             logger.warning("❌ No relevant chunks found in the vector DB for this query.")
-            return "I could not find any relevant information in the provided context to answer your question."
         # Log retrieved chunks
         chunks = retrieved_chunks['documents'][0]
@@ -427,14 +427,26 @@ async def get_rag_response(request_data: ChatRequest, api_key: Optional[str] = N
             logger.warning(f"⚠️  Context too long, truncating to {max_context_length}")
             context_for_prompt = context_for_prompt[:max_context_length] + "\n\n[... content truncated ...]"
-        # Step 4: Construct prompt for the LLM
         full_prompt = (
-            "Based on the context below, answer the user's question concisely and accurately. "
-            "If the answer isn't in the context, say so clearly and answer the question yourself based on your knowledge.\n\n"
-            "Context:\n"
             f"{context_for_prompt}\n\n"
-            f"Question: {request_data.prompt}\n\n"
-            "Answer:"
         )
         # Step 5: Generate the response using the LLM
@@ -459,6 +471,21 @@ async def get_rag_response(request_data: ChatRequest, api_key: Optional[str] = N
         logger.error(f"❌ An unexpected error occurred: {e}", exc_info=True)
         return f"An unexpected error occurred: {e}"
 async def execute_task(request_data: TaskRequest, api_key: Optional[str] = None) -> str:
     """
     Executes a specific task on the given context.

         if doc_count == 0:
             logger.warning("⚠️  Vector DB is empty. Cannot answer query.")
+            return "I don't have any specific context loaded right now. Please provide some context in the Knowledge Base and click 'Index Context' before asking questions. However, I'd be happy to help with general questions using my built-in knowledge!"
         # Step 3: Retrieve relevant chunks from ChromaDB
         logger.info("🔎 Retrieving relevant chunks from vector DB...")
         if not retrieved_chunks or not retrieved_chunks.get('documents') or not retrieved_chunks['documents'][0]:
             logger.warning("❌ No relevant chunks found in the vector DB for this query.")
+            return "I couldn't find specific information about that in the provided context. Let me help you with what I know from my general knowledge:\n\n" + await _generate_fallback_response(request_data.prompt, api_key)
         # Log retrieved chunks
         chunks = retrieved_chunks['documents'][0]
             logger.warning(f"⚠️  Context too long, truncating to {max_context_length}")
             context_for_prompt = context_for_prompt[:max_context_length] + "\n\n[... content truncated ...]"
+        # Step 4: Construct improved prompt for the LLM
         full_prompt = (
+            "You are an intelligent assistant with access to specific context information. "
+            "Your goal is to provide comprehensive, helpful answers that combine the provided context with your expertise.\n\n"
+            "INSTRUCTIONS:\n"
+            "• Use the provided context as your PRIMARY source when it's relevant\n"
+            "• If the context fully answers the question, focus on that information and enhance it with practical insights\n"
+            "• If the context only partially addresses the question, build upon it with your knowledge\n"
+            "• If the context isn't relevant to the question, briefly mention this and provide a helpful answer based on your expertise\n"
+            "• Be natural and conversational - avoid robotic phrases like 'based solely on the context'\n"
+            "• Provide actionable, practical advice when appropriate\n"
+            "• Structure your response clearly with headings or bullet points when helpful\n\n"
+            "CONTEXT INFORMATION:\n"
             f"{context_for_prompt}\n\n"
+            f"USER QUESTION: {request_data.prompt}\n\n"
+            "Please provide a comprehensive, helpful response:"
         )
         # Step 5: Generate the response using the LLM
         logger.error(f"❌ An unexpected error occurred: {e}", exc_info=True)
         return f"An unexpected error occurred: {e}"
+async def _generate_fallback_response(prompt: str, api_key: Optional[str] = None) -> str:
+    """Generate a response using only the model's knowledge when no context is available."""
+    fallback_prompt = (
+        f"Please provide a helpful, comprehensive answer to this question using your knowledge:\n\n"
+        f"Question: {prompt}\n\n"
+        f"Answer:"
+    )
+    try:
+        return await _generate_response_async(fallback_prompt, api_key)
+    except Exception as e:
+        logger.error(f"❌ Fallback response generation failed: {e}")
+        return "I'm having trouble generating a response right now. Please try again or rephrase your question."
 async def execute_task(request_data: TaskRequest, api_key: Optional[str] = None) -> str:
     """
     Executes a specific task on the given context.