Spaces:

EmTpro01
/

CCET_Chat_Assistance

Running

App Files Files Community

EmTpro01 commited on Jun 19

Commit

0b80b63

verified ·

1 Parent(s): c5a3183

Update app.py

Browse files

Files changed (1) hide show

app.py +37 -109

app.py CHANGED Viewed

@@ -1,8 +1,9 @@
 import os
 from flask import Flask, request, jsonify, render_template
 import google.generativeai as genai
 from langchain_google_genai import GoogleGenerativeAIEmbeddings, ChatGoogleGenerativeAI
-from langchain.vectorstores import FAISS
 from langchain.chains import ConversationalRetrievalChain
 from langchain.memory import ConversationBufferMemory
 from dotenv import load_dotenv
@@ -75,7 +76,7 @@ def initialize_chatbot():
     # Initialize the language model
     try:
         llm = ChatGoogleGenerativeAI(
-            model="gemini-2.0-flash",
             temperature=0.2,
             top_p=0.85,
             google_api_key=GOOGLE_API_KEY
@@ -94,7 +95,7 @@ def initialize_chatbot():
             retriever=retriever,
             memory=memory,
             verbose=True,
-            return_source_documents=False,  # Set to False to hide source documents
             combine_docs_chain_kwargs={"prompt": get_custom_prompt()},
         )
         logger.info("QA chain created successfully")
@@ -108,67 +109,50 @@ def initialize_chatbot():
 def format_links_as_html(text):
     # Detect markdown style links [text](url)
     markdown_pattern = r'\[(.*?)\]\((https?://[^\s\)]+)\)'
-    if re.search(markdown_pattern, text):
-        text = re.sub(markdown_pattern, r'<a href="\2" target="_blank">\1</a>', text)
-        return text
     # Handle URLs in square brackets [url]
     bracket_pattern = r'\[(https?://[^\s\]]+)\]'
-    if re.search(bracket_pattern, text):
-        text = re.sub(bracket_pattern, r'<a href="\1" target="_blank">\1</a>', text)
-        return text
-    # Regular URL pattern
-    url_pattern = r'(https?://[^\s\])+)'
-    # Find all URLs in the text
-    urls = re.findall(url_pattern, text)
-    # If there are multiple URLs, keep only the first one
-    if len(urls) > 1:
-        for url in urls[1:]:
-            text = text.replace(url, "")
-    # Replace the remaining URL with an HTML anchor tag
-    if urls:
-        text = re.sub(url_pattern, r'<a href="\1" target="_blank">\1</a>', text, count=1)
     return text
 # Function to properly escape asterisks for markdown rendering
 def escape_markdown(text):
-    # Replace single asterisks not intended for markdown with escaped versions
-    # This regex looks for asterisks that aren't part of markdown patterns
-    return re.sub(r'(?<!\*)\*(?!\*)', r'\*', text)
 # Function to format markdown and handle asterisks with proper line breaks
 def format_markdown_with_breaks(text):
-    # First remove escaped asterisks (\*) and replace with just asterisks (*)
     text = text.replace('\\*', '*')
-    # Handle bold text (convert **text** to <strong>text</strong>)
     text = re.sub(r'\*\*(.*?)\*\*', r'<strong>\1</strong>', text)
-    # Now split text by lines for processing asterisk line breaks
     lines = text.split('\n')
     formatted_lines = []
     for i, line in enumerate(lines):
-        # If line starts with asterisk (possibly after whitespace), add a line break before it
-        # except for the first line
-        if line.strip().startswith('*'):
-            # Extract content after the asterisk
-            content = line.strip()[1:].strip()
-            # Add line break (except for the first line)
-            if i == 0 or len(formatted_lines) == 0:
-                formatted_lines.append(f"• {content}")
-            else:
-                formatted_lines.append(f"<br>• {content}")
         else:
             formatted_lines.append(line)
-    return '\n'.join(formatted_lines)
 @app.route('/')
 def home():
@@ -180,86 +164,34 @@ def health():
     try:
         current_time = time.time()
         uptime_seconds = current_time - app_start_time
-        uptime_hours = uptime_seconds / 3600
-        # Check if critical components are available
         health_status = {
             "status": "healthy",
             "timestamp": time.strftime("%Y-%m-%d %H:%M:%S UTC", time.gmtime()),
             "uptime_seconds": round(uptime_seconds, 2),
-            "uptime_hours": round(uptime_hours, 2),
-            "api_key_configured": bool(GOOGLE_API_KEY and GOOGLE_API_KEY != "your_api_key_here"),
             "chatbot_initialized": qa_chain is not None
         }
-        # Return 200 status for healthy
         return jsonify(health_status), 200
     except Exception as e:
         logger.error(f"Health check failed: {str(e)}")
         return jsonify({
-            "status": "unhealthy",
-            "error": str(e),
             "timestamp": time.strftime("%Y-%m-%d %H:%M:%S UTC", time.gmtime())
         }), 500
-@app.route('/_health')
-def health_check():
-    """Legacy health check endpoint for Docker (keeping for compatibility)"""
-    return jsonify({"status": "healthy"}), 200
 @app.route('/ping')
 def ping():
     """Simple ping endpoint for basic uptime checks"""
     return "pong", 200
-@app.route('/status')
-def status():
-    """Detailed status endpoint"""
-    try:
-        current_time = time.time()
-        uptime_seconds = current_time - app_start_time
-        status_info = {
-            "application": "Flask Chatbot",
-            "status": "running",
-            "timestamp": time.strftime("%Y-%m-%d %H:%M:%S UTC", time.gmtime()),
-            "uptime": {
-                "seconds": round(uptime_seconds, 2),
-                "minutes": round(uptime_seconds / 60, 2),
-                "hours": round(uptime_seconds / 3600, 2),
-                "days": round(uptime_seconds / 86400, 2)
-            },
-            "environment": {
-                "python_version": os.sys.version,
-                "port": os.environ.get('PORT', 7860)
-            },
-            "services": {
-                "api_key_configured": bool(GOOGLE_API_KEY and GOOGLE_API_KEY != "your_api_key_here"),
-                "chatbot_initialized": qa_chain is not None,
-                "memory_initialized": memory is not None
-            }
-        }
-        return jsonify(status_info), 200
-    except Exception as e:
-        logger.error(f"Status check failed: {str(e)}")
-        return jsonify({
-            "status": "error",
-            "error": str(e),
-            "timestamp": time.strftime("%Y-%m-%d %H:%M:%S UTC", time.gmtime())
-        }), 500
 @app.route('/api/chat', methods=['POST'])
 def chat():
     global qa_chain
-    # Initialize on first request if not already done
     if qa_chain is None:
-        success = initialize_chatbot()
-        if not success:
-            return jsonify({"error": "Failed to initialize chatbot. Check server logs for details."}), 500
     data = request.json
     user_message = data.get('message', '')
@@ -270,29 +202,25 @@ def chat():
     try:
         logger.info(f"Processing user query: {user_message}")
-        # Process the query through the QA chain
-        result = qa_chain({"question": user_message})
-        # Extract the answer
         answer = result.get("answer", "I'm sorry, I couldn't generate a response.")
-        # Format the answer (escape markdown, format links, and handle numbered lists)
         answer = escape_markdown(answer)
         answer = format_links_as_html(answer)
         answer = format_markdown_with_breaks(answer)
         logger.info("Query processed successfully")
-        return jsonify({
-            "answer": answer,
-            # No sources included in the response
-        })
     except Exception as e:
-        logger.error(f"Error processing request: {str(e)}")
-        return jsonify({"error": f"Error processing request: {str(e)}"}), 500
 if __name__ == '__main__':
-    # For Docker deployment, bind to all interfaces and use port 7860
     port = int(os.environ.get('PORT', 7860))
     app.run(host='0.0.0.0', port=port, debug=False)

 import os
 from flask import Flask, request, jsonify, render_template
 import google.generativeai as genai
+# LangChain Community has the updated vector stores
+from langchain_community.vectorstores import FAISS
 from langchain_google_genai import GoogleGenerativeAIEmbeddings, ChatGoogleGenerativeAI
 from langchain.chains import ConversationalRetrievalChain
 from langchain.memory import ConversationBufferMemory
 from dotenv import load_dotenv
     # Initialize the language model
     try:
         llm = ChatGoogleGenerativeAI(
+            model="gemini-2.0-flash", # Updated to a newer recommended model
             temperature=0.2,
             top_p=0.85,
             google_api_key=GOOGLE_API_KEY
             retriever=retriever,
             memory=memory,
             verbose=True,
+            return_source_documents=False,
             combine_docs_chain_kwargs={"prompt": get_custom_prompt()},
         )
         logger.info("QA chain created successfully")
 def format_links_as_html(text):
     # Detect markdown style links [text](url)
     markdown_pattern = r'\[(.*?)\]\((https?://[^\s\)]+)\)'
+    text = re.sub(markdown_pattern, r'<a href="\2" target="_blank">\1</a>', text)
     # Handle URLs in square brackets [url]
     bracket_pattern = r'\[(https?://[^\s\]]+)\]'
+    text = re.sub(bracket_pattern, r'<a href="\1" target="_blank">\1</a>', text)
+    # Regular URL pattern - THIS IS THE FIX
+    # The previous pattern r'(https?://[^\s\])+)' was invalid.
+    url_pattern = r'(?<!href=")(https?://[^\s<]+)'
+    # Replace URLs with HTML anchor tags
+    text = re.sub(url_pattern, r'<a href="\1" target="_blank">\1</a>', text)
     return text
 # Function to properly escape asterisks for markdown rendering
 def escape_markdown(text):
+    return re.sub(r'(?<!\*)\*(?!\*)', r'\\*', text)
 # Function to format markdown and handle asterisks with proper line breaks
 def format_markdown_with_breaks(text):
     text = text.replace('\\*', '*')
     text = re.sub(r'\*\*(.*?)\*\*', r'<strong>\1</strong>', text)
     lines = text.split('\n')
     formatted_lines = []
     for i, line in enumerate(lines):
+        stripped_line = line.strip()
+        if stripped_line.startswith('* '):
+            content = stripped_line[2:].strip()
+            # Use a bullet point character for lists
+            formatted_lines.append(f"<br>• {content}")
+        elif stripped_line.startswith('*'):
+            content = stripped_line[1:].strip()
+            formatted_lines.append(f"<br>• {content}")
         else:
             formatted_lines.append(line)
+    # Join the lines, but remove the initial <br> if it exists
+    result = '\n'.join(formatted_lines)
+    if result.startswith('<br>'):
+        result = result[4:]
+    return result
 @app.route('/')
 def home():
     try:
         current_time = time.time()
         uptime_seconds = current_time - app_start_time
         health_status = {
             "status": "healthy",
             "timestamp": time.strftime("%Y-%m-%d %H:%M:%S UTC", time.gmtime()),
             "uptime_seconds": round(uptime_seconds, 2),
             "chatbot_initialized": qa_chain is not None
         }
         return jsonify(health_status), 200
     except Exception as e:
         logger.error(f"Health check failed: {str(e)}")
         return jsonify({
+            "status": "unhealthy", "error": str(e),
             "timestamp": time.strftime("%Y-%m-%d %H:%M:%S UTC", time.gmtime())
         }), 500
 @app.route('/ping')
 def ping():
     """Simple ping endpoint for basic uptime checks"""
     return "pong", 200
 @app.route('/api/chat', methods=['POST'])
 def chat():
     global qa_chain
     if qa_chain is None:
+        if not initialize_chatbot():
+            return jsonify({"error": "Failed to initialize chatbot. Check server logs."}), 500
     data = request.json
     user_message = data.get('message', '')
     try:
         logger.info(f"Processing user query: {user_message}")
+        # Use .invoke() instead of the deprecated __call__ method
+        result = qa_chain.invoke({"question": user_message})
         answer = result.get("answer", "I'm sorry, I couldn't generate a response.")
+        # Format the answer
         answer = escape_markdown(answer)
         answer = format_links_as_html(answer)
         answer = format_markdown_with_breaks(answer)
         logger.info("Query processed successfully")
+        return jsonify({"answer": answer})
     except Exception as e:
+        # Log the full traceback for better debugging
+        logger.exception(f"Error processing request: {str(e)}")
+        return jsonify({"error": f"An internal error occurred: {str(e)}"}), 500
 if __name__ == '__main__':
     port = int(os.environ.get('PORT', 7860))
     app.run(host='0.0.0.0', port=port, debug=False)