Spaces:

mbudisic
/

PsTuts-RAG

Sleeping

mbudisic commited on Jun 3

Commit

119237b

1 Parent(s): 6abc2ec

feat: Refactor ApplicationState and initialize datastore

- Refactored the ApplicationState class to streamline initialization and state management.
- Introduced a new datastore management system using DatastoreManager and MemorySaver.
- Updated the on_chat_start function to handle datastore initialization and graph compilation.
- Added a new chainlit.md file for developer onboarding and documentation.

Files changed (2) hide show

app.py +135 -165
chainlit.md +14 -0

app.py CHANGED Viewed

@@ -1,7 +1,4 @@
 from pstuts_rag.configuration import Configuration
-from pstuts_rag.datastore import fill_the_db
-from pstuts_rag.graph import build_the_graph
-from pstuts_rag.state import PsTutsTeamState
 import requests
 import asyncio
 import json
@@ -12,21 +9,21 @@ import re
 import chainlit as cl
 from dotenv import load_dotenv
 from langchain_core.documents import Document
 from langchain_core.language_models import BaseChatModel
 from langchain_core.runnables import Runnable
-from langchain_openai import ChatOpenAI
 from langchain_core.embeddings import Embeddings
-from langchain_huggingface import HuggingFaceEmbeddings
 from langchain_core.messages import HumanMessage, BaseMessage
-import langgraph.graph
-import pstuts_rag.datastore
-import pstuts_rag.rag
 import nest_asyncio
 from uuid import uuid4
@@ -80,22 +77,10 @@ class ApplicationState:
         pointsLoaded: Number of data points loaded into the database
     """
-    embeddings: Embeddings = None
-    docs: List[Document] = []
-    qdrant_client = None
-    vector_store = None
-    datastore_manager = None
-    rag = None
-    llm: BaseChatModel = None
-    rag_chain: Runnable = None
-    ai_graph: Runnable = None
-    ai_graph_sketch = None
-    tasks: List[asyncio.Task] = []
-    hasLoaded: asyncio.Event = asyncio.Event()
-    pointsLoaded: int = 0
     def __init__(self) -> None:
         """
@@ -104,7 +89,7 @@ class ApplicationState:
         load_dotenv()
         set_api_key_if_not_present("OPENAI_API_KEY")
         set_api_key_if_not_present("TAVILY_API_KEY")
-        os.environ["LANGCHAIN_TRACING_V2"] = "true"
         os.environ["LANGCHAIN_PROJECT"] = (
             f"AIE - MBUDISIC - HF - CERT - {unique_id}"
         )
@@ -112,40 +97,7 @@ class ApplicationState:
 # Initialize global application state
-app_state = ApplicationState()
-params = Configuration()
-ai_state = PsTutsTeamState(
-    messages=[],
-    team_members=[VIDEOARCHIVE, ADOBEHELP],
-    next="START",
-)
-async def initialize():
-    await fill_the_db(app_state)
-    app_state.ai_graph, app_state.ai_graph_sketch = await build_the_graph(
-        app_state
-    )
-def enter_chain(message: str):
-    """
-    Entry point for the agent graph chain.
-    Transforms a user message into the state format expected by the agent graph.
-    Args:
-        message: User's input message
-    Returns:
-        Dictionary with the message and team members information
-    """
-    results = {
-        "messages": [HumanMessage(content=message)],
-        "team_members": [VIDEOARCHIVE, ADOBEHELP],
-    }
-    return results
 @cl.on_chat_start
@@ -156,105 +108,123 @@ async def on_chat_start():
     Sets up the language model, vector database components, and spawns tasks
     for database population and graph building.
     """
-    app_state.llm = ChatOpenAI(model=params.tool_calling_model, temperature=0)
-    # Use LangChain's built-in HuggingFaceEmbeddings wrapper
-    app_state.embeddings = HuggingFaceEmbeddings(
-        model_name=params.embedding_model
-    )
-    app_state.rag = pstuts_rag.rag.RAGChainInstance(
-        name="deployed",
-        qdrant_client=app_state.qdrant_client,
-        llm=app_state.llm,
-        embeddings=app_state.embeddings,
     )
-    app_state.tasks.append(asyncio.create_task(initialize()))
-def process_response(
-    response_message: BaseMessage,
-) -> Tuple[str, List[cl.Message]]:
-    """
-    Processes a response from the AI agents.
-    Extracts the main text and video references from the response,
-    and creates message elements for displaying video content.
-    Args:
-        response: Response object from the AI agent
-    Returns:
-        Tuple containing the text response and a list of message elements with video references
-    """
-    streamed_text = f"[_from: {response_message.name}_]\n"
-    msg_references = []
-    if response_message.name == VIDEOARCHIVE:
-        text, references = pstuts_rag.rag.RAGChainFactory.unpack_references(
-            str(response_message.content)
-        )
-        streamed_text += text
-        if len(references) > 0:
-            references = json.loads(references)
-            print(references)
-            for ref in references:
-                msg_references.append(
-                    cl.Message(
-                        content=(
-                            f"Watch {ref['title']} from timestamp "
-                            f"{round(ref['start'] // 60)}m:{round(ref['start'] % 60)}s"
-                        ),
-                        elements=[
-                            cl.Video(
-                                name=ref["title"],
-                                url=f"{ref['source']}#t={ref['start']}",
-                                display="side",
-                            )
-                        ],
-                    )
                 )
-    else:
-        streamed_text += str(response_message.content)
-        # Find all URLs in the content
-        urls = re.findall(
-            r"https?://(?:[-\w.]|(?:%[\da-fA-F]{2}))+[/\w\.-]*(?:\?[/\w\.-=&%]*)?",
-            str(response_message.content),
         )
-        print(urls)
-        links = []
-        # Create a list of unique URLs
-        for idx, u in enumerate(list(set(urls))):
-            url = "https://api.microlink.io"
-            params = {
-                "url": u,
-                "screenshot": True,
-            }
-            payload = requests.get(url, params)
-            if payload:
-                print(f"Successful screenshot\n{payload.json()}")
-                links.append(
-                    cl.Image(
-                        name=f"Website {idx} Preview: {u}",
-                        display="side",  # Show in the sidebar
-                        url=payload.json()["data"]["screenshot"]["url"],
-                    )
-                )
-        print(links)
-        msg_references.append(
-            cl.Message(
-                content="\n".join([l.url for l in links]), elements=links
             )
         )
-    return streamed_text, msg_references
 @cl.on_message
@@ -268,21 +238,21 @@ async def main(user_cl_message: cl.Message):
     Args:
         message: User's input message
     """
-    for s in app_state.ai_graph.stream(
-        user_cl_message.content, {"recursion_limit": 20}
-    ):
-        if "__end__" not in s and "supervisor" not in s.keys():
-            for [node_type, node_response] in s.items():
-                print(f"Processing {node_type} messages")
-                for node_message in node_response["messages"]:
-                    print(f"Message {node_message}")
-                    msg = cl.Message(content="")
-                    text, references = process_response(node_message)
-                    for token in [char for char in text]:
-                        await msg.stream_token(token)
-                    await msg.send()
-                    for m in references:
-                        await m.send()
 if __name__ == "__main__":

 from pstuts_rag.configuration import Configuration
 import requests
 import asyncio
 import json
 import chainlit as cl
 from dotenv import load_dotenv
 from langchain_core.documents import Document
 from langchain_core.language_models import BaseChatModel
 from langchain_core.runnables import Runnable
 from langchain_core.embeddings import Embeddings
+from langgraph.checkpoint.memory import MemorySaver
 from langchain_core.messages import HumanMessage, BaseMessage
+from pstuts_rag.configuration import Configuration
+from pstuts_rag.datastore import DatastoreManager
+from pstuts_rag.rag_for_transcripts import create_transcript_rag_chain
+from pstuts_rag.nodes import initialize
 import nest_asyncio
 from uuid import uuid4
         pointsLoaded: Number of data points loaded into the database
     """
+    config: Configuration = Configuration()
+    compiled_graph = None
+    datastore: DatastoreManager = None
+    checkpointer = MemorySaver()
     def __init__(self) -> None:
         """
         load_dotenv()
         set_api_key_if_not_present("OPENAI_API_KEY")
         set_api_key_if_not_present("TAVILY_API_KEY")
+        # os.environ["LANGCHAIN_TRACING_V2"] = "true"
         os.environ["LANGCHAIN_PROJECT"] = (
             f"AIE - MBUDISIC - HF - CERT - {unique_id}"
         )
 # Initialize global application state
+_app_state = ApplicationState()
 @cl.on_chat_start
     Sets up the language model, vector database components, and spawns tasks
     for database population and graph building.
     """
+    global _app_state
+    # Initialize datastore using asyncio.to_thread to avoid blocking
+    initialize_datastore: bool = _app_state.datastore is None or (
+        isinstance(_app_state.datastore, DatastoreManager)
+        and _app_state.datastore.count_docs() == 0
     )
+    if initialize_datastore:
+        _app_state.datastore = await asyncio.to_thread(
+            lambda: DatastoreManager(
+                config=_app_state.config
+            ).add_completion_callback(
+                lambda: cl.run_sync(
+                    cl.Message(content="Datastore loading completed.").send()
                 )
+            )
+        )
+    # Initialize and compile graph synchronously (blocking as intended)
+    if _app_state.compiled_graph is None:
+        _app_state.datastore, graph_builder = initialize(_app_state.datastore)
+        _app_state.compiled_graph = graph_builder.compile(
+            checkpointer=_app_state.checkpointer
         )
+    # Start datastore population as background task (non-blocking)
+    if initialize_datastore:
+        asyncio.create_task(
+            _app_state.datastore.from_json_globs(
+                _app_state.config.transcript_glob
             )
         )
+# def process_response(
+#     response_message: BaseMessage,
+# ) -> Tuple[str, List[cl.Message]]:
+#     """
+#     Processes a response from the AI agents.
+#     Extracts the main text and video references from the response,
+#     and creates message elements for displaying video content.
+#     Args:
+#         response: Response object from the AI agent
+#     Returns:
+#         Tuple containing the text response and a list of message elements with video references
+#     """
+#     streamed_text = f"[_from: {response_message.name}_]\n"
+#     msg_references = []
+#     if response_message.name == VIDEOARCHIVE:
+#         text, references = pstuts_rag.rag.RAGChainFactory.unpack_references(
+#             str(response_message.content)
+#         )
+#         streamed_text += text
+#         if len(references) > 0:
+#             references = json.loads(references)
+#             print(references)
+#             for ref in references:
+#                 msg_references.append(
+#                     cl.Message(
+#                         content=(
+#                             f"Watch {ref['title']} from timestamp "
+#                             f"{round(ref['start'] // 60)}m:{round(ref['start'] % 60)}s"
+#                         ),
+#                         elements=[
+#                             cl.Video(
+#                                 name=ref["title"],
+#                                 url=f"{ref['source']}#t={ref['start']}",
+#                                 display="side",
+#                             )
+#                         ],
+#                     )
+#                 )
+#     else:
+#         streamed_text += str(response_message.content)
+#         # Find all URLs in the content
+#         urls = re.findall(
+#             r"https?://(?:[-\w.]|(?:%[\da-fA-F]{2}))+[/\w\.-]*(?:\?[/\w\.-=&%]*)?",
+#             str(response_message.content),
+#         )
+#         print(urls)
+#         links = []
+#         # Create a list of unique URLs
+#         for idx, u in enumerate(list(set(urls))):
+#             url = "https://api.microlink.io"
+#             params = {
+#                 "url": u,
+#                 "screenshot": True,
+#             }
+#             payload = requests.get(url, params)
+#             if payload:
+#                 print(f"Successful screenshot\n{payload.json()}")
+#                 links.append(
+#                     cl.Image(
+#                         name=f"Website {idx} Preview: {u}",
+#                         display="side",  # Show in the sidebar
+#                         url=payload.json()["data"]["screenshot"]["url"],
+#                     )
+#                 )
+#         print(links)
+#         msg_references.append(
+#             cl.Message(
+#                 content="\n".join([l.url for l in links]), elements=links
+#             )
+#         )
+#     return streamed_text, msg_references
 @cl.on_message
     Args:
         message: User's input message
     """
+    # for s in app_state.ai_graph.stream(
+    #     user_cl_message.content, {"recursion_limit": 20}
+    # ):
+    #     if "__end__" not in s and "supervisor" not in s.keys():
+    #         for [node_type, node_response] in s.items():
+    #             print(f"Processing {node_type} messages")
+    #             for node_message in node_response["messages"]:
+    #                 print(f"Message {node_message}")
+    #                 msg = cl.Message(content="")
+    #                 text, references = process_response(node_message)
+    #                 for token in [char for char in text]:
+    #                     await msg.stream_token(token)
+    #                 await msg.send()
+    #                 for m in references:
+    #                     await m.send()
 if __name__ == "__main__":

chainlit.md ADDED Viewed

	@@ -0,0 +1,14 @@

+# Welcome to Chainlit! 🚀🤖
+Hi there, Developer! 👋 We're excited to have you on board. Chainlit is a powerful tool designed to help you prototype, debug and share applications built on top of LLMs.
+## Useful Links 🔗
+- **Documentation:** Get started with our comprehensive [Chainlit Documentation](https://docs.chainlit.io) 📚
+- **Discord Community:** Join our friendly [Chainlit Discord](https://discord.gg/k73SQ3FyUh) to ask questions, share your projects, and connect with other developers! 💬
+We can't wait to see what you create with Chainlit! Happy coding! 💻😊
+## Welcome screen
+To modify the welcome screen, edit the `chainlit.md` file at the root of your project. If you do not want a welcome screen, just leave this file empty.