Tuned the prompt in app.py

infracloudio · Jul 16, 2024 · f0865b3 · f0865b3
1 parent 9885c03
commit f0865b3
Show file tree

Hide file tree

Showing 3 changed files with 399 additions and 2 deletions.
diff --git a/README.md b/README.md
@@ -9,6 +9,10 @@ The AI assistant for tech communities.
 - [✔️] **Search Stack Overflow**: InSightful can search Stack Overflow for relevant questions and answers.
 - [✔️] **Browse The Web**: InSightful can browse the web for relevant information on community topics.
 
+## Overview of workflow
+
+![RAG-FC](https://github.com/user-attachments/assets/dd56f9e6-f641-4500-8785-15bc1fe37b4b)
+
 ## Prerequisites
 
 - Python 3.10.13
@@ -56,5 +60,5 @@ These flags ensure there are no conflicting ports between the services and allow
 Finally, run the application.
 
 ```bash
-streamlit run InSightful.py
-```
+streamlit run app.py
+```
diff --git a/app.py b/app.py
@@ -0,0 +1,258 @@
+import os
+import uuid
+import streamlit as st
+import datasets
+from langchain import hub
+from langchain_huggingface import HuggingFaceEndpointEmbeddings, HuggingFaceEndpoint
+from langchain_core.output_parsers import StrOutputParser
+from langchain_core.runnables import RunnablePassthrough
+from langchain.agents import create_react_agent, AgentExecutor
+from langchain.tools.retriever import create_retriever_tool
+from langchain_community.tools.tavily_search import TavilySearchResults
+from langchain_community.utilities import StackExchangeAPIWrapper
+from langchain_community.tools.stackexchange.tool import StackExchangeTool
+from langchain_core.messages import SystemMessage
+from langchain_text_splitters import RecursiveCharacterTextSplitter
+from langchain_core.documents import Document
+from langchain_chroma import Chroma
+import chromadb
+from chromadb.config import Settings
+from chromadb.utils.embedding_functions import HuggingFaceEmbeddingServer
+
+st.set_page_config(layout="wide", page_title="InSightful")
+
+# Set up Chroma DB client
+def setup_chroma_client():
+    client = chromadb.HttpClient(
+        host="http://{host}:{port}".format(
+            host=os.getenv("VECTORDB_HOST", "localhost"),
+            port=os.getenv("VECTORDB_PORT", "8000"),
+        ),
+        settings=Settings(allow_reset=True),
+    )
+    return client
+
+# Set up Chroma embedding function
+def setup_chroma_embedding_function():
+    chroma_embedding_function = HuggingFaceEmbeddingServer(
+        url="http://{host}:{port}/embed".format(
+            host=os.getenv("TEI_HOST", "localhost"), port=os.getenv("TEI_PORT", "8081")
+        )
+    )
+    return chroma_embedding_function
+
+# Set up HuggingFaceEndpoint model
+def setup_huggingface_endpoint():
+    model = HuggingFaceEndpoint(
+        endpoint_url="http://{host}:{port}".format(
+            host=os.getenv("TGI_HOST", "localhost"), port=os.getenv("TGI_PORT", "8080")
+        ),
+        temperature=0.3,
+        task="conversational",
+        stop_sequences=[
+            "<|im_end|>",
+            "{your_token}".format(your_token=os.getenv("STOP_TOKEN", "localhost")),
+        ],
+    )
+    return model
+
+# Set up HuggingFaceEndpointEmbeddings embedder
+def setup_huggingface_embeddings():
+    embedder = HuggingFaceEndpointEmbeddings(
+        model="http://{host}:{port}".format(
+            host=os.getenv("TEI_HOST", "localhost"), port=os.getenv("TEI_PORT", "8081")
+        ),
+        task="feature-extraction",
+    )
+    return embedder
+
+def load_prompt_and_system_ins():
+    prompt = hub.pull("hwchase17/react-chat")
+    # Set up prompt template
+    template = """
+    You are InSightful, a virtual assistant designed to help users with a wide range of tasks, from answering simple questions to providing in-depth explanations and discussions on a wide range of topics. As a language model,
+    you are able to generate human-like text based on the input you receive, allowing you to engage in 
+    natural-sounding conversations and provide responses that are coherent and relevant to the topic at hand.
+
+    Always provide accurate and informative responses to a wide range of questions. 
+
+    You can assess the health of a conversation from the engagement and understand the sentiment of the conversations on Slack.
+
+    You can assess if people are generally interested or disinterested in the conversation, and you can also determine if the conversation is positive or negative.
+
+    You do not answer questions about personal information, such as social security numbers,
+    credit card numbers, or other sensitive information. You also do not provide medical, legal, or financial advice.
+
+    You will not respond to any questions that are inappropriate or offensive. You are friendly, helpful,
+    and you are here to assist users with any questions they may have.
+
+    Keep your answers clear and concise, and provide as much information as possible to help users understand the topic.
+
+    Use your best judgement and only use any tool if you absolutely need to.
+
+    Tools provide you with more context and up-to-date information. Use them to your advantage.
+
+    Use the tools for any current information. Make sure to use the tools to verify your answers as well.
+
+    Thought: {thought}
+    Action: {action}
+    Action Input: {action_input}
+    Observation: {observation}
+
+    If you are ready with an answer use the format:
+    Thought: Do I have to use a tool? No
+    Final Answer: {observation}
+
+    """
+
+    system_instructions = SystemMessage(
+        content=template,
+        metadata={"role": "system"},
+    )
+
+    return prompt, system_instructions
+
+class RAG:
+    def __init__(self, llm, embeddings, collection_name, db_client):
+        self.llm = llm
+        self.embeddings = embeddings
+        self.collection_name = collection_name
+        self.db_client = db_client
+
+    def load_documents(self, doc):
+        documents = []
+        for data in datasets.load_dataset(doc, split="train[:500]").to_list():
+            documents.append(
+                Document(
+                    page_content=data["text"],
+                    metadata=dict(user=data["user"], 
+                                  workspace=data["workspace"]),
+                )
+            )
+        print("Document loaded")
+        return documents
+
+    def chunk_doc(self, pages, chunk_size=512, chunk_overlap=30):
+        text_splitter = RecursiveCharacterTextSplitter(
+            chunk_size=chunk_size, chunk_overlap=chunk_overlap
+        )
+        chunks = text_splitter.split_documents(pages)
+        print("Document chunked")
+        return chunks
+
+    def insert_embeddings(self, chunks, chroma_embedding_function, embedder):
+        collection = self.db_client.get_or_create_collection(
+            self.collection_name, embedding_function=chroma_embedding_function
+        )
+        for chunk in chunks:
+            collection.add(
+                ids=[str(uuid.uuid1())],
+                metadatas=chunk.metadata,
+                documents=chunk.page_content,
+            )
+        db = Chroma(
+            embedding_function=embedder,
+            collection_name=self.collection_name,
+            client=self.db_client,
+        )
+        print("Embeddings inserted\n")
+        return db
+
+    def query_docs(self, model, question, vector_store, prompt):
+        retriever = vector_store.as_retriever(
+            search_type="similarity", search_kwargs={"k": 4}
+        )
+        rag_chain = (
+            {"context": retriever | format_docs, "question": RunnablePassthrough()}
+            | prompt
+            | model
+            | StrOutputParser()
+        )
+        answer = rag_chain.invoke(question)
+        return answer
+
+def format_docs(docs):
+    return "\n\n".join(doc.page_content for doc in docs)
+
+def create_retriever(name, model, description, client, chroma_embedding_function, embedder):
+    rag = RAG(llm=model, embeddings=embedder, collection_name="Slack", db_client=client)
+    pages = rag.load_documents("spencer/software_slacks")
+    chunks = rag.chunk_doc(pages)
+    vector_store = rag.insert_embeddings(chunks, chroma_embedding_function, embedder)
+    retriever = vector_store.as_retriever(
+        search_type="similarity", search_kwargs={"k": 10}
+    )
+    info_retriever = create_retriever_tool(retriever, name, description)
+    return info_retriever
+
+@st.cache_resource
+def setup_tools(_model, _client, _chroma_embedding_function, _embedder):
+    stackexchange_wrapper = StackExchangeAPIWrapper(max_results=3)
+    stackexchange_tool = StackExchangeTool(api_wrapper=stackexchange_wrapper)
+
+    web_search_tool = TavilySearchResults(max_results=5,
+                                          search_depth = "advanced",
+                                          include_answer=True)
+
+    retriever = create_retriever(
+        name="Slack conversations retriever",
+        model=_model,
+        description="Retrieves conversations from Slack for context.",
+        client=_client,
+        chroma_embedding_function=_chroma_embedding_function,
+        embedder=_embedder,
+    )
+    return [web_search_tool, stackexchange_tool, retriever]
+
+def setup_agent(model, prompt, client, chroma_embedding_function, embedder):
+    tools = setup_tools(model, client, chroma_embedding_function, embedder)
+    agent = create_react_agent(llm=model, prompt=prompt, tools=tools)
+    agent_executor = AgentExecutor(
+        agent=agent, verbose=True, tools=tools, handle_parsing_errors=True
+    )
+    return agent_executor
+
+def main():
+    client = setup_chroma_client()
+    chroma_embedding_function = setup_chroma_embedding_function()
+    prompt, system_instructions = load_prompt_and_system_ins()
+    model = setup_huggingface_endpoint()
+    embedder = setup_huggingface_embeddings()
+
+    agent_executor = setup_agent(
+        model, prompt, client, chroma_embedding_function, embedder
+    )
+
+    st.title("InSightful: Your AI Assistant for community questions")
+    st.markdown(
+        """
+    InSightful is an AI assistant that helps you with your questions. 
+    - It can browse past conversations with your colleagues/teammates and can search StackOverflow for technical questions.
+    - With access to the web, InSightful can also conduct its own research for you."""
+    )
+
+    chat_history = st.session_state.get(
+        "chat_history", [{"role": "system", "content": system_instructions.content}]
+    )
+
+    for message in chat_history[1:]:
+        with st.chat_message(message["role"]):
+            st.markdown(message["content"])
+
+    if question := st.chat_input("Enter your question here"):
+        st.chat_message("user").markdown(question)
+        chat_history.append({"role": "user", "content": question})
+        with st.spinner():
+            response = agent_executor.invoke(
+                {
+                    "input": question,
+                    "chat_history": chat_history,
+                }
+            )["output"]
+        st.chat_message("assistant").markdown(response)
+        chat_history.append({"role": "assistant", "content": response})
+
+    st.session_state["chat_history"] = chat_history
+
+if __name__ == "__main__":
+    main()