confluence_bot.py

# @see https://github.com/devsentient/examples

import os
from atlassian import Confluence 
from langchain.callbacks.base import BaseCallbackHandler
import streamlit as st
from streamlit_extras.stylable_container import stylable_container
from streamlit_mic_recorder import speech_to_text
from dotenv import load_dotenv

# Import the ConfluenceQA class
from confluence_qa import ConfluenceQA

load_dotenv()

base_config = dict(
    db_url = os.getenv("NEO4J_URI"),
    db_username = os.getenv("NEO4J_USERNAME"),
    db_password = os.getenv("NEO4J_PASSWORD"),
    llm_name = os.getenv("LLM"),
    ollama_base_url = os.getenv("OLLAMA_BASE_URL"),
    embedding_model_name = os.getenv("EMBEDDING_MODEL")
)

class StreamHandler(BaseCallbackHandler):
    def __init__(self, container, initial_text=""):
        self.container = container
        self.text = initial_text

    def on_llm_new_token(self, token: str, **kwargs) -> None:
        self.text += token
        self.container.markdown(self.text)

st.set_page_config(
    page_title='Q&A Bot for Confluence Page',
    page_icon='⚡',
    layout='wide',
    initial_sidebar_state='auto',
)


@st.cache_resource
def load_confluence(config, force_reload:bool=False):
    # st.write("loading the confluence page")
    confluence_qa = ConfluenceQA(config=config)
    confluence_qa.init_embeddings()
    confluence_qa.init_models()
    confluence_qa.vector_store_confluence_docs(force_reload=force_reload)
    confluence_qa.retreival_qa_chain()
    return confluence_qa

def display_chat():
    # Session state
    if "config" not in st.session_state:
        st.session_state["config"] = {}
        st.session_state["config"].update(base_config)

    if "confluence_qa" not in st.session_state:
        st.session_state["confluence_qa"] = None

    if "generated" not in st.session_state:
        st.session_state["generated"] = []

    if "user_input" not in st.session_state:
        st.session_state["user_input"] = []

    if st.session_state["generated"]:
        size = len(st.session_state["generated"])
        # Display only the last three exchanges
        for i in range(max(size - 3, 0), size):
            with st.chat_message("user"):
                st.write(st.session_state["user_input"][i])

            with st.chat_message("assistant"):
                st.write(st.session_state["generated"][i])
        with st.container():
            st.write("&nbsp;")

def chat_input():
    with stylable_container(
        key="bottom_content",
        css_styles="""
            {
                position: fixed;
                bottom: 120px;
            }
            """,
    ):
        speech_text = speech_to_text(language='en', start_prompt="🎙️ Talk", stop_prompt="🎙️ Done", just_once=True, key='STT')
    chat_input_text = st.chat_input("What question can I help you resolve today?")
    user_input = chat_input_text if chat_input_text else speech_text
    if user_input:
        with st.chat_message("user"):
            st.write(user_input)
        with st.chat_message("assistant"):
            stream_handler = StreamHandler(st.empty())
            confluence_qa = st.session_state.get("confluence_qa")
            if confluence_qa is None:
                st.warning("Answer questions based on the pre-ingested confluence page, You can refresh the knowledge graph by clicking [Ingest] in the config panel", icon="🚨")
                confluence_qa = load_confluence(st.session_state["config"])
                st.session_state["confluence_qa"] = confluence_qa
            qa_chain = confluence_qa.retreival_qa_chain()
            result = qa_chain(
                {"question": user_input, "chat_history": []}, callbacks=[stream_handler]
            )["answer"]
            output = result
            st.session_state[f"user_input"].append(user_input)
            st.session_state[f"generated"].append(output)

def list_space(url:str, username:str, password:str) ->[]:
    confluence = Confluence(
        url=url,
        username=username,
        password=password,
        cloud=True)
    result = confluence.get_all_spaces(start=0, limit=500, expand=None)
    spaces = result["results"]
    return list(map(lambda s: f"{s['name']} | ({s['key']})", spaces))

with st.sidebar.form(key ='ConfigForm'):
        st.markdown('## Confluence Config')
        confluence_url = st.text_input("paste the confluence URL", "https://toronto.atlassian.net/wiki")
        username = st.text_input(label="confluence username",
                                help="leave blank if confluence page is public",
                                type="password")
        api_key = st.text_input(label="confluence api key",
                                help="leave blank if confluence page is public",
                                type="password")
        space_key = None
        try:
            spaces = list_space(url=confluence_url, username=username, password=api_key)
            if spaces:
                space = st.selectbox('Which space do you want to import', spaces, index=None)
                if space:
                    space_key = space.split("|")[1].strip().strip("()")
        except BaseException as e:
            st.error(f"{e}", icon="🚨")

        wipeout = st.checkbox(label='Wipeout',
                              help="Wipeout the whole database and clear out all previously loaded data!")

        btSubmitted = st.form_submit_button(label='Ingest')

        if btSubmitted and confluence_url and space_key:
            st.session_state["config"].update({
                "confluence_url": confluence_url,
                "username": username if username != "" else None,
                "api_key": api_key if api_key != "" else None,
                "space_key": space_key,
                "overwrite":wipeout
            })
            with st.spinner(text=f"Ingesting [{space_key}]..."):
                try:
                    confluence_qa = load_confluence(st.session_state["config"], force_reload=True)
                    st.session_state["confluence_qa"] = confluence_qa
                    st.success("Confluence Space Ingested", icon="✅")
                except BaseException as be:
                    if "exist" in be.message:
                        st.error(f"This Space [{space_key}] has already been ingested, You can check the [wipeout] option to delete the whole database and rebuild it again. !!! This could wipe out all the other ingested Spaces too!!!", icon="🚨")
                    else:
                        st.error(f"{be.message}", icon="🚨")
                    pass

st.title("Confluence Q&A Demo")

display_chat()
chat_input()