Spaces:

RAHMAN00700
/

Chat-with-Multiple-Documents-Using-Streamlit-and-Watsonx

Running

App Files Files Community

RAHMAN00700 commited on Nov 10, 2024

Commit

a455ea8

unverified ·

1 Parent(s): c73f78c

Create app.py

Browse files

Files changed (1) hide show

app.py +199 -0

app.py ADDED Viewed

	@@ -0,0 +1,199 @@

+import os
+import streamlit as st
+import tempfile
+from pptx import Presentation
+from docx import Document
+from langchain.document_loaders import PyPDFLoader, TextLoader
+from langchain.indexes import VectorstoreIndexCreator
+from langchain.chains import RetrievalQA
+from langchain.text_splitter import RecursiveCharacterTextSplitter
+from langchain.embeddings import HuggingFaceEmbeddings
+from langchain.chains import LLMChain
+from langchain.prompts import PromptTemplate
+from ibm_watson_machine_learning.foundation_models import Model
+from ibm_watson_machine_learning.foundation_models.extensions.langchain import WatsonxLLM
+from ibm_watson_machine_learning.metanames import GenTextParamsMetaNames as GenParams
+from ibm_watson_machine_learning.foundation_models.utils.enums import DecodingMethods
+# Initialize index to None
+index = None
+rag_chain = None  # Initialize rag_chain as None by default
+# Custom loader for DOCX files
+class DocxLoader:
+    def __init__(self, file_path):
+        self.file_path = file_path
+    def load(self):
+        document = Document(self.file_path)
+        text_content = []
+        for para in document.paragraphs:
+            text_content.append(para.text)
+        return " ".join(text_content)
+# Custom loader for PPTX files
+class PptxLoader:
+    def __init__(self, file_path):
+        self.file_path = file_path
+    def load(self):
+        presentation = Presentation(self.file_path)
+        text_content = []
+        for slide in presentation.slides:
+            for shape in slide.shapes:
+                if hasattr(shape, "text"):
+                    text_content.append(shape.text)
+        return " ".join(text_content)
+# Caching function to load various file types
+@st.cache_resource
+def load_file(file_name, file_type):
+    loaders = []
+    if file_type == "pdf":
+        loaders = [PyPDFLoader(file_name)]
+    elif file_type == "docx":
+        loader = DocxLoader(file_name)
+        text = loader.load()
+        with tempfile.NamedTemporaryFile(delete=False, suffix=".txt") as temp_file:
+            temp_file.write(text.encode("utf-8"))
+            temp_file_path = temp_file.name
+        loaders = [TextLoader(temp_file_path)]
+    elif file_type == "txt":
+        loaders = [TextLoader(file_name)]
+    elif file_type == "pptx":
+        loader = PptxLoader(file_name)
+        text = loader.load()
+        with tempfile.NamedTemporaryFile(delete=False, suffix=".txt") as temp_file:
+            temp_file.write(text.encode("utf-8"))
+            temp_file_path = temp_file.name
+        loaders = [TextLoader(temp_file_path)]
+    else:
+        st.error("Unsupported file type.")
+        return None
+    index = VectorstoreIndexCreator(
+        embedding=HuggingFaceEmbeddings(model_name="all-MiniLM-L12-v2"),
+        text_splitter=RecursiveCharacterTextSplitter(chunk_size=450, chunk_overlap=50)
+    ).from_loaders(loaders)
+    return index
+def format_history():
+    return ""
+# Watsonx API setup using environment variables
+watsonx_api_key = os.getenv("WATSONX_API_KEY")
+watsonx_project_id = os.getenv("WATSONX_PROJECT_ID")
+if not watsonx_api_key or not watsonx_project_id:
+    st.error("API Key or Project ID is not set. Please set them as environment variables.")
+prompt_template_br = PromptTemplate(
+    input_variables=["context", "question"],
+    template="""<|begin_of_text|><|start_header_id|>system<|end_header_id|>
+I am a helpful assistant.
+<|eot_id|>
+{context}
+<|start_header_id|>user<|end_header_id|>
+{question}<|eot_id|>
+"""
+)
+with st.sidebar:
+    st.title("Watsonx RAG with Multiple docs")
+    watsonx_model = st.selectbox("Model", ["meta-llama/llama-3-405b-instruct", "codellama/codellama-34b-instruct-hf", "ibm/granite-20b-multilingual"])
+    max_new_tokens = st.slider("Max output tokens", min_value=100, max_value=4000, value=600, step=100)
+    decoding_method = st.radio("Decoding", (DecodingMethods.GREEDY.value, DecodingMethods.SAMPLE.value))
+    parameters = {
+        GenParams.DECODING_METHOD: decoding_method,
+        GenParams.MAX_NEW_TOKENS: max_new_tokens,
+        GenParams.MIN_NEW_TOKENS: 1,
+        GenParams.TEMPERATURE: 0,
+        GenParams.TOP_K: 50,
+        GenParams.TOP_P: 1,
+        GenParams.STOP_SEQUENCES: [],
+        GenParams.REPETITION_PENALTY: 1
+    }
+    st.info("Upload a PDF, DOCX, TXT, or PPTX file to use RAG")
+    uploaded_file = st.file_uploader("Upload file", accept_multiple_files=False, type=["pdf", "docx", "txt", "pptx"])
+    if uploaded_file is not None:
+        bytes_data = uploaded_file.read()
+        st.write("Filename:", uploaded_file.name)
+        with open(uploaded_file.name, 'wb') as f:
+            f.write(bytes_data)
+        file_type = uploaded_file.name.split('.')[-1].lower()
+        index = load_file(uploaded_file.name, file_type)
+    model_name = watsonx_model
+    def clear_messages():
+        st.session_state.messages = []
+    st.button('Clear messages', on_click=clear_messages)
+st.info("Setting up Watsonx...")
+my_credentials = {
+    "url": "https://us-south.ml.cloud.ibm.com",
+    "apikey": watsonx_api_key
+}
+params = parameters
+project_id = watsonx_project_id
+space_id = None
+verify = False
+model = WatsonxLLM(model=Model(model_name, my_credentials, params, project_id, space_id, verify))
+if model:
+    st.info(f"Model {model_name} ready.")
+    chain = LLMChain(llm=model, prompt=prompt_template_br, verbose=True)
+if chain:
+    st.info("Chat ready.")
+    # Only create rag_chain if index is successfully created
+    if index is not None:
+        rag_chain = RetrievalQA.from_chain_type(
+            llm=model,
+            chain_type="stuff",
+            retriever=index.vectorstore.as_retriever(),
+            chain_type_kwargs={"prompt": prompt_template_br},
+            return_source_documents=False,
+            verbose=True
+        )
+        st.info("Document-based retrieval is ready.")
+    else:
+        st.warning("No document uploaded. Answering common queries without retrieval.")
+# Chat loop for handling queries
+if "messages" not in st.session_state:
+    st.session_state.messages = []
+for message in st.session_state.messages:
+    st.chat_message(message["role"]).markdown(message["content"])
+prompt = st.chat_input("Ask your question here", disabled=False if chain else True)
+if prompt:
+    st.chat_message("user").markdown(prompt)
+    # Answer based on availability of rag_chain or chain
+    if rag_chain:
+        response_text = rag_chain.run(prompt).strip()
+    else:
+        # Use general model-based response if rag_chain is not available
+        response_text = chain.run(question=prompt, context=format_history()).strip("<|start_header_id|>assistant<|end_header_id|>").strip("<|eot_id|>")
+    # Store and display conversation
+    st.session_state.messages.append({'role': 'User', 'content': prompt})
+    st.chat_message("assistant").markdown(response_text)
+    st.session_state.messages.append({'role': 'Assistant', 'content': response_text})