Spaces:

HEHEBOIOG
/

NewsInferno

Sleeping

App Files Files Community

HEHEBOIOG commited on Dec 9, 2024

Commit

187e418

verified ·

1 Parent(s): d047c3e

Update app.py

Browse files

Files changed (1) hide show

app.py +93 -33

app.py CHANGED Viewed

@@ -20,6 +20,7 @@ class AdvancedRAGChatbot:
                  llm_model: str = "llama-3.3-70b-versatile",
                  temperature: float = 0.7,
                  retrieval_k: int = 5):
         self.embeddings = self._configure_embeddings(embedding_model)
         self.semantic_model = SentenceTransformer('all-MiniLM-L6-v2')
         self.sentiment_analyzer = pipeline("sentiment-analysis")
@@ -31,10 +32,12 @@ class AdvancedRAGChatbot:
         self.qa_chain = self._create_conversational_retrieval_chain()
     def _configure_embeddings(self, model_name: str):
         encode_kwargs = {'normalize_embeddings': True, 'show_progress_bar': True}
         return HuggingFaceBgeEmbeddings(model_name=model_name, encode_kwargs=encode_kwargs)
     def _configure_llm(self, model_name: str, temperature: float):
         return ChatGroq(
             model_name=model_name,
             temperature=temperature,
@@ -43,14 +46,24 @@ class AdvancedRAGChatbot:
         )
     def _initialize_vector_database(self, persist_directory: str = 'vector_db'):
         return Chroma(persist_directory=persist_directory, embedding_function=self.embeddings)
     def _configure_retriever(self, retrieval_k: int):
-        return self.vector_db.as_retriever(k=retrieval_k, search_type="mmr", fetch_k=20)
     def _create_conversational_retrieval_chain(self):
         template = """
-        You are a helpful AI assistant. Use the following context and chat history to provide a precise answer.
         Context: {context}
         Chat History: {chat_history}
@@ -68,64 +81,111 @@ class AdvancedRAGChatbot:
         )
     def process_query(self, query: str) -> Dict[str, Any]:
         semantic_score = self.semantic_model.encode([query])[0]
         sentiment_result = self.sentiment_analyzer(query)[0]
         entities = self.ner_pipeline(query)
         result = self.qa_chain({"question": query})
-        response_data = {
             "response": result['answer'],
             "source_documents": result.get('source_documents', []),
             "semantic_similarity": semantic_score.tolist(),
             "sentiment": sentiment_result,
-            "named_entities": entities,
-            "contextual_information": result.get("source_documents", [])
         }
-        return response_data
 def main():
-    st.set_page_config(page_title="Advanced NLP RAG Chatbot", layout="wide", initial_sidebar_state="expanded")
-    st.title("🧠 Advanced NLP RAG Chatbot")
     with st.sidebar:
-        st.header("Configuration")
         embedding_model = st.selectbox(
             "Embedding Model",
             ["BAAI/bge-large-en-v1.5", "sentence-transformers/all-MiniLM-L6-v2"]
         )
-        temperature = st.slider("Model Temperature", 0.0, 1.0, 0.7)
-        retrieval_k = st.slider("Documents to Retrieve (k)", 1, 10, 5)
     chatbot = AdvancedRAGChatbot(
         embedding_model=embedding_model,
         temperature=temperature,
         retrieval_k=retrieval_k
     )
-    st.markdown("### Chat with the AI Assistant")
-    query_col, response_col = st.columns(2)
-    with query_col:
-        user_input = st.text_area("Ask your question:", placeholder="Type your question here...", height=150)
-    if user_input:
-        with st.spinner("Processing your query..."):
-            response = chatbot.process_query(user_input)
-        with response_col:
-            st.markdown("### Bot Response")
-            st.write(response['response'])
-            st.markdown("### Sentiment Analysis")
-            st.write(f"Sentiment: {response['sentiment']['label']} ({response['sentiment']['score']:.2%})")
-            st.markdown("### Named Entities")
-            for entity in response['named_entities']:
-                st.write(f"- {entity['word']} ({entity['entity']})")
-            st.markdown("### Source Documents")
-            for doc in response['source_documents']:
-                st.text_area("Source Document", doc.page_content, height=100)
 if __name__ == "__main__":
-    main()

                  llm_model: str = "llama-3.3-70b-versatile",
                  temperature: float = 0.7,
                  retrieval_k: int = 5):
+        """Initialize the Advanced RAG Chatbot with configurable parameters"""
         self.embeddings = self._configure_embeddings(embedding_model)
         self.semantic_model = SentenceTransformer('all-MiniLM-L6-v2')
         self.sentiment_analyzer = pipeline("sentiment-analysis")
         self.qa_chain = self._create_conversational_retrieval_chain()
     def _configure_embeddings(self, model_name: str):
+        """Configure embeddings with normalization"""
         encode_kwargs = {'normalize_embeddings': True, 'show_progress_bar': True}
         return HuggingFaceBgeEmbeddings(model_name=model_name, encode_kwargs=encode_kwargs)
     def _configure_llm(self, model_name: str, temperature: float):
+        """Configure the Language Model with Groq"""
         return ChatGroq(
             model_name=model_name,
             temperature=temperature,
         )
     def _initialize_vector_database(self, persist_directory: str = 'vector_db'):
+        """Initialize the vector database"""
         return Chroma(persist_directory=persist_directory, embedding_function=self.embeddings)
     def _configure_retriever(self, retrieval_k: int):
+        """Configure the document retriever"""
+        return self.vector_db.as_retriever(
+            search_kwargs={
+                "k": retrieval_k,
+                "search_type": "mmr",
+                "fetch_k": 20
+            }
+        )
     def _create_conversational_retrieval_chain(self):
+        """Create the conversational retrieval chain"""
         template = """
+        You are a helpful AI assistant. Provide a precise and comprehensive answer
+        based on the context and chat history.
         Context: {context}
         Chat History: {chat_history}
         )
     def process_query(self, query: str) -> Dict[str, Any]:
+        """Process the user query with multiple NLP techniques"""
+        # Advanced NLP Analysis
         semantic_score = self.semantic_model.encode([query])[0]
         sentiment_result = self.sentiment_analyzer(query)[0]
         entities = self.ner_pipeline(query)
+        # RAG Query Processing
         result = self.qa_chain({"question": query})
+        return {
             "response": result['answer'],
             "source_documents": result.get('source_documents', []),
             "semantic_similarity": semantic_score.tolist(),
             "sentiment": sentiment_result,
+            "named_entities": entities
         }
 def main():
+    # Page Configuration
+    st.set_page_config(
+        page_title="Advanced RAG Chatbot",
+        page_icon="🧠",
+        layout="wide",
+        initial_sidebar_state="expanded"
+    )
+    # Sidebar Configuration
     with st.sidebar:
+        st.header("🔧 Chatbot Settings")
+        st.markdown("Customize your AI assistant's behavior")
+        # Model Configuration
         embedding_model = st.selectbox(
             "Embedding Model",
             ["BAAI/bge-large-en-v1.5", "sentence-transformers/all-MiniLM-L6-v2"]
         )
+        temperature = st.slider("Creativity Level", 0.0, 1.0, 0.7, help="Higher values make responses more creative")
+        retrieval_k = st.slider("Context Depth", 1, 10, 5, help="Number of reference documents to retrieve")
+        # Additional Controls
+        st.divider()
+        reset_chat = st.button("🔄 Reset Conversation")
+    # Initialize Chatbot
     chatbot = AdvancedRAGChatbot(
         embedding_model=embedding_model,
         temperature=temperature,
         retrieval_k=retrieval_k
     )
+    # Main Chat Interface
+    st.title("🤖 Advanced RAG Chatbot")
+    # Two-column layout
+    col1, col2 = st.columns(2)
+    with col1:
+        st.header("Input")
+        # Chat input with placeholder
+        user_input = st.text_area(
+            "Ask your question",
+            placeholder="Enter your query here...",
+            height=250
+        )
+        # Submit button
+        submit_button = st.button("Send Query", type="primary")
+    with col2:
+        st.header("Response")
+        # Response container
+        if submit_button and user_input:
+            with st.spinner("Processing your query..."):
+                try:
+                    response = chatbot.process_query(user_input)
+                    # Bot Response
+                    st.markdown("#### Bot's Answer")
+                    st.write(response['response'])
+                    # Sentiment Analysis
+                    st.markdown("#### Sentiment Analysis")
+                    sentiment = response['sentiment']
+                    st.metric(
+                        label="Sentiment",
+                        value=sentiment['label'],
+                        delta=f"{sentiment['score']:.2%}"
+                    )
+                    # Named Entities
+                    st.markdown("#### Detected Entities")
+                    for entity in response['named_entities']:
+                        st.text(f"{entity['word']} ({entity['entity']})")
+                    # Source Documents
+                    if response['source_documents']:
+                        st.markdown("#### Reference Documents")
+                        for i, doc in enumerate(response['source_documents'], 1):
+                            with st.expander(f"Document {i}"):
+                                st.write(doc.page_content)
+                except Exception as e:
+                    st.error(f"An error occurred: {e}")
+        else:
+            st.info("Submit a query to see the AI's response")
 if __name__ == "__main__":
+    main()