Spaces:

aniudupa
/

ani

Sleeping

App Files Files Community

aniudupa commited on Feb 1

Commit

4786462

verified ·

1 Parent(s): 91d6566

Update app.py

Browse files

Files changed (1) hide show

app.py +76 -12

app.py CHANGED Viewed

@@ -2,21 +2,25 @@ from fastapi import APIRouter, HTTPException
 from pydantic import BaseModel
 from pathlib import Path
 import os
 from langchain_community.vectorstores import FAISS
 from langchain_community.embeddings import HuggingFaceEmbeddings
 from langchain.prompts import PromptTemplate
 from langchain_together import Together
 from langchain.memory import ConversationBufferWindowMemory
 from langchain.chains import ConversationalRetrievalChain
 # Set the API key for Together.ai
-TOGETHER_AI_API = os.getenv("TOGETHER_AI_API", "1c27fe0df51a29edee1bec6b4b648b436cc80cf4ccc36f56de17272d9e663cbd")
 # Ensure proper cache directory is available for models
 os.environ['TRANSFORMERS_CACHE'] = '/tmp/cache'
 # Initialize FastAPI Router
-app = APIRouter()
 # Lazy loading of large models (only load embeddings and index when required)
 embeddings = HuggingFaceEmbeddings(
@@ -26,7 +30,7 @@ embeddings = HuggingFaceEmbeddings(
 index_path = Path("models/index.faiss")
 if not index_path.exists():
-    raise FileNotFoundError("FAISS index not found. Please generate it and place it in 'ipc_vector_db'.")
 # Load the FAISS index
 db = FAISS.load_local("models", embeddings, allow_dangerous_deserialization=True)
@@ -46,7 +50,7 @@ llm = Together(
     model="mistralai/Mistral-7B-Instruct-v0.2",
     temperature=0.5,
     max_tokens=1024,
-    together_api_key=TOGETHER_AI_API,
 )
 # Set up memory for conversational context
@@ -60,25 +64,85 @@ qa_chain = ConversationalRetrievalChain.from_llm(
     combine_docs_chain_kwargs={"prompt": prompt},
 )
 # Input schema for chat requests
 class ChatRequest(BaseModel):
     question: str
     chat_history: str
 # POST endpoint to handle chat requests
-@app.post("/chat/")
 async def chat(request: ChatRequest):
     try:
-        # Prepare the input data
-        inputs = {"question": request.question, "chat_history": request.chat_history}
-        # Run the chain to get the answer
         result = qa_chain(inputs)
-        return {"answer": result["answer"]}
     except Exception as e:
-        # Return an error if something goes wrong
         raise HTTPException(status_code=500, detail=f"Error processing request: {str(e)}")
 # GET endpoint to check if the API is running
-@app.get("/")
 async def root():
-    return {"message": "LawGPT API is running."}

 from pydantic import BaseModel
 from pathlib import Path
 import os
+import re
 from langchain_community.vectorstores import FAISS
 from langchain_community.embeddings import HuggingFaceEmbeddings
 from langchain.prompts import PromptTemplate
 from langchain_together import Together
 from langchain.memory import ConversationBufferWindowMemory
 from langchain.chains import ConversationalRetrievalChain
+from langdetect import detect
+from googletrans import Translator, LANGUAGES
 # Set the API key for Together.ai
+os.environ["TOGETHER_AI_API"] = "1c27fe0df51a29edee1bec6b4b648b436cc80cf4ccc36f56de17272d9e663cbd"
 # Ensure proper cache directory is available for models
 os.environ['TRANSFORMERS_CACHE'] = '/tmp/cache'
 # Initialize FastAPI Router
+router = APIRouter()
+bot_name = "LawGPT"
 # Lazy loading of large models (only load embeddings and index when required)
 embeddings = HuggingFaceEmbeddings(
 index_path = Path("models/index.faiss")
 if not index_path.exists():
+    raise FileNotFoundError("FAISS index not found. Please generate it and place it in 'models'.")
 # Load the FAISS index
 db = FAISS.load_local("models", embeddings, allow_dangerous_deserialization=True)
     model="mistralai/Mistral-7B-Instruct-v0.2",
     temperature=0.5,
     max_tokens=1024,
+    together_api_key=os.getenv("TOGETHER_AI_API"),
 )
 # Set up memory for conversational context
     combine_docs_chain_kwargs={"prompt": prompt},
 )
+# Translator instance (sync version)
+translator = Translator()
 # Input schema for chat requests
 class ChatRequest(BaseModel):
     question: str
     chat_history: str
+# Function to validate the input question
+def is_valid_question(question: str) -> bool:
+    """
+    Validate the input question to ensure it is meaningful and related to Indian law or crime.
+    """
+    question = question.strip()
+    # Reject if the question is too short
+    if len(question) < 3:
+        return False
+    # Reject if the question contains only numbers or symbols
+    if re.match(r'^\d+$', question) or re.match(r'^[^a-zA-Z0-9\s]+$', question):
+        return False
+    # Define keywords related to Indian law and crime
+    legal_keywords = [
+        "IPC", "CrPC", "section", "law", "crime", "penalty", "punishment",
+        "legal", "court", "justice", "offense", "fraud", "murder", "theft",
+        "bail", "arrest", "FIR", "judgment", "act", "contract", "constitutional",
+        "habeas corpus", "petition", "rights", "lawyer", "advocate", "accused",
+        "penal", "conviction", "sentence", "appeal", "trial", "witness"
+    ]
+    # Check if the question contains at least one legal keyword
+    if not any(keyword.lower() in question.lower() for keyword in legal_keywords):
+        return False
+    return True
 # POST endpoint to handle chat requests
+@router.post("/chat/")
 async def chat(request: ChatRequest):
     try:
+        # Detect language
+        detected_lang = await translator.detect(request.question)
+        detected_language = detected_lang.lang
+        # Translate question to English
+        question_translation = await translator.translate(request.question, src=detected_language, dest="en")
+        question_in_english = question_translation.text
+        # Validate translated question
+        if not is_valid_question(question_in_english):
+            return {
+                "answer": "Please provide a valid legal question related to Indian laws.",
+                "language": LANGUAGES.get(detected_language, "unknown")
+            }
+        # Prepare input for LLM
+        inputs = {"question": question_in_english, "chat_history": request.chat_history}
+        # Run LLM retrieval chain
         result = qa_chain(inputs)
+        # Ensure response contains an answer
+        if 'answer' not in result:
+            raise ValueError("Missing 'answer' key in the result from qa_chain")
+        # Translate response back to original language
+        answer_translation = await translator.translate(result["answer"], src="en", dest=detected_language)
+        answer_in_original_language = answer_translation.text
+        return {
+            "answer": answer_in_original_language,
+            "language": LANGUAGES.get(detected_language, "unknown")
+        }
     except Exception as e:
         raise HTTPException(status_code=500, detail=f"Error processing request: {str(e)}")
 # GET endpoint to check if the API is running
+@router.get("/")
 async def root():
+    return {"message": "LawGPT API is running."}