|
import streamlit as st |
|
from tantivy_search_agent import TantivySearchAgent |
|
from agent_workflow import SearchAgent |
|
import os |
|
from typing import Optional, List |
|
from dotenv import load_dotenv |
|
import gdown |
|
|
|
|
|
load_dotenv() |
|
|
|
class SearchAgentUI: |
|
def __init__(self): |
|
self.tantivy_agent: Optional[TantivySearchAgent] = None |
|
self.agent: Optional[SearchAgent] = None |
|
self.index_path ="./index" |
|
|
|
self.gdrive_index_id = os.getenv("GDRIVE_INDEX_ID", "1lpbBCPimwcNfC0VZOlQueA4SHNGIp5_t") |
|
|
|
def download_index_from_gdrive(self) -> bool: |
|
"""Download index folder from Google Drive""" |
|
try: |
|
|
|
zip_path = "index.zip" |
|
|
|
url = f"https://drive.google.com/uc?id={self.gdrive_index_id}" |
|
gdown.download(url, zip_path, quiet=False) |
|
|
|
|
|
import zipfile |
|
with zipfile.ZipFile(zip_path, 'r') as zip_ref: |
|
zip_ref.extractall(".") |
|
|
|
|
|
except Exception as e: |
|
st.error(f"Failed to download index: {str(e)}") |
|
return False |
|
|
|
def get_available_providers(self, api_keys: dict) -> List[str]: |
|
"""Get available providers without creating a SearchAgent instance""" |
|
temp_tantivy = TantivySearchAgent(self.index_path) |
|
temp_agent = SearchAgent(temp_tantivy, api_keys=api_keys) |
|
return temp_agent.get_available_providers() |
|
|
|
def initialize_system(self, api_keys: dict): |
|
try: |
|
|
|
if not os.path.exists(self.index_path): |
|
st.warning("Index folder not found. Attempting to download from Google Drive...") |
|
if not self.download_index_from_gdrive(): |
|
return False, "שגיאה: לא ניתן להוריד את האינדקס", [] |
|
st.success("Index downloaded successfully!") |
|
|
|
self.tantivy_agent = TantivySearchAgent(self.index_path) |
|
if self.tantivy_agent.validate_index(): |
|
available_providers = self.get_available_providers(api_keys) |
|
if not available_providers: |
|
return False, "שגיאה: לא נמצאו ספקי AI זמינים. אנא הזן מפתח API אחד לפחות.", [] |
|
|
|
self.agent = SearchAgent( |
|
self.tantivy_agent, |
|
provider_name=st.session_state.get('provider', available_providers[0]), |
|
api_keys=api_keys |
|
) |
|
return True, "המערכת מוכנה לחיפוש", available_providers |
|
else: |
|
return False, "שגיאה: אינדקס לא תקין", [] |
|
except Exception as ex: |
|
return False, f"שגיאה באתחול המערכת: {str(ex)}", [] |
|
|
|
def main(self): |
|
st.set_page_config( |
|
page_title="איתוריא", |
|
layout="wide", |
|
initial_sidebar_state="expanded" |
|
) |
|
|
|
|
|
st.markdown(""" |
|
<style> |
|
.stApp { |
|
direction: rtl; |
|
} |
|
.stTextInput > div > div > input { |
|
direction: rtl; |
|
} |
|
.stSelectbox > div > div > div { |
|
direction: rtl; |
|
} |
|
.stNumberInput > div > div > input { |
|
direction: rtl; |
|
} |
|
.search-step { |
|
border: 1px solid #e0e0e0; |
|
border-radius: 5px; |
|
padding: 10px; |
|
margin: 5px 0; |
|
background-color: #f8f9fa; |
|
} |
|
.document-group { |
|
border: 1px solid #e3f2fd; |
|
border-radius: 5px; |
|
padding: 10px; |
|
margin: 5px 0; |
|
background-color: #f5f9ff; |
|
} |
|
.document-item { |
|
border: 1px solid #e0e0e0; |
|
border-radius: 5px; |
|
padding: 10px; |
|
margin: 5px 0; |
|
background-color: white; |
|
} |
|
[data-testid="stSidebar"] { |
|
direction: rtl; |
|
} |
|
</style> |
|
""", unsafe_allow_html=True) |
|
|
|
st.session_state.api_keys = { |
|
'google': "", |
|
'openai': "", |
|
'anthropic': "" |
|
|
|
} |
|
|
|
|
|
|
|
|
|
with st.sidebar: |
|
st.title("הגדרות") |
|
|
|
|
|
st.subheader("הגדרת מפתחות API") |
|
|
|
|
|
google_key = st.text_input( |
|
"Google API Key", |
|
value=st.session_state.api_keys['google'], |
|
type="password", |
|
key="google_key", |
|
help="הזן את מפתח ה-API של Google Gemini " |
|
) |
|
st.session_state.api_keys['google'] = google_key |
|
|
|
st.html('<small> ניתן להשיג מפתח <a href="https://aistudio.google.com/app/apikey">כאן</a> </small>', ) |
|
|
|
|
|
openai_key = st.text_input( |
|
"OpenAI API Key", |
|
value=st.session_state.api_keys['openai'], |
|
type="password", |
|
key="openai_key", |
|
help="הזן את מפתח ה-API של OpenAI" |
|
) |
|
st.session_state.api_keys['openai'] = openai_key |
|
|
|
|
|
st.html('<small> ניתן להשיג מפתח <a href="https://platform.openai.com/account/api-keys">כאן</a> </small> ', ) |
|
|
|
|
|
|
|
anthropic_key = st.text_input( |
|
"Anthropic API Key", |
|
value=st.session_state.api_keys['anthropic'], |
|
type="password", |
|
key="anthropic_key", |
|
help="הזן את מפתח ה-API של Anthropic Claude" |
|
) |
|
st.session_state.api_keys['anthropic'] = anthropic_key |
|
|
|
|
|
st.html('<small> ניתן להשיג מפתח <a href="https://console.anthropic.com/">כאן</a> </small>', ) |
|
|
|
|
|
st.markdown("---") |
|
|
|
|
|
success, status_msg, available_providers = self.initialize_system(st.session_state.api_keys) |
|
|
|
|
|
with st.sidebar: |
|
if available_providers: |
|
if 'provider' not in st.session_state or st.session_state.provider not in available_providers: |
|
st.session_state.provider = available_providers[0] if available_providers else None |
|
|
|
provider = st.selectbox( |
|
"ספק בינה מלאכותית", |
|
options=available_providers, |
|
key='provider', |
|
help="בחר את מודל הAI לשימוש (רק מודלים עם מפתח API זמין יוצגו)" |
|
) |
|
if self.agent: |
|
self.agent.set_provider(provider) |
|
|
|
max_iterations = st.number_input( |
|
"מספר נסיונות מקסימלי", |
|
min_value=1, |
|
value=6, |
|
key='max_iterations' |
|
) |
|
|
|
results_per_search = st.number_input( |
|
"תוצאות לכל חיפוש", |
|
min_value=1, |
|
value=20, |
|
key='results_per_search' |
|
) |
|
|
|
|
|
st.title("איתוריא") |
|
st.markdown(""" |
|
איתוריא היא מערכת חיפוש תורנית רב שלבית מבוססת בינה מלאכותית. היא משתמשת במודל שפה כדי ליצור שאילתת חיפוש, לדרג את התוצאות, ולסכם את התשובה הסופית. החיפוש מתבצע על המאגר של [אוצריא](https://www.otzaria.org/). |
|
""") |
|
|
|
if success: |
|
st.success(status_msg) |
|
else: |
|
st.error(status_msg) |
|
|
|
|
|
query = st.text_input( |
|
"הכנס שאילתת חיפוש", |
|
disabled=not success, |
|
placeholder="הקלד את שאילתת החיפוש שלך כאן...", |
|
key='search_query' |
|
) |
|
|
|
|
|
if (st.button('חפש', disabled=not success) or query) and query!="" and self.agent: |
|
try: |
|
if 'steps' not in st.session_state: |
|
st.session_state.steps = [] |
|
|
|
steps_container = st.container() |
|
answer_container = st.container() |
|
sources_container = st.container() |
|
|
|
with steps_container: |
|
st.subheader("צעדי תהליך החיפוש") |
|
|
|
def handle_step_update(step): |
|
if 'final_result' in step: |
|
final_result = step['final_result'] |
|
|
|
with answer_container: |
|
st.subheader("תשובה סופית") |
|
st.info(final_result['answer']) |
|
|
|
if final_result['sources']: |
|
with sources_container: |
|
st.subheader("מסמכי מקור") |
|
st.markdown(f"נמצאו {len(final_result['sources'])} תוצאות") |
|
|
|
for i, source in enumerate(final_result['sources']): |
|
with st.expander(f"תוצאה {i+1}: {source['reference']} (ציון: {source['score']:.2f})"): |
|
st.write(source['text']) |
|
|
|
else: |
|
with steps_container: |
|
step_number = len(st.session_state.steps) + 1 |
|
st.markdown(f""" |
|
<div class='search-step'> |
|
<strong>צעד {step_number}. {step['action']}</strong> |
|
</div> |
|
""", unsafe_allow_html=True) |
|
st.markdown(f"**{step['description']}**") |
|
|
|
if 'results' in step: |
|
documents = [] |
|
|
|
for r in step['results']: |
|
if r['type'] == 'query': |
|
st.markdown("**שאילתת חיפוש:**") |
|
st.code(r['content']) |
|
|
|
elif r['type'] == 'document': |
|
documents.append(r['content']) |
|
|
|
elif r['type'] == 'evaluation': |
|
content = r['content'] |
|
status = "✓" if content['status'] == 'accepted' else "↻" |
|
confidence = f"ביטחון: {content['confidence']}" |
|
if content['status'] == 'accepted': |
|
st.success(f"{status} {confidence}") |
|
else: |
|
st.warning(f"{status} {confidence}") |
|
if content['explanation']: |
|
st.info(content['explanation']) |
|
|
|
elif r['type'] == 'new_query': |
|
st.markdown("**ניסיון הבא:**") |
|
st.code(r['content']) |
|
|
|
|
|
if documents: |
|
for i, doc in enumerate(documents): |
|
with st.expander(f"{doc['reference']} (ציון: {doc['score']:.2f})"): |
|
st.write(doc['highlights'][0]) |
|
|
|
st.markdown("---") |
|
st.session_state.steps.append(step) |
|
|
|
|
|
st.session_state.steps = [] |
|
|
|
|
|
self.agent.search_and_answer( |
|
query=query, |
|
num_results=results_per_search, |
|
max_iterations=max_iterations, |
|
on_step=handle_step_update |
|
) |
|
|
|
except Exception as ex: |
|
st.error(f"שגיאת חיפוש: {str(ex)}") |
|
|
|
if __name__ == "__main__": |
|
app = SearchAgentUI() |
|
app.main() |
|
|