Spaces:

Pixeltable
/

Multi-LLM-RAG-with-Groundtruth-Comparison

Running

App Files Files Community

PierreBrunelle commited on Oct 6

Commit

66368d3

•

1 Parent(s): f09e956

Update app.py

Browse files

Files changed (1) hide show

app.py +19 -15

app.py CHANGED Viewed

@@ -49,11 +49,10 @@ def create_prompt(top_k_list: list[dict], question: str) -> str:
     {question}'''
 """Gradio Application"""
 def process_files(ground_truth_file, pdf_files, chunk_limit, chunk_separator, show_question, show_correct_answer, show_gpt4omini, show_llamav3p23b, show_mistralsmall, progress=gr.Progress()):
     # Ensure a clean slate for the demo by removing and recreating the 'rag_demo' directory
     progress(0, desc="Initializing...")
     pxt.drop_dir('rag_demo', force=True)
     pxt.create_dir('rag_demo')
@@ -65,13 +64,13 @@ def process_files(ground_truth_file, pdf_files, chunk_limit, chunk_separator, sh
         queries_t = pxt.io.import_excel('rag_demo.queries', ground_truth_file.name)
     progress(0.2, desc="Processing documents...")
     # Create a table to store the uploaded PDF documents
     documents_t = pxt.create_table(
         'rag_demo.documents',
         {'document': pxt.DocumentType()}
     )
     # Insert the PDF files into the documents table
     documents_t.insert({'document': file.name} for file in pdf_files if file.name.endswith('.pdf'))
@@ -206,19 +205,17 @@ with gr.Blocks(theme=Monochrome) as demo:
     )
     # Add the disclaimer
-    gr.Markdown(
         """
         <div style="background-color: #E5DDD4; border: 1px solid #e9ecef; border-radius: 8px; padding: 15px; margin-bottom: 20px;">
-            <strong>Disclaimer:</strong> This Gradio app is running on OpenAI, Mistral, and Fireworks accounts with the developer's personal API keys.
-            If you wish to use it with your own hardware or API keys, you can
-            <a href="https://huggingface.co/spaces/Pixeltable/Multi-LLM-RAG-with-Groundtruth-Comparison?duplicate=true" target="_blank" style="color: #F25022; text-decoration: none; font-weight: bold;">duplicate this Hugging Face Space</a>
-            or run it locally or in Google Colab.
         </div>
         """
     )
     with gr.Row():
-        with gr.Column():
            with gr.Accordion("What This Demo Does", open = True):
             gr.Markdown("""
           1. **Ingests Documents**: Uploads your PDF documents and a ground truth file (CSV or XLSX).
@@ -226,7 +223,7 @@ with gr.Blocks(theme=Monochrome) as demo:
           4. **Generates Answers**: Leverages OpenAI to produce accurate answers based on the retrieved context.
           5. **Compares Results**: Displays the generated answers alongside the ground truth for easy evaluation.
           """)
-        with gr.Column():
           with gr.Accordion("How to Use", open = True):
             gr.Markdown("""
           1. Upload your ground truth file (CSV or XLSX) with the following two columns: **question** and **correct_answer**.
@@ -234,7 +231,7 @@ with gr.Blocks(theme=Monochrome) as demo:
           3. Click "Process Files and Generate Output" to start the RAG process.
           4. View the results in the table below, comparing AI-generated answers to the ground truth.
           """)
     # File upload components for ground truth and PDF documents
     with gr.Row():
         ground_truth_file = gr.File(label="Upload Ground Truth (CSV or XLSX) - Format to respect:question | correct_answer", file_count="single")
@@ -267,6 +264,13 @@ with gr.Blocks(theme=Monochrome) as demo:
     with gr.Row():
         with gr.Column(scale=1):
             download_button = gr.Button("Download Results as CSV")
         with gr.Column(scale=2):
             csv_output = gr.File(label="CSV Download")
@@ -285,7 +289,7 @@ with gr.Blocks(theme=Monochrome) as demo:
                                  show_llamav3p23b,
                                  show_mistralsmall],
                          outputs=df_output)
     download_button.click(
     trigger_download,
     inputs=[df_output],
@@ -293,4 +297,4 @@ with gr.Blocks(theme=Monochrome) as demo:
     )
 if __name__ == "__main__":
-    demo.launch(debug=True)

     {question}'''
 """Gradio Application"""
 def process_files(ground_truth_file, pdf_files, chunk_limit, chunk_separator, show_question, show_correct_answer, show_gpt4omini, show_llamav3p23b, show_mistralsmall, progress=gr.Progress()):
     # Ensure a clean slate for the demo by removing and recreating the 'rag_demo' directory
     progress(0, desc="Initializing...")
     pxt.drop_dir('rag_demo', force=True)
     pxt.create_dir('rag_demo')
         queries_t = pxt.io.import_excel('rag_demo.queries', ground_truth_file.name)
     progress(0.2, desc="Processing documents...")
     # Create a table to store the uploaded PDF documents
     documents_t = pxt.create_table(
         'rag_demo.documents',
         {'document': pxt.DocumentType()}
     )
     # Insert the PDF files into the documents table
     documents_t.insert({'document': file.name} for file in pdf_files if file.name.endswith('.pdf'))
     )
     # Add the disclaimer
+    gr.HTML(
         """
         <div style="background-color: #E5DDD4; border: 1px solid #e9ecef; border-radius: 8px; padding: 15px; margin-bottom: 20px;">
+            <strong>Disclaimer:</strong> This app is running on OpenAI, Mistral, and Fireworks accounts with my own API keys 😞. This Hugging Face Space uses the free tier (2vCPU, 16GB RAM), which may result in slower processing times, especially for embedding generation and large document processing. Embeddings are generated using the sentence-transformer library with the 'intfloat/e5-large-v2' model. If you wish to use this app with your own hardware or API keys for improved performance, you can:
+            <a href="https://huggingface.co/spaces/Pixeltable/Multi-LLM-RAG-with-Groundtruth-Comparison/duplicate" target="_blank" style="color: #F25022; text-decoration: none; font-weight: bold;">duplicate this Hugging Face Space</a>, run it locally, or use <b>Google Colab with the Free limited GPU support</b>.</p>
         </div>
         """
     )
     with gr.Row():
+        with gr.Column():
            with gr.Accordion("What This Demo Does", open = True):
             gr.Markdown("""
           1. **Ingests Documents**: Uploads your PDF documents and a ground truth file (CSV or XLSX).
           4. **Generates Answers**: Leverages OpenAI to produce accurate answers based on the retrieved context.
           5. **Compares Results**: Displays the generated answers alongside the ground truth for easy evaluation.
           """)
+        with gr.Column():
           with gr.Accordion("How to Use", open = True):
             gr.Markdown("""
           1. Upload your ground truth file (CSV or XLSX) with the following two columns: **question** and **correct_answer**.
           3. Click "Process Files and Generate Output" to start the RAG process.
           4. View the results in the table below, comparing AI-generated answers to the ground truth.
           """)
     # File upload components for ground truth and PDF documents
     with gr.Row():
         ground_truth_file = gr.File(label="Upload Ground Truth (CSV or XLSX) - Format to respect:question | correct_answer", file_count="single")
     with gr.Row():
         with gr.Column(scale=1):
             download_button = gr.Button("Download Results as CSV")
+            gr.Examples(
+            examples=['Zacks-Nvidia-Report.pdf'],
+            inputs=[pdf_files])
+            gr.Examples(
+            examples=['Q-A-Rag.xlsx'],
+            inputs=[ground_truth_files])
         with gr.Column(scale=2):
             csv_output = gr.File(label="CSV Download")
                                  show_llamav3p23b,
                                  show_mistralsmall],
                          outputs=df_output)
     download_button.click(
     trigger_download,
     inputs=[df_output],
     )
 if __name__ == "__main__":
+    demo.launch(show_api=False)