data_only_hallucination_leaderboard

Runtime error

pminervini commited on Nov 29, 2023

Commit

9af5ebf

•

1 Parent(s): 241e347

update

Files changed (1) hide show

app.py CHANGED Viewed

@@ -60,7 +60,7 @@ raw_data, original_df = get_leaderboard_df(EVAL_RESULTS_PATH, EVAL_REQUESTS_PATH
 # update_collections(original_df.copy())
 leaderboard_df = original_df.copy()
-plot_df = create_plot_df(create_scores_df(raw_data))
 (
     finished_eval_queue_df,
@@ -251,22 +251,23 @@ with demo:
                     queue=True,
                 )
-        with gr.TabItem("📈 Metrics through time", elem_id="llm-benchmark-tab-table", id=4):
-            with gr.Row():
-                with gr.Column():
-                    chart = create_metric_plot_obj(
-                        plot_df,
-                        [AutoEvalColumn.average.name],
-                        title="Average of Top Scores and Human Baseline Over Time (from last update)",
-                    )
-                    gr.Plot(value=chart, min_width=500)
-                with gr.Column():
-                    chart = create_metric_plot_obj(
-                        plot_df,
-                        BENCHMARK_COLS,
-                        title="Top Scores and Human Baseline Over Time (from last update)",
-                    )
-                    gr.Plot(value=chart, min_width=500)
         with gr.TabItem("📝 About", elem_id="llm-benchmark-tab-table", id=2):
             gr.Markdown(LLM_BENCHMARKS_TEXT, elem_classes="markdown-text")

 # update_collections(original_df.copy())
 leaderboard_df = original_df.copy()
+# plot_df = create_plot_df(create_scores_df(raw_data))
 (
     finished_eval_queue_df,
                     queue=True,
                 )
+        # with gr.TabItem("📈 Metrics through time", elem_id="llm-benchmark-tab-table", id=4):
+        #     with gr.Row():
+        #         with gr.Column():
+        #             chart = create_metric_plot_obj(
+        #                 plot_df,
+        #                 [AutoEvalColumn.average.name],
+        #                 title="Average of Top Scores and Human Baseline Over Time (from last update)",
+        #             )
+        #             gr.Plot(value=chart, min_width=500)
+        #         with gr.Column():
+        #             chart = create_metric_plot_obj(
+        #                 plot_df,
+        #                 BENCHMARK_COLS,
+        #                 title="Top Scores and Human Baseline Over Time (from last update)",
+        #             )
+        #             gr.Plot(value=chart, min_width=500)
         with gr.TabItem("📝 About", elem_id="llm-benchmark-tab-table", id=2):
             gr.Markdown(LLM_BENCHMARKS_TEXT, elem_classes="markdown-text")