Spaces:

MERaLiON
/

SeaEval_Leaderboard

Running

App Files Files Community

zhuohan-7 commited on Jul 30, 2024

Commit

2115ef1

verified ·

1 Parent(s): 4b7a759

Upload folder using huggingface_hub

Browse files

Files changed (3) hide show

app/__pycache__/draw_diagram.cpython-312.pyc +0 -0
app/__pycache__/pages.cpython-312.pyc +0 -0
app/pages.py +64 -8

app/__pycache__/draw_diagram.cpython-312.pyc CHANGED Viewed

Binary files a/app/__pycache__/draw_diagram.cpython-312.pyc and b/app/__pycache__/draw_diagram.cpython-312.pyc differ

app/__pycache__/pages.cpython-312.pyc CHANGED Viewed

Binary files a/app/__pycache__/pages.cpython-312.pyc and b/app/__pycache__/pages.cpython-312.pyc differ

app/pages.py CHANGED Viewed

@@ -2,16 +2,72 @@ import streamlit as st
 from app.draw_diagram import *
 def dashboard():
-    st.title("SeaEval")
-    """
-    [gh]: https://github.com/SeaEval/SeaEval
-    [![GitHub Repo stars](https://img.shields.io/github/stars/SeaEval/SeaEval?style=social)][gh]
-    """
     seaeval_url = "https://seaeval.github.io/"
-    st.markdown("[SeaEval](%s) is the new benchmark for multilingual foundation models consisting of 28 dataset." % seaeval_url)
-    st.markdown(".... haven't finished yet ...")
 def cross_lingual_consistency():
     st.title("Cross-Lingual Consistency")

 from app.draw_diagram import *
 def dashboard():
+    with st.container():
+        st.title("SeaEval")
+        st.markdown("""
+            [gh]: https://github.com/SeaEval/SeaEval
+            [![GitHub watchers](https://img.shields.io/github/watchers/SeaEval/SeaEval?style=social)][gh]
+            [![GitHub Repo stars](https://img.shields.io/github/stars/SeaEval/SeaEval?style=social)][gh]
+            """)
     seaeval_url = "https://seaeval.github.io/"
+    st.divider()
+    st.markdown("#### What is [SeaEval](%s)" % seaeval_url)
+    with st.container():
+        left_co, cent_co,last_co = st.columns(3)
+        with cent_co:
+            st.image("./style/seaeval_overall.png",
+                    #  caption="SeaEval data range",
+                    width=500)
+        st.markdown('''
+                    ''')
+        st.markdown("##### A new benchmark for multilingual foundation models consisting of 28 dataset.")
+        st.markdown(''':star: How models understand and reason with natural language?
+                    :balloon: Languages: English, Chinese, Malay, Spainish, Indonedian, Vietnamese, Filipino.
+                    ''')
+        st.markdown(''':star: How models comprehend cultural practices, nuances and values?
+                    :balloon: 4 new datasets on Cultural Understanding.
+                    ''')
+        st.markdown(''':star: How models perform across languages in terms of consistency?
+                    :balloon: 2 new datasets with curated metrics for Cross-Linugal Consistency.
+                    ''')
+    with st.container():
+        left_co, cent_co,last_co = st.columns(3)
+        with cent_co:
+            st.image("./style/consistency.png",
+                    #  caption="SeaEval data range",
+                    width=500)
+        st.markdown("##### Evaluation with enhanced cross-lingual capabilities.")
+        st.markdown(''':star: How models perform according to different (paraphrased) instructions?
+                    :balloon: Each dataset is equipped with 5 different prompts to avoid randomness introduced by instructions,
+                    which is non-negligible..
+                    ''')
+        st.markdown(''':star: Multilingual accuracy and performance consistency across languages.
+                    :balloon: If you can answer the question in your native language, can you answer the same question
+                    correctly in your second/third language?
+                    ''')
+    st.divider()
+    with st.container():
+        st.markdown("##### Citations")
+        st.markdown('''
+                    :round_pushpin: SeaEval Paper \n
+                        @article{SeaEval2023,
+                            title={SeaEval for Multilingual Foundation Models: From Cross-Lingual Alignment to Cultural Reasoning},
+                            author={Wang, Bin and Liu, Zhengyuan and Huang, Xin and Jiao, Fangkai and Ding, Yang and Aw, Ai Ti and Chen, Nancy F},
+                            journal={arXiv preprint arXiv:2309.04766},
+                            year={2023}
+                            }
+                    ''')
 def cross_lingual_consistency():
     st.title("Cross-Lingual Consistency")