zhuohan-7 commited on
Commit
2115ef1
·
verified ·
1 Parent(s): 4b7a759

Upload folder using huggingface_hub

Browse files
app/__pycache__/draw_diagram.cpython-312.pyc CHANGED
Binary files a/app/__pycache__/draw_diagram.cpython-312.pyc and b/app/__pycache__/draw_diagram.cpython-312.pyc differ
 
app/__pycache__/pages.cpython-312.pyc CHANGED
Binary files a/app/__pycache__/pages.cpython-312.pyc and b/app/__pycache__/pages.cpython-312.pyc differ
 
app/pages.py CHANGED
@@ -2,16 +2,72 @@ import streamlit as st
2
  from app.draw_diagram import *
3
 
4
  def dashboard():
5
- st.title("SeaEval")
6
-
7
- """
8
- [gh]: https://github.com/SeaEval/SeaEval
9
- [![GitHub Repo stars](https://img.shields.io/github/stars/SeaEval/SeaEval?style=social)][gh]
10
- """
 
 
 
11
 
12
  seaeval_url = "https://seaeval.github.io/"
13
- st.markdown("[SeaEval](%s) is the new benchmark for multilingual foundation models consisting of 28 dataset." % seaeval_url)
14
- st.markdown(".... haven't finished yet ...")
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
15
 
16
  def cross_lingual_consistency():
17
  st.title("Cross-Lingual Consistency")
 
2
  from app.draw_diagram import *
3
 
4
  def dashboard():
5
+
6
+ with st.container():
7
+ st.title("SeaEval")
8
+
9
+ st.markdown("""
10
+ [gh]: https://github.com/SeaEval/SeaEval
11
+ [![GitHub watchers](https://img.shields.io/github/watchers/SeaEval/SeaEval?style=social)][gh]
12
+ [![GitHub Repo stars](https://img.shields.io/github/stars/SeaEval/SeaEval?style=social)][gh]
13
+ """)
14
 
15
  seaeval_url = "https://seaeval.github.io/"
16
+
17
+ st.divider()
18
+ st.markdown("#### What is [SeaEval](%s)" % seaeval_url)
19
+
20
+ with st.container():
21
+ left_co, cent_co,last_co = st.columns(3)
22
+ with cent_co:
23
+ st.image("./style/seaeval_overall.png",
24
+ # caption="SeaEval data range",
25
+ width=500)
26
+ st.markdown('''
27
+
28
+ ''')
29
+ st.markdown("##### A new benchmark for multilingual foundation models consisting of 28 dataset.")
30
+ st.markdown(''':star: How models understand and reason with natural language?
31
+ :balloon: Languages: English, Chinese, Malay, Spainish, Indonedian, Vietnamese, Filipino.
32
+ ''')
33
+
34
+ st.markdown(''':star: How models comprehend cultural practices, nuances and values?
35
+ :balloon: 4 new datasets on Cultural Understanding.
36
+ ''')
37
+
38
+ st.markdown(''':star: How models perform across languages in terms of consistency?
39
+ :balloon: 2 new datasets with curated metrics for Cross-Linugal Consistency.
40
+ ''')
41
+ with st.container():
42
+ left_co, cent_co,last_co = st.columns(3)
43
+ with cent_co:
44
+ st.image("./style/consistency.png",
45
+ # caption="SeaEval data range",
46
+ width=500)
47
+ st.markdown("##### Evaluation with enhanced cross-lingual capabilities.")
48
+ st.markdown(''':star: How models perform according to different (paraphrased) instructions?
49
+ :balloon: Each dataset is equipped with 5 different prompts to avoid randomness introduced by instructions,
50
+ which is non-negligible..
51
+ ''')
52
+
53
+ st.markdown(''':star: Multilingual accuracy and performance consistency across languages.
54
+ :balloon: If you can answer the question in your native language, can you answer the same question
55
+ correctly in your second/third language?
56
+ ''')
57
+
58
+ st.divider()
59
+ with st.container():
60
+ st.markdown("##### Citations")
61
+
62
+ st.markdown('''
63
+ :round_pushpin: SeaEval Paper \n
64
+ @article{SeaEval2023,
65
+ title={SeaEval for Multilingual Foundation Models: From Cross-Lingual Alignment to Cultural Reasoning},
66
+ author={Wang, Bin and Liu, Zhengyuan and Huang, Xin and Jiao, Fangkai and Ding, Yang and Aw, Ai Ti and Chen, Nancy F},
67
+ journal={arXiv preprint arXiv:2309.04766},
68
+ year={2023}
69
+ }
70
+ ''')
71
 
72
  def cross_lingual_consistency():
73
  st.title("Cross-Lingual Consistency")