kargaranamir commited on
Commit
28f58e9
β€’
1 Parent(s): 99cad18

add div and glot500 to datasets comparing with.

Browse files
app.py CHANGED
@@ -1,6 +1,6 @@
1
  import pandas as pd
2
  import streamlit as st
3
- from utils import df_to_html, render_svg, combine_json_files, render_metadata
4
 
5
  data = combine_json_files('./languages')
6
 
@@ -24,10 +24,10 @@ def render_home_table():
24
  df_data['ISO Code'] = df_data['ISO Code'].astype(str) # Convert to string
25
  df_data['Number of Sites'] = df_data.apply(lambda row: '<a href="/?isocode={}&site=True" target="_self">{}</a>'.format(row['ISO Code'], row['Number of Sites']), axis=1)
26
  df_data['Number of Links'] = df_data.apply(lambda row: '<a href="/?isocode={}&links=True" target="_self">{}</a>'.format(row['ISO Code'], row['Number of Links']), axis=1)
27
-
28
 
29
  # Display the table
30
- df_data = df_data[['ISO Code', 'Language Name', 'Family', 'Subgrouping', 'Number of Sites', 'Number of Links', 'Number of Speakers', 'Supported by allenai/MADLAD-400 or facebook/flores']]
31
  st.write(df_to_html(df_data), unsafe_allow_html=True)
32
 
33
 
 
1
  import pandas as pd
2
  import streamlit as st
3
+ from utils import df_to_html, render_svg, combine_json_files, render_metadata, color_mapping
4
 
5
  data = combine_json_files('./languages')
6
 
 
24
  df_data['ISO Code'] = df_data['ISO Code'].astype(str) # Convert to string
25
  df_data['Number of Sites'] = df_data.apply(lambda row: '<a href="/?isocode={}&site=True" target="_self">{}</a>'.format(row['ISO Code'], row['Number of Sites']), axis=1)
26
  df_data['Number of Links'] = df_data.apply(lambda row: '<a href="/?isocode={}&links=True" target="_self">{}</a>'.format(row['ISO Code'], row['Number of Links']), axis=1)
27
+ df_data["Supported by MADLAD-400, flores, and Glot500"] = df_data.apply(lambda row: color_mapping([row["Supported by allenai/MADLAD-400"] + row["Supported by facebook/flores"] + row["Supported by cis-lmu/Glot500"]]), axis =1)
28
 
29
  # Display the table
30
+ df_data = df_data[['ISO Code', 'Language Name', 'Family', 'Subgrouping', 'Number of Sites', 'Number of Links', 'Number of Speakers', 'Supported by MADLAD-400, flores, and Glot500']]
31
  st.write(df_to_html(df_data), unsafe_allow_html=True)
32
 
33
 
languages/abk_Cyrl.json CHANGED
@@ -3,7 +3,9 @@
3
  "Family": "Abkhaz-Adyge",
4
  "Subgrouping": "Abkhaz-Abaza",
5
  "Number of Speakers": "190_000",
6
- "Supported by allenai/MADLAD-400 or facebook/flores": "πŸŸ₯",
 
 
7
  "Sites": [
8
  {
9
  "Site Name": "jinepsgazetesi.com",
 
3
  "Family": "Abkhaz-Adyge",
4
  "Subgrouping": "Abkhaz-Abaza",
5
  "Number of Speakers": "190_000",
6
+ "Supported by allenai/MADLAD-400": 0,
7
+ "Supported by facebook/flores": 0,
8
+ "Supported by cis-lmu/Glot500": 1,
9
  "Sites": [
10
  {
11
  "Site Name": "jinepsgazetesi.com",
languages/ady_Cyrl.json CHANGED
@@ -3,7 +3,9 @@
3
  "Family": "Abkhaz-Adyge",
4
  "Subgrouping": "Circassian",
5
  "Number of Speakers": "610_000",
6
- "Supported by allenai/MADLAD-400 or facebook/flores": "🟨",
 
 
7
  "Sites": [
8
  {
9
  "Site Name": "jinepsgazetesi.com",
 
3
  "Family": "Abkhaz-Adyge",
4
  "Subgrouping": "Circassian",
5
  "Number of Speakers": "610_000",
6
+ "Supported by allenai/MADLAD-400": 1,
7
+ "Supported by facebook/flores": 0,
8
+ "Supported by cis-lmu/Glot500": 0,
9
  "Sites": [
10
  {
11
  "Site Name": "jinepsgazetesi.com",
languages/ahk_Latn.json CHANGED
@@ -3,7 +3,9 @@
3
  "Family": "Sino-Tibetan",
4
  "Subgrouping": "Lolo-Burmese",
5
  "Number of Speakers": "620_000",
6
- "Supported by allenai/MADLAD-400 or facebook/flores": "πŸŸ₯",
 
 
7
  "Sites": [
8
  {
9
  "Site Name": "akhaliterature.com",
 
3
  "Family": "Sino-Tibetan",
4
  "Subgrouping": "Lolo-Burmese",
5
  "Number of Speakers": "620_000",
6
+ "Supported by allenai/MADLAD-400": 1,
7
+ "Supported by facebook/flores": 0,
8
+ "Supported by cis-lmu/Glot500": 1,
9
  "Sites": [
10
  {
11
  "Site Name": "akhaliterature.com",
languages/anm_Latn.json CHANGED
@@ -3,7 +3,9 @@
3
  "Family": "Sino-Tibetan",
4
  "Subgrouping": "Kuki-Chin",
5
  "Number of Speakers": "14_000",
6
- "Supported by allenai/MADLAD-400 or facebook/flores": "πŸŸ₯",
 
 
7
  "Sites": [
8
  {
9
  "Site Name": "apakan.org",
 
3
  "Family": "Sino-Tibetan",
4
  "Subgrouping": "Kuki-Chin",
5
  "Number of Speakers": "14_000",
6
+ "Supported by allenai/MADLAD-400": 0,
7
+ "Supported by facebook/flores": 0,
8
+ "Supported by cis-lmu/Glot500": 0,
9
  "Sites": [
10
  {
11
  "Site Name": "apakan.org",
languages/ava_Cyrl.json CHANGED
@@ -3,7 +3,9 @@
3
  "Family": "Nakh-Daghestanian",
4
  "Subgrouping": "Avar–Andic",
5
  "Number of Speakers": "800_000",
6
- "Supported by allenai/MADLAD-400 or facebook/flores": "🟨",
 
 
7
  "Sites": [
8
  {
9
  "Site Name": "radioerkenli.com",
 
3
  "Family": "Nakh-Daghestanian",
4
  "Subgrouping": "Avar–Andic",
5
  "Number of Speakers": "800_000",
6
+ "Supported by allenai/MADLAD-400": 1,
7
+ "Supported by facebook/flores": 0,
8
+ "Supported by cis-lmu/Glot500": 0,
9
  "Sites": [
10
  {
11
  "Site Name": "radioerkenli.com",
languages/bal_Arab.json CHANGED
@@ -3,7 +3,9 @@
3
  "Family": "Indo-European",
4
  "Subgrouping": "Iranian",
5
  "Number of Speakers": "8_000_000",
6
- "Supported by allenai/MADLAD-400 or facebook/flores": "πŸŸ₯",
 
 
7
  "Sites": [
8
  {
9
  "Site Name": "sunnionline.us",
 
3
  "Family": "Indo-European",
4
  "Subgrouping": "Iranian",
5
  "Number of Speakers": "8_000_000",
6
+ "Supported by allenai/MADLAD-400": 0,
7
+ "Supported by facebook/flores": 0,
8
+ "Supported by cis-lmu/Glot500": 0,
9
  "Sites": [
10
  {
11
  "Site Name": "sunnionline.us",
languages/bar_Latn.json CHANGED
@@ -3,7 +3,9 @@
3
  "Family": "Indo-European",
4
  "Subgrouping": "Germanic",
5
  "Number of Speakers": "14_000_000",
6
- "Supported by allenai/MADLAD-400 or facebook/flores": "πŸŸ₯",
 
 
7
  "Sites": [
8
  {
9
  "Site Name": "bar.wikipedia.org",
 
3
  "Family": "Indo-European",
4
  "Subgrouping": "Germanic",
5
  "Number of Speakers": "14_000_000",
6
+ "Supported by allenai/MADLAD-400": 0,
7
+ "Supported by facebook/flores": 0,
8
+ "Supported by cis-lmu/Glot500": 1,
9
  "Sites": [
10
  {
11
  "Site Name": "bar.wikipedia.org",
languages/bqi_Arab.json CHANGED
@@ -3,7 +3,9 @@
3
  "Family": "Indo-European",
4
  "Subgrouping": "Iranian",
5
  "Number of Speakers": "1_200_000",
6
- "Supported by allenai/MADLAD-400 or facebook/flores": "πŸŸ₯",
 
 
7
  "Sites": [
8
  {
9
  "Site Name": "lurishacademy.org",
 
3
  "Family": "Indo-European",
4
  "Subgrouping": "Iranian",
5
  "Number of Speakers": "1_200_000",
6
+ "Supported by allenai/MADLAD-400": 0,
7
+ "Supported by facebook/flores": 0,
8
+ "Supported by cis-lmu/Glot500": 0,
9
  "Sites": [
10
  {
11
  "Site Name": "lurishacademy.org",
languages/brh_Arab.json CHANGED
@@ -3,7 +3,9 @@
3
  "Family": "Dravidian",
4
  "Subgrouping": "",
5
  "Number of Speakers": "2_800_000",
6
- "Supported by allenai/MADLAD-400 or facebook/flores": "πŸŸ₯",
 
 
7
  "Sites": [
8
  {
9
  "Site Name": "talarbrahui",
 
3
  "Family": "Dravidian",
4
  "Subgrouping": "",
5
  "Number of Speakers": "2_800_000",
6
+ "Supported by allenai/MADLAD-400": 0,
7
+ "Supported by facebook/flores": 0,
8
+ "Supported by cis-lmu/Glot500": 0,
9
  "Sites": [
10
  {
11
  "Site Name": "talarbrahui",
languages/che_Cyrl.json CHANGED
@@ -3,7 +3,9 @@
3
  "Family": "Nakh-Daghestanian",
4
  "Subgrouping": "Nakh",
5
  "Number of Speakers": "1_800_000",
6
- "Supported by allenai/MADLAD-400 or facebook/flores": "🟨",
 
 
7
  "Sites": [
8
  {
9
  "Site Name": "jinepsgazetesi.com",
 
3
  "Family": "Nakh-Daghestanian",
4
  "Subgrouping": "Nakh",
5
  "Number of Speakers": "1_800_000",
6
+ "Supported by allenai/MADLAD-400": 1,
7
+ "Supported by facebook/flores": 0,
8
+ "Supported by cis-lmu/Glot500": 1,
9
  "Sites": [
10
  {
11
  "Site Name": "jinepsgazetesi.com",
languages/crl_Cans.json CHANGED
@@ -3,7 +3,9 @@
3
  "Family": "Algic",
4
  "Subgrouping": "Cree-Montagnais-Naskapi",
5
  "Number of Speakers": "400",
6
- "Supported by allenai/MADLAD-400 or facebook/flores": "πŸŸ₯",
 
 
7
  "Sites": [
8
  {
9
  "Site Name": "nunavikprotectedareas.com",
 
3
  "Family": "Algic",
4
  "Subgrouping": "Cree-Montagnais-Naskapi",
5
  "Number of Speakers": "400",
6
+ "Supported by allenai/MADLAD-400": 0,
7
+ "Supported by facebook/flores": 0,
8
+ "Supported by cis-lmu/Glot500": 0,
9
  "Sites": [
10
  {
11
  "Site Name": "nunavikprotectedareas.com",
languages/div_Thaa.json ADDED
@@ -0,0 +1,57 @@
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
+ {
2
+ "Language Name": "Dhivehi",
3
+ "Family": "Indo-European",
4
+ "Subgrouping": "Insular Indo-Aryan",
5
+ "Number of Speakers": "500_000",
6
+ "Supported by allenai/MADLAD-400": 1,
7
+ "Supported by facebook/flores": 0,
8
+ "Supported by cis-lmu/Glot500": 1,
9
+ "Sites": [
10
+ {
11
+ "Site Name": "hassanhameed.com",
12
+ "Site URL": "https://www.hassanhameed.com/dhivehi-language",
13
+ "Category": "linguistics",
14
+ "Confidence": "🟩",
15
+ "Info": "confirmed by glotlid",
16
+ "Possible Parallel Languages": "",
17
+ "Links": []
18
+ },
19
+ {
20
+ "Site Name": "asim-ahmedasim.blogspot.com",
21
+ "Site URL": "https://asim-ahmedasim.blogspot.com/",
22
+ "Category": "blog",
23
+ "Confidence": "🟩",
24
+ "Info": "confirmed by glotlid",
25
+ "Possible Parallel Languages": "",
26
+ "Links": []
27
+ },
28
+ {
29
+ "Site Name": "thaareekh.blogspot.com",
30
+ "Site URL": "https://thaareekh.blogspot.com/",
31
+ "Category": "",
32
+ "Confidence": "🟩",
33
+ "Info": "confirmed by glotlid",
34
+ "Possible Parallel Languages": "",
35
+ "Links": []
36
+ },
37
+ {
38
+ "Site Name": "ilyashussainibrahim.com",
39
+ "Site URL": "https://www.ilyashussainibrahim.com/",
40
+ "Category": "",
41
+ "Confidence": "🟩",
42
+ "Info": "confirmed by glotlid",
43
+ "Possible Parallel Languages": "",
44
+ "Links": []
45
+ },
46
+ {
47
+ "Site Name": "halinews.com",
48
+ "Site URL": "https://halinews.com/",
49
+ "Category": "news",
50
+ "Confidence": "🟩",
51
+ "Info": "confirmed by glotlid",
52
+ "Possible Parallel Languages": "",
53
+ "Links": []
54
+ }
55
+ ]
56
+ }
57
+
languages/enm_Latn.json CHANGED
@@ -3,7 +3,9 @@
3
  "Family": "Indo-European",
4
  "Subgrouping": "Germanic",
5
  "Number of Speakers": "0",
6
- "Supported by allenai/MADLAD-400 or facebook/flores": "πŸŸ₯",
 
 
7
  "Sites": [
8
  {
9
  "Site Name": "quod.lib.umich.edu/c/cme/AHA2727/",
 
3
  "Family": "Indo-European",
4
  "Subgrouping": "Germanic",
5
  "Number of Speakers": "0",
6
+ "Supported by allenai/MADLAD-400": 0,
7
+ "Supported by facebook/flores": 0,
8
+ "Supported by cis-lmu/Glot500": 1,
9
  "Sites": [
10
  {
11
  "Site Name": "quod.lib.umich.edu/c/cme/AHA2727/",
languages/glk_Arab.json CHANGED
@@ -3,7 +3,9 @@
3
  "Family": "Indo-European",
4
  "Subgrouping": "Iranian",
5
  "Number of Speakers": "3_000_000",
6
- "Supported by allenai/MADLAD-400 or facebook/flores": "πŸŸ₯",
 
 
7
  "Sites": [
8
  {
9
  "Site Name": "t.me/gilaki_twitter",
 
3
  "Family": "Indo-European",
4
  "Subgrouping": "Iranian",
5
  "Number of Speakers": "3_000_000",
6
+ "Supported by allenai/MADLAD-400": 0,
7
+ "Supported by facebook/flores": 0,
8
+ "Supported by cis-lmu/Glot500": 1,
9
  "Sites": [
10
  {
11
  "Site Name": "t.me/gilaki_twitter",
languages/hac_Arab.json CHANGED
@@ -3,7 +3,9 @@
3
  "Family": "Indo-European",
4
  "Subgrouping": "Iranian",
5
  "Number of Speakers": "300_000",
6
- "Supported by allenai/MADLAD-400 or facebook/flores": "πŸŸ₯",
 
 
7
  "Sites": [
8
  {
9
  "Site Name": "anfsorani.com/Ω‡Ϋ†Ψ±Ψ§Ω…ΫŒ",
 
3
  "Family": "Indo-European",
4
  "Subgrouping": "Iranian",
5
  "Number of Speakers": "300_000",
6
+ "Supported by allenai/MADLAD-400": 0,
7
+ "Supported by facebook/flores": 0,
8
+ "Supported by cis-lmu/Glot500": 0,
9
  "Sites": [
10
  {
11
  "Site Name": "anfsorani.com/Ω‡Ϋ†Ψ±Ψ§Ω…ΫŒ",
languages/ike_Cans.json CHANGED
@@ -3,7 +3,9 @@
3
  "Family": "Eskimo-Aleut",
4
  "Subgrouping": "Inuit",
5
  "Number of Speakers": "42_000",
6
- "Supported by allenai/MADLAD-400 or facebook/flores": "🟨",
 
 
7
  "Sites": [
8
  {
9
  "Site Name": "nunavikprotectedareas.com",
 
3
  "Family": "Eskimo-Aleut",
4
  "Subgrouping": "Inuit",
5
  "Number of Speakers": "42_000",
6
+ "Supported by allenai/MADLAD-400": 1,
7
+ "Supported by facebook/flores": 0,
8
+ "Supported by cis-lmu/Glot500": 1,
9
  "Sites": [
10
  {
11
  "Site Name": "nunavikprotectedareas.com",
languages/khb_Talu.json CHANGED
@@ -3,7 +3,9 @@
3
  "Family": "Tai-Kadai",
4
  "Subgrouping": "Daic",
5
  "Number of Speakers": "550_000",
6
- "Supported by allenai/MADLAD-400 or facebook/flores": "πŸŸ₯",
 
 
7
  "Sites": [
8
  {
9
  "Site Name": "dw12.com",
 
3
  "Family": "Tai-Kadai",
4
  "Subgrouping": "Daic",
5
  "Number of Speakers": "550_000",
6
+ "Supported by allenai/MADLAD-400": 0,
7
+ "Supported by facebook/flores": 0,
8
+ "Supported by cis-lmu/Glot500": 0,
9
  "Sites": [
10
  {
11
  "Site Name": "dw12.com",
languages/lki_Arab.json CHANGED
@@ -3,7 +3,9 @@
3
  "Family": "Indo-European",
4
  "Subgrouping": "Iranian",
5
  "Number of Speakers": "600_000",
6
- "Supported by allenai/MADLAD-400 or facebook/flores": "πŸŸ₯",
 
 
7
  "Sites": [
8
  {
9
  "Site Name": "lurishacademy.org",
 
3
  "Family": "Indo-European",
4
  "Subgrouping": "Iranian",
5
  "Number of Speakers": "600_000",
6
+ "Supported by allenai/MADLAD-400": 0,
7
+ "Supported by facebook/flores": 0,
8
+ "Supported by cis-lmu/Glot500": 0,
9
  "Sites": [
10
  {
11
  "Site Name": "lurishacademy.org",
languages/lrc_Arab.json CHANGED
@@ -3,7 +3,9 @@
3
  "Family": "Indo-European",
4
  "Subgrouping": "Iranian",
5
  "Number of Speakers": "4_000_000",
6
- "Supported by allenai/MADLAD-400 or facebook/flores": "🟨",
 
 
7
  "Sites": [
8
  {
9
  "Site Name": "lurishacademy.org",
 
3
  "Family": "Indo-European",
4
  "Subgrouping": "Iranian",
5
  "Number of Speakers": "4_000_000",
6
+ "Supported by allenai/MADLAD-400": 1,
7
+ "Supported by facebook/flores": 0,
8
+ "Supported by cis-lmu/Glot500": 0,
9
  "Sites": [
10
  {
11
  "Site Name": "lurishacademy.org",
languages/mns_Cyrl.json CHANGED
@@ -3,7 +3,9 @@
3
  "Family": "Uralic",
4
  "Subgrouping": "Mansic",
5
  "Number of Speakers": "2_200",
6
- "Supported by allenai/MADLAD-400 or facebook/flores": "πŸŸ₯",
 
 
7
  "Sites": [
8
  {
9
  "Site Name": "khanty-yasang.ru/luima-seripos",
 
3
  "Family": "Uralic",
4
  "Subgrouping": "Mansic",
5
  "Number of Speakers": "2_200",
6
+ "Supported by allenai/MADLAD-400": 0,
7
+ "Supported by facebook/flores": 0,
8
+ "Supported by cis-lmu/Glot500": 0,
9
  "Sites": [
10
  {
11
  "Site Name": "khanty-yasang.ru/luima-seripos",
languages/mon_Mong.json CHANGED
@@ -3,7 +3,9 @@
3
  "Family": "Mongolic",
4
  "Subgrouping": "",
5
  "Number of Speakers": "6_000_000",
6
- "Supported by allenai/MADLAD-400 or facebook/flores": "πŸŸ₯",
 
 
7
  "Sites": [
8
  {
9
  "Site Name": "wikibilig.mn",
 
3
  "Family": "Mongolic",
4
  "Subgrouping": "",
5
  "Number of Speakers": "6_000_000",
6
+ "Supported by allenai/MADLAD-400": 0,
7
+ "Supported by facebook/flores": 0,
8
+ "Supported by cis-lmu/Glot500": 0,
9
  "Sites": [
10
  {
11
  "Site Name": "wikibilig.mn",
languages/nsk_Cans.json CHANGED
@@ -3,7 +3,9 @@
3
  "Family": "Algic",
4
  "Subgrouping": "Cree-Montagnais-Naskapi",
5
  "Number of Speakers": "1_200",
6
- "Supported by allenai/MADLAD-400 or facebook/flores": "πŸŸ₯",
 
 
7
  "Sites": [
8
  {
9
  "Site Name": "clscnaskapi.org",
 
3
  "Family": "Algic",
4
  "Subgrouping": "Cree-Montagnais-Naskapi",
5
  "Number of Speakers": "1_200",
6
+ "Supported by allenai/MADLAD-400": 0,
7
+ "Supported by facebook/flores": 0,
8
+ "Supported by cis-lmu/Glot500": 0,
9
  "Sites": [
10
  {
11
  "Site Name": "clscnaskapi.org",
languages/oss_Cyrl.json CHANGED
@@ -3,7 +3,9 @@
3
  "Family": "Indo-European",
4
  "Subgrouping": "Iranian",
5
  "Number of Speakers": "490_000",
6
- "Supported by allenai/MADLAD-400 or facebook/flores": "🟨",
 
 
7
  "Sites": [
8
  {
9
  "Site Name": "jinepsgazetesi.com",
 
3
  "Family": "Indo-European",
4
  "Subgrouping": "Iranian",
5
  "Number of Speakers": "490_000",
6
+ "Supported by allenai/MADLAD-400": 1,
7
+ "Supported by facebook/flores": 0,
8
+ "Supported by cis-lmu/Glot500": 1,
9
  "Sites": [
10
  {
11
  "Site Name": "jinepsgazetesi.com",
languages/sdh_Arab.json CHANGED
@@ -3,7 +3,9 @@
3
  "Family": "Indo-European",
4
  "Subgrouping": "Iranian",
5
  "Number of Speakers": "1_500_000",
6
- "Supported by allenai/MADLAD-400 or facebook/flores": "πŸŸ₯",
 
 
7
  "Sites": [
8
  {
9
  "Site Name": "shafaq.com/ku",
 
3
  "Family": "Indo-European",
4
  "Subgrouping": "Iranian",
5
  "Number of Speakers": "1_500_000",
6
+ "Supported by allenai/MADLAD-400": 0,
7
+ "Supported by facebook/flores": 0,
8
+ "Supported by cis-lmu/Glot500": 0,
9
  "Sites": [
10
  {
11
  "Site Name": "shafaq.com/ku",
languages/snk_Latn.json CHANGED
@@ -3,7 +3,9 @@
3
  "Family": "Mande",
4
  "Subgrouping": "Soninke-Bozo",
5
  "Number of Speakers": "2_300_000",
6
- "Supported by allenai/MADLAD-400 or facebook/flores": "πŸŸ₯",
 
 
7
  "Sites": [
8
  {
9
  "Site Name": "soninkara.com/snk/",
 
3
  "Family": "Mande",
4
  "Subgrouping": "Soninke-Bozo",
5
  "Number of Speakers": "2_300_000",
6
+ "Supported by allenai/MADLAD-400": 0,
7
+ "Supported by facebook/flores": 0,
8
+ "Supported by cis-lmu/Glot500": 0,
9
  "Sites": [
10
  {
11
  "Site Name": "soninkara.com/snk/",
languages/srp_Latn.json CHANGED
@@ -3,7 +3,9 @@
3
  "Family": "Indo-European",
4
  "Subgrouping": "Slavic",
5
  "Number of Speakers": "12_000_000",
6
- "Supported by allenai/MADLAD-400 or facebook/flores": "πŸŸ₯",
 
 
7
  "Sites": [
8
  {
9
  "Site Name": "turizamiputovanja.com",
 
3
  "Family": "Indo-European",
4
  "Subgrouping": "Slavic",
5
  "Number of Speakers": "12_000_000",
6
+ "Supported by allenai/MADLAD-400": 0,
7
+ "Supported by facebook/flores": 0,
8
+ "Supported by cis-lmu/Glot500": 1,
9
  "Sites": [
10
  {
11
  "Site Name": "turizamiputovanja.com",
languages/syl_Sylo.json CHANGED
@@ -3,7 +3,9 @@
3
  "Family": "Indo-European",
4
  "Subgrouping": "Eastern Indo-Aryan",
5
  "Number of Speakers": "10_000_000",
6
- "Supported by allenai/MADLAD-400 or facebook/flores": "πŸŸ₯",
 
 
7
  "Sites": [
8
  {
9
  "Site Name": "surmafarorkhobor.com",
 
3
  "Family": "Indo-European",
4
  "Subgrouping": "Eastern Indo-Aryan",
5
  "Number of Speakers": "10_000_000",
6
+ "Supported by allenai/MADLAD-400": 0,
7
+ "Supported by facebook/flores": 0,
8
+ "Supported by cis-lmu/Glot500": 0,
9
  "Sites": [
10
  {
11
  "Site Name": "surmafarorkhobor.com",
languages/uzs_Arab.json CHANGED
@@ -3,7 +3,9 @@
3
  "Family": "Turkic",
4
  "Subgrouping": "Turkestan",
5
  "Number of Speakers": "4_600_000",
6
- "Supported by allenai/MADLAD-400 or facebook/flores": "πŸŸ₯",
 
 
7
  "Sites": [
8
  {
9
  "Site Name": "trt.net.tr/afghaniuzbek",
 
3
  "Family": "Turkic",
4
  "Subgrouping": "Turkestan",
5
  "Number of Speakers": "4_600_000",
6
+ "Supported by allenai/MADLAD-400": 0,
7
+ "Supported by facebook/flores": 0,
8
+ "Supported by cis-lmu/Glot500": 0,
9
  "Sites": [
10
  {
11
  "Site Name": "trt.net.tr/afghaniuzbek",
languages/xmf_Geor.json CHANGED
@@ -3,7 +3,9 @@
3
  "Family": "Kartvelian",
4
  "Subgrouping": "Zan",
5
  "Number of Speakers": "345_000",
6
- "Supported by allenai/MADLAD-400 or facebook/flores": "πŸŸ₯",
 
 
7
  "Sites": [
8
  {
9
  "Site Name": "titus.uni-frankfurt.de",
 
3
  "Family": "Kartvelian",
4
  "Subgrouping": "Zan",
5
  "Number of Speakers": "345_000",
6
+ "Supported by allenai/MADLAD-400": 0,
7
+ "Supported by facebook/flores": 0,
8
+ "Supported by cis-lmu/Glot500": 1,
9
  "Sites": [
10
  {
11
  "Site Name": "titus.uni-frankfurt.de",
utils.py CHANGED
@@ -81,4 +81,23 @@ def render_metadata():
81
  <a href="https://arxiv.org/abs/xxxx.xxxxx"><img alt="arXiv" src="https://img.shields.io/badge/arXiv-xxxx.xxxxx-b31b1b.svg"></a>
82
  </p>"""
83
  c = st.container()
84
- c.write(html, unsafe_allow_html=True)
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
81
  <a href="https://arxiv.org/abs/xxxx.xxxxx"><img alt="arXiv" src="https://img.shields.io/badge/arXiv-xxxx.xxxxx-b31b1b.svg"></a>
82
  </p>"""
83
  c = st.container()
84
+ c.write(html, unsafe_allow_html=True)
85
+
86
+
87
+
88
+
89
+ # Define the function for conditional coloring
90
+ def color_mapping(listx):
91
+
92
+ bins = len(listx)
93
+ mean = sum(listx) / (1.0 * bins)
94
+
95
+ if mean == 0:
96
+ return "πŸŸ₯"
97
+ elif mean < 1.0/bins + 0.01:
98
+ return "🟧"
99
+ elif mean < 2.0/bins + 0.01:
100
+ return "🟨"
101
+ else:
102
+ return "🟩"
103
+