avr23-cds-translation2

Running

App Files Files Community

Demosthene-OR commited on Mar 17

Commit

9910446

•

1 Parent(s): bb0fb0e

./...

Browse files

Files changed (3) hide show

tabs/id_lang_tab.py +7 -5
tabs/modelisation_seq2seq_tab.py +8 -36
tabs/read_api_url.py +17 -0

tabs/id_lang_tab.py CHANGED Viewed

@@ -13,6 +13,7 @@ import seaborn as sns
 from sklearn import naive_bayes
 from translate_app import tr
 import requests
 title = "Identification de langue"
 sidebar_name = "Identification de langue"
@@ -280,11 +281,11 @@ def display_shapley(lang_sel):
 def run():
     global tokenizer, vectorizer, dict_token, dict_ids, nb_token, lan_to_language, clf_nb
     global toggle_val, custom_sentence, lan_identified
-    global lang_exemples, exemples
     tokenizer, dict_token, dict_ids, nb_token, lan_to_language, clf_nb, vectorizer = init_nb_identifier()
-    lan_identified = requests.get( "https://demosthene-or-api-avr23-cds-translation.hf.space/lan_identified").json()
     lang_id_model_ext, dict_xlmr, sentence_test, lang_exemples, exemples= init_lang_id_external()
     st.write("")
@@ -329,7 +330,7 @@ def run():
         if custom_sentence!='':
-            url = "https://demosthene-or-api-avr23-cds-translation.hf.space/lang_id_dl"
             params = {"sentence": custom_sentence}
             response = requests.get(url, params=params)
@@ -409,7 +410,8 @@ def run():
             st.write("<center><h5>"+tr("Architecture du modèle utilisé")+":</h5></center>", unsafe_allow_html=True)
             col1, col2, col3 = st.columns([0.15,0.7,0.15])
             with col2:
-                st.image("https://demosthene-or-api-avr23-cds-translation.hf.space/small_vocab/plot_model?&model_type=lang_id",use_column_width="auto")
     elif (chosen_id == "tab3"):
         st.write("### **"+tr("Interpretabilité du classifieur Naïve Bayes sur 5 langues")+"**")
         st.write("##### "+tr("..et un Training set réduit (15000 phrases et 94 tokens)"))

 from sklearn import naive_bayes
 from translate_app import tr
 import requests
+import read_api_url
 title = "Identification de langue"
 sidebar_name = "Identification de langue"
 def run():
     global tokenizer, vectorizer, dict_token, dict_ids, nb_token, lan_to_language, clf_nb
     global toggle_val, custom_sentence, lan_identified
+    global lang_exemples, exemples, url_base
+    url_base = read_api_url()
     tokenizer, dict_token, dict_ids, nb_token, lan_to_language, clf_nb, vectorizer = init_nb_identifier()
+    lan_identified = requests.get( url_base[0]+"/lan_identified").json()
     lang_id_model_ext, dict_xlmr, sentence_test, lang_exemples, exemples= init_lang_id_external()
     st.write("")
         if custom_sentence!='':
+            url = url_base[0]+"/lang_id_dl"
             params = {"sentence": custom_sentence}
             response = requests.get(url, params=params)
             st.write("<center><h5>"+tr("Architecture du modèle utilisé")+":</h5></center>", unsafe_allow_html=True)
             col1, col2, col3 = st.columns([0.15,0.7,0.15])
             with col2:
+                st.image(url_base[0]+"e/small_vocab/plot_model?&model_type=lang_id",use_column_width="auto")
     elif (chosen_id == "tab3"):
         st.write("### **"+tr("Interpretabilité du classifieur Naïve Bayes sur 5 langues")+"**")
         st.write("##### "+tr("..et un Training set réduit (15000 phrases et 94 tokens)"))

tabs/modelisation_seq2seq_tab.py CHANGED Viewed

@@ -13,33 +13,17 @@ import wavio
 from gtts import gTTS
 from extra_streamlit_components import tab_bar, TabBarItemData
 from translate_app import tr
-import csv
 import requests
 # from multiprocessing import Pool
 import concurrent.futures
-import time
 title = "Traduction Sequence à Sequence"
 sidebar_name = "Traduction Seq2Seq"
 dataPath = st.session_state.DataPath
-@st.cache_data
-def read_api_url():
-    api_url = []
-    # Ouvrir le fichier CSV en mode lecture
-    with open("api-url.txt", newline='') as fichier_csv:
-        lecteur_csv = csv.reader(fichier_csv)
-        # Lire et afficher les trois premières lignes
-        for i in range(3):
-            ligne = next(lecteur_csv, None)  # Lire la ligne suivante
-            if ligne is not None:
-                api_url.append(ligne[0])
-            else: return None
-        return api_url
 @st.cache_data
 def load_corpus(path):
     input_file = os.path.join(path)
@@ -66,10 +50,10 @@ n1 = 0
 df_data_en, df_data_fr, translation_en_fr, translation_fr_en, lang_classifier, model_speech, finetuned_translation_en_fr = load_all_data()
-def fetch_translation2(url):
     return requests.get(url)
-def display_translation2(n1, Lang, model_type):
     global df_data_src, df_data_tgt, placeholder, url_base
     n = 3
@@ -215,23 +199,11 @@ def run():
             mode = 2  # Transformer
         # Exécuter la fonction asynchrone
-        '''
-        t0 = time.time()
-        asyncio.run(display_translation1(n1, Lang, mode))
-        t1 = time.time()
-        st.write("Durée 1: "+str(t1-t0))
-        '''
         # t0 = time.time()
-        display_translation2(n1, Lang,mode)
         # t1 = time.time()
-        # st.write("Durée 2: "+str(t1-t0))
-        '''
-        t0 = time.time()
-        display_translation3(n1, Lang,mode)
-        t1 = time.time()
-        st.write("Durée 3: "+str(t1-t0))
-        '''
         st.write("## **"+tr("Details sur la méthode")+" :**\n")
         if (chosen_id == "tab1"):
             st.markdown(tr(

 from gtts import gTTS
 from extra_streamlit_components import tab_bar, TabBarItemData
 from translate_app import tr
+# import csv
 import requests
 # from multiprocessing import Pool
 import concurrent.futures
+# import time
+import read_api_url
 title = "Traduction Sequence à Sequence"
 sidebar_name = "Traduction Seq2Seq"
 dataPath = st.session_state.DataPath
 @st.cache_data
 def load_corpus(path):
     input_file = os.path.join(path)
 df_data_en, df_data_fr, translation_en_fr, translation_fr_en, lang_classifier, model_speech, finetuned_translation_en_fr = load_all_data()
+def fetch_translation(url):
     return requests.get(url)
+def display_translation(n1, Lang, model_type):
     global df_data_src, df_data_tgt, placeholder, url_base
     n = 3
             mode = 2  # Transformer
         # Exécuter la fonction asynchrone
         # t0 = time.time()
+        display_translation(n1, Lang,mode)
         # t1 = time.time()
+        # st.write("Durée : "+str(t1-t0))
         st.write("## **"+tr("Details sur la méthode")+" :**\n")
         if (chosen_id == "tab1"):
             st.markdown(tr(

tabs/read_api_url.py ADDED Viewed

	@@ -0,0 +1,17 @@

+import csv
+@st.cache_data
+def read_api_url():
+    api_url = []
+    # Ouvrir le fichier CSV en mode lecture
+    with open("api-url.txt", newline='') as fichier_csv:
+        lecteur_csv = csv.reader(fichier_csv)
+        # Lire toutes les lignes
+        ligne = next(lecteur_csv, None)
+        while ligne is not None:
+            api_url.append(ligne[0])
+            ligne = next(lecteur_csv, None)
+    return api_url