Spaces:
Sleeping
Sleeping
=
commited on
Commit
•
ddf8478
1
Parent(s):
9b14109
adding new requirements
Browse files- app.py +12 -12
- pages/provide_sentences.py +15 -15
- pages/provide_sentences_mongo.py +6 -6
- requirements.txt +1 -2
- send_and_retrieve_data.ipynb +0 -1
- wolof-translate/setup.py +0 -5
- wolof-translate/wolof_translate.egg-info/PKG-INFO +0 -9
- wolof-translate/wolof_translate.egg-info/SOURCES.txt +0 -59
- wolof-translate/wolof_translate.egg-info/dependency_links.txt +0 -1
- wolof-translate/wolof_translate.egg-info/top_level.txt +0 -1
- wolof-translate/wolof_translate/checkpoints/t5_base_custom_train_results_fw_v3/best_checkpoints.pth +0 -3
- wolof-translate/wolof_translate/checkpoints/t5_small_custom_train_results_fw_v3/best_checkpoints.json +0 -13
- wolof-translate/wolof_translate/checkpoints/t5_small_custom_train_results_fw_v3/best_checkpoints.pth +0 -3
- wolof-translate/wolof_translate/checkpoints/t5_small_custom_train_results_wf_v3/best_checkpoints.json +0 -13
- wolof-translate/wolof_translate/checkpoints/t5_small_custom_train_results_wf_v3/best_checkpoints.pth +0 -3
- {wolof-translate/wolof_translate → wolof_translate}/__init__.py +0 -0
- {wolof-translate/wolof_translate → wolof_translate}/__pycache__/__init__.cpython-310.pyc +0 -0
- {wolof-translate/wolof_translate → wolof_translate}/__pycache__/dataset_v1.cpython-310.pyc +0 -0
- {wolof-translate/wolof_translate → wolof_translate}/__pycache__/sent_transformers.cpython-310.pyc +0 -0
- {wolof-translate/wolof_translate → wolof_translate}/data/sentences/deleted_lines.csv +0 -0
- {wolof-translate/wolof_translate → wolof_translate}/data/sentences/french.csv +0 -0
- {wolof-translate/wolof_translate → wolof_translate}/data/sentences/modified_lines.csv +0 -0
- {wolof-translate/wolof_translate → wolof_translate}/data/sentences/wolof.csv +0 -0
- {wolof-translate/wolof_translate → wolof_translate}/data/sentences/wolof_2.csv +0 -0
- {wolof-translate/wolof_translate → wolof_translate}/data/sentences/wolof_french.csv +0 -0
- {wolof-translate/wolof_translate → wolof_translate}/data/wolof_writing/definitions.csv +0 -0
- {wolof-translate/wolof_translate → wolof_translate}/data/wolof_writing/wolof_special_chars.csv +0 -0
- {wolof-translate/wolof_translate → wolof_translate}/tokenizers/__init__.py +0 -0
- {wolof-translate/wolof_translate → wolof_translate}/tokenizers/__pycache__/__init__.cpython-310.pyc +0 -0
- {wolof-translate/wolof_translate → wolof_translate}/tokenizers/adverse_tokenizer.json +0 -0
- {wolof-translate/wolof_translate → wolof_translate}/tokenizers/t5_tokenizers/fr_tokenizer_v1.json +0 -0
- {wolof-translate/wolof_translate → wolof_translate}/tokenizers/t5_tokenizers/tokenizer_v1.json +0 -0
- {wolof-translate/wolof_translate → wolof_translate}/tokenizers/t5_tokenizers/tokenizer_v2.json +0 -0
- {wolof-translate/wolof_translate → wolof_translate}/tokenizers/t5_tokenizers/tokenizer_v3.json +0 -0
- {wolof-translate/wolof_translate → wolof_translate}/tokenizers/t5_tokenizers/tokenizer_v4.json +0 -0
- {wolof-translate/wolof_translate → wolof_translate}/tokenizers/t5_tokenizers/wf_tokenizer_v1.json +0 -0
- {wolof-translate/wolof_translate → wolof_translate}/tokenizers/tokenizer_v1.json +0 -0
- {wolof-translate/wolof_translate → wolof_translate}/utils/__init__.py +0 -0
- {wolof-translate/wolof_translate → wolof_translate}/utils/database_manager.py +0 -0
app.py
CHANGED
@@ -16,30 +16,30 @@ st.markdown("Translation page 🔠")
|
|
16 |
# models = {
|
17 |
# "Version ✌️": {
|
18 |
# "French ➡️ Wolof": {
|
19 |
-
# "checkpoints": "
|
20 |
-
# "tokenizer": "
|
21 |
# "max_len": None
|
22 |
# }
|
23 |
# },
|
24 |
# "Version ☝️": {
|
25 |
# "French ➡️ Wolof": {
|
26 |
-
# "checkpoints": "
|
27 |
-
# "tokenizer": "
|
28 |
# "max_len": 51
|
29 |
# },
|
30 |
# "Wolof ➡️ French": {
|
31 |
-
# "checkpoints": "
|
32 |
-
# "tokenizer": "
|
33 |
# "max_len": 51
|
34 |
# }
|
35 |
# }
|
36 |
# }
|
37 |
|
38 |
# # add special characters from Wolof
|
39 |
-
# sp_wolof_chars = pd.read_csv('
|
40 |
|
41 |
# # add definitions
|
42 |
-
# sp_wolof_words = pd.read_csv('
|
43 |
|
44 |
# # let us add a callback functions to change the input text
|
45 |
# def add_symbol_to_text():
|
@@ -78,10 +78,10 @@ st.markdown("Translation page 🔠")
|
|
78 |
# def get_modelfw_v3():
|
79 |
|
80 |
# # recuperate checkpoints
|
81 |
-
# checkpoints = torch.load(os.path.join('
|
82 |
|
83 |
# # recuperate the tokenizer
|
84 |
-
# tokenizer_file = "
|
85 |
|
86 |
# # initialize the tokenizer
|
87 |
# tokenizer = T5TokenizerFast(tokenizer_file=tokenizer_file)
|
@@ -99,10 +99,10 @@ st.markdown("Translation page 🔠")
|
|
99 |
# def get_modelwf_v3():
|
100 |
|
101 |
# # recuperate checkpoints
|
102 |
-
# checkpoints = torch.load(os.path.join('
|
103 |
|
104 |
# # recuperate the tokenizer
|
105 |
-
# tokenizer_file = "
|
106 |
|
107 |
# # initialize the tokenizer
|
108 |
# tokenizer = T5TokenizerFast(tokenizer_file=tokenizer_file)
|
|
|
16 |
# models = {
|
17 |
# "Version ✌️": {
|
18 |
# "French ➡️ Wolof": {
|
19 |
+
# "checkpoints": "wolof_translate/checkpoints/t5_small_custom_train_results_fw_v4",
|
20 |
+
# "tokenizer": "wolof_translate/tokenizers/t5_tokenizers/tokenizer_v4.json",
|
21 |
# "max_len": None
|
22 |
# }
|
23 |
# },
|
24 |
# "Version ☝️": {
|
25 |
# "French ➡️ Wolof": {
|
26 |
+
# "checkpoints": "wolof_translate/checkpoints/t5_small_custom_train_results_fw_v3",
|
27 |
+
# "tokenizer": "wolof_translate/tokenizers/t5_tokenizers/tokenizer_v3.json",
|
28 |
# "max_len": 51
|
29 |
# },
|
30 |
# "Wolof ➡️ French": {
|
31 |
+
# "checkpoints": "wolof_translate/checkpoints/t5_small_custom_train_results_wf_v3",
|
32 |
+
# "tokenizer": "wolof_translate/trokenizers/t5_tokenizers/tokenizer_v3.json",
|
33 |
# "max_len": 51
|
34 |
# }
|
35 |
# }
|
36 |
# }
|
37 |
|
38 |
# # add special characters from Wolof
|
39 |
+
# sp_wolof_chars = pd.read_csv('wolof_translate/data/wolof_writing/wolof_special_chars.csv')
|
40 |
|
41 |
# # add definitions
|
42 |
+
# sp_wolof_words = pd.read_csv('wolof_translate/data/wolof_writing/definitions.csv')
|
43 |
|
44 |
# # let us add a callback functions to change the input text
|
45 |
# def add_symbol_to_text():
|
|
|
78 |
# def get_modelfw_v3():
|
79 |
|
80 |
# # recuperate checkpoints
|
81 |
+
# checkpoints = torch.load(os.path.join('wolof_translate/checkpoints/t5_small_custom_train_results_fw_v3', "best_checkpoints.pth"), map_location=torch.device('cpu'))
|
82 |
|
83 |
# # recuperate the tokenizer
|
84 |
+
# tokenizer_file = "wolof_translate/tokenizers/t5_tokenizers/tokenizer_v3.json"
|
85 |
|
86 |
# # initialize the tokenizer
|
87 |
# tokenizer = T5TokenizerFast(tokenizer_file=tokenizer_file)
|
|
|
99 |
# def get_modelwf_v3():
|
100 |
|
101 |
# # recuperate checkpoints
|
102 |
+
# checkpoints = torch.load(os.path.join('wolof_translate/checkpoints/t5_small_custom_train_results_wf_v3', "best_checkpoints.pth"), map_location=torch.device('cpu'))
|
103 |
|
104 |
# # recuperate the tokenizer
|
105 |
+
# tokenizer_file = "wolof_translate/tokenizers/t5_tokenizers/tokenizer_v3.json"
|
106 |
|
107 |
# # initialize the tokenizer
|
108 |
# tokenizer = T5TokenizerFast(tokenizer_file=tokenizer_file)
|
pages/provide_sentences.py
CHANGED
@@ -4,20 +4,20 @@ import pandas as pd
|
|
4 |
st.markdown("Provide your own 🤗 sentences")
|
5 |
|
6 |
# recuperate the already saved sentences (for the moment french/wolof)
|
7 |
-
sentences_ = pd.read_csv('
|
8 |
|
9 |
sentences = sentences_.copy()
|
10 |
|
11 |
# get french and wolof sentences
|
12 |
-
french_examples = pd.read_csv('
|
13 |
|
14 |
-
wolof_examples = pd.read_csv('
|
15 |
|
16 |
# add special characters from Wolof
|
17 |
-
sp_wolof_chars = pd.read_csv('
|
18 |
|
19 |
# add definitions
|
20 |
-
sp_wolof_words = pd.read_csv('
|
21 |
|
22 |
sp_wolof_words.sort_values(by = ['french', 'wolof'], inplace = True)
|
23 |
|
@@ -89,10 +89,10 @@ def add_new_sentences():
|
|
89 |
sentences = pd.DataFrame({sentences.columns.tolist()[0]: [sentence_1],
|
90 |
sentences.columns.tolist()[1]: [sentence_2]})
|
91 |
## save the result
|
92 |
-
sentences.to_csv('
|
93 |
|
94 |
# recuperate the already saved sentences (for the moment french/wolof)
|
95 |
-
sentences = pd.read_csv('
|
96 |
|
97 |
# add the last position to delete and modify
|
98 |
st.session_state.line1 = len(sentences) - 1
|
@@ -124,10 +124,10 @@ def add_new_sentences2():
|
|
124 |
sentences = pd.DataFrame({sentences.columns.tolist()[0]: [sentence_1],
|
125 |
sentences.columns.tolist()[1]: [sentence_2]})
|
126 |
## save the result
|
127 |
-
sentences.to_csv('
|
128 |
|
129 |
# recuperate the already saved sentences (for the moment french/wolof)
|
130 |
-
sentences = pd.read_csv('
|
131 |
|
132 |
# clean the inputs' contents
|
133 |
st.session_state.left_sentence = ''
|
@@ -148,7 +148,7 @@ def delete_line():
|
|
148 |
|
149 |
else:
|
150 |
|
151 |
-
deleted = pd.read_csv('
|
152 |
|
153 |
if not deleted.empty:
|
154 |
|
@@ -163,9 +163,9 @@ def delete_line():
|
|
163 |
sentences.drop(index = number, inplace=True)
|
164 |
|
165 |
## save the result
|
166 |
-
sentences.to_csv('
|
167 |
|
168 |
-
deleted.to_csv('
|
169 |
|
170 |
def modify_line():
|
171 |
|
@@ -177,7 +177,7 @@ def modify_line():
|
|
177 |
|
178 |
else:
|
179 |
|
180 |
-
modified = pd.read_csv('
|
181 |
|
182 |
if not modified.empty:
|
183 |
|
@@ -196,9 +196,9 @@ def modify_line():
|
|
196 |
sentences.drop(index = number, inplace=True)
|
197 |
|
198 |
## save the result
|
199 |
-
sentences.to_csv('
|
200 |
|
201 |
-
modified.to_csv('
|
202 |
|
203 |
|
204 |
left.header("French")
|
|
|
4 |
st.markdown("Provide your own 🤗 sentences")
|
5 |
|
6 |
# recuperate the already saved sentences (for the moment french/wolof)
|
7 |
+
sentences_ = pd.read_csv('wolof_translate/data/sentences/wolof_french.csv')
|
8 |
|
9 |
sentences = sentences_.copy()
|
10 |
|
11 |
# get french and wolof sentences
|
12 |
+
french_examples = pd.read_csv('wolof_translate/data/sentences/french.csv')
|
13 |
|
14 |
+
wolof_examples = pd.read_csv('wolof_translate/data/sentences/wolof_2.csv')
|
15 |
|
16 |
# add special characters from Wolof
|
17 |
+
sp_wolof_chars = pd.read_csv('wolof_translate/data/wolof_writing/wolof_special_chars.csv')
|
18 |
|
19 |
# add definitions
|
20 |
+
sp_wolof_words = pd.read_csv('wolof_translate/data/wolof_writing/definitions.csv')
|
21 |
|
22 |
sp_wolof_words.sort_values(by = ['french', 'wolof'], inplace = True)
|
23 |
|
|
|
89 |
sentences = pd.DataFrame({sentences.columns.tolist()[0]: [sentence_1],
|
90 |
sentences.columns.tolist()[1]: [sentence_2]})
|
91 |
## save the result
|
92 |
+
sentences.to_csv('wolof_translate/data/sentences/wolof_french.csv', index=False)
|
93 |
|
94 |
# recuperate the already saved sentences (for the moment french/wolof)
|
95 |
+
sentences = pd.read_csv('wolof_translate/data/sentences/wolof_french.csv')
|
96 |
|
97 |
# add the last position to delete and modify
|
98 |
st.session_state.line1 = len(sentences) - 1
|
|
|
124 |
sentences = pd.DataFrame({sentences.columns.tolist()[0]: [sentence_1],
|
125 |
sentences.columns.tolist()[1]: [sentence_2]})
|
126 |
## save the result
|
127 |
+
sentences.to_csv('wolof_translate/data/sentences/wolof_french.csv', index=False)
|
128 |
|
129 |
# recuperate the already saved sentences (for the moment french/wolof)
|
130 |
+
sentences = pd.read_csv('wolof_translate/data/sentences/wolof_french.csv')
|
131 |
|
132 |
# clean the inputs' contents
|
133 |
st.session_state.left_sentence = ''
|
|
|
148 |
|
149 |
else:
|
150 |
|
151 |
+
deleted = pd.read_csv('wolof_translate/data/sentences/deleted_lines.csv')
|
152 |
|
153 |
if not deleted.empty:
|
154 |
|
|
|
163 |
sentences.drop(index = number, inplace=True)
|
164 |
|
165 |
## save the result
|
166 |
+
sentences.to_csv('wolof_translate/data/sentences/wolof_french.csv', index=False)
|
167 |
|
168 |
+
deleted.to_csv('wolof_translate/data/sentences/deleted_lines.csv', index=False)
|
169 |
|
170 |
def modify_line():
|
171 |
|
|
|
177 |
|
178 |
else:
|
179 |
|
180 |
+
modified = pd.read_csv('wolof_translate/data/sentences/modified_lines.csv')
|
181 |
|
182 |
if not modified.empty:
|
183 |
|
|
|
196 |
sentences.drop(index = number, inplace=True)
|
197 |
|
198 |
## save the result
|
199 |
+
sentences.to_csv('wolof_translate/data/sentences/wolof_french.csv', index=False)
|
200 |
|
201 |
+
modified.to_csv('wolof_translate/data/sentences/deleted_lines.csv', index=False)
|
202 |
|
203 |
|
204 |
left.header("French")
|
pages/provide_sentences_mongo.py
CHANGED
@@ -20,15 +20,15 @@ sentences_, deleted = db_manager.load_data_frames()
|
|
20 |
sentences = sentences_.copy()
|
21 |
|
22 |
# get french and wolof sentences
|
23 |
-
french_examples = pd.read_csv('
|
24 |
|
25 |
-
wolof_examples = pd.read_csv('
|
26 |
|
27 |
# add special characters from Wolof
|
28 |
-
sp_wolof_chars = pd.read_csv('
|
29 |
|
30 |
# add definitions
|
31 |
-
sp_wolof_words = pd.read_csv('
|
32 |
|
33 |
sp_wolof_words.sort_values(by = ['french', 'wolof'], inplace = True)
|
34 |
|
@@ -93,10 +93,10 @@ def add_new_sentences():
|
|
93 |
|
94 |
|
95 |
## save the result
|
96 |
-
sentences.to_csv('
|
97 |
|
98 |
# recuperate the already saved sentences (for the moment french/wolof)
|
99 |
-
sentences = pd.read_csv('
|
100 |
|
101 |
# add the last position to delete and modify
|
102 |
st.session_state.line1 = len(sentences) - 1
|
|
|
20 |
sentences = sentences_.copy()
|
21 |
|
22 |
# get french and wolof sentences
|
23 |
+
french_examples = pd.read_csv('wolof_translate/data/sentences/french.csv')
|
24 |
|
25 |
+
wolof_examples = pd.read_csv('wolof_translate/data/sentences/wolof_2.csv')
|
26 |
|
27 |
# add special characters from Wolof
|
28 |
+
sp_wolof_chars = pd.read_csv('wolof_translate/data/wolof_writing/wolof_special_chars.csv')
|
29 |
|
30 |
# add definitions
|
31 |
+
sp_wolof_words = pd.read_csv('wolof_translate/data/wolof_writing/definitions.csv')
|
32 |
|
33 |
sp_wolof_words.sort_values(by = ['french', 'wolof'], inplace = True)
|
34 |
|
|
|
93 |
|
94 |
|
95 |
## save the result
|
96 |
+
sentences.to_csv('wolof_translate/data/sentences/wolof_french.csv', index=False)
|
97 |
|
98 |
# recuperate the already saved sentences (for the moment french/wolof)
|
99 |
+
sentences = pd.read_csv('wolof_translate/data/sentences/wolof_french.csv')
|
100 |
|
101 |
# add the last position to delete and modify
|
102 |
st.session_state.line1 = len(sentences) - 1
|
requirements.txt
CHANGED
@@ -1,5 +1,4 @@
|
|
1 |
altair<5
|
2 |
transformers
|
3 |
torch
|
4 |
-
pandas
|
5 |
-
wolof-translate
|
|
|
1 |
altair<5
|
2 |
transformers
|
3 |
torch
|
4 |
+
pandas
|
|
send_and_retrieve_data.ipynb
CHANGED
@@ -670,7 +670,6 @@
|
|
670 |
}
|
671 |
],
|
672 |
"source": [
|
673 |
-
"# %%writefile wolof-translate/wolof_translate/utils/database_manager.py\n",
|
674 |
"from pymongo.mongo_client import MongoClient\n",
|
675 |
"from pymongo.server_api import ServerApi\n",
|
676 |
"import pandas as pd\n",
|
|
|
670 |
}
|
671 |
],
|
672 |
"source": [
|
|
|
673 |
"from pymongo.mongo_client import MongoClient\n",
|
674 |
"from pymongo.server_api import ServerApi\n",
|
675 |
"import pandas as pd\n",
|
wolof-translate/setup.py
DELETED
@@ -1,5 +0,0 @@
|
|
1 |
-
from setuptools import setup
|
2 |
-
|
3 |
-
setup(name="wolof_translate", version="0.0.1", author="Oumar Kane", author_email="oumar.kane@univ-thies.sn",
|
4 |
-
description="Contain function and classes to process corpora for making translation between wolof text and other languages.",
|
5 |
-
requires=['spacy', 'nltk', 'gensim'])
|
|
|
|
|
|
|
|
|
|
|
|
wolof-translate/wolof_translate.egg-info/PKG-INFO
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
Metadata-Version: 2.1
|
2 |
-
Name: wolof-translate
|
3 |
-
Version: 0.0.1
|
4 |
-
Summary: Contain function and classes to process corpora for making translation between wolof text and other languages.
|
5 |
-
Author: Oumar Kane
|
6 |
-
Author-email: oumar.kane@univ-thies.sn
|
7 |
-
Requires: spacy
|
8 |
-
Requires: nltk
|
9 |
-
Requires: gensim
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
wolof-translate/wolof_translate.egg-info/SOURCES.txt
DELETED
@@ -1,59 +0,0 @@
|
|
1 |
-
setup.py
|
2 |
-
wolof_translate/__init__.py
|
3 |
-
wolof_translate.egg-info/PKG-INFO
|
4 |
-
wolof_translate.egg-info/SOURCES.txt
|
5 |
-
wolof_translate.egg-info/dependency_links.txt
|
6 |
-
wolof_translate.egg-info/top_level.txt
|
7 |
-
wolof_translate/__pycache__/__init__.cpython-310.pyc
|
8 |
-
wolof_translate/__pycache__/dataset_v1.cpython-310.pyc
|
9 |
-
wolof_translate/__pycache__/sent_transformers.cpython-310.pyc
|
10 |
-
wolof_translate/data/__init__.py
|
11 |
-
wolof_translate/data/dataset_v1.py
|
12 |
-
wolof_translate/data/dataset_v2.py
|
13 |
-
wolof_translate/data/dataset_v3.py
|
14 |
-
wolof_translate/data/__pycache__/__init__.cpython-310.pyc
|
15 |
-
wolof_translate/data/__pycache__/dataset_v1.cpython-310.pyc
|
16 |
-
wolof_translate/data/__pycache__/dataset_v2.cpython-310.pyc
|
17 |
-
wolof_translate/models/__init__.py
|
18 |
-
wolof_translate/models/__pycache__/__init__.cpython-310.pyc
|
19 |
-
wolof_translate/models/transformers/__init__.py
|
20 |
-
wolof_translate/models/transformers/main.py
|
21 |
-
wolof_translate/models/transformers/optimization.py
|
22 |
-
wolof_translate/models/transformers/position.py
|
23 |
-
wolof_translate/models/transformers/size.py
|
24 |
-
wolof_translate/models/transformers/__pycache__/__init__.cpython-310.pyc
|
25 |
-
wolof_translate/models/transformers/__pycache__/main.cpython-310.pyc
|
26 |
-
wolof_translate/models/transformers/__pycache__/optimization.cpython-310.pyc
|
27 |
-
wolof_translate/models/transformers/__pycache__/position.cpython-310.pyc
|
28 |
-
wolof_translate/models/transformers/__pycache__/size.cpython-310.pyc
|
29 |
-
wolof_translate/pipe/__init__.py
|
30 |
-
wolof_translate/pipe/nlp_pipeline.py
|
31 |
-
wolof_translate/tokenizers/__init__.py
|
32 |
-
wolof_translate/tokenizers/adverse_tokenizer.json
|
33 |
-
wolof_translate/tokenizers/tokenizer_v1.json
|
34 |
-
wolof_translate/tokenizers/__pycache__/__init__.cpython-310.pyc
|
35 |
-
wolof_translate/tokenizers/t5_tokenizers/fr_tokenizer_v1.json
|
36 |
-
wolof_translate/tokenizers/t5_tokenizers/tokenizer_v1.json
|
37 |
-
wolof_translate/tokenizers/t5_tokenizers/tokenizer_v2.json
|
38 |
-
wolof_translate/tokenizers/t5_tokenizers/tokenizer_v3.json
|
39 |
-
wolof_translate/tokenizers/t5_tokenizers/wf_tokenizer_v1.json
|
40 |
-
wolof_translate/trainers/__init__.py
|
41 |
-
wolof_translate/trainers/transformer_trainer.py
|
42 |
-
wolof_translate/trainers/__pycache__/__init__.cpython-310.pyc
|
43 |
-
wolof_translate/trainers/__pycache__/transformer_trainer.cpython-310.pyc
|
44 |
-
wolof_translate/utils/__init__.py
|
45 |
-
wolof_translate/utils/evaluation.py
|
46 |
-
wolof_translate/utils/extract_poems.py
|
47 |
-
wolof_translate/utils/extract_sentences.py
|
48 |
-
wolof_translate/utils/sent_corrections.py
|
49 |
-
wolof_translate/utils/sent_transformers.py
|
50 |
-
wolof_translate/utils/sent_unification.py
|
51 |
-
wolof_translate/utils/split_with_valid.py
|
52 |
-
wolof_translate/utils/tokenize_text.py
|
53 |
-
wolof_translate/utils/__pycache__/__init__.cpython-310.pyc
|
54 |
-
wolof_translate/utils/__pycache__/evaluation.cpython-310.pyc
|
55 |
-
wolof_translate/utils/__pycache__/sent_corrections.cpython-310.pyc
|
56 |
-
wolof_translate/utils/__pycache__/sent_transformers.cpython-310.pyc
|
57 |
-
wolof_translate/utils/__pycache__/sent_unification.cpython-310.pyc
|
58 |
-
wolof_translate/utils/__pycache__/split_with_valid.cpython-310.pyc
|
59 |
-
wolof_translate/utils/__pycache__/tokenize_text.cpython-310.pyc
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
wolof-translate/wolof_translate.egg-info/dependency_links.txt
DELETED
@@ -1 +0,0 @@
|
|
1 |
-
|
|
|
|
wolof-translate/wolof_translate.egg-info/top_level.txt
DELETED
@@ -1 +0,0 @@
|
|
1 |
-
wolof_translate
|
|
|
|
wolof-translate/wolof_translate/checkpoints/t5_base_custom_train_results_fw_v3/best_checkpoints.pth
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:3c27c98fb26335a018a9e39fa61efe4b16e356439d266fee60f41e7c30ac9e95
|
3 |
-
size 801021373
|
|
|
|
|
|
|
|
wolof-translate/wolof_translate/checkpoints/t5_small_custom_train_results_fw_v3/best_checkpoints.json
DELETED
@@ -1,13 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"metrics": {
|
3 |
-
"train_loss": 0.003311718240206019,
|
4 |
-
"test_loss": 0.5539475262048654,
|
5 |
-
"bleu": 28.528,
|
6 |
-
"gen_len": 8.1575,
|
7 |
-
"current_epoch": 346
|
8 |
-
},
|
9 |
-
"best_performance": {
|
10 |
-
"best_score": 28.528,
|
11 |
-
"best_epoch": 346
|
12 |
-
}
|
13 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
wolof-translate/wolof_translate/checkpoints/t5_small_custom_train_results_fw_v3/best_checkpoints.pth
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:b30a787b8488fb4f230d37ee9fab553e95e18fbf7e7036920069997a5b975534
|
3 |
-
size 180980359
|
|
|
|
|
|
|
|
wolof-translate/wolof_translate/checkpoints/t5_small_custom_train_results_wf_v3/best_checkpoints.json
DELETED
@@ -1,13 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"metrics": {
|
3 |
-
"train_loss": 0.010352298853033019,
|
4 |
-
"test_loss": 0.5878886595368386,
|
5 |
-
"bleu": 22.9625,
|
6 |
-
"gen_len": 9.3562,
|
7 |
-
"current_epoch": 94
|
8 |
-
},
|
9 |
-
"best_performance": {
|
10 |
-
"best_score": 22.9625,
|
11 |
-
"best_epoch": 94
|
12 |
-
}
|
13 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
wolof-translate/wolof_translate/checkpoints/t5_small_custom_train_results_wf_v3/best_checkpoints.pth
DELETED
@@ -1,3 +0,0 @@
|
|
1 |
-
version https://git-lfs.github.com/spec/v1
|
2 |
-
oid sha256:5e543a1882f682a4fa84f6c6ff4d21e8afceb0cbee401bd934c7338f7515320f
|
3 |
-
size 180980103
|
|
|
|
|
|
|
|
{wolof-translate/wolof_translate → wolof_translate}/__init__.py
RENAMED
File without changes
|
{wolof-translate/wolof_translate → wolof_translate}/__pycache__/__init__.cpython-310.pyc
RENAMED
File without changes
|
{wolof-translate/wolof_translate → wolof_translate}/__pycache__/dataset_v1.cpython-310.pyc
RENAMED
File without changes
|
{wolof-translate/wolof_translate → wolof_translate}/__pycache__/sent_transformers.cpython-310.pyc
RENAMED
File without changes
|
{wolof-translate/wolof_translate → wolof_translate}/data/sentences/deleted_lines.csv
RENAMED
File without changes
|
{wolof-translate/wolof_translate → wolof_translate}/data/sentences/french.csv
RENAMED
File without changes
|
{wolof-translate/wolof_translate → wolof_translate}/data/sentences/modified_lines.csv
RENAMED
File without changes
|
{wolof-translate/wolof_translate → wolof_translate}/data/sentences/wolof.csv
RENAMED
File without changes
|
{wolof-translate/wolof_translate → wolof_translate}/data/sentences/wolof_2.csv
RENAMED
File without changes
|
{wolof-translate/wolof_translate → wolof_translate}/data/sentences/wolof_french.csv
RENAMED
File without changes
|
{wolof-translate/wolof_translate → wolof_translate}/data/wolof_writing/definitions.csv
RENAMED
File without changes
|
{wolof-translate/wolof_translate → wolof_translate}/data/wolof_writing/wolof_special_chars.csv
RENAMED
File without changes
|
{wolof-translate/wolof_translate → wolof_translate}/tokenizers/__init__.py
RENAMED
File without changes
|
{wolof-translate/wolof_translate → wolof_translate}/tokenizers/__pycache__/__init__.cpython-310.pyc
RENAMED
File without changes
|
{wolof-translate/wolof_translate → wolof_translate}/tokenizers/adverse_tokenizer.json
RENAMED
File without changes
|
{wolof-translate/wolof_translate → wolof_translate}/tokenizers/t5_tokenizers/fr_tokenizer_v1.json
RENAMED
File without changes
|
{wolof-translate/wolof_translate → wolof_translate}/tokenizers/t5_tokenizers/tokenizer_v1.json
RENAMED
File without changes
|
{wolof-translate/wolof_translate → wolof_translate}/tokenizers/t5_tokenizers/tokenizer_v2.json
RENAMED
File without changes
|
{wolof-translate/wolof_translate → wolof_translate}/tokenizers/t5_tokenizers/tokenizer_v3.json
RENAMED
File without changes
|
{wolof-translate/wolof_translate → wolof_translate}/tokenizers/t5_tokenizers/tokenizer_v4.json
RENAMED
File without changes
|
{wolof-translate/wolof_translate → wolof_translate}/tokenizers/t5_tokenizers/wf_tokenizer_v1.json
RENAMED
File without changes
|
{wolof-translate/wolof_translate → wolof_translate}/tokenizers/tokenizer_v1.json
RENAMED
File without changes
|
{wolof-translate/wolof_translate → wolof_translate}/utils/__init__.py
RENAMED
File without changes
|
{wolof-translate/wolof_translate → wolof_translate}/utils/database_manager.py
RENAMED
File without changes
|