A-Roucher commited on
Commit
b19e82a
1 Parent(s): 72c879a

feat: full dataset

Browse files
Files changed (1) hide show
  1. app.py +1 -3
app.py CHANGED
@@ -8,9 +8,7 @@ import time
8
 
9
 
10
  if "initialized" not in st.session_state:
11
- dataset = datasets.load_dataset('A-Roucher/english_historical_quotes', download_mode="force_redownload")
12
- st.session_state.dataset = datasets.Dataset.from_dict(dataset['train'][:100])
13
-
14
  st.session_state.all_authors = list(set(st.session_state.dataset['author']))
15
  model_name = "sentence-transformers/all-MiniLM-L6-v2" # BAAI/bge-small-en-v1.5" # "Cohere/Cohere-embed-english-light-v3.0" # "sentence-transformers/all-MiniLM-L6-v2"
16
  st.session_state.encoder = SentenceTransformer(model_name)
 
8
 
9
 
10
  if "initialized" not in st.session_state:
11
+ st.session_state.dataset = datasets.load_dataset('A-Roucher/english_historical_quotes', download_mode="force_redownload")['train']
 
 
12
  st.session_state.all_authors = list(set(st.session_state.dataset['author']))
13
  model_name = "sentence-transformers/all-MiniLM-L6-v2" # BAAI/bge-small-en-v1.5" # "Cohere/Cohere-embed-english-light-v3.0" # "sentence-transformers/all-MiniLM-L6-v2"
14
  st.session_state.encoder = SentenceTransformer(model_name)