Spaces:
Sleeping
Sleeping
Commit
·
0f7ca6c
1
Parent(s):
6b90dc3
sort?
Browse files
app.py
CHANGED
@@ -188,7 +188,7 @@ def load_corpus_lookups(dataset_name):
|
|
188 |
corpus_lookups[dataset_name] += p_lookup
|
189 |
|
190 |
logger.info(f"Loaded corpus lookups for {dataset_name}. Total entries: {len(corpus_lookups[dataset_name])}")
|
191 |
-
logger.info(f"Sample corpus lookup entry: {corpus_lookups[dataset_name][
|
192 |
|
193 |
def load_queries(dataset_name):
|
194 |
global queries, q_lookups, qrels
|
@@ -244,8 +244,23 @@ def run_evaluation(dataset, postfix):
|
|
244 |
|
245 |
all_scores, psg_indices = search_queries(dataset, q_reps)
|
246 |
|
247 |
-
results = {
|
248 |
-
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
249 |
qrels[dataset] = {str(qid): {str(doc_id): rel for doc_id, rel in rels.items()}
|
250 |
for qid, rels in qrels[dataset].items()}
|
251 |
|
|
|
188 |
corpus_lookups[dataset_name] += p_lookup
|
189 |
|
190 |
logger.info(f"Loaded corpus lookups for {dataset_name}. Total entries: {len(corpus_lookups[dataset_name])}")
|
191 |
+
logger.info(f"Sample corpus lookup entry: {corpus_lookups[dataset_name][:10]}")
|
192 |
|
193 |
def load_queries(dataset_name):
|
194 |
global queries, q_lookups, qrels
|
|
|
244 |
|
245 |
all_scores, psg_indices = search_queries(dataset, q_reps)
|
246 |
|
247 |
+
results = {}
|
248 |
+
logging.info(f"Number of queries in q_lookups: {len(q_lookups[dataset])}")
|
249 |
+
logging.info("Size of all_scores: " + str(len(all_scores)))
|
250 |
+
logging.info("Size of psg_indices: " + str(len(psg_indices)))
|
251 |
+
for qid, scores, doc_ids in zip(q_lookups[dataset].keys(), all_scores, psg_indices):
|
252 |
+
qid_str = str(qid)
|
253 |
+
results[qid_str] = {}
|
254 |
+
for doc_id, score in zip(doc_ids, scores):
|
255 |
+
doc_id_str = str(doc_id)
|
256 |
+
results[qid_str][doc_id_str] = float(score)
|
257 |
+
|
258 |
+
if not results[qid_str]: # If no results for this query
|
259 |
+
logger.warning(f"No results for query {qid_str}")
|
260 |
+
|
261 |
+
logger.info(f"Number of queries in results: {len(results)}")
|
262 |
+
logger.info(f"Sample result: {next(iter(results.items()))}")
|
263 |
+
|
264 |
qrels[dataset] = {str(qid): {str(doc_id): rel for doc_id, rel in rels.items()}
|
265 |
for qid, rels in qrels[dataset].items()}
|
266 |
|