orionweller commited on
Commit
0f7ca6c
·
1 Parent(s): 6b90dc3
Files changed (1) hide show
  1. app.py +18 -3
app.py CHANGED
@@ -188,7 +188,7 @@ def load_corpus_lookups(dataset_name):
188
  corpus_lookups[dataset_name] += p_lookup
189
 
190
  logger.info(f"Loaded corpus lookups for {dataset_name}. Total entries: {len(corpus_lookups[dataset_name])}")
191
- logger.info(f"Sample corpus lookup entry: {corpus_lookups[dataset_name][0]}")
192
 
193
  def load_queries(dataset_name):
194
  global queries, q_lookups, qrels
@@ -244,8 +244,23 @@ def run_evaluation(dataset, postfix):
244
 
245
  all_scores, psg_indices = search_queries(dataset, q_reps)
246
 
247
- results = {str(qid): {str(doc_id): float(score) for doc_id, score in zip(doc_ids, scores)}
248
- for qid, scores, doc_ids in zip(q_lookups[dataset].keys(), all_scores, psg_indices)}
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
249
  qrels[dataset] = {str(qid): {str(doc_id): rel for doc_id, rel in rels.items()}
250
  for qid, rels in qrels[dataset].items()}
251
 
 
188
  corpus_lookups[dataset_name] += p_lookup
189
 
190
  logger.info(f"Loaded corpus lookups for {dataset_name}. Total entries: {len(corpus_lookups[dataset_name])}")
191
+ logger.info(f"Sample corpus lookup entry: {corpus_lookups[dataset_name][:10]}")
192
 
193
  def load_queries(dataset_name):
194
  global queries, q_lookups, qrels
 
244
 
245
  all_scores, psg_indices = search_queries(dataset, q_reps)
246
 
247
+ results = {}
248
+ logging.info(f"Number of queries in q_lookups: {len(q_lookups[dataset])}")
249
+ logging.info("Size of all_scores: " + str(len(all_scores)))
250
+ logging.info("Size of psg_indices: " + str(len(psg_indices)))
251
+ for qid, scores, doc_ids in zip(q_lookups[dataset].keys(), all_scores, psg_indices):
252
+ qid_str = str(qid)
253
+ results[qid_str] = {}
254
+ for doc_id, score in zip(doc_ids, scores):
255
+ doc_id_str = str(doc_id)
256
+ results[qid_str][doc_id_str] = float(score)
257
+
258
+ if not results[qid_str]: # If no results for this query
259
+ logger.warning(f"No results for query {qid_str}")
260
+
261
+ logger.info(f"Number of queries in results: {len(results)}")
262
+ logger.info(f"Sample result: {next(iter(results.items()))}")
263
+
264
  qrels[dataset] = {str(qid): {str(doc_id): rel for doc_id, rel in rels.items()}
265
  for qid, rels in qrels[dataset].items()}
266