multi-stage-retrieval-QA / data_preparation.py
Hyma7's picture
Update data_preparation.py
9fe5fd9 verified
raw
history blame
362 Bytes
from beir import util
from beir.datasets.data_loader import GenericDataLoader
def load_dataset(dataset_name="nq"):
data_path = util.download_and_unzip("https://public.ukp.informatik.tu-darmstadt.de/thakur/BEIR/datasets/nq.zip", "nq")
corpus, queries, qrels = GenericDataLoader(data_folder=data_path).load(split="test")
return corpus, queries, qrels