datasets==2.18.0 evaluate==0.4.1 torch==2.2.2+cu121 tqdm==4.65.0 transformers==4.39.3