numpy==1.24.4 Pillow==10.3.0 Requests==2.31.0 torch torchvision transformers accelerate==0.30.0 qwen-vl-utils