huggingface_hub>=0.25.2 torch torchvision transformers gradio==4.19.2 Pillow qwen_vl_utils accelerate>=0.26.0