gradio==3.35.2 transformers>=4.42 accelerate>=0.33 sentencepiece timm einops hydra-core pillow torch deepspeed==0.14.2 git+https://github.com/Efficient-Large-Model/VILA.git