transformers>=4.40.0
accelerate>=0.28.0
torch
flask
sentencepiece
pynvml

[vllm]
vllm>=0.3.0
