kernels
transformers>=4.40.0
accelerate>=0.28.0
torch==2.10
flask
sentencepiece
nvidia-ml-py

[vllm]
vllm>=0.3.0
