torch>=2.10.0
cuda-python
nvidia-cutlass-dsl[cu13]==4.4.1
apache-tvm-ffi!=0.1.8,!=0.1.8.post0,<0.2,>=0.1.6
rich>=13

[dev]
pytest
