Metadata-Version: 2.4
Name: dmx-runtime
Version: 0.1.0
Summary: DMX inference runtime — load compressed models with HuggingFace transformers
Requires-Python: >=3.10
Requires-Dist: torch>=2.0
Requires-Dist: numpy
Requires-Dist: dmx-compress>=1.2.0
Requires-Dist: transformers>=4.40
Provides-Extra: cuda
Requires-Dist: triton; extra == "cuda"
