torch>=1.12.0
transformers>=4.21.0
datasets>=2.0.0
numpy>=1.21.0
pandas>=1.3.0
scipy>=1.7.0
accelerate>=0.20.0
deepspeed>=0.9.0
tensorboard>=2.8.0
wandb>=0.13.0
evaluate>=0.4.0
scikit-learn>=1.0.0
seaborn>=0.11.0
matplotlib>=3.5.0
tokenizers>=0.13.0
sentencepiece>=0.1.96
protobuf>=3.20.0
psutil>=5.8.0
pynvml>=11.4.0
tqdm>=4.64.0
click>=8.0.0
pyyaml>=6.0
jsonlines>=3.0.0
llamafactory>=0.7.0
lm_eval>=0.4.0

[all]
megatron-core[dev]>=0.7.0
apex>=0.1
mamba-ssm>=1.2.0
causal-conv1d>=1.4.0
rwkv>=0.8.0
bitsandbytes>=0.41.0
auto-gptq>=0.4.0
optimum>=1.12.0
vllm>=0.2.0
text-generation-inference>=1.0.0

[dev]
pytest>=7.1.0
pytest-cov>=4.0.0
black>=22.0.0
isort>=5.10.0
flake8>=5.0.0
mypy>=0.991
sphinx>=5.0.0
sphinx-rtd-theme>=1.0.0

[inference]
vllm>=0.2.0
text-generation-inference>=1.0.0

[mamba]
mamba-ssm>=1.2.0
causal-conv1d>=1.4.0

[megatron]
megatron-core[dev]>=0.7.0
apex>=0.1

[quantization]
bitsandbytes>=0.41.0
auto-gptq>=0.4.0
optimum>=1.12.0

[rwkv]
rwkv>=0.8.0
