torch
torchdiffeq
torchvision
transformers
datasets==3.6.0
tensor_parallel
numpy
pandas
einops
opt_einsum
rotary_embedding_torch
wandb
pyyaml
tqdm
zstandard

[cuda]
mamba-ssm
causal-conv1d
