numpy
torch
ninja
requests
pynvml
einops
click
tqdm
tabulate
packaging>=24.2
nvidia-cudnn-frontend>=1.13.0
