flashinfer

Flash Infer for arm64

  • https://arxiv.org/abs/2501.01005

git clone https://github.com/flashinfer-ai/flashinfer.git --recursive

pip install ninja

export TORCH_CUDA_ARCH_LIST="90"

cd flashinfer pip install --no-build-isolation --verbose .

python -m flashinfer.aot # Compile AOT kernels python -m pip install --no-build-isolation --verbose .