| { | |
| description = "Flake for Hopper Flash Attention kernel"; | |
| inputs = { | |
| kernel-builder.url = "github:huggingface/kernel-builder/torch-2.8"; | |
| }; | |
| outputs = | |
| { | |
| self, | |
| kernel-builder, | |
| }: | |
| kernel-builder.lib.genFlakeOutputs { | |
| path = ./.; | |
| rev = self.shortRev or self.dirtyShortRev or self.lastModifiedDate; | |
| # Building with CDUA later than 12.4 fails with: | |
| # | |
| # error: 'ptxas' died due to signal 11 (Invalid memory reference) | |
| # | |
| # So, build for 12.4 only and copy to all the other build variants | |
| # by hand (which works fine thanks to backward compat). | |
| torchVersions = [ | |
| { | |
| torchVersion = "2.8"; | |
| cudaVersion = "12.4"; | |
| cxx11Abi = true; | |
| systems = [ | |
| "x86_64-linux" | |
| "aarch64-linux" | |
| ]; | |
| upstreamVariant = true; | |
| } | |
| ]; | |
| }; | |
| } | |